diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,151271 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.06875, + "eval_steps": 500, + "global_step": 13750, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "global_step": 1, + "learning_rate": 2.5e-06, + "loss": 6.0015, + "loss_base2": 8.6583, + "loss_pixel": 0.7156, + "loss_text": 5.2858, + "ppl": 404.0344, + "step": 1 + }, + { + "epoch": 0.0, + "global_step": 2, + "learning_rate": 5e-06, + "loss": 6.0018, + "loss_base2": 8.6588, + "loss_pixel": 0.7157, + "loss_text": 5.2861, + "ppl": 404.1556, + "step": 2 + }, + { + "epoch": 0.0, + "global_step": 3, + "learning_rate": 7.5e-06, + "loss": 5.9599, + "loss_base2": 8.5983, + "loss_pixel": 0.6826, + "loss_text": 5.2772, + "ppl": 387.5714, + "step": 3 + }, + { + "epoch": 0.0, + "global_step": 4, + "learning_rate": 1e-05, + "loss": 5.8847, + "loss_base2": 8.4898, + "loss_pixel": 0.6266, + "loss_text": 5.2581, + "ppl": 359.4949, + "step": 4 + }, + { + "epoch": 0.0, + "global_step": 5, + "learning_rate": 1.25e-05, + "loss": 5.799, + "loss_base2": 8.3662, + "loss_pixel": 0.5689, + "loss_text": 5.2301, + "ppl": 329.9694, + "step": 5 + }, + { + "epoch": 0.0, + "global_step": 6, + "learning_rate": 1.5e-05, + "loss": 5.7186, + "loss_base2": 8.2502, + "loss_pixel": 0.5278, + "loss_text": 5.1908, + "ppl": 304.4784, + "step": 6 + }, + { + "epoch": 0.0, + "global_step": 7, + "learning_rate": 1.7500000000000002e-05, + "loss": 5.6337, + "loss_base2": 8.1277, + "loss_pixel": 0.5006, + "loss_text": 5.1331, + "ppl": 279.6951, + "step": 7 + }, + { + "epoch": 0.0, + "global_step": 8, + "learning_rate": 2e-05, + "loss": 5.536, + "loss_base2": 7.9868, + "loss_pixel": 0.4794, + "loss_text": 5.0565, + "ppl": 253.6613, + "step": 8 + }, + { + "epoch": 0.0, + "global_step": 9, + "learning_rate": 2.2499999999999998e-05, + "loss": 5.4228, + "loss_base2": 7.8234, + "loss_pixel": 0.4617, + "loss_text": 4.9611, + "ppl": 226.5125, + "step": 9 + }, + { + "epoch": 0.0, + "global_step": 10, + "learning_rate": 2.5e-05, + "loss": 5.3213, + "loss_base2": 7.677, + "loss_pixel": 0.4483, + "loss_text": 4.873, + "ppl": 204.6498, + "step": 10 + }, + { + "epoch": 0.0, + "global_step": 11, + "learning_rate": 2.75e-05, + "loss": 5.217, + "loss_base2": 7.5265, + "loss_pixel": 0.4363, + "loss_text": 4.7807, + "ppl": 184.3802, + "step": 11 + }, + { + "epoch": 0.0, + "global_step": 12, + "learning_rate": 3e-05, + "loss": 5.1381, + "loss_base2": 7.4127, + "loss_pixel": 0.4261, + "loss_text": 4.712, + "ppl": 170.3917, + "step": 12 + }, + { + "epoch": 0.0, + "global_step": 13, + "learning_rate": 3.2500000000000004e-05, + "loss": 5.0797, + "loss_base2": 7.3285, + "loss_pixel": 0.4157, + "loss_text": 4.6641, + "ppl": 160.7258, + "step": 13 + }, + { + "epoch": 0.0, + "global_step": 14, + "learning_rate": 3.5000000000000004e-05, + "loss": 5.0206, + "loss_base2": 7.2432, + "loss_pixel": 0.4068, + "loss_text": 4.6137, + "ppl": 151.5022, + "step": 14 + }, + { + "epoch": 0.0, + "global_step": 15, + "learning_rate": 3.75e-05, + "loss": 4.9759, + "loss_base2": 7.1787, + "loss_pixel": 0.4011, + "loss_text": 4.5748, + "ppl": 144.8792, + "step": 15 + }, + { + "epoch": 0.0, + "global_step": 16, + "learning_rate": 4e-05, + "loss": 4.9438, + "loss_base2": 7.1324, + "loss_pixel": 0.3966, + "loss_text": 4.5472, + "ppl": 140.3024, + "step": 16 + }, + { + "epoch": 0.0, + "global_step": 17, + "learning_rate": 4.25e-05, + "loss": 4.9132, + "loss_base2": 7.0882, + "loss_pixel": 0.3926, + "loss_text": 4.5206, + "ppl": 136.0742, + "step": 17 + }, + { + "epoch": 0.0, + "global_step": 18, + "learning_rate": 4.4999999999999996e-05, + "loss": 4.8813, + "loss_base2": 7.0422, + "loss_pixel": 0.3898, + "loss_text": 4.4915, + "ppl": 131.8019, + "step": 18 + }, + { + "epoch": 0.0, + "global_step": 19, + "learning_rate": 4.75e-05, + "loss": 4.853, + "loss_base2": 7.0014, + "loss_pixel": 0.3877, + "loss_text": 4.4652, + "ppl": 128.1242, + "step": 19 + }, + { + "epoch": 0.0, + "global_step": 20, + "learning_rate": 5e-05, + "loss": 4.8239, + "loss_base2": 6.9594, + "loss_pixel": 0.3859, + "loss_text": 4.438, + "ppl": 124.4495, + "step": 20 + }, + { + "epoch": 0.0, + "global_step": 21, + "learning_rate": 5.25e-05, + "loss": 4.8015, + "loss_base2": 6.9271, + "loss_pixel": 0.3853, + "loss_text": 4.4161, + "ppl": 121.6928, + "step": 21 + }, + { + "epoch": 0.0, + "global_step": 22, + "learning_rate": 5.5e-05, + "loss": 4.7777, + "loss_base2": 6.8928, + "loss_pixel": 0.3845, + "loss_text": 4.3932, + "ppl": 118.8307, + "step": 22 + }, + { + "epoch": 0.0, + "global_step": 23, + "learning_rate": 5.75e-05, + "loss": 4.7395, + "loss_base2": 6.8377, + "loss_pixel": 0.3841, + "loss_text": 4.3554, + "ppl": 114.377, + "step": 23 + }, + { + "epoch": 0.0, + "global_step": 24, + "learning_rate": 6e-05, + "loss": 4.7171, + "loss_base2": 6.8053, + "loss_pixel": 0.3846, + "loss_text": 4.3325, + "ppl": 111.8434, + "step": 24 + }, + { + "epoch": 0.0, + "global_step": 25, + "learning_rate": 6.25e-05, + "loss": 4.693, + "loss_base2": 6.7706, + "loss_pixel": 0.3845, + "loss_text": 4.3085, + "ppl": 109.1802, + "step": 25 + }, + { + "epoch": 0.0, + "global_step": 26, + "learning_rate": 6.500000000000001e-05, + "loss": 4.6667, + "loss_base2": 6.7326, + "loss_pixel": 0.3853, + "loss_text": 4.2814, + "ppl": 106.3462, + "step": 26 + }, + { + "epoch": 0.0, + "global_step": 27, + "learning_rate": 6.75e-05, + "loss": 4.6428, + "loss_base2": 6.6981, + "loss_pixel": 0.3853, + "loss_text": 4.2576, + "ppl": 103.8347, + "step": 27 + }, + { + "epoch": 0.0, + "global_step": 28, + "learning_rate": 7.000000000000001e-05, + "loss": 4.6076, + "loss_base2": 6.6474, + "loss_pixel": 0.3862, + "loss_text": 4.2214, + "ppl": 100.2433, + "step": 28 + }, + { + "epoch": 0.0, + "global_step": 29, + "learning_rate": 7.25e-05, + "loss": 4.5756, + "loss_base2": 6.6012, + "loss_pixel": 0.3849, + "loss_text": 4.1907, + "ppl": 97.0863, + "step": 29 + }, + { + "epoch": 0.0, + "global_step": 30, + "learning_rate": 7.5e-05, + "loss": 4.5488, + "loss_base2": 6.5625, + "loss_pixel": 0.3851, + "loss_text": 4.1637, + "ppl": 94.5189, + "step": 30 + }, + { + "epoch": 0.0, + "global_step": 31, + "learning_rate": 7.75e-05, + "loss": 4.513, + "loss_base2": 6.5109, + "loss_pixel": 0.3837, + "loss_text": 4.1293, + "ppl": 91.195, + "step": 31 + }, + { + "epoch": 0.0, + "global_step": 32, + "learning_rate": 8e-05, + "loss": 4.4795, + "loss_base2": 6.4626, + "loss_pixel": 0.3832, + "loss_text": 4.0962, + "ppl": 88.1906, + "step": 32 + }, + { + "epoch": 0.0, + "global_step": 33, + "learning_rate": 8.25e-05, + "loss": 4.4519, + "loss_base2": 6.4227, + "loss_pixel": 0.383, + "loss_text": 4.0689, + "ppl": 85.7898, + "step": 33 + }, + { + "epoch": 0.0, + "global_step": 34, + "learning_rate": 8.5e-05, + "loss": 4.4144, + "loss_base2": 6.3686, + "loss_pixel": 0.3822, + "loss_text": 4.0322, + "ppl": 82.6322, + "step": 34 + }, + { + "epoch": 0.0, + "global_step": 35, + "learning_rate": 8.75e-05, + "loss": 4.3992, + "loss_base2": 6.3467, + "loss_pixel": 0.3816, + "loss_text": 4.0175, + "ppl": 81.3857, + "step": 35 + }, + { + "epoch": 0.0, + "global_step": 36, + "learning_rate": 8.999999999999999e-05, + "loss": 4.3634, + "loss_base2": 6.2951, + "loss_pixel": 0.3814, + "loss_text": 3.982, + "ppl": 78.5237, + "step": 36 + }, + { + "epoch": 0.0, + "global_step": 37, + "learning_rate": 9.25e-05, + "loss": 4.3384, + "loss_base2": 6.259, + "loss_pixel": 0.3816, + "loss_text": 3.9568, + "ppl": 76.5849, + "step": 37 + }, + { + "epoch": 0.0, + "global_step": 38, + "learning_rate": 9.5e-05, + "loss": 4.3119, + "loss_base2": 6.2208, + "loss_pixel": 0.3806, + "loss_text": 3.9313, + "ppl": 74.5821, + "step": 38 + }, + { + "epoch": 0.0, + "global_step": 39, + "learning_rate": 9.750000000000001e-05, + "loss": 4.2996, + "loss_base2": 6.203, + "loss_pixel": 0.3808, + "loss_text": 3.9188, + "ppl": 73.6703, + "step": 39 + }, + { + "epoch": 0.0, + "global_step": 40, + "learning_rate": 0.0001, + "loss": 4.2666, + "loss_base2": 6.1554, + "loss_pixel": 0.3805, + "loss_text": 3.8861, + "ppl": 71.2789, + "step": 40 + }, + { + "epoch": 0.0, + "global_step": 41, + "learning_rate": 0.0001025, + "loss": 4.2494, + "loss_base2": 6.1306, + "loss_pixel": 0.381, + "loss_text": 3.8683, + "ppl": 70.0634, + "step": 41 + }, + { + "epoch": 0.0, + "global_step": 42, + "learning_rate": 0.000105, + "loss": 4.2234, + "loss_base2": 6.0931, + "loss_pixel": 0.3806, + "loss_text": 3.8428, + "ppl": 68.2652, + "step": 42 + }, + { + "epoch": 0.0, + "global_step": 43, + "learning_rate": 0.0001075, + "loss": 4.2088, + "loss_base2": 6.072, + "loss_pixel": 0.3812, + "loss_text": 3.8276, + "ppl": 67.2758, + "step": 43 + }, + { + "epoch": 0.0, + "global_step": 44, + "learning_rate": 0.00011, + "loss": 4.1889, + "loss_base2": 6.0433, + "loss_pixel": 0.3808, + "loss_text": 3.8081, + "ppl": 65.9502, + "step": 44 + }, + { + "epoch": 0.0, + "global_step": 45, + "learning_rate": 0.00011250000000000001, + "loss": 4.1737, + "loss_base2": 6.0214, + "loss_pixel": 0.381, + "loss_text": 3.7927, + "ppl": 64.9553, + "step": 45 + }, + { + "epoch": 0.0, + "global_step": 46, + "learning_rate": 0.000115, + "loss": 4.2223, + "loss_base2": 6.0915, + "loss_pixel": 0.3818, + "loss_text": 3.8405, + "ppl": 68.1901, + "step": 46 + }, + { + "epoch": 0.0, + "global_step": 47, + "learning_rate": 0.0001175, + "loss": 4.2372, + "loss_base2": 6.113, + "loss_pixel": 0.3807, + "loss_text": 3.8565, + "ppl": 69.2138, + "step": 47 + }, + { + "epoch": 0.0, + "global_step": 48, + "learning_rate": 0.00012, + "loss": 4.2087, + "loss_base2": 6.0719, + "loss_pixel": 0.3804, + "loss_text": 3.8284, + "ppl": 67.269, + "step": 48 + }, + { + "epoch": 0.0, + "global_step": 49, + "learning_rate": 0.0001225, + "loss": 4.1838, + "loss_base2": 6.0359, + "loss_pixel": 0.3802, + "loss_text": 3.8037, + "ppl": 65.6147, + "step": 49 + }, + { + "epoch": 0.0, + "global_step": 50, + "learning_rate": 0.000125, + "loss": 4.1626, + "loss_base2": 6.0054, + "loss_pixel": 0.3799, + "loss_text": 3.7827, + "ppl": 64.2383, + "step": 50 + }, + { + "epoch": 0.0, + "global_step": 51, + "learning_rate": 0.0001275, + "loss": 4.1453, + "loss_base2": 5.9804, + "loss_pixel": 0.3794, + "loss_text": 3.7658, + "ppl": 63.1366, + "step": 51 + }, + { + "epoch": 0.0, + "global_step": 52, + "learning_rate": 0.00013000000000000002, + "loss": 4.1279, + "loss_base2": 5.9553, + "loss_pixel": 0.3797, + "loss_text": 3.7482, + "ppl": 62.0475, + "step": 52 + }, + { + "epoch": 0.0, + "global_step": 53, + "learning_rate": 0.00013250000000000002, + "loss": 4.1225, + "loss_base2": 5.9475, + "loss_pixel": 0.3792, + "loss_text": 3.7433, + "ppl": 61.7133, + "step": 53 + }, + { + "epoch": 0.0, + "global_step": 54, + "learning_rate": 0.000135, + "loss": 4.1726, + "loss_base2": 6.0198, + "loss_pixel": 0.3794, + "loss_text": 3.7932, + "ppl": 64.8839, + "step": 54 + }, + { + "epoch": 0.0, + "global_step": 55, + "learning_rate": 0.0001375, + "loss": 4.1576, + "loss_base2": 5.9981, + "loss_pixel": 0.3802, + "loss_text": 3.7774, + "ppl": 63.9179, + "step": 55 + }, + { + "epoch": 0.0, + "global_step": 56, + "learning_rate": 0.00014000000000000001, + "loss": 4.1421, + "loss_base2": 5.9758, + "loss_pixel": 0.3792, + "loss_text": 3.7628, + "ppl": 62.9348, + "step": 56 + }, + { + "epoch": 0.0, + "global_step": 57, + "learning_rate": 0.0001425, + "loss": 4.1346, + "loss_base2": 5.965, + "loss_pixel": 0.3794, + "loss_text": 3.7552, + "ppl": 62.4646, + "step": 57 + }, + { + "epoch": 0.0, + "global_step": 58, + "learning_rate": 0.000145, + "loss": 4.1477, + "loss_base2": 5.9839, + "loss_pixel": 0.3786, + "loss_text": 3.7691, + "ppl": 63.2883, + "step": 58 + }, + { + "epoch": 0.0, + "global_step": 59, + "learning_rate": 0.0001475, + "loss": 4.1242, + "loss_base2": 5.95, + "loss_pixel": 0.379, + "loss_text": 3.7452, + "ppl": 61.8183, + "step": 59 + }, + { + "epoch": 0.0, + "global_step": 60, + "learning_rate": 0.00015, + "loss": 4.1092, + "loss_base2": 5.9283, + "loss_pixel": 0.3798, + "loss_text": 3.7294, + "ppl": 60.898, + "step": 60 + }, + { + "epoch": 0.0, + "global_step": 61, + "learning_rate": 0.0001525, + "loss": 4.1017, + "loss_base2": 5.9175, + "loss_pixel": 0.3787, + "loss_text": 3.7231, + "ppl": 60.443, + "step": 61 + }, + { + "epoch": 0.0, + "global_step": 62, + "learning_rate": 0.000155, + "loss": 4.0881, + "loss_base2": 5.8979, + "loss_pixel": 0.3782, + "loss_text": 3.7099, + "ppl": 59.6265, + "step": 62 + }, + { + "epoch": 0.0, + "global_step": 63, + "learning_rate": 0.0001575, + "loss": 4.0798, + "loss_base2": 5.8859, + "loss_pixel": 0.378, + "loss_text": 3.7018, + "ppl": 59.1336, + "step": 63 + }, + { + "epoch": 0.0, + "global_step": 64, + "learning_rate": 0.00016, + "loss": 4.0695, + "loss_base2": 5.871, + "loss_pixel": 0.3793, + "loss_text": 3.6903, + "ppl": 58.5277, + "step": 64 + }, + { + "epoch": 0.0, + "global_step": 65, + "learning_rate": 0.00016250000000000002, + "loss": 4.0675, + "loss_base2": 5.8682, + "loss_pixel": 0.3816, + "loss_text": 3.686, + "ppl": 58.4108, + "step": 65 + }, + { + "epoch": 0.0, + "global_step": 66, + "learning_rate": 0.000165, + "loss": 4.0543, + "loss_base2": 5.8491, + "loss_pixel": 0.3817, + "loss_text": 3.6726, + "ppl": 57.6448, + "step": 66 + }, + { + "epoch": 0.0, + "global_step": 67, + "learning_rate": 0.0001675, + "loss": 4.0428, + "loss_base2": 5.8325, + "loss_pixel": 0.378, + "loss_text": 3.6648, + "ppl": 56.9857, + "step": 67 + }, + { + "epoch": 0.0, + "global_step": 68, + "learning_rate": 0.00017, + "loss": 4.0327, + "loss_base2": 5.818, + "loss_pixel": 0.3761, + "loss_text": 3.6566, + "ppl": 56.413, + "step": 68 + }, + { + "epoch": 0.0, + "global_step": 69, + "learning_rate": 0.0001725, + "loss": 4.023, + "loss_base2": 5.804, + "loss_pixel": 0.3819, + "loss_text": 3.6412, + "ppl": 55.8685, + "step": 69 + }, + { + "epoch": 0.0, + "global_step": 70, + "learning_rate": 0.000175, + "loss": 4.0716, + "loss_base2": 5.8741, + "loss_pixel": 0.4254, + "loss_text": 3.6463, + "ppl": 58.6507, + "step": 70 + }, + { + "epoch": 0.0, + "global_step": 71, + "learning_rate": 0.0001775, + "loss": 4.0159, + "loss_base2": 5.7937, + "loss_pixel": 0.3849, + "loss_text": 3.631, + "ppl": 55.4732, + "step": 71 + }, + { + "epoch": 0.0, + "global_step": 72, + "learning_rate": 0.00017999999999999998, + "loss": 4.0085, + "loss_base2": 5.783, + "loss_pixel": 0.3824, + "loss_text": 3.6261, + "ppl": 55.0642, + "step": 72 + }, + { + "epoch": 0.0, + "global_step": 73, + "learning_rate": 0.0001825, + "loss": 4.0226, + "loss_base2": 5.8034, + "loss_pixel": 0.3797, + "loss_text": 3.643, + "ppl": 55.8461, + "step": 73 + }, + { + "epoch": 0.0, + "global_step": 74, + "learning_rate": 0.000185, + "loss": 3.9813, + "loss_base2": 5.7438, + "loss_pixel": 0.3817, + "loss_text": 3.5996, + "ppl": 53.5867, + "step": 74 + }, + { + "epoch": 0.0, + "global_step": 75, + "learning_rate": 0.0001875, + "loss": 3.9879, + "loss_base2": 5.7533, + "loss_pixel": 0.3822, + "loss_text": 3.6057, + "ppl": 53.9415, + "step": 75 + }, + { + "epoch": 0.0, + "global_step": 76, + "learning_rate": 0.00019, + "loss": 3.966, + "loss_base2": 5.7217, + "loss_pixel": 0.3813, + "loss_text": 3.5847, + "ppl": 52.773, + "step": 76 + }, + { + "epoch": 0.0, + "global_step": 77, + "learning_rate": 0.00019250000000000002, + "loss": 3.955, + "loss_base2": 5.7059, + "loss_pixel": 0.3804, + "loss_text": 3.5747, + "ppl": 52.1957, + "step": 77 + }, + { + "epoch": 0.0, + "global_step": 78, + "learning_rate": 0.00019500000000000002, + "loss": 3.9475, + "loss_base2": 5.695, + "loss_pixel": 0.3803, + "loss_text": 3.5672, + "ppl": 51.8057, + "step": 78 + }, + { + "epoch": 0.0, + "global_step": 79, + "learning_rate": 0.0001975, + "loss": 3.9516, + "loss_base2": 5.701, + "loss_pixel": 0.3793, + "loss_text": 3.5723, + "ppl": 52.0185, + "step": 79 + }, + { + "epoch": 0.0, + "global_step": 80, + "learning_rate": 0.0002, + "loss": 3.9383, + "loss_base2": 5.6818, + "loss_pixel": 0.3789, + "loss_text": 3.5594, + "ppl": 51.3313, + "step": 80 + }, + { + "epoch": 0.0, + "global_step": 81, + "learning_rate": 0.00020250000000000002, + "loss": 3.9163, + "loss_base2": 5.65, + "loss_pixel": 0.3788, + "loss_text": 3.5375, + "ppl": 50.2143, + "step": 81 + }, + { + "epoch": 0.0, + "global_step": 82, + "learning_rate": 0.000205, + "loss": 3.9252, + "loss_base2": 5.6629, + "loss_pixel": 0.3777, + "loss_text": 3.5475, + "ppl": 50.6632, + "step": 82 + }, + { + "epoch": 0.0, + "global_step": 83, + "learning_rate": 0.0002075, + "loss": 3.9026, + "loss_base2": 5.6303, + "loss_pixel": 0.3778, + "loss_text": 3.5247, + "ppl": 49.5311, + "step": 83 + }, + { + "epoch": 0.0, + "global_step": 84, + "learning_rate": 0.00021, + "loss": 3.8938, + "loss_base2": 5.6176, + "loss_pixel": 0.3769, + "loss_text": 3.5169, + "ppl": 49.0971, + "step": 84 + }, + { + "epoch": 0.0, + "global_step": 85, + "learning_rate": 0.0002125, + "loss": 3.8918, + "loss_base2": 5.6147, + "loss_pixel": 0.377, + "loss_text": 3.5149, + "ppl": 48.999, + "step": 85 + }, + { + "epoch": 0.0, + "global_step": 86, + "learning_rate": 0.000215, + "loss": 3.8795, + "loss_base2": 5.5969, + "loss_pixel": 0.3756, + "loss_text": 3.5038, + "ppl": 48.4, + "step": 86 + }, + { + "epoch": 0.0, + "global_step": 87, + "learning_rate": 0.0002175, + "loss": 3.871, + "loss_base2": 5.5847, + "loss_pixel": 0.3744, + "loss_text": 3.4966, + "ppl": 47.9904, + "step": 87 + }, + { + "epoch": 0.0, + "global_step": 88, + "learning_rate": 0.00022, + "loss": 3.8765, + "loss_base2": 5.5926, + "loss_pixel": 0.3743, + "loss_text": 3.5022, + "ppl": 48.255, + "step": 88 + }, + { + "epoch": 0.0, + "global_step": 89, + "learning_rate": 0.00022250000000000001, + "loss": 3.8691, + "loss_base2": 5.5819, + "loss_pixel": 0.3946, + "loss_text": 3.4745, + "ppl": 47.8993, + "step": 89 + }, + { + "epoch": 0.0, + "global_step": 90, + "learning_rate": 0.00022500000000000002, + "loss": 4.0012, + "loss_base2": 5.7725, + "loss_pixel": 0.5244, + "loss_text": 3.4768, + "ppl": 54.6637, + "step": 90 + }, + { + "epoch": 0.0, + "global_step": 91, + "learning_rate": 0.0002275, + "loss": 3.8736, + "loss_base2": 5.5884, + "loss_pixel": 0.4044, + "loss_text": 3.4691, + "ppl": 48.1153, + "step": 91 + }, + { + "epoch": 0.0, + "global_step": 92, + "learning_rate": 0.00023, + "loss": 3.8492, + "loss_base2": 5.5532, + "loss_pixel": 0.3834, + "loss_text": 3.4658, + "ppl": 46.9555, + "step": 92 + }, + { + "epoch": 0.0, + "global_step": 93, + "learning_rate": 0.0002325, + "loss": 3.8508, + "loss_base2": 5.5555, + "loss_pixel": 0.3897, + "loss_text": 3.4611, + "ppl": 47.0307, + "step": 93 + }, + { + "epoch": 0.0, + "global_step": 94, + "learning_rate": 0.000235, + "loss": 3.8389, + "loss_base2": 5.5384, + "loss_pixel": 0.3931, + "loss_text": 3.4458, + "ppl": 46.4743, + "step": 94 + }, + { + "epoch": 0.0, + "global_step": 95, + "learning_rate": 0.0002375, + "loss": 3.8347, + "loss_base2": 5.5323, + "loss_pixel": 0.3921, + "loss_text": 3.4426, + "ppl": 46.2795, + "step": 95 + }, + { + "epoch": 0.0, + "global_step": 96, + "learning_rate": 0.00024, + "loss": 3.8494, + "loss_base2": 5.5535, + "loss_pixel": 0.3892, + "loss_text": 3.4602, + "ppl": 46.9649, + "step": 96 + }, + { + "epoch": 0.0, + "global_step": 97, + "learning_rate": 0.00024249999999999999, + "loss": 3.9233, + "loss_base2": 5.6601, + "loss_pixel": 0.3852, + "loss_text": 3.5382, + "ppl": 50.567, + "step": 97 + }, + { + "epoch": 0.0, + "global_step": 98, + "learning_rate": 0.000245, + "loss": 3.8921, + "loss_base2": 5.6151, + "loss_pixel": 0.3832, + "loss_text": 3.5088, + "ppl": 49.0137, + "step": 98 + }, + { + "epoch": 0.0, + "global_step": 99, + "learning_rate": 0.0002475, + "loss": 3.8663, + "loss_base2": 5.5779, + "loss_pixel": 0.3835, + "loss_text": 3.4829, + "ppl": 47.7653, + "step": 99 + }, + { + "epoch": 0.0, + "global_step": 100, + "learning_rate": 0.00025, + "loss": 3.8408, + "loss_base2": 5.5411, + "loss_pixel": 0.3838, + "loss_text": 3.457, + "ppl": 46.5627, + "step": 100 + }, + { + "epoch": 0.0, + "global_step": 101, + "learning_rate": 0.0002525, + "loss": 3.8075, + "loss_base2": 5.4931, + "loss_pixel": 0.3846, + "loss_text": 3.4229, + "ppl": 45.0377, + "step": 101 + }, + { + "epoch": 0.0, + "global_step": 102, + "learning_rate": 0.000255, + "loss": 3.7758, + "loss_base2": 5.4473, + "loss_pixel": 0.3848, + "loss_text": 3.391, + "ppl": 43.6324, + "step": 102 + }, + { + "epoch": 0.0, + "global_step": 103, + "learning_rate": 0.0002575, + "loss": 3.7572, + "loss_base2": 5.4205, + "loss_pixel": 0.3835, + "loss_text": 3.3737, + "ppl": 42.8283, + "step": 103 + }, + { + "epoch": 0.0, + "global_step": 104, + "learning_rate": 0.00026000000000000003, + "loss": 3.7368, + "loss_base2": 5.3911, + "loss_pixel": 0.3824, + "loss_text": 3.3544, + "ppl": 41.9635, + "step": 104 + }, + { + "epoch": 0.0, + "global_step": 105, + "learning_rate": 0.00026250000000000004, + "loss": 3.7127, + "loss_base2": 5.3563, + "loss_pixel": 0.3826, + "loss_text": 3.3301, + "ppl": 40.9643, + "step": 105 + }, + { + "epoch": 0.0, + "global_step": 106, + "learning_rate": 0.00026500000000000004, + "loss": 3.6868, + "loss_base2": 5.3189, + "loss_pixel": 0.3812, + "loss_text": 3.3056, + "ppl": 39.9169, + "step": 106 + }, + { + "epoch": 0.0, + "global_step": 107, + "learning_rate": 0.0002675, + "loss": 3.6626, + "loss_base2": 5.284, + "loss_pixel": 0.3808, + "loss_text": 3.2818, + "ppl": 38.9625, + "step": 107 + }, + { + "epoch": 0.0, + "global_step": 108, + "learning_rate": 0.00027, + "loss": 3.6359, + "loss_base2": 5.2455, + "loss_pixel": 0.3806, + "loss_text": 3.2553, + "ppl": 37.936, + "step": 108 + }, + { + "epoch": 0.0, + "global_step": 109, + "learning_rate": 0.0002725, + "loss": 3.6217, + "loss_base2": 5.225, + "loss_pixel": 0.3807, + "loss_text": 3.241, + "ppl": 37.4011, + "step": 109 + }, + { + "epoch": 0.0, + "global_step": 110, + "learning_rate": 0.000275, + "loss": 3.59, + "loss_base2": 5.1793, + "loss_pixel": 0.3803, + "loss_text": 3.2097, + "ppl": 36.2341, + "step": 110 + }, + { + "epoch": 0.0, + "global_step": 111, + "learning_rate": 0.0002775, + "loss": 3.5906, + "loss_base2": 5.1801, + "loss_pixel": 0.3797, + "loss_text": 3.2109, + "ppl": 36.2558, + "step": 111 + }, + { + "epoch": 0.0, + "global_step": 112, + "learning_rate": 0.00028000000000000003, + "loss": 3.5783, + "loss_base2": 5.1624, + "loss_pixel": 0.3799, + "loss_text": 3.1985, + "ppl": 35.8126, + "step": 112 + }, + { + "epoch": 0.0, + "global_step": 113, + "learning_rate": 0.0002825, + "loss": 3.9224, + "loss_base2": 5.6588, + "loss_pixel": 0.3802, + "loss_text": 3.5422, + "ppl": 50.5216, + "step": 113 + }, + { + "epoch": 0.0, + "global_step": 114, + "learning_rate": 0.000285, + "loss": 3.8456, + "loss_base2": 5.548, + "loss_pixel": 0.379, + "loss_text": 3.4667, + "ppl": 46.7867, + "step": 114 + }, + { + "epoch": 0.0, + "global_step": 115, + "learning_rate": 0.0002875, + "loss": 3.8397, + "loss_base2": 5.5395, + "loss_pixel": 0.3798, + "loss_text": 3.4599, + "ppl": 46.5115, + "step": 115 + }, + { + "epoch": 0.0, + "global_step": 116, + "learning_rate": 0.00029, + "loss": 3.7928, + "loss_base2": 5.4719, + "loss_pixel": 0.378, + "loss_text": 3.4147, + "ppl": 44.3805, + "step": 116 + }, + { + "epoch": 0.0, + "global_step": 117, + "learning_rate": 0.0002925, + "loss": 3.7708, + "loss_base2": 5.4401, + "loss_pixel": 0.3769, + "loss_text": 3.3938, + "ppl": 43.4148, + "step": 117 + }, + { + "epoch": 0.0, + "global_step": 118, + "learning_rate": 0.000295, + "loss": 3.7713, + "loss_base2": 5.4408, + "loss_pixel": 0.3776, + "loss_text": 3.3937, + "ppl": 43.4365, + "step": 118 + }, + { + "epoch": 0.0, + "global_step": 119, + "learning_rate": 0.00029749999999999997, + "loss": 3.731, + "loss_base2": 5.3827, + "loss_pixel": 0.3776, + "loss_text": 3.3534, + "ppl": 41.7208, + "step": 119 + }, + { + "epoch": 0.0, + "global_step": 120, + "learning_rate": 0.0003, + "loss": 3.7119, + "loss_base2": 5.3551, + "loss_pixel": 0.377, + "loss_text": 3.3349, + "ppl": 40.9315, + "step": 120 + }, + { + "epoch": 0.0, + "global_step": 121, + "learning_rate": 0.0003025, + "loss": 3.7459, + "loss_base2": 5.4042, + "loss_pixel": 0.3814, + "loss_text": 3.3646, + "ppl": 42.3471, + "step": 121 + }, + { + "epoch": 0.0, + "global_step": 122, + "learning_rate": 0.000305, + "loss": 3.7249, + "loss_base2": 5.3739, + "loss_pixel": 0.4016, + "loss_text": 3.3233, + "ppl": 41.4671, + "step": 122 + }, + { + "epoch": 0.0, + "global_step": 123, + "learning_rate": 0.0003075, + "loss": 3.6853, + "loss_base2": 5.3168, + "loss_pixel": 0.3933, + "loss_text": 3.2919, + "ppl": 39.8571, + "step": 123 + }, + { + "epoch": 0.0, + "global_step": 124, + "learning_rate": 0.00031, + "loss": 3.6616, + "loss_base2": 5.2826, + "loss_pixel": 0.3802, + "loss_text": 3.2814, + "ppl": 38.9236, + "step": 124 + }, + { + "epoch": 0.0, + "global_step": 125, + "learning_rate": 0.0003125, + "loss": 3.6682, + "loss_base2": 5.2921, + "loss_pixel": 0.3801, + "loss_text": 3.2881, + "ppl": 39.1813, + "step": 125 + }, + { + "epoch": 0.0, + "global_step": 126, + "learning_rate": 0.000315, + "loss": 3.6423, + "loss_base2": 5.2547, + "loss_pixel": 0.3835, + "loss_text": 3.2587, + "ppl": 38.1795, + "step": 126 + }, + { + "epoch": 0.0, + "global_step": 127, + "learning_rate": 0.0003175, + "loss": 3.6384, + "loss_base2": 5.2491, + "loss_pixel": 0.3839, + "loss_text": 3.2545, + "ppl": 38.0309, + "step": 127 + }, + { + "epoch": 0.0, + "global_step": 128, + "learning_rate": 0.00032, + "loss": 3.626, + "loss_base2": 5.2312, + "loss_pixel": 0.3809, + "loss_text": 3.2451, + "ppl": 37.5623, + "step": 128 + }, + { + "epoch": 0.0, + "global_step": 129, + "learning_rate": 0.00032250000000000003, + "loss": 3.6187, + "loss_base2": 5.2207, + "loss_pixel": 0.3823, + "loss_text": 3.2364, + "ppl": 37.2891, + "step": 129 + }, + { + "epoch": 0.0, + "global_step": 130, + "learning_rate": 0.00032500000000000004, + "loss": 3.6106, + "loss_base2": 5.209, + "loss_pixel": 0.3829, + "loss_text": 3.2278, + "ppl": 36.9882, + "step": 130 + }, + { + "epoch": 0.0, + "global_step": 131, + "learning_rate": 0.00032750000000000005, + "loss": 3.6095, + "loss_base2": 5.2074, + "loss_pixel": 0.3843, + "loss_text": 3.2252, + "ppl": 36.9476, + "step": 131 + }, + { + "epoch": 0.0, + "global_step": 132, + "learning_rate": 0.00033, + "loss": 3.5958, + "loss_base2": 5.1876, + "loss_pixel": 0.3813, + "loss_text": 3.2145, + "ppl": 36.4448, + "step": 132 + }, + { + "epoch": 0.0, + "global_step": 133, + "learning_rate": 0.0003325, + "loss": 3.6018, + "loss_base2": 5.1963, + "loss_pixel": 0.3815, + "loss_text": 3.2203, + "ppl": 36.6642, + "step": 133 + }, + { + "epoch": 0.0, + "global_step": 134, + "learning_rate": 0.000335, + "loss": 3.5729, + "loss_base2": 5.1546, + "loss_pixel": 0.382, + "loss_text": 3.191, + "ppl": 35.6197, + "step": 134 + }, + { + "epoch": 0.0, + "global_step": 135, + "learning_rate": 0.0003375, + "loss": 3.5856, + "loss_base2": 5.1729, + "loss_pixel": 0.3863, + "loss_text": 3.1993, + "ppl": 36.075, + "step": 135 + }, + { + "epoch": 0.0, + "global_step": 136, + "learning_rate": 0.00034, + "loss": 3.5825, + "loss_base2": 5.1685, + "loss_pixel": 0.3827, + "loss_text": 3.1998, + "ppl": 35.9633, + "step": 136 + }, + { + "epoch": 0.0, + "global_step": 137, + "learning_rate": 0.00034250000000000003, + "loss": 3.5764, + "loss_base2": 5.1597, + "loss_pixel": 0.3833, + "loss_text": 3.1931, + "ppl": 35.7446, + "step": 137 + }, + { + "epoch": 0.0, + "global_step": 138, + "learning_rate": 0.000345, + "loss": 3.5469, + "loss_base2": 5.1171, + "loss_pixel": 0.3811, + "loss_text": 3.1659, + "ppl": 34.7056, + "step": 138 + }, + { + "epoch": 0.0, + "global_step": 139, + "learning_rate": 0.0003475, + "loss": 3.5537, + "loss_base2": 5.1269, + "loss_pixel": 0.3822, + "loss_text": 3.1716, + "ppl": 34.9424, + "step": 139 + }, + { + "epoch": 0.0, + "global_step": 140, + "learning_rate": 0.00035, + "loss": 3.5573, + "loss_base2": 5.1321, + "loss_pixel": 0.3822, + "loss_text": 3.1751, + "ppl": 35.0684, + "step": 140 + }, + { + "epoch": 0.0, + "global_step": 141, + "learning_rate": 0.0003525, + "loss": 3.5622, + "loss_base2": 5.1392, + "loss_pixel": 0.3829, + "loss_text": 3.1793, + "ppl": 35.2406, + "step": 141 + }, + { + "epoch": 0.0, + "global_step": 142, + "learning_rate": 0.000355, + "loss": 3.5722, + "loss_base2": 5.1536, + "loss_pixel": 0.3824, + "loss_text": 3.1898, + "ppl": 35.5948, + "step": 142 + }, + { + "epoch": 0.0, + "global_step": 143, + "learning_rate": 0.0003575, + "loss": 3.5453, + "loss_base2": 5.1148, + "loss_pixel": 0.3795, + "loss_text": 3.1657, + "ppl": 34.6501, + "step": 143 + }, + { + "epoch": 0.0, + "global_step": 144, + "learning_rate": 0.00035999999999999997, + "loss": 3.5456, + "loss_base2": 5.1152, + "loss_pixel": 0.3809, + "loss_text": 3.1646, + "ppl": 34.6605, + "step": 144 + }, + { + "epoch": 0.0, + "global_step": 145, + "learning_rate": 0.0003625, + "loss": 3.5258, + "loss_base2": 5.0867, + "loss_pixel": 0.3804, + "loss_text": 3.1454, + "ppl": 33.9809, + "step": 145 + }, + { + "epoch": 0.0, + "global_step": 146, + "learning_rate": 0.000365, + "loss": 3.5203, + "loss_base2": 5.0787, + "loss_pixel": 0.3801, + "loss_text": 3.1402, + "ppl": 33.7946, + "step": 146 + }, + { + "epoch": 0.0, + "global_step": 147, + "learning_rate": 0.0003675, + "loss": 3.5207, + "loss_base2": 5.0793, + "loss_pixel": 0.3798, + "loss_text": 3.1409, + "ppl": 33.8081, + "step": 147 + }, + { + "epoch": 0.0, + "global_step": 148, + "learning_rate": 0.00037, + "loss": 3.522, + "loss_base2": 5.0812, + "loss_pixel": 0.379, + "loss_text": 3.143, + "ppl": 33.8521, + "step": 148 + }, + { + "epoch": 0.0, + "global_step": 149, + "learning_rate": 0.0003725, + "loss": 3.4984, + "loss_base2": 5.0471, + "loss_pixel": 0.3799, + "loss_text": 3.1185, + "ppl": 33.0625, + "step": 149 + }, + { + "epoch": 0.0, + "global_step": 150, + "learning_rate": 0.000375, + "loss": 3.4794, + "loss_base2": 5.0197, + "loss_pixel": 0.3793, + "loss_text": 3.1001, + "ppl": 32.4403, + "step": 150 + }, + { + "epoch": 0.0, + "global_step": 151, + "learning_rate": 0.0003775, + "loss": 3.4851, + "loss_base2": 5.0279, + "loss_pixel": 0.3793, + "loss_text": 3.1058, + "ppl": 32.6257, + "step": 151 + }, + { + "epoch": 0.0, + "global_step": 152, + "learning_rate": 0.00038, + "loss": 3.485, + "loss_base2": 5.0278, + "loss_pixel": 0.3793, + "loss_text": 3.1056, + "ppl": 32.6224, + "step": 152 + }, + { + "epoch": 0.0, + "global_step": 153, + "learning_rate": 0.00038250000000000003, + "loss": 3.4869, + "loss_base2": 5.0305, + "loss_pixel": 0.3793, + "loss_text": 3.1076, + "ppl": 32.6845, + "step": 153 + }, + { + "epoch": 0.0, + "global_step": 154, + "learning_rate": 0.00038500000000000003, + "loss": 3.4787, + "loss_base2": 5.0187, + "loss_pixel": 0.3788, + "loss_text": 3.0998, + "ppl": 32.4176, + "step": 154 + }, + { + "epoch": 0.0, + "global_step": 155, + "learning_rate": 0.00038750000000000004, + "loss": 3.4662, + "loss_base2": 5.0007, + "loss_pixel": 0.3789, + "loss_text": 3.0873, + "ppl": 32.0149, + "step": 155 + }, + { + "epoch": 0.0, + "global_step": 156, + "learning_rate": 0.00039000000000000005, + "loss": 3.4568, + "loss_base2": 4.9871, + "loss_pixel": 0.379, + "loss_text": 3.0778, + "ppl": 31.7153, + "step": 156 + }, + { + "epoch": 0.0, + "global_step": 157, + "learning_rate": 0.0003925, + "loss": 3.4569, + "loss_base2": 4.9873, + "loss_pixel": 0.3789, + "loss_text": 3.0781, + "ppl": 31.7185, + "step": 157 + }, + { + "epoch": 0.0, + "global_step": 158, + "learning_rate": 0.000395, + "loss": 3.4475, + "loss_base2": 4.9737, + "loss_pixel": 0.3785, + "loss_text": 3.069, + "ppl": 31.4217, + "step": 158 + }, + { + "epoch": 0.0, + "global_step": 159, + "learning_rate": 0.0003975, + "loss": 3.4604, + "loss_base2": 4.9923, + "loss_pixel": 0.3784, + "loss_text": 3.082, + "ppl": 31.8297, + "step": 159 + }, + { + "epoch": 0.0, + "global_step": 160, + "learning_rate": 0.0004, + "loss": 3.4557, + "loss_base2": 4.9855, + "loss_pixel": 0.3785, + "loss_text": 3.0772, + "ppl": 31.6805, + "step": 160 + }, + { + "epoch": 0.0, + "global_step": 161, + "learning_rate": 0.0004025, + "loss": 3.4971, + "loss_base2": 5.0452, + "loss_pixel": 0.3784, + "loss_text": 3.1187, + "ppl": 33.0196, + "step": 161 + }, + { + "epoch": 0.0, + "global_step": 162, + "learning_rate": 0.00040500000000000003, + "loss": 3.543, + "loss_base2": 5.1115, + "loss_pixel": 0.3775, + "loss_text": 3.1656, + "ppl": 34.5705, + "step": 162 + }, + { + "epoch": 0.0, + "global_step": 163, + "learning_rate": 0.0004075, + "loss": 3.6593, + "loss_base2": 5.2793, + "loss_pixel": 0.3775, + "loss_text": 3.2818, + "ppl": 38.8341, + "step": 163 + }, + { + "epoch": 0.0, + "global_step": 164, + "learning_rate": 0.00041, + "loss": 3.4828, + "loss_base2": 5.0246, + "loss_pixel": 0.3775, + "loss_text": 3.1053, + "ppl": 32.5507, + "step": 164 + }, + { + "epoch": 0.0, + "global_step": 165, + "learning_rate": 0.0004125, + "loss": 3.4825, + "loss_base2": 5.0242, + "loss_pixel": 0.3777, + "loss_text": 3.1048, + "ppl": 32.541, + "step": 165 + }, + { + "epoch": 0.0, + "global_step": 166, + "learning_rate": 0.000415, + "loss": 3.4516, + "loss_base2": 4.9796, + "loss_pixel": 0.3764, + "loss_text": 3.0751, + "ppl": 31.5508, + "step": 166 + }, + { + "epoch": 0.0, + "global_step": 167, + "learning_rate": 0.0004175, + "loss": 3.4111, + "loss_base2": 4.9212, + "loss_pixel": 0.3757, + "loss_text": 3.0353, + "ppl": 30.2986, + "step": 167 + }, + { + "epoch": 0.0, + "global_step": 168, + "learning_rate": 0.00042, + "loss": 3.3904, + "loss_base2": 4.8913, + "loss_pixel": 0.3759, + "loss_text": 3.0145, + "ppl": 29.6778, + "step": 168 + }, + { + "epoch": 0.0, + "global_step": 169, + "learning_rate": 0.00042249999999999997, + "loss": 3.5964, + "loss_base2": 5.1885, + "loss_pixel": 0.3764, + "loss_text": 3.22, + "ppl": 36.4667, + "step": 169 + }, + { + "epoch": 0.0, + "global_step": 170, + "learning_rate": 0.000425, + "loss": 3.4291, + "loss_base2": 4.9471, + "loss_pixel": 0.3747, + "loss_text": 3.0545, + "ppl": 30.8489, + "step": 170 + }, + { + "epoch": 0.0, + "global_step": 171, + "learning_rate": 0.0004275, + "loss": 3.3753, + "loss_base2": 4.8695, + "loss_pixel": 0.375, + "loss_text": 3.0003, + "ppl": 29.2331, + "step": 171 + }, + { + "epoch": 0.0, + "global_step": 172, + "learning_rate": 0.00043, + "loss": 3.3571, + "loss_base2": 4.8433, + "loss_pixel": 0.3744, + "loss_text": 2.9826, + "ppl": 28.7058, + "step": 172 + }, + { + "epoch": 0.0, + "global_step": 173, + "learning_rate": 0.0004325, + "loss": 3.3334, + "loss_base2": 4.8091, + "loss_pixel": 0.3741, + "loss_text": 2.9593, + "ppl": 28.0335, + "step": 173 + }, + { + "epoch": 0.0, + "global_step": 174, + "learning_rate": 0.000435, + "loss": 3.3242, + "loss_base2": 4.7958, + "loss_pixel": 0.375, + "loss_text": 2.9492, + "ppl": 27.7768, + "step": 174 + }, + { + "epoch": 0.0, + "global_step": 175, + "learning_rate": 0.0004375, + "loss": 3.3141, + "loss_base2": 4.7812, + "loss_pixel": 0.3739, + "loss_text": 2.9401, + "ppl": 27.4976, + "step": 175 + }, + { + "epoch": 0.0, + "global_step": 176, + "learning_rate": 0.00044, + "loss": 3.3093, + "loss_base2": 4.7743, + "loss_pixel": 0.3748, + "loss_text": 2.9345, + "ppl": 27.366, + "step": 176 + }, + { + "epoch": 0.0, + "global_step": 177, + "learning_rate": 0.0004425, + "loss": 3.4203, + "loss_base2": 4.9344, + "loss_pixel": 0.3734, + "loss_text": 3.0469, + "ppl": 30.5786, + "step": 177 + }, + { + "epoch": 0.0, + "global_step": 178, + "learning_rate": 0.00044500000000000003, + "loss": 3.565, + "loss_base2": 5.1432, + "loss_pixel": 0.374, + "loss_text": 3.191, + "ppl": 35.3395, + "step": 178 + }, + { + "epoch": 0.0, + "global_step": 179, + "learning_rate": 0.00044750000000000004, + "loss": 3.5573, + "loss_base2": 5.1321, + "loss_pixel": 0.3737, + "loss_text": 3.1837, + "ppl": 35.0684, + "step": 179 + }, + { + "epoch": 0.0, + "global_step": 180, + "learning_rate": 0.00045000000000000004, + "loss": 3.5001, + "loss_base2": 5.0496, + "loss_pixel": 0.3721, + "loss_text": 3.128, + "ppl": 33.1188, + "step": 180 + }, + { + "epoch": 0.0, + "global_step": 181, + "learning_rate": 0.00045250000000000005, + "loss": 3.4996, + "loss_base2": 5.0489, + "loss_pixel": 0.372, + "loss_text": 3.1275, + "ppl": 33.1022, + "step": 181 + }, + { + "epoch": 0.0, + "global_step": 182, + "learning_rate": 0.000455, + "loss": 3.5246, + "loss_base2": 5.0849, + "loss_pixel": 0.3718, + "loss_text": 3.1529, + "ppl": 33.9402, + "step": 182 + }, + { + "epoch": 0.0, + "global_step": 183, + "learning_rate": 0.0004575, + "loss": 3.455, + "loss_base2": 4.9845, + "loss_pixel": 0.3711, + "loss_text": 3.0838, + "ppl": 31.6583, + "step": 183 + }, + { + "epoch": 0.0, + "global_step": 184, + "learning_rate": 0.00046, + "loss": 3.4509, + "loss_base2": 4.9786, + "loss_pixel": 0.3706, + "loss_text": 3.0803, + "ppl": 31.5288, + "step": 184 + }, + { + "epoch": 0.0, + "global_step": 185, + "learning_rate": 0.0004625, + "loss": 3.4488, + "loss_base2": 4.9756, + "loss_pixel": 0.3706, + "loss_text": 3.0782, + "ppl": 31.4626, + "step": 185 + }, + { + "epoch": 0.0, + "global_step": 186, + "learning_rate": 0.000465, + "loss": 3.4321, + "loss_base2": 4.9515, + "loss_pixel": 0.3704, + "loss_text": 3.0617, + "ppl": 30.9416, + "step": 186 + }, + { + "epoch": 0.0, + "global_step": 187, + "learning_rate": 0.00046750000000000003, + "loss": 3.4353, + "loss_base2": 4.9561, + "loss_pixel": 0.3696, + "loss_text": 3.0657, + "ppl": 31.0407, + "step": 187 + }, + { + "epoch": 0.0, + "global_step": 188, + "learning_rate": 0.00047, + "loss": 3.3677, + "loss_base2": 4.8586, + "loss_pixel": 0.3699, + "loss_text": 2.9978, + "ppl": 29.0117, + "step": 188 + }, + { + "epoch": 0.0, + "global_step": 189, + "learning_rate": 0.0004725, + "loss": 3.4067, + "loss_base2": 4.9148, + "loss_pixel": 0.3698, + "loss_text": 3.0369, + "ppl": 30.1655, + "step": 189 + }, + { + "epoch": 0.0, + "global_step": 190, + "learning_rate": 0.000475, + "loss": 3.397, + "loss_base2": 4.9008, + "loss_pixel": 0.3691, + "loss_text": 3.0279, + "ppl": 29.8743, + "step": 190 + }, + { + "epoch": 0.0, + "global_step": 191, + "learning_rate": 0.0004775, + "loss": 3.3876, + "loss_base2": 4.8873, + "loss_pixel": 0.369, + "loss_text": 3.0185, + "ppl": 29.5948, + "step": 191 + }, + { + "epoch": 0.0, + "global_step": 192, + "learning_rate": 0.00048, + "loss": 3.402, + "loss_base2": 4.908, + "loss_pixel": 0.3677, + "loss_text": 3.0343, + "ppl": 30.0241, + "step": 192 + }, + { + "epoch": 0.0, + "global_step": 193, + "learning_rate": 0.0004825, + "loss": 3.3701, + "loss_base2": 4.862, + "loss_pixel": 0.3665, + "loss_text": 3.0035, + "ppl": 29.0814, + "step": 193 + }, + { + "epoch": 0.0, + "global_step": 194, + "learning_rate": 0.00048499999999999997, + "loss": 3.3727, + "loss_base2": 4.8658, + "loss_pixel": 0.3663, + "loss_text": 3.0065, + "ppl": 29.1571, + "step": 194 + }, + { + "epoch": 0.0, + "global_step": 195, + "learning_rate": 0.0004875, + "loss": 3.3578, + "loss_base2": 4.8443, + "loss_pixel": 0.3652, + "loss_text": 2.9925, + "ppl": 28.7259, + "step": 195 + }, + { + "epoch": 0.0, + "global_step": 196, + "learning_rate": 0.00049, + "loss": 3.3579, + "loss_base2": 4.8444, + "loss_pixel": 0.3644, + "loss_text": 2.9935, + "ppl": 28.7288, + "step": 196 + }, + { + "epoch": 0.0, + "global_step": 197, + "learning_rate": 0.0004925, + "loss": 3.3318, + "loss_base2": 4.8068, + "loss_pixel": 0.3641, + "loss_text": 2.9677, + "ppl": 27.9887, + "step": 197 + }, + { + "epoch": 0.0, + "global_step": 198, + "learning_rate": 0.000495, + "loss": 3.3419, + "loss_base2": 4.8213, + "loss_pixel": 0.3645, + "loss_text": 2.9774, + "ppl": 28.2728, + "step": 198 + }, + { + "epoch": 0.0, + "global_step": 199, + "learning_rate": 0.0004975, + "loss": 3.3508, + "loss_base2": 4.8342, + "loss_pixel": 0.3623, + "loss_text": 2.9885, + "ppl": 28.5255, + "step": 199 + }, + { + "epoch": 0.0, + "global_step": 200, + "learning_rate": 0.0005, + "loss": 3.3253, + "loss_base2": 4.7974, + "loss_pixel": 0.3614, + "loss_text": 2.9639, + "ppl": 27.8073, + "step": 200 + }, + { + "epoch": 0.0, + "global_step": 201, + "learning_rate": 0.0004999958263772955, + "loss": 3.3265, + "loss_base2": 4.7991, + "loss_pixel": 0.3607, + "loss_text": 2.9657, + "ppl": 27.8407, + "step": 201 + }, + { + "epoch": 0.0, + "global_step": 202, + "learning_rate": 0.000499991652754591, + "loss": 3.3189, + "loss_base2": 4.7882, + "loss_pixel": 0.3596, + "loss_text": 2.9593, + "ppl": 27.6299, + "step": 202 + }, + { + "epoch": 0.0, + "global_step": 203, + "learning_rate": 0.0004999874791318864, + "loss": 3.3106, + "loss_base2": 4.7762, + "loss_pixel": 0.3604, + "loss_text": 2.9502, + "ppl": 27.4016, + "step": 203 + }, + { + "epoch": 0.0, + "global_step": 204, + "learning_rate": 0.0004999833055091819, + "loss": 3.3231, + "loss_base2": 4.7942, + "loss_pixel": 0.3716, + "loss_text": 2.9515, + "ppl": 27.7462, + "step": 204 + }, + { + "epoch": 0.0, + "global_step": 205, + "learning_rate": 0.0004999791318864774, + "loss": 3.3096, + "loss_base2": 4.7747, + "loss_pixel": 0.3841, + "loss_text": 2.9256, + "ppl": 27.3742, + "step": 205 + }, + { + "epoch": 0.0, + "global_step": 206, + "learning_rate": 0.000499974958263773, + "loss": 3.3008, + "loss_base2": 4.762, + "loss_pixel": 0.3659, + "loss_text": 2.9349, + "ppl": 27.1343, + "step": 206 + }, + { + "epoch": 0.0, + "global_step": 207, + "learning_rate": 0.0004999707846410685, + "loss": 3.2965, + "loss_base2": 4.7558, + "loss_pixel": 0.3723, + "loss_text": 2.9242, + "ppl": 27.0179, + "step": 207 + }, + { + "epoch": 0.0, + "global_step": 208, + "learning_rate": 0.000499966611018364, + "loss": 3.3042, + "loss_base2": 4.767, + "loss_pixel": 0.3682, + "loss_text": 2.9359, + "ppl": 27.2268, + "step": 208 + }, + { + "epoch": 0.0, + "global_step": 209, + "learning_rate": 0.0004999624373956595, + "loss": 3.2841, + "loss_base2": 4.738, + "loss_pixel": 0.3635, + "loss_text": 2.9206, + "ppl": 26.685, + "step": 209 + }, + { + "epoch": 0.0, + "global_step": 210, + "learning_rate": 0.000499958263772955, + "loss": 3.2685, + "loss_base2": 4.7154, + "loss_pixel": 0.3636, + "loss_text": 2.9049, + "ppl": 26.2719, + "step": 210 + }, + { + "epoch": 0.0, + "global_step": 211, + "learning_rate": 0.0004999540901502505, + "loss": 3.2696, + "loss_base2": 4.717, + "loss_pixel": 0.3636, + "loss_text": 2.9061, + "ppl": 26.3008, + "step": 211 + }, + { + "epoch": 0.0, + "global_step": 212, + "learning_rate": 0.0004999499165275459, + "loss": 3.246, + "loss_base2": 4.683, + "loss_pixel": 0.3625, + "loss_text": 2.8835, + "ppl": 25.6874, + "step": 212 + }, + { + "epoch": 0.0, + "global_step": 213, + "learning_rate": 0.0004999457429048414, + "loss": 3.2579, + "loss_base2": 4.7002, + "loss_pixel": 0.36, + "loss_text": 2.8978, + "ppl": 25.9949, + "step": 213 + }, + { + "epoch": 0.0, + "global_step": 214, + "learning_rate": 0.0004999415692821369, + "loss": 3.25, + "loss_base2": 4.6888, + "loss_pixel": 0.359, + "loss_text": 2.891, + "ppl": 25.7903, + "step": 214 + }, + { + "epoch": 0.0, + "global_step": 215, + "learning_rate": 0.0004999373956594324, + "loss": 3.2656, + "loss_base2": 4.7113, + "loss_pixel": 0.3589, + "loss_text": 2.9067, + "ppl": 26.1958, + "step": 215 + }, + { + "epoch": 0.0, + "global_step": 216, + "learning_rate": 0.0004999332220367279, + "loss": 3.229, + "loss_base2": 4.6585, + "loss_pixel": 0.3585, + "loss_text": 2.8705, + "ppl": 25.2544, + "step": 216 + }, + { + "epoch": 0.0, + "global_step": 217, + "learning_rate": 0.0004999290484140234, + "loss": 3.2431, + "loss_base2": 4.6788, + "loss_pixel": 0.3613, + "loss_text": 2.8819, + "ppl": 25.613, + "step": 217 + }, + { + "epoch": 0.0, + "global_step": 218, + "learning_rate": 0.0004999248747913189, + "loss": 3.3007, + "loss_base2": 4.7619, + "loss_pixel": 0.3782, + "loss_text": 2.9225, + "ppl": 27.1316, + "step": 218 + }, + { + "epoch": 0.0, + "global_step": 219, + "learning_rate": 0.0004999207011686143, + "loss": 3.2636, + "loss_base2": 4.7084, + "loss_pixel": 0.3689, + "loss_text": 2.8947, + "ppl": 26.1435, + "step": 219 + }, + { + "epoch": 0.0, + "global_step": 220, + "learning_rate": 0.0004999165275459098, + "loss": 3.2626, + "loss_base2": 4.7069, + "loss_pixel": 0.3752, + "loss_text": 2.8874, + "ppl": 26.1174, + "step": 220 + }, + { + "epoch": 0.0, + "global_step": 221, + "learning_rate": 0.0004999123539232053, + "loss": 3.2611, + "loss_base2": 4.7048, + "loss_pixel": 0.3666, + "loss_text": 2.8945, + "ppl": 26.0782, + "step": 221 + }, + { + "epoch": 0.0, + "global_step": 222, + "learning_rate": 0.0004999081803005008, + "loss": 3.2605, + "loss_base2": 4.7039, + "loss_pixel": 0.3705, + "loss_text": 2.89, + "ppl": 26.0626, + "step": 222 + }, + { + "epoch": 0.0, + "global_step": 223, + "learning_rate": 0.0004999040066777964, + "loss": 3.2533, + "loss_base2": 4.6935, + "loss_pixel": 0.3691, + "loss_text": 2.8842, + "ppl": 25.8756, + "step": 223 + }, + { + "epoch": 0.0, + "global_step": 224, + "learning_rate": 0.0004998998330550919, + "loss": 3.2464, + "loss_base2": 4.6836, + "loss_pixel": 0.3645, + "loss_text": 2.8819, + "ppl": 25.6977, + "step": 224 + }, + { + "epoch": 0.0, + "global_step": 225, + "learning_rate": 0.0004998956594323873, + "loss": 3.2254, + "loss_base2": 4.6533, + "loss_pixel": 0.3627, + "loss_text": 2.8627, + "ppl": 25.1636, + "step": 225 + }, + { + "epoch": 0.0, + "global_step": 226, + "learning_rate": 0.0004998914858096828, + "loss": 3.2128, + "loss_base2": 4.6351, + "loss_pixel": 0.3634, + "loss_text": 2.8495, + "ppl": 24.8486, + "step": 226 + }, + { + "epoch": 0.0, + "global_step": 227, + "learning_rate": 0.0004998873121869783, + "loss": 3.2545, + "loss_base2": 4.6953, + "loss_pixel": 0.3603, + "loss_text": 2.8942, + "ppl": 25.9067, + "step": 227 + }, + { + "epoch": 0.0, + "global_step": 228, + "learning_rate": 0.0004998831385642738, + "loss": 3.2208, + "loss_base2": 4.6466, + "loss_pixel": 0.3594, + "loss_text": 2.8614, + "ppl": 25.0482, + "step": 228 + }, + { + "epoch": 0.0, + "global_step": 229, + "learning_rate": 0.0004998789649415693, + "loss": 3.2133, + "loss_base2": 4.6358, + "loss_pixel": 0.3592, + "loss_text": 2.8541, + "ppl": 24.861, + "step": 229 + }, + { + "epoch": 0.0, + "global_step": 230, + "learning_rate": 0.0004998747913188648, + "loss": 3.1869, + "loss_base2": 4.5977, + "loss_pixel": 0.3578, + "loss_text": 2.8291, + "ppl": 24.2132, + "step": 230 + }, + { + "epoch": 0.0, + "global_step": 231, + "learning_rate": 0.0004998706176961603, + "loss": 3.1824, + "loss_base2": 4.5912, + "loss_pixel": 0.3562, + "loss_text": 2.8261, + "ppl": 24.1045, + "step": 231 + }, + { + "epoch": 0.0, + "global_step": 232, + "learning_rate": 0.0004998664440734558, + "loss": 3.1707, + "loss_base2": 4.5744, + "loss_pixel": 0.3544, + "loss_text": 2.8164, + "ppl": 23.8242, + "step": 232 + }, + { + "epoch": 0.0, + "global_step": 233, + "learning_rate": 0.0004998622704507513, + "loss": 3.1743, + "loss_base2": 4.5795, + "loss_pixel": 0.3535, + "loss_text": 2.8208, + "ppl": 23.9101, + "step": 233 + }, + { + "epoch": 0.0, + "global_step": 234, + "learning_rate": 0.0004998580968280468, + "loss": 3.1682, + "loss_base2": 4.5707, + "loss_pixel": 0.3531, + "loss_text": 2.815, + "ppl": 23.7647, + "step": 234 + }, + { + "epoch": 0.0, + "global_step": 235, + "learning_rate": 0.0004998539232053422, + "loss": 3.1664, + "loss_base2": 4.5681, + "loss_pixel": 0.3507, + "loss_text": 2.8157, + "ppl": 23.7219, + "step": 235 + }, + { + "epoch": 0.0, + "global_step": 236, + "learning_rate": 0.0004998497495826377, + "loss": 3.1547, + "loss_base2": 4.5513, + "loss_pixel": 0.3495, + "loss_text": 2.8052, + "ppl": 23.446, + "step": 236 + }, + { + "epoch": 0.0, + "global_step": 237, + "learning_rate": 0.0004998455759599332, + "loss": 3.1588, + "loss_base2": 4.5572, + "loss_pixel": 0.3489, + "loss_text": 2.8099, + "ppl": 23.5423, + "step": 237 + }, + { + "epoch": 0.0, + "global_step": 238, + "learning_rate": 0.0004998414023372287, + "loss": 3.1535, + "loss_base2": 4.5495, + "loss_pixel": 0.3469, + "loss_text": 2.8066, + "ppl": 23.4179, + "step": 238 + }, + { + "epoch": 0.0, + "global_step": 239, + "learning_rate": 0.0004998372287145241, + "loss": 3.1463, + "loss_base2": 4.5392, + "loss_pixel": 0.3464, + "loss_text": 2.7999, + "ppl": 23.2499, + "step": 239 + }, + { + "epoch": 0.0, + "global_step": 240, + "learning_rate": 0.0004998330550918197, + "loss": 3.1405, + "loss_base2": 4.5308, + "loss_pixel": 0.3464, + "loss_text": 2.7941, + "ppl": 23.1154, + "step": 240 + }, + { + "epoch": 0.0, + "global_step": 241, + "learning_rate": 0.0004998288814691152, + "loss": 3.1233, + "loss_base2": 4.506, + "loss_pixel": 0.3447, + "loss_text": 2.7786, + "ppl": 22.7212, + "step": 241 + }, + { + "epoch": 0.0, + "global_step": 242, + "learning_rate": 0.0004998247078464107, + "loss": 3.1368, + "loss_base2": 4.5254, + "loss_pixel": 0.3426, + "loss_text": 2.7941, + "ppl": 23.0301, + "step": 242 + }, + { + "epoch": 0.0, + "global_step": 243, + "learning_rate": 0.0004998205342237062, + "loss": 3.1204, + "loss_base2": 4.5018, + "loss_pixel": 0.3428, + "loss_text": 2.7776, + "ppl": 22.6554, + "step": 243 + }, + { + "epoch": 0.0, + "global_step": 244, + "learning_rate": 0.0004998163606010017, + "loss": 3.1167, + "loss_base2": 4.4964, + "loss_pixel": 0.3411, + "loss_text": 2.7756, + "ppl": 22.5718, + "step": 244 + }, + { + "epoch": 0.0, + "global_step": 245, + "learning_rate": 0.0004998121869782972, + "loss": 3.1124, + "loss_base2": 4.4902, + "loss_pixel": 0.3395, + "loss_text": 2.7729, + "ppl": 22.4749, + "step": 245 + }, + { + "epoch": 0.0, + "global_step": 246, + "learning_rate": 0.0004998080133555927, + "loss": 3.1048, + "loss_base2": 4.4793, + "loss_pixel": 0.339, + "loss_text": 2.7658, + "ppl": 22.3048, + "step": 246 + }, + { + "epoch": 0.0, + "global_step": 247, + "learning_rate": 0.0004998038397328882, + "loss": 3.0983, + "loss_base2": 4.4699, + "loss_pixel": 0.3387, + "loss_text": 2.7596, + "ppl": 22.1602, + "step": 247 + }, + { + "epoch": 0.0, + "global_step": 248, + "learning_rate": 0.0004997996661101836, + "loss": 3.09, + "loss_base2": 4.4579, + "loss_pixel": 0.337, + "loss_text": 2.753, + "ppl": 21.9771, + "step": 248 + }, + { + "epoch": 0.0, + "global_step": 249, + "learning_rate": 0.0004997954924874791, + "loss": 3.1555, + "loss_base2": 4.5524, + "loss_pixel": 0.3364, + "loss_text": 2.8191, + "ppl": 23.4648, + "step": 249 + }, + { + "epoch": 0.0, + "global_step": 250, + "learning_rate": 0.0004997913188647746, + "loss": 3.1501, + "loss_base2": 4.5446, + "loss_pixel": 0.3368, + "loss_text": 2.8133, + "ppl": 23.3384, + "step": 250 + }, + { + "epoch": 0.0, + "global_step": 251, + "learning_rate": 0.0004997871452420701, + "loss": 3.1609, + "loss_base2": 4.5602, + "loss_pixel": 0.3434, + "loss_text": 2.8175, + "ppl": 23.5918, + "step": 251 + }, + { + "epoch": 0.0, + "global_step": 252, + "learning_rate": 0.0004997829716193656, + "loss": 3.1493, + "loss_base2": 4.5435, + "loss_pixel": 0.3639, + "loss_text": 2.7854, + "ppl": 23.3197, + "step": 252 + }, + { + "epoch": 0.0, + "global_step": 253, + "learning_rate": 0.0004997787979966611, + "loss": 3.4537, + "loss_base2": 4.9826, + "loss_pixel": 0.7014, + "loss_text": 2.7523, + "ppl": 31.6172, + "step": 253 + }, + { + "epoch": 0.0, + "global_step": 254, + "learning_rate": 0.0004997746243739566, + "loss": 3.1729, + "loss_base2": 4.5775, + "loss_pixel": 0.3754, + "loss_text": 2.7976, + "ppl": 23.8766, + "step": 254 + }, + { + "epoch": 0.0, + "global_step": 255, + "learning_rate": 0.0004997704507512522, + "loss": 3.1472, + "loss_base2": 4.5404, + "loss_pixel": 0.3737, + "loss_text": 2.7735, + "ppl": 23.2708, + "step": 255 + }, + { + "epoch": 0.0, + "global_step": 256, + "learning_rate": 0.0004997662771285477, + "loss": 3.2093, + "loss_base2": 4.63, + "loss_pixel": 0.3741, + "loss_text": 2.8352, + "ppl": 24.7617, + "step": 256 + }, + { + "epoch": 0.0, + "global_step": 257, + "learning_rate": 0.0004997621035058431, + "loss": 3.2454, + "loss_base2": 4.6821, + "loss_pixel": 0.3737, + "loss_text": 2.8717, + "ppl": 25.672, + "step": 257 + }, + { + "epoch": 0.0, + "global_step": 258, + "learning_rate": 0.0004997579298831386, + "loss": 3.2377, + "loss_base2": 4.671, + "loss_pixel": 0.369, + "loss_text": 2.8687, + "ppl": 25.4751, + "step": 258 + }, + { + "epoch": 0.0, + "global_step": 259, + "learning_rate": 0.0004997537562604341, + "loss": 3.2157, + "loss_base2": 4.6393, + "loss_pixel": 0.3706, + "loss_text": 2.8451, + "ppl": 24.9207, + "step": 259 + }, + { + "epoch": 0.0, + "global_step": 260, + "learning_rate": 0.0004997495826377296, + "loss": 3.2125, + "loss_base2": 4.6347, + "loss_pixel": 0.3705, + "loss_text": 2.842, + "ppl": 24.8411, + "step": 260 + }, + { + "epoch": 0.0, + "global_step": 261, + "learning_rate": 0.0004997454090150251, + "loss": 3.1863, + "loss_base2": 4.5969, + "loss_pixel": 0.3752, + "loss_text": 2.8111, + "ppl": 24.1987, + "step": 261 + }, + { + "epoch": 0.0, + "global_step": 262, + "learning_rate": 0.0004997412353923205, + "loss": 3.1891, + "loss_base2": 4.6009, + "loss_pixel": 0.3838, + "loss_text": 2.8052, + "ppl": 24.2666, + "step": 262 + }, + { + "epoch": 0.0, + "global_step": 263, + "learning_rate": 0.000499737061769616, + "loss": 3.1821, + "loss_base2": 4.5908, + "loss_pixel": 0.3785, + "loss_text": 2.8036, + "ppl": 24.0973, + "step": 263 + }, + { + "epoch": 0.0, + "global_step": 264, + "learning_rate": 0.0004997328881469115, + "loss": 3.1859, + "loss_base2": 4.5963, + "loss_pixel": 0.3869, + "loss_text": 2.799, + "ppl": 24.189, + "step": 264 + }, + { + "epoch": 0.0, + "global_step": 265, + "learning_rate": 0.000499728714524207, + "loss": 3.1803, + "loss_base2": 4.5882, + "loss_pixel": 0.3934, + "loss_text": 2.7869, + "ppl": 24.054, + "step": 265 + }, + { + "epoch": 0.0, + "global_step": 266, + "learning_rate": 0.0004997245409015025, + "loss": 3.1601, + "loss_base2": 4.5591, + "loss_pixel": 0.3883, + "loss_text": 2.7718, + "ppl": 23.573, + "step": 266 + }, + { + "epoch": 0.0, + "global_step": 267, + "learning_rate": 0.000499720367278798, + "loss": 3.1588, + "loss_base2": 4.5572, + "loss_pixel": 0.3865, + "loss_text": 2.7724, + "ppl": 23.5423, + "step": 267 + }, + { + "epoch": 0.0, + "global_step": 268, + "learning_rate": 0.0004997161936560935, + "loss": 3.1546, + "loss_base2": 4.5511, + "loss_pixel": 0.3876, + "loss_text": 2.767, + "ppl": 23.4437, + "step": 268 + }, + { + "epoch": 0.0, + "global_step": 269, + "learning_rate": 0.000499712020033389, + "loss": 3.1391, + "loss_base2": 4.5288, + "loss_pixel": 0.387, + "loss_text": 2.7521, + "ppl": 23.0831, + "step": 269 + }, + { + "epoch": 0.0, + "global_step": 270, + "learning_rate": 0.0004997078464106845, + "loss": 3.1377, + "loss_base2": 4.5267, + "loss_pixel": 0.3875, + "loss_text": 2.7503, + "ppl": 23.0508, + "step": 270 + }, + { + "epoch": 0.0, + "global_step": 271, + "learning_rate": 0.00049970367278798, + "loss": 3.1204, + "loss_base2": 4.5018, + "loss_pixel": 0.3845, + "loss_text": 2.7358, + "ppl": 22.6554, + "step": 271 + }, + { + "epoch": 0.0, + "global_step": 272, + "learning_rate": 0.0004996994991652755, + "loss": 3.1238, + "loss_base2": 4.5067, + "loss_pixel": 0.3839, + "loss_text": 2.7399, + "ppl": 22.7326, + "step": 272 + }, + { + "epoch": 0.0, + "global_step": 273, + "learning_rate": 0.000499695325542571, + "loss": 3.1072, + "loss_base2": 4.4827, + "loss_pixel": 0.385, + "loss_text": 2.7222, + "ppl": 22.3584, + "step": 273 + }, + { + "epoch": 0.0, + "global_step": 274, + "learning_rate": 0.0004996911519198665, + "loss": 3.122, + "loss_base2": 4.5041, + "loss_pixel": 0.3823, + "loss_text": 2.7397, + "ppl": 22.6917, + "step": 274 + }, + { + "epoch": 0.0, + "global_step": 275, + "learning_rate": 0.0004996869782971619, + "loss": 3.1195, + "loss_base2": 4.5005, + "loss_pixel": 0.3832, + "loss_text": 2.7363, + "ppl": 22.6351, + "step": 275 + }, + { + "epoch": 0.0, + "global_step": 276, + "learning_rate": 0.0004996828046744574, + "loss": 3.1135, + "loss_base2": 4.4918, + "loss_pixel": 0.3829, + "loss_text": 2.7305, + "ppl": 22.4997, + "step": 276 + }, + { + "epoch": 0.0, + "global_step": 277, + "learning_rate": 0.0004996786310517529, + "loss": 3.0952, + "loss_base2": 4.4654, + "loss_pixel": 0.3816, + "loss_text": 2.7136, + "ppl": 22.0917, + "step": 277 + }, + { + "epoch": 0.0, + "global_step": 278, + "learning_rate": 0.0004996744574290484, + "loss": 3.1008, + "loss_base2": 4.4735, + "loss_pixel": 0.3822, + "loss_text": 2.7186, + "ppl": 22.2157, + "step": 278 + }, + { + "epoch": 0.0, + "global_step": 279, + "learning_rate": 0.0004996702838063439, + "loss": 3.1031, + "loss_base2": 4.4768, + "loss_pixel": 0.3817, + "loss_text": 2.7213, + "ppl": 22.2669, + "step": 279 + }, + { + "epoch": 0.0, + "global_step": 280, + "learning_rate": 0.0004996661101836394, + "loss": 3.1239, + "loss_base2": 4.5068, + "loss_pixel": 0.3821, + "loss_text": 2.7418, + "ppl": 22.7349, + "step": 280 + }, + { + "epoch": 0.0, + "global_step": 281, + "learning_rate": 0.0004996619365609349, + "loss": 3.0724, + "loss_base2": 4.4325, + "loss_pixel": 0.3808, + "loss_text": 2.6916, + "ppl": 21.5937, + "step": 281 + }, + { + "epoch": 0.0, + "global_step": 282, + "learning_rate": 0.0004996577629382304, + "loss": 3.0578, + "loss_base2": 4.4115, + "loss_pixel": 0.3807, + "loss_text": 2.6771, + "ppl": 21.2807, + "step": 282 + }, + { + "epoch": 0.0, + "global_step": 283, + "learning_rate": 0.0004996535893155259, + "loss": 3.0344, + "loss_base2": 4.3777, + "loss_pixel": 0.3877, + "loss_text": 2.6467, + "ppl": 20.7885, + "step": 283 + }, + { + "epoch": 0.0, + "global_step": 284, + "learning_rate": 0.0004996494156928213, + "loss": 3.0462, + "loss_base2": 4.3947, + "loss_pixel": 0.4175, + "loss_text": 2.6287, + "ppl": 21.0353, + "step": 284 + }, + { + "epoch": 0.0, + "global_step": 285, + "learning_rate": 0.0004996452420701168, + "loss": 3.0207, + "loss_base2": 4.3579, + "loss_pixel": 0.3937, + "loss_text": 2.627, + "ppl": 20.5056, + "step": 285 + }, + { + "epoch": 0.0, + "global_step": 286, + "learning_rate": 0.0004996410684474123, + "loss": 2.9827, + "loss_base2": 4.3031, + "loss_pixel": 0.3845, + "loss_text": 2.5983, + "ppl": 19.741, + "step": 286 + }, + { + "epoch": 0.0, + "global_step": 287, + "learning_rate": 0.0004996368948247078, + "loss": 2.9718, + "loss_base2": 4.2874, + "loss_pixel": 0.3912, + "loss_text": 2.5806, + "ppl": 19.527, + "step": 287 + }, + { + "epoch": 0.0, + "global_step": 288, + "learning_rate": 0.0004996327212020034, + "loss": 2.9572, + "loss_base2": 4.2663, + "loss_pixel": 0.3951, + "loss_text": 2.5621, + "ppl": 19.244, + "step": 288 + }, + { + "epoch": 0.0, + "global_step": 289, + "learning_rate": 0.0004996285475792989, + "loss": 2.961, + "loss_base2": 4.2718, + "loss_pixel": 0.3922, + "loss_text": 2.5687, + "ppl": 19.3173, + "step": 289 + }, + { + "epoch": 0.0, + "global_step": 290, + "learning_rate": 0.0004996243739565944, + "loss": 2.9248, + "loss_base2": 4.2196, + "loss_pixel": 0.3878, + "loss_text": 2.537, + "ppl": 18.6305, + "step": 290 + }, + { + "epoch": 0.0, + "global_step": 291, + "learning_rate": 0.0004996202003338899, + "loss": 2.9296, + "loss_base2": 4.2265, + "loss_pixel": 0.3844, + "loss_text": 2.5451, + "ppl": 18.7201, + "step": 291 + }, + { + "epoch": 0.0, + "global_step": 292, + "learning_rate": 0.0004996160267111854, + "loss": 2.905, + "loss_base2": 4.191, + "loss_pixel": 0.384, + "loss_text": 2.521, + "ppl": 18.2652, + "step": 292 + }, + { + "epoch": 0.0, + "global_step": 293, + "learning_rate": 0.0004996118530884809, + "loss": 2.9046, + "loss_base2": 4.1905, + "loss_pixel": 0.3876, + "loss_text": 2.517, + "ppl": 18.2579, + "step": 293 + }, + { + "epoch": 0.0, + "global_step": 294, + "learning_rate": 0.0004996076794657763, + "loss": 2.9035, + "loss_base2": 4.1889, + "loss_pixel": 0.387, + "loss_text": 2.5165, + "ppl": 18.2379, + "step": 294 + }, + { + "epoch": 0.0, + "global_step": 295, + "learning_rate": 0.0004996035058430718, + "loss": 2.9, + "loss_base2": 4.1838, + "loss_pixel": 0.3852, + "loss_text": 2.5148, + "ppl": 18.1741, + "step": 295 + }, + { + "epoch": 0.0, + "global_step": 296, + "learning_rate": 0.0004995993322203673, + "loss": 3.0979, + "loss_base2": 4.4693, + "loss_pixel": 0.3839, + "loss_text": 2.714, + "ppl": 22.1514, + "step": 296 + }, + { + "epoch": 0.0, + "global_step": 297, + "learning_rate": 0.0004995951585976628, + "loss": 3.067, + "loss_base2": 4.4247, + "loss_pixel": 0.3805, + "loss_text": 2.6865, + "ppl": 21.4774, + "step": 297 + }, + { + "epoch": 0.0, + "global_step": 298, + "learning_rate": 0.0004995909849749582, + "loss": 2.9303, + "loss_base2": 4.2275, + "loss_pixel": 0.3815, + "loss_text": 2.5488, + "ppl": 18.7332, + "step": 298 + }, + { + "epoch": 0.0, + "global_step": 299, + "learning_rate": 0.0004995868113522537, + "loss": 2.9543, + "loss_base2": 4.2622, + "loss_pixel": 0.3814, + "loss_text": 2.5729, + "ppl": 19.1883, + "step": 299 + }, + { + "epoch": 0.0, + "global_step": 300, + "learning_rate": 0.0004995826377295492, + "loss": 3.0093, + "loss_base2": 4.3415, + "loss_pixel": 0.3803, + "loss_text": 2.629, + "ppl": 20.2732, + "step": 300 + }, + { + "epoch": 0.0, + "global_step": 301, + "learning_rate": 0.0004995784641068447, + "loss": 2.952, + "loss_base2": 4.2588, + "loss_pixel": 0.3802, + "loss_text": 2.5718, + "ppl": 19.1442, + "step": 301 + }, + { + "epoch": 0.0, + "global_step": 302, + "learning_rate": 0.0004995742904841402, + "loss": 2.9579, + "loss_base2": 4.2673, + "loss_pixel": 0.3799, + "loss_text": 2.5781, + "ppl": 19.2575, + "step": 302 + }, + { + "epoch": 0.0, + "global_step": 303, + "learning_rate": 0.0004995701168614357, + "loss": 2.9298, + "loss_base2": 4.2268, + "loss_pixel": 0.3776, + "loss_text": 2.5522, + "ppl": 18.7239, + "step": 303 + }, + { + "epoch": 0.0, + "global_step": 304, + "learning_rate": 0.0004995659432387313, + "loss": 2.9306, + "loss_base2": 4.228, + "loss_pixel": 0.3773, + "loss_text": 2.5533, + "ppl": 18.7389, + "step": 304 + }, + { + "epoch": 0.0, + "global_step": 305, + "learning_rate": 0.0004995617696160268, + "loss": 2.9199, + "loss_base2": 4.2125, + "loss_pixel": 0.3767, + "loss_text": 2.5432, + "ppl": 18.5394, + "step": 305 + }, + { + "epoch": 0.0, + "global_step": 306, + "learning_rate": 0.0004995575959933223, + "loss": 2.9007, + "loss_base2": 4.1848, + "loss_pixel": 0.376, + "loss_text": 2.5247, + "ppl": 18.1869, + "step": 306 + }, + { + "epoch": 0.0, + "global_step": 307, + "learning_rate": 0.0004995534223706177, + "loss": 2.8685, + "loss_base2": 4.1384, + "loss_pixel": 0.3748, + "loss_text": 2.4938, + "ppl": 17.6106, + "step": 307 + }, + { + "epoch": 0.0, + "global_step": 308, + "learning_rate": 0.0004995492487479132, + "loss": 2.8902, + "loss_base2": 4.1697, + "loss_pixel": 0.3749, + "loss_text": 2.5153, + "ppl": 17.9969, + "step": 308 + }, + { + "epoch": 0.0, + "global_step": 309, + "learning_rate": 0.0004995450751252087, + "loss": 2.8798, + "loss_base2": 4.1547, + "loss_pixel": 0.3822, + "loss_text": 2.4976, + "ppl": 17.8107, + "step": 309 + }, + { + "epoch": 0.0, + "global_step": 310, + "learning_rate": 0.0004995409015025042, + "loss": 2.9186, + "loss_base2": 4.2106, + "loss_pixel": 0.4436, + "loss_text": 2.4749, + "ppl": 18.5153, + "step": 310 + }, + { + "epoch": 0.0, + "global_step": 311, + "learning_rate": 0.0004995367278797997, + "loss": 2.8782, + "loss_base2": 4.1524, + "loss_pixel": 0.407, + "loss_text": 2.4712, + "ppl": 17.7822, + "step": 311 + }, + { + "epoch": 0.0, + "global_step": 312, + "learning_rate": 0.0004995325542570952, + "loss": 2.8506, + "loss_base2": 4.1125, + "loss_pixel": 0.401, + "loss_text": 2.4496, + "ppl": 17.2982, + "step": 312 + }, + { + "epoch": 0.0, + "global_step": 313, + "learning_rate": 0.0004995283806343906, + "loss": 2.8407, + "loss_base2": 4.0983, + "loss_pixel": 0.384, + "loss_text": 2.4566, + "ppl": 17.1278, + "step": 313 + }, + { + "epoch": 0.0, + "global_step": 314, + "learning_rate": 0.0004995242070116861, + "loss": 2.841, + "loss_base2": 4.0987, + "loss_pixel": 0.3828, + "loss_text": 2.4582, + "ppl": 17.1329, + "step": 314 + }, + { + "epoch": 0.0, + "global_step": 315, + "learning_rate": 0.0004995200333889816, + "loss": 2.8286, + "loss_base2": 4.0808, + "loss_pixel": 0.388, + "loss_text": 2.4406, + "ppl": 16.9218, + "step": 315 + }, + { + "epoch": 0.0, + "global_step": 316, + "learning_rate": 0.0004995158597662771, + "loss": 2.8152, + "loss_base2": 4.0615, + "loss_pixel": 0.3917, + "loss_text": 2.4235, + "ppl": 16.6965, + "step": 316 + }, + { + "epoch": 0.0, + "global_step": 317, + "learning_rate": 0.0004995116861435726, + "loss": 2.8132, + "loss_base2": 4.0586, + "loss_pixel": 0.3891, + "loss_text": 2.4241, + "ppl": 16.6632, + "step": 317 + }, + { + "epoch": 0.0, + "global_step": 318, + "learning_rate": 0.0004995075125208681, + "loss": 2.7896, + "loss_base2": 4.0245, + "loss_pixel": 0.3864, + "loss_text": 2.4033, + "ppl": 16.2745, + "step": 318 + }, + { + "epoch": 0.0, + "global_step": 319, + "learning_rate": 0.0004995033388981636, + "loss": 2.7988, + "loss_base2": 4.0378, + "loss_pixel": 0.3832, + "loss_text": 2.4156, + "ppl": 16.4249, + "step": 319 + }, + { + "epoch": 0.0, + "global_step": 320, + "learning_rate": 0.0004994991652754592, + "loss": 2.7755, + "loss_base2": 4.0042, + "loss_pixel": 0.3826, + "loss_text": 2.3928, + "ppl": 16.0466, + "step": 320 + }, + { + "epoch": 0.0, + "global_step": 321, + "learning_rate": 0.0004994949916527546, + "loss": 3.1493, + "loss_base2": 4.5435, + "loss_pixel": 0.3835, + "loss_text": 2.7658, + "ppl": 23.3197, + "step": 321 + }, + { + "epoch": 0.0, + "global_step": 322, + "learning_rate": 0.0004994908180300501, + "loss": 2.9505, + "loss_base2": 4.2567, + "loss_pixel": 0.3849, + "loss_text": 2.5657, + "ppl": 19.1155, + "step": 322 + }, + { + "epoch": 0.0, + "global_step": 323, + "learning_rate": 0.0004994866444073456, + "loss": 2.8208, + "loss_base2": 4.0696, + "loss_pixel": 0.3849, + "loss_text": 2.436, + "ppl": 16.7903, + "step": 323 + }, + { + "epoch": 0.0, + "global_step": 324, + "learning_rate": 0.0004994824707846411, + "loss": 2.8125, + "loss_base2": 4.0576, + "loss_pixel": 0.3829, + "loss_text": 2.4296, + "ppl": 16.6515, + "step": 324 + }, + { + "epoch": 0.0, + "global_step": 325, + "learning_rate": 0.0004994782971619366, + "loss": 2.7943, + "loss_base2": 4.0313, + "loss_pixel": 0.382, + "loss_text": 2.4124, + "ppl": 16.3512, + "step": 325 + }, + { + "epoch": 0.0, + "global_step": 326, + "learning_rate": 0.0004994741235392321, + "loss": 2.7888, + "loss_base2": 4.0234, + "loss_pixel": 0.3812, + "loss_text": 2.4076, + "ppl": 16.2615, + "step": 326 + }, + { + "epoch": 0.0, + "global_step": 327, + "learning_rate": 0.0004994699499165276, + "loss": 2.772, + "loss_base2": 3.9992, + "loss_pixel": 0.3821, + "loss_text": 2.3899, + "ppl": 15.9906, + "step": 327 + }, + { + "epoch": 0.0, + "global_step": 328, + "learning_rate": 0.0004994657762938231, + "loss": 2.7827, + "loss_base2": 4.0146, + "loss_pixel": 0.3821, + "loss_text": 2.4006, + "ppl": 16.1626, + "step": 328 + }, + { + "epoch": 0.0, + "global_step": 329, + "learning_rate": 0.0004994616026711186, + "loss": 2.776, + "loss_base2": 4.0049, + "loss_pixel": 0.3816, + "loss_text": 2.3944, + "ppl": 16.0547, + "step": 329 + }, + { + "epoch": 0.0, + "global_step": 330, + "learning_rate": 0.000499457429048414, + "loss": 2.7789, + "loss_base2": 4.0091, + "loss_pixel": 0.3822, + "loss_text": 2.3967, + "ppl": 16.1013, + "step": 330 + }, + { + "epoch": 0.0, + "global_step": 331, + "learning_rate": 0.0004994532554257095, + "loss": 3.1214, + "loss_base2": 4.5032, + "loss_pixel": 0.381, + "loss_text": 2.7404, + "ppl": 22.6781, + "step": 331 + }, + { + "epoch": 0.0, + "global_step": 332, + "learning_rate": 0.000499449081803005, + "loss": 2.8526, + "loss_base2": 4.1154, + "loss_pixel": 0.3814, + "loss_text": 2.4712, + "ppl": 17.3328, + "step": 332 + }, + { + "epoch": 0.0, + "global_step": 333, + "learning_rate": 0.0004994449081803005, + "loss": 2.7735, + "loss_base2": 4.0013, + "loss_pixel": 0.3803, + "loss_text": 2.3932, + "ppl": 16.0146, + "step": 333 + }, + { + "epoch": 0.0, + "global_step": 334, + "learning_rate": 0.0004994407345575959, + "loss": 2.7545, + "loss_base2": 3.9739, + "loss_pixel": 0.38, + "loss_text": 2.3745, + "ppl": 15.7132, + "step": 334 + }, + { + "epoch": 0.0, + "global_step": 335, + "learning_rate": 0.0004994365609348914, + "loss": 2.7506, + "loss_base2": 3.9683, + "loss_pixel": 0.3802, + "loss_text": 2.3703, + "ppl": 15.652, + "step": 335 + }, + { + "epoch": 0.0, + "global_step": 336, + "learning_rate": 0.0004994323873121869, + "loss": 2.7342, + "loss_base2": 3.9446, + "loss_pixel": 0.3803, + "loss_text": 2.3539, + "ppl": 15.3974, + "step": 336 + }, + { + "epoch": 0.0, + "global_step": 337, + "learning_rate": 0.0004994282136894825, + "loss": 2.7397, + "loss_base2": 3.9526, + "loss_pixel": 0.381, + "loss_text": 2.3587, + "ppl": 15.4823, + "step": 337 + }, + { + "epoch": 0.0, + "global_step": 338, + "learning_rate": 0.000499424040066778, + "loss": 2.7442, + "loss_base2": 3.959, + "loss_pixel": 0.3798, + "loss_text": 2.3644, + "ppl": 15.5522, + "step": 338 + }, + { + "epoch": 0.0, + "global_step": 339, + "learning_rate": 0.0004994198664440735, + "loss": 2.7051, + "loss_base2": 3.9026, + "loss_pixel": 0.3797, + "loss_text": 2.3254, + "ppl": 14.9558, + "step": 339 + }, + { + "epoch": 0.0, + "global_step": 340, + "learning_rate": 0.000499415692821369, + "loss": 3.079, + "loss_base2": 4.4421, + "loss_pixel": 0.3811, + "loss_text": 2.6979, + "ppl": 21.7367, + "step": 340 + }, + { + "epoch": 0.0, + "global_step": 341, + "learning_rate": 0.0004994115191986645, + "loss": 3.1559, + "loss_base2": 4.553, + "loss_pixel": 0.3794, + "loss_text": 2.7764, + "ppl": 23.4742, + "step": 341 + }, + { + "epoch": 0.0, + "global_step": 342, + "learning_rate": 0.00049940734557596, + "loss": 3.1536, + "loss_base2": 4.5497, + "loss_pixel": 0.38, + "loss_text": 2.7736, + "ppl": 23.4202, + "step": 342 + }, + { + "epoch": 0.0, + "global_step": 343, + "learning_rate": 0.0004994031719532554, + "loss": 3.1262, + "loss_base2": 4.5102, + "loss_pixel": 0.3787, + "loss_text": 2.7475, + "ppl": 22.7872, + "step": 343 + }, + { + "epoch": 0.0, + "global_step": 344, + "learning_rate": 0.0004993989983305509, + "loss": 3.1355, + "loss_base2": 4.5236, + "loss_pixel": 0.379, + "loss_text": 2.7565, + "ppl": 23.0001, + "step": 344 + }, + { + "epoch": 0.0, + "global_step": 345, + "learning_rate": 0.0004993948247078464, + "loss": 3.103, + "loss_base2": 4.4767, + "loss_pixel": 0.3788, + "loss_text": 2.7242, + "ppl": 22.2646, + "step": 345 + }, + { + "epoch": 0.0, + "global_step": 346, + "learning_rate": 0.0004993906510851419, + "loss": 3.0951, + "loss_base2": 4.4653, + "loss_pixel": 0.3787, + "loss_text": 2.7164, + "ppl": 22.0894, + "step": 346 + }, + { + "epoch": 0.0, + "global_step": 347, + "learning_rate": 0.0004993864774624374, + "loss": 3.0779, + "loss_base2": 4.4405, + "loss_pixel": 0.3786, + "loss_text": 2.6993, + "ppl": 21.7128, + "step": 347 + }, + { + "epoch": 0.0, + "global_step": 348, + "learning_rate": 0.0004993823038397329, + "loss": 3.0683, + "loss_base2": 4.4266, + "loss_pixel": 0.3792, + "loss_text": 2.6891, + "ppl": 21.5053, + "step": 348 + }, + { + "epoch": 0.0, + "global_step": 349, + "learning_rate": 0.0004993781302170284, + "loss": 3.0565, + "loss_base2": 4.4096, + "loss_pixel": 0.3777, + "loss_text": 2.6788, + "ppl": 21.253, + "step": 349 + }, + { + "epoch": 0.0, + "global_step": 350, + "learning_rate": 0.0004993739565943239, + "loss": 3.05, + "loss_base2": 4.4002, + "loss_pixel": 0.3775, + "loss_text": 2.6725, + "ppl": 21.1153, + "step": 350 + }, + { + "epoch": 0.0, + "global_step": 351, + "learning_rate": 0.0004993697829716193, + "loss": 3.0366, + "loss_base2": 4.3809, + "loss_pixel": 0.3767, + "loss_text": 2.6599, + "ppl": 20.8343, + "step": 351 + }, + { + "epoch": 0.0, + "global_step": 352, + "learning_rate": 0.0004993656093489148, + "loss": 3.042, + "loss_base2": 4.3887, + "loss_pixel": 0.3778, + "loss_text": 2.6642, + "ppl": 20.9471, + "step": 352 + }, + { + "epoch": 0.0, + "global_step": 353, + "learning_rate": 0.0004993614357262104, + "loss": 3.0378, + "loss_base2": 4.3826, + "loss_pixel": 0.3763, + "loss_text": 2.6615, + "ppl": 20.8593, + "step": 353 + }, + { + "epoch": 0.0, + "global_step": 354, + "learning_rate": 0.0004993572621035059, + "loss": 3.0161, + "loss_base2": 4.3513, + "loss_pixel": 0.3756, + "loss_text": 2.6405, + "ppl": 20.4115, + "step": 354 + }, + { + "epoch": 0.0, + "global_step": 355, + "learning_rate": 0.0004993530884808014, + "loss": 3.0199, + "loss_base2": 4.3568, + "loss_pixel": 0.3745, + "loss_text": 2.6453, + "ppl": 20.4892, + "step": 355 + }, + { + "epoch": 0.0, + "global_step": 356, + "learning_rate": 0.0004993489148580969, + "loss": 3.0046, + "loss_base2": 4.3347, + "loss_pixel": 0.3748, + "loss_text": 2.6298, + "ppl": 20.1781, + "step": 356 + }, + { + "epoch": 0.0, + "global_step": 357, + "learning_rate": 0.0004993447412353923, + "loss": 3.0046, + "loss_base2": 4.3347, + "loss_pixel": 0.3748, + "loss_text": 2.6298, + "ppl": 20.1781, + "step": 357 + }, + { + "epoch": 0.0, + "global_step": 358, + "learning_rate": 0.0004993405676126878, + "loss": 3.0041, + "loss_base2": 4.334, + "loss_pixel": 0.3756, + "loss_text": 2.6284, + "ppl": 20.1681, + "step": 358 + }, + { + "epoch": 0.0, + "global_step": 359, + "learning_rate": 0.0004993363939899833, + "loss": 3.0059, + "loss_base2": 4.3366, + "loss_pixel": 0.3987, + "loss_text": 2.6072, + "ppl": 20.2044, + "step": 359 + }, + { + "epoch": 0.0, + "global_step": 360, + "learning_rate": 0.0004993322203672788, + "loss": 3.0023, + "loss_base2": 4.3314, + "loss_pixel": 0.3803, + "loss_text": 2.622, + "ppl": 20.1318, + "step": 360 + }, + { + "epoch": 0.0, + "global_step": 361, + "learning_rate": 0.0004993280467445743, + "loss": 2.9892, + "loss_base2": 4.3125, + "loss_pixel": 0.3877, + "loss_text": 2.6015, + "ppl": 19.8698, + "step": 361 + }, + { + "epoch": 0.0, + "global_step": 362, + "learning_rate": 0.0004993238731218698, + "loss": 2.9698, + "loss_base2": 4.2845, + "loss_pixel": 0.3763, + "loss_text": 2.5934, + "ppl": 19.488, + "step": 362 + }, + { + "epoch": 0.0, + "global_step": 363, + "learning_rate": 0.0004993196994991653, + "loss": 2.978, + "loss_base2": 4.2963, + "loss_pixel": 0.3794, + "loss_text": 2.5986, + "ppl": 19.6485, + "step": 363 + }, + { + "epoch": 0.0, + "global_step": 364, + "learning_rate": 0.0004993155258764608, + "loss": 2.9284, + "loss_base2": 4.2248, + "loss_pixel": 0.3806, + "loss_text": 2.5478, + "ppl": 18.6977, + "step": 364 + }, + { + "epoch": 0.0, + "global_step": 365, + "learning_rate": 0.0004993113522537563, + "loss": 2.7765, + "loss_base2": 4.0056, + "loss_pixel": 0.3806, + "loss_text": 2.3959, + "ppl": 16.0627, + "step": 365 + }, + { + "epoch": 0.0, + "global_step": 366, + "learning_rate": 0.0004993071786310517, + "loss": 2.7443, + "loss_base2": 3.9592, + "loss_pixel": 0.378, + "loss_text": 2.3663, + "ppl": 15.5537, + "step": 366 + }, + { + "epoch": 0.0, + "global_step": 367, + "learning_rate": 0.0004993030050083472, + "loss": 2.7314, + "loss_base2": 3.9406, + "loss_pixel": 0.3786, + "loss_text": 2.3528, + "ppl": 15.3544, + "step": 367 + }, + { + "epoch": 0.0, + "global_step": 368, + "learning_rate": 0.0004992988313856427, + "loss": 2.7326, + "loss_base2": 3.9423, + "loss_pixel": 0.3795, + "loss_text": 2.3531, + "ppl": 15.3728, + "step": 368 + }, + { + "epoch": 0.0, + "global_step": 369, + "learning_rate": 0.0004992946577629383, + "loss": 2.7004, + "loss_base2": 3.8959, + "loss_pixel": 0.3796, + "loss_text": 2.3208, + "ppl": 14.8857, + "step": 369 + }, + { + "epoch": 0.0, + "global_step": 370, + "learning_rate": 0.0004992904841402338, + "loss": 2.6922, + "loss_base2": 3.884, + "loss_pixel": 0.3779, + "loss_text": 2.3142, + "ppl": 14.7641, + "step": 370 + }, + { + "epoch": 0.0, + "global_step": 371, + "learning_rate": 0.0004992863105175292, + "loss": 2.6899, + "loss_base2": 3.8807, + "loss_pixel": 0.3769, + "loss_text": 2.313, + "ppl": 14.7302, + "step": 371 + }, + { + "epoch": 0.0, + "global_step": 372, + "learning_rate": 0.0004992821368948247, + "loss": 2.8585, + "loss_base2": 4.1239, + "loss_pixel": 0.3776, + "loss_text": 2.4809, + "ppl": 17.4354, + "step": 372 + }, + { + "epoch": 0.0, + "global_step": 373, + "learning_rate": 0.0004992779632721202, + "loss": 3.0017, + "loss_base2": 4.3305, + "loss_pixel": 0.3771, + "loss_text": 2.6246, + "ppl": 20.1197, + "step": 373 + }, + { + "epoch": 0.0, + "global_step": 374, + "learning_rate": 0.0004992737896494157, + "loss": 3.0216, + "loss_base2": 4.3592, + "loss_pixel": 0.376, + "loss_text": 2.6456, + "ppl": 20.5241, + "step": 374 + }, + { + "epoch": 0.0, + "global_step": 375, + "learning_rate": 0.0004992696160267112, + "loss": 3.0005, + "loss_base2": 4.3288, + "loss_pixel": 0.3752, + "loss_text": 2.6253, + "ppl": 20.0956, + "step": 375 + }, + { + "epoch": 0.0, + "global_step": 376, + "learning_rate": 0.0004992654424040067, + "loss": 2.9862, + "loss_base2": 4.3082, + "loss_pixel": 0.3752, + "loss_text": 2.611, + "ppl": 19.8103, + "step": 376 + }, + { + "epoch": 0.0, + "global_step": 377, + "learning_rate": 0.0004992612687813022, + "loss": 2.9606, + "loss_base2": 4.2712, + "loss_pixel": 0.3743, + "loss_text": 2.5863, + "ppl": 19.3096, + "step": 377 + }, + { + "epoch": 0.0, + "global_step": 378, + "learning_rate": 0.0004992570951585977, + "loss": 2.9665, + "loss_base2": 4.2798, + "loss_pixel": 0.3741, + "loss_text": 2.5924, + "ppl": 19.4238, + "step": 378 + }, + { + "epoch": 0.0, + "global_step": 379, + "learning_rate": 0.0004992529215358932, + "loss": 2.9628, + "loss_base2": 4.2744, + "loss_pixel": 0.3733, + "loss_text": 2.5894, + "ppl": 19.3521, + "step": 379 + }, + { + "epoch": 0.0, + "global_step": 380, + "learning_rate": 0.0004992487479131886, + "loss": 2.9689, + "loss_base2": 4.2832, + "loss_pixel": 0.3729, + "loss_text": 2.596, + "ppl": 19.4705, + "step": 380 + }, + { + "epoch": 0.0, + "global_step": 381, + "learning_rate": 0.0004992445742904841, + "loss": 2.9444, + "loss_base2": 4.2479, + "loss_pixel": 0.3733, + "loss_text": 2.5711, + "ppl": 18.9993, + "step": 381 + }, + { + "epoch": 0.0, + "global_step": 382, + "learning_rate": 0.0004992404006677796, + "loss": 2.9446, + "loss_base2": 4.2482, + "loss_pixel": 0.384, + "loss_text": 2.5606, + "ppl": 19.0031, + "step": 382 + }, + { + "epoch": 0.0, + "global_step": 383, + "learning_rate": 0.0004992362270450751, + "loss": 2.9643, + "loss_base2": 4.2766, + "loss_pixel": 0.4011, + "loss_text": 2.5633, + "ppl": 19.3811, + "step": 383 + }, + { + "epoch": 0.0, + "global_step": 384, + "learning_rate": 0.0004992320534223706, + "loss": 2.966, + "loss_base2": 4.279, + "loss_pixel": 0.4048, + "loss_text": 2.5612, + "ppl": 19.4141, + "step": 384 + }, + { + "epoch": 0.0, + "global_step": 385, + "learning_rate": 0.0004992278797996662, + "loss": 2.9589, + "loss_base2": 4.2688, + "loss_pixel": 0.3957, + "loss_text": 2.5632, + "ppl": 19.2768, + "step": 385 + }, + { + "epoch": 0.0, + "global_step": 386, + "learning_rate": 0.0004992237061769617, + "loss": 2.9313, + "loss_base2": 4.229, + "loss_pixel": 0.3805, + "loss_text": 2.5508, + "ppl": 18.752, + "step": 386 + }, + { + "epoch": 0.0, + "global_step": 387, + "learning_rate": 0.0004992195325542572, + "loss": 2.9266, + "loss_base2": 4.2222, + "loss_pixel": 0.3819, + "loss_text": 2.5447, + "ppl": 18.6641, + "step": 387 + }, + { + "epoch": 0.0, + "global_step": 388, + "learning_rate": 0.0004992153589315526, + "loss": 2.9262, + "loss_base2": 4.2216, + "loss_pixel": 0.3877, + "loss_text": 2.5385, + "ppl": 18.6566, + "step": 388 + }, + { + "epoch": 0.0, + "global_step": 389, + "learning_rate": 0.0004992111853088481, + "loss": 2.9159, + "loss_base2": 4.2068, + "loss_pixel": 0.388, + "loss_text": 2.5279, + "ppl": 18.4654, + "step": 389 + }, + { + "epoch": 0.0, + "global_step": 390, + "learning_rate": 0.0004992070116861436, + "loss": 2.907, + "loss_base2": 4.1939, + "loss_pixel": 0.3859, + "loss_text": 2.5211, + "ppl": 18.3018, + "step": 390 + }, + { + "epoch": 0.0, + "global_step": 391, + "learning_rate": 0.0004992028380634391, + "loss": 2.9415, + "loss_base2": 4.2437, + "loss_pixel": 0.3833, + "loss_text": 2.5581, + "ppl": 18.9442, + "step": 391 + }, + { + "epoch": 0.0, + "global_step": 392, + "learning_rate": 0.0004991986644407346, + "loss": 2.9032, + "loss_base2": 4.1884, + "loss_pixel": 0.3816, + "loss_text": 2.5216, + "ppl": 18.2324, + "step": 392 + }, + { + "epoch": 0.0, + "global_step": 393, + "learning_rate": 0.00049919449081803, + "loss": 2.8973, + "loss_base2": 4.1799, + "loss_pixel": 0.3816, + "loss_text": 2.5157, + "ppl": 18.1251, + "step": 393 + }, + { + "epoch": 0.0, + "global_step": 394, + "learning_rate": 0.0004991903171953255, + "loss": 2.8991, + "loss_base2": 4.1825, + "loss_pixel": 0.3818, + "loss_text": 2.5173, + "ppl": 18.1578, + "step": 394 + }, + { + "epoch": 0.0, + "global_step": 395, + "learning_rate": 0.000499186143572621, + "loss": 2.8939, + "loss_base2": 4.175, + "loss_pixel": 0.3821, + "loss_text": 2.5117, + "ppl": 18.0636, + "step": 395 + }, + { + "epoch": 0.0, + "global_step": 396, + "learning_rate": 0.0004991819699499165, + "loss": 2.8847, + "loss_base2": 4.1617, + "loss_pixel": 0.3817, + "loss_text": 2.503, + "ppl": 17.8982, + "step": 396 + }, + { + "epoch": 0.0, + "global_step": 397, + "learning_rate": 0.000499177796327212, + "loss": 2.9152, + "loss_base2": 4.2057, + "loss_pixel": 0.3812, + "loss_text": 2.5341, + "ppl": 18.4525, + "step": 397 + }, + { + "epoch": 0.0, + "global_step": 398, + "learning_rate": 0.0004991736227045075, + "loss": 2.8763, + "loss_base2": 4.1496, + "loss_pixel": 0.38, + "loss_text": 2.4963, + "ppl": 17.7485, + "step": 398 + }, + { + "epoch": 0.0, + "global_step": 399, + "learning_rate": 0.000499169449081803, + "loss": 2.8887, + "loss_base2": 4.1675, + "loss_pixel": 0.3798, + "loss_text": 2.5089, + "ppl": 17.9699, + "step": 399 + }, + { + "epoch": 0.0, + "global_step": 400, + "learning_rate": 0.0004991652754590985, + "loss": 2.8573, + "loss_base2": 4.1222, + "loss_pixel": 0.3791, + "loss_text": 2.4782, + "ppl": 17.4144, + "step": 400 + }, + { + "epoch": 0.0, + "global_step": 401, + "learning_rate": 0.000499161101836394, + "loss": 2.8665, + "loss_base2": 4.1355, + "loss_pixel": 0.3789, + "loss_text": 2.4875, + "ppl": 17.5754, + "step": 401 + }, + { + "epoch": 0.0, + "global_step": 402, + "learning_rate": 0.0004991569282136895, + "loss": 2.8622, + "loss_base2": 4.1293, + "loss_pixel": 0.3787, + "loss_text": 2.4835, + "ppl": 17.5, + "step": 402 + }, + { + "epoch": 0.0, + "global_step": 403, + "learning_rate": 0.000499152754590985, + "loss": 2.8476, + "loss_base2": 4.1082, + "loss_pixel": 0.3782, + "loss_text": 2.4695, + "ppl": 17.2463, + "step": 403 + }, + { + "epoch": 0.0, + "global_step": 404, + "learning_rate": 0.0004991485809682805, + "loss": 2.861, + "loss_base2": 4.1276, + "loss_pixel": 0.3787, + "loss_text": 2.4823, + "ppl": 17.479, + "step": 404 + }, + { + "epoch": 0.0, + "global_step": 405, + "learning_rate": 0.000499144407345576, + "loss": 2.8727, + "loss_base2": 4.1444, + "loss_pixel": 0.378, + "loss_text": 2.4947, + "ppl": 17.6847, + "step": 405 + }, + { + "epoch": 0.0, + "global_step": 406, + "learning_rate": 0.0004991402337228715, + "loss": 2.8568, + "loss_base2": 4.1215, + "loss_pixel": 0.3772, + "loss_text": 2.4795, + "ppl": 17.4057, + "step": 406 + }, + { + "epoch": 0.0, + "global_step": 407, + "learning_rate": 0.0004991360601001669, + "loss": 2.8347, + "loss_base2": 4.0896, + "loss_pixel": 0.3763, + "loss_text": 2.4584, + "ppl": 17.0253, + "step": 407 + }, + { + "epoch": 0.0, + "global_step": 408, + "learning_rate": 0.0004991318864774624, + "loss": 2.8526, + "loss_base2": 4.1154, + "loss_pixel": 0.3767, + "loss_text": 2.4759, + "ppl": 17.3328, + "step": 408 + }, + { + "epoch": 0.0, + "global_step": 409, + "learning_rate": 0.0004991277128547579, + "loss": 2.8517, + "loss_base2": 4.1141, + "loss_pixel": 0.376, + "loss_text": 2.4757, + "ppl": 17.3172, + "step": 409 + }, + { + "epoch": 0.0, + "global_step": 410, + "learning_rate": 0.0004991235392320534, + "loss": 2.8329, + "loss_base2": 4.087, + "loss_pixel": 0.3757, + "loss_text": 2.4572, + "ppl": 16.9947, + "step": 410 + }, + { + "epoch": 0.0, + "global_step": 411, + "learning_rate": 0.0004991193656093489, + "loss": 2.8411, + "loss_base2": 4.0988, + "loss_pixel": 0.3756, + "loss_text": 2.4655, + "ppl": 17.1346, + "step": 411 + }, + { + "epoch": 0.0, + "global_step": 412, + "learning_rate": 0.0004991151919866444, + "loss": 2.8368, + "loss_base2": 4.0926, + "loss_pixel": 0.375, + "loss_text": 2.4618, + "ppl": 17.0611, + "step": 412 + }, + { + "epoch": 0.0, + "global_step": 413, + "learning_rate": 0.0004991110183639399, + "loss": 2.832, + "loss_base2": 4.0857, + "loss_pixel": 0.3741, + "loss_text": 2.4579, + "ppl": 16.9794, + "step": 413 + }, + { + "epoch": 0.0, + "global_step": 414, + "learning_rate": 0.0004991068447412354, + "loss": 2.8291, + "loss_base2": 4.0815, + "loss_pixel": 0.3745, + "loss_text": 2.4546, + "ppl": 16.9302, + "step": 414 + }, + { + "epoch": 0.0, + "global_step": 415, + "learning_rate": 0.0004991026711185309, + "loss": 2.8273, + "loss_base2": 4.0789, + "loss_pixel": 0.3743, + "loss_text": 2.453, + "ppl": 16.8998, + "step": 415 + }, + { + "epoch": 0.0, + "global_step": 416, + "learning_rate": 0.0004990984974958263, + "loss": 2.8232, + "loss_base2": 4.073, + "loss_pixel": 0.3738, + "loss_text": 2.4494, + "ppl": 16.8306, + "step": 416 + }, + { + "epoch": 0.0, + "global_step": 417, + "learning_rate": 0.0004990943238731218, + "loss": 2.8218, + "loss_base2": 4.071, + "loss_pixel": 0.3734, + "loss_text": 2.4484, + "ppl": 16.8071, + "step": 417 + }, + { + "epoch": 0.0, + "global_step": 418, + "learning_rate": 0.0004990901502504174, + "loss": 2.8124, + "loss_base2": 4.0574, + "loss_pixel": 0.3728, + "loss_text": 2.4397, + "ppl": 16.6498, + "step": 418 + }, + { + "epoch": 0.0, + "global_step": 419, + "learning_rate": 0.0004990859766277129, + "loss": 2.8121, + "loss_base2": 4.057, + "loss_pixel": 0.3728, + "loss_text": 2.4393, + "ppl": 16.6448, + "step": 419 + }, + { + "epoch": 0.0, + "global_step": 420, + "learning_rate": 0.0004990818030050084, + "loss": 2.8135, + "loss_base2": 4.059, + "loss_pixel": 0.3724, + "loss_text": 2.4412, + "ppl": 16.6682, + "step": 420 + }, + { + "epoch": 0.0, + "global_step": 421, + "learning_rate": 0.0004990776293823039, + "loss": 2.8209, + "loss_base2": 4.0697, + "loss_pixel": 0.3721, + "loss_text": 2.4489, + "ppl": 16.792, + "step": 421 + }, + { + "epoch": 0.0, + "global_step": 422, + "learning_rate": 0.0004990734557595994, + "loss": 2.8056, + "loss_base2": 4.0476, + "loss_pixel": 0.3722, + "loss_text": 2.4334, + "ppl": 16.537, + "step": 422 + }, + { + "epoch": 0.0, + "global_step": 423, + "learning_rate": 0.0004990692821368949, + "loss": 2.805, + "loss_base2": 4.0468, + "loss_pixel": 0.3714, + "loss_text": 2.4336, + "ppl": 16.5271, + "step": 423 + }, + { + "epoch": 0.0, + "global_step": 424, + "learning_rate": 0.0004990651085141904, + "loss": 2.7958, + "loss_base2": 4.0335, + "loss_pixel": 0.3718, + "loss_text": 2.4239, + "ppl": 16.3757, + "step": 424 + }, + { + "epoch": 0.0, + "global_step": 425, + "learning_rate": 0.0004990609348914858, + "loss": 2.7934, + "loss_base2": 4.03, + "loss_pixel": 0.3709, + "loss_text": 2.4225, + "ppl": 16.3365, + "step": 425 + }, + { + "epoch": 0.0, + "global_step": 426, + "learning_rate": 0.0004990567612687813, + "loss": 2.7846, + "loss_base2": 4.0173, + "loss_pixel": 0.3705, + "loss_text": 2.4141, + "ppl": 16.1933, + "step": 426 + }, + { + "epoch": 0.0, + "global_step": 427, + "learning_rate": 0.0004990525876460768, + "loss": 2.776, + "loss_base2": 4.0049, + "loss_pixel": 0.3704, + "loss_text": 2.4056, + "ppl": 16.0547, + "step": 427 + }, + { + "epoch": 0.0, + "global_step": 428, + "learning_rate": 0.0004990484140233723, + "loss": 2.7833, + "loss_base2": 4.0155, + "loss_pixel": 0.3725, + "loss_text": 2.4108, + "ppl": 16.1723, + "step": 428 + }, + { + "epoch": 0.0, + "global_step": 429, + "learning_rate": 0.0004990442404006678, + "loss": 2.7924, + "loss_base2": 4.0286, + "loss_pixel": 0.3759, + "loss_text": 2.4165, + "ppl": 16.3201, + "step": 429 + }, + { + "epoch": 0.0, + "global_step": 430, + "learning_rate": 0.0004990400667779632, + "loss": 2.7893, + "loss_base2": 4.0241, + "loss_pixel": 0.3756, + "loss_text": 2.4137, + "ppl": 16.2696, + "step": 430 + }, + { + "epoch": 0.0, + "global_step": 431, + "learning_rate": 0.0004990358931552587, + "loss": 2.7736, + "loss_base2": 4.0015, + "loss_pixel": 0.3732, + "loss_text": 2.4004, + "ppl": 16.0162, + "step": 431 + }, + { + "epoch": 0.0, + "global_step": 432, + "learning_rate": 0.0004990317195325542, + "loss": 2.7834, + "loss_base2": 4.0156, + "loss_pixel": 0.3717, + "loss_text": 2.4117, + "ppl": 16.1739, + "step": 432 + }, + { + "epoch": 0.0, + "global_step": 433, + "learning_rate": 0.0004990275459098497, + "loss": 2.7858, + "loss_base2": 4.0191, + "loss_pixel": 0.3724, + "loss_text": 2.4134, + "ppl": 16.2128, + "step": 433 + }, + { + "epoch": 0.0, + "global_step": 434, + "learning_rate": 0.0004990233722871453, + "loss": 2.7575, + "loss_base2": 3.9782, + "loss_pixel": 0.3719, + "loss_text": 2.3857, + "ppl": 15.7604, + "step": 434 + }, + { + "epoch": 0.0, + "global_step": 435, + "learning_rate": 0.0004990191986644408, + "loss": 2.7682, + "loss_base2": 3.9937, + "loss_pixel": 0.3716, + "loss_text": 2.3966, + "ppl": 15.9299, + "step": 435 + }, + { + "epoch": 0.0, + "global_step": 436, + "learning_rate": 0.0004990150250417363, + "loss": 2.762, + "loss_base2": 3.9847, + "loss_pixel": 0.3719, + "loss_text": 2.39, + "ppl": 15.8315, + "step": 436 + }, + { + "epoch": 0.0, + "global_step": 437, + "learning_rate": 0.0004990108514190318, + "loss": 2.7722, + "loss_base2": 3.9994, + "loss_pixel": 0.3692, + "loss_text": 2.403, + "ppl": 15.9938, + "step": 437 + }, + { + "epoch": 0.0, + "global_step": 438, + "learning_rate": 0.0004990066777963273, + "loss": 2.7478, + "loss_base2": 3.9642, + "loss_pixel": 0.3711, + "loss_text": 2.3767, + "ppl": 15.6083, + "step": 438 + }, + { + "epoch": 0.0, + "global_step": 439, + "learning_rate": 0.0004990025041736227, + "loss": 2.7713, + "loss_base2": 3.9981, + "loss_pixel": 0.3688, + "loss_text": 2.4025, + "ppl": 15.9794, + "step": 439 + }, + { + "epoch": 0.0, + "global_step": 440, + "learning_rate": 0.0004989983305509182, + "loss": 2.7852, + "loss_base2": 4.0182, + "loss_pixel": 0.3722, + "loss_text": 2.413, + "ppl": 16.2031, + "step": 440 + }, + { + "epoch": 0.0, + "global_step": 441, + "learning_rate": 0.0004989941569282137, + "loss": 2.7661, + "loss_base2": 3.9906, + "loss_pixel": 0.371, + "loss_text": 2.3951, + "ppl": 15.8965, + "step": 441 + }, + { + "epoch": 0.0, + "global_step": 442, + "learning_rate": 0.0004989899833055092, + "loss": 2.7855, + "loss_base2": 4.0186, + "loss_pixel": 0.3696, + "loss_text": 2.4159, + "ppl": 16.2079, + "step": 442 + }, + { + "epoch": 0.0, + "global_step": 443, + "learning_rate": 0.0004989858096828047, + "loss": 2.7758, + "loss_base2": 4.0046, + "loss_pixel": 0.3709, + "loss_text": 2.4049, + "ppl": 16.0515, + "step": 443 + }, + { + "epoch": 0.0, + "global_step": 444, + "learning_rate": 0.0004989816360601001, + "loss": 2.7569, + "loss_base2": 3.9774, + "loss_pixel": 0.3689, + "loss_text": 2.388, + "ppl": 15.7509, + "step": 444 + }, + { + "epoch": 0.0, + "global_step": 445, + "learning_rate": 0.0004989774624373956, + "loss": 2.7757, + "loss_base2": 4.0045, + "loss_pixel": 0.3674, + "loss_text": 2.4083, + "ppl": 16.0499, + "step": 445 + }, + { + "epoch": 0.0, + "global_step": 446, + "learning_rate": 0.0004989732888146911, + "loss": 2.7871, + "loss_base2": 4.0209, + "loss_pixel": 0.368, + "loss_text": 2.4191, + "ppl": 16.2339, + "step": 446 + }, + { + "epoch": 0.0, + "global_step": 447, + "learning_rate": 0.0004989691151919866, + "loss": 2.762, + "loss_base2": 3.9847, + "loss_pixel": 0.3717, + "loss_text": 2.3903, + "ppl": 15.8315, + "step": 447 + }, + { + "epoch": 0.0, + "global_step": 448, + "learning_rate": 0.0004989649415692821, + "loss": 2.7518, + "loss_base2": 3.97, + "loss_pixel": 0.3707, + "loss_text": 2.3812, + "ppl": 15.6708, + "step": 448 + }, + { + "epoch": 0.0, + "global_step": 449, + "learning_rate": 0.0004989607679465776, + "loss": 2.7597, + "loss_base2": 3.9814, + "loss_pixel": 0.3686, + "loss_text": 2.3911, + "ppl": 15.7951, + "step": 449 + }, + { + "epoch": 0.0, + "global_step": 450, + "learning_rate": 0.0004989565943238732, + "loss": 2.7417, + "loss_base2": 3.9554, + "loss_pixel": 0.3677, + "loss_text": 2.3739, + "ppl": 15.5133, + "step": 450 + }, + { + "epoch": 0.0, + "global_step": 451, + "learning_rate": 0.0004989524207011687, + "loss": 2.7256, + "loss_base2": 3.9322, + "loss_pixel": 0.3662, + "loss_text": 2.3594, + "ppl": 15.2656, + "step": 451 + }, + { + "epoch": 0.0, + "global_step": 452, + "learning_rate": 0.0004989482470784641, + "loss": 2.7233, + "loss_base2": 3.9289, + "loss_pixel": 0.3642, + "loss_text": 2.3591, + "ppl": 15.2305, + "step": 452 + }, + { + "epoch": 0.0, + "global_step": 453, + "learning_rate": 0.0004989440734557596, + "loss": 2.7244, + "loss_base2": 3.9305, + "loss_pixel": 0.3662, + "loss_text": 2.3582, + "ppl": 15.2473, + "step": 453 + }, + { + "epoch": 0.0, + "global_step": 454, + "learning_rate": 0.0004989398998330551, + "loss": 2.7182, + "loss_base2": 3.9215, + "loss_pixel": 0.3641, + "loss_text": 2.3541, + "ppl": 15.153, + "step": 454 + }, + { + "epoch": 0.0, + "global_step": 455, + "learning_rate": 0.0004989357262103506, + "loss": 2.7226, + "loss_base2": 3.9279, + "loss_pixel": 0.3657, + "loss_text": 2.3568, + "ppl": 15.2198, + "step": 455 + }, + { + "epoch": 0.0, + "global_step": 456, + "learning_rate": 0.0004989315525876461, + "loss": 2.7089, + "loss_base2": 3.9081, + "loss_pixel": 0.3642, + "loss_text": 2.3448, + "ppl": 15.0128, + "step": 456 + }, + { + "epoch": 0.0, + "global_step": 457, + "learning_rate": 0.0004989273789649416, + "loss": 2.7017, + "loss_base2": 3.8977, + "loss_pixel": 0.3649, + "loss_text": 2.3369, + "ppl": 14.905, + "step": 457 + }, + { + "epoch": 0.0, + "global_step": 458, + "learning_rate": 0.0004989232053422371, + "loss": 2.72, + "loss_base2": 3.9241, + "loss_pixel": 0.3641, + "loss_text": 2.3559, + "ppl": 15.1803, + "step": 458 + }, + { + "epoch": 0.0, + "global_step": 459, + "learning_rate": 0.0004989190317195326, + "loss": 2.7035, + "loss_base2": 3.9003, + "loss_pixel": 0.3629, + "loss_text": 2.3406, + "ppl": 14.9319, + "step": 459 + }, + { + "epoch": 0.0, + "global_step": 460, + "learning_rate": 0.0004989148580968281, + "loss": 2.6943, + "loss_base2": 3.8871, + "loss_pixel": 0.366, + "loss_text": 2.3283, + "ppl": 14.7952, + "step": 460 + }, + { + "epoch": 0.0, + "global_step": 461, + "learning_rate": 0.0004989106844741236, + "loss": 2.6831, + "loss_base2": 3.8709, + "loss_pixel": 0.363, + "loss_text": 2.3201, + "ppl": 14.6304, + "step": 461 + }, + { + "epoch": 0.0, + "global_step": 462, + "learning_rate": 0.000498906510851419, + "loss": 2.6983, + "loss_base2": 3.8928, + "loss_pixel": 0.3654, + "loss_text": 2.3329, + "ppl": 14.8545, + "step": 462 + }, + { + "epoch": 0.0, + "global_step": 463, + "learning_rate": 0.0004989023372287145, + "loss": 2.6991, + "loss_base2": 3.894, + "loss_pixel": 0.3634, + "loss_text": 2.3357, + "ppl": 14.8663, + "step": 463 + }, + { + "epoch": 0.0, + "global_step": 464, + "learning_rate": 0.00049889816360601, + "loss": 2.6699, + "loss_base2": 3.8519, + "loss_pixel": 0.361, + "loss_text": 2.3088, + "ppl": 14.4385, + "step": 464 + }, + { + "epoch": 0.0, + "global_step": 465, + "learning_rate": 0.0004988939899833055, + "loss": 2.6806, + "loss_base2": 3.8673, + "loss_pixel": 0.361, + "loss_text": 2.3195, + "ppl": 14.5938, + "step": 465 + }, + { + "epoch": 0.0, + "global_step": 466, + "learning_rate": 0.0004988898163606009, + "loss": 2.6915, + "loss_base2": 3.883, + "loss_pixel": 0.3611, + "loss_text": 2.3304, + "ppl": 14.7538, + "step": 466 + }, + { + "epoch": 0.0, + "global_step": 467, + "learning_rate": 0.0004988856427378965, + "loss": 2.7015, + "loss_base2": 3.8974, + "loss_pixel": 0.3594, + "loss_text": 2.3421, + "ppl": 14.9021, + "step": 467 + }, + { + "epoch": 0.0, + "global_step": 468, + "learning_rate": 0.000498881469115192, + "loss": 2.6555, + "loss_base2": 3.8311, + "loss_pixel": 0.3589, + "loss_text": 2.2966, + "ppl": 14.2321, + "step": 468 + }, + { + "epoch": 0.0, + "global_step": 469, + "learning_rate": 0.0004988772954924875, + "loss": 2.6742, + "loss_base2": 3.8581, + "loss_pixel": 0.3586, + "loss_text": 2.3155, + "ppl": 14.5007, + "step": 469 + }, + { + "epoch": 0.0, + "global_step": 470, + "learning_rate": 0.000498873121869783, + "loss": 2.6587, + "loss_base2": 3.8357, + "loss_pixel": 0.3586, + "loss_text": 2.3001, + "ppl": 14.2777, + "step": 470 + }, + { + "epoch": 0.0, + "global_step": 471, + "learning_rate": 0.0004988689482470785, + "loss": 2.6455, + "loss_base2": 3.8166, + "loss_pixel": 0.3594, + "loss_text": 2.286, + "ppl": 14.0905, + "step": 471 + }, + { + "epoch": 0.0, + "global_step": 472, + "learning_rate": 0.000498864774624374, + "loss": 2.6845, + "loss_base2": 3.8729, + "loss_pixel": 0.3627, + "loss_text": 2.3218, + "ppl": 14.6509, + "step": 472 + }, + { + "epoch": 0.0, + "global_step": 473, + "learning_rate": 0.0004988606010016695, + "loss": 2.7073, + "loss_base2": 3.9058, + "loss_pixel": 0.3753, + "loss_text": 2.332, + "ppl": 14.9888, + "step": 473 + }, + { + "epoch": 0.0, + "global_step": 474, + "learning_rate": 0.000498856427378965, + "loss": 2.6851, + "loss_base2": 3.8738, + "loss_pixel": 0.3631, + "loss_text": 2.3221, + "ppl": 14.6597, + "step": 474 + }, + { + "epoch": 0.0, + "global_step": 475, + "learning_rate": 0.0004988522537562604, + "loss": 2.7128, + "loss_base2": 3.9137, + "loss_pixel": 0.3663, + "loss_text": 2.3465, + "ppl": 15.0714, + "step": 475 + }, + { + "epoch": 0.0, + "global_step": 476, + "learning_rate": 0.0004988480801335559, + "loss": 2.7182, + "loss_base2": 3.9215, + "loss_pixel": 0.3675, + "loss_text": 2.3506, + "ppl": 15.153, + "step": 476 + }, + { + "epoch": 0.0, + "global_step": 477, + "learning_rate": 0.0004988439065108514, + "loss": 2.7078, + "loss_base2": 3.9065, + "loss_pixel": 0.3632, + "loss_text": 2.3446, + "ppl": 14.9962, + "step": 477 + }, + { + "epoch": 0.0, + "global_step": 478, + "learning_rate": 0.0004988397328881469, + "loss": 2.7432, + "loss_base2": 3.9576, + "loss_pixel": 0.3635, + "loss_text": 2.3796, + "ppl": 15.5366, + "step": 478 + }, + { + "epoch": 0.0, + "global_step": 479, + "learning_rate": 0.0004988355592654424, + "loss": 2.7201, + "loss_base2": 3.9243, + "loss_pixel": 0.3639, + "loss_text": 2.3562, + "ppl": 15.1818, + "step": 479 + }, + { + "epoch": 0.0, + "global_step": 480, + "learning_rate": 0.0004988313856427379, + "loss": 2.7471, + "loss_base2": 3.9632, + "loss_pixel": 0.3639, + "loss_text": 2.3832, + "ppl": 15.5973, + "step": 480 + }, + { + "epoch": 0.0, + "global_step": 481, + "learning_rate": 0.0004988272120200334, + "loss": 2.7535, + "loss_base2": 3.9725, + "loss_pixel": 0.3615, + "loss_text": 2.392, + "ppl": 15.6975, + "step": 481 + }, + { + "epoch": 0.0, + "global_step": 482, + "learning_rate": 0.0004988230383973288, + "loss": 2.7615, + "loss_base2": 3.984, + "loss_pixel": 0.3607, + "loss_text": 2.4009, + "ppl": 15.8236, + "step": 482 + }, + { + "epoch": 0.0, + "global_step": 483, + "learning_rate": 0.0004988188647746244, + "loss": 2.6783, + "loss_base2": 3.864, + "loss_pixel": 0.3605, + "loss_text": 2.3178, + "ppl": 14.5603, + "step": 483 + }, + { + "epoch": 0.0, + "global_step": 484, + "learning_rate": 0.0004988146911519199, + "loss": 2.6513, + "loss_base2": 3.825, + "loss_pixel": 0.36, + "loss_text": 2.2913, + "ppl": 14.1725, + "step": 484 + }, + { + "epoch": 0.0, + "global_step": 485, + "learning_rate": 0.0004988105175292154, + "loss": 2.7558, + "loss_base2": 3.9758, + "loss_pixel": 0.3587, + "loss_text": 2.397, + "ppl": 15.7336, + "step": 485 + }, + { + "epoch": 0.0, + "global_step": 486, + "learning_rate": 0.0004988063439065109, + "loss": 2.6873, + "loss_base2": 3.877, + "loss_pixel": 0.3576, + "loss_text": 2.3298, + "ppl": 14.692, + "step": 486 + }, + { + "epoch": 0.0, + "global_step": 487, + "learning_rate": 0.0004988021702838064, + "loss": 2.8417, + "loss_base2": 4.0997, + "loss_pixel": 0.3569, + "loss_text": 2.4848, + "ppl": 17.1449, + "step": 487 + }, + { + "epoch": 0.0, + "global_step": 488, + "learning_rate": 0.0004987979966611019, + "loss": 2.7708, + "loss_base2": 3.9974, + "loss_pixel": 0.3567, + "loss_text": 2.414, + "ppl": 15.9714, + "step": 488 + }, + { + "epoch": 0.0, + "global_step": 489, + "learning_rate": 0.0004987938230383973, + "loss": 2.7788, + "loss_base2": 4.009, + "loss_pixel": 0.3571, + "loss_text": 2.4218, + "ppl": 16.0997, + "step": 489 + }, + { + "epoch": 0.0, + "global_step": 490, + "learning_rate": 0.0004987896494156928, + "loss": 2.7816, + "loss_base2": 4.013, + "loss_pixel": 0.3554, + "loss_text": 2.4262, + "ppl": 16.1448, + "step": 490 + }, + { + "epoch": 0.0, + "global_step": 491, + "learning_rate": 0.0004987854757929883, + "loss": 2.8123, + "loss_base2": 4.0573, + "loss_pixel": 0.3547, + "loss_text": 2.4576, + "ppl": 16.6482, + "step": 491 + }, + { + "epoch": 0.0, + "global_step": 492, + "learning_rate": 0.0004987813021702838, + "loss": 2.9406, + "loss_base2": 4.2424, + "loss_pixel": 0.3537, + "loss_text": 2.5869, + "ppl": 18.9272, + "step": 492 + }, + { + "epoch": 0.0, + "global_step": 493, + "learning_rate": 0.0004987771285475793, + "loss": 2.9154, + "loss_base2": 4.206, + "loss_pixel": 0.3537, + "loss_text": 2.5617, + "ppl": 18.4562, + "step": 493 + }, + { + "epoch": 0.0, + "global_step": 494, + "learning_rate": 0.0004987729549248748, + "loss": 2.8858, + "loss_base2": 4.1633, + "loss_pixel": 0.3556, + "loss_text": 2.5301, + "ppl": 17.9179, + "step": 494 + }, + { + "epoch": 0.0, + "global_step": 495, + "learning_rate": 0.0004987687813021703, + "loss": 2.8735, + "loss_base2": 4.1456, + "loss_pixel": 0.3517, + "loss_text": 2.5218, + "ppl": 17.6989, + "step": 495 + }, + { + "epoch": 0.0, + "global_step": 496, + "learning_rate": 0.0004987646076794658, + "loss": 2.8508, + "loss_base2": 4.1128, + "loss_pixel": 0.3507, + "loss_text": 2.5001, + "ppl": 17.3016, + "step": 496 + }, + { + "epoch": 0.0, + "global_step": 497, + "learning_rate": 0.0004987604340567613, + "loss": 2.823, + "loss_base2": 4.0727, + "loss_pixel": 0.3505, + "loss_text": 2.4725, + "ppl": 16.8273, + "step": 497 + }, + { + "epoch": 0.0, + "global_step": 498, + "learning_rate": 0.0004987562604340567, + "loss": 2.8154, + "loss_base2": 4.0618, + "loss_pixel": 0.3502, + "loss_text": 2.4652, + "ppl": 16.6999, + "step": 498 + }, + { + "epoch": 0.0, + "global_step": 499, + "learning_rate": 0.0004987520868113523, + "loss": 2.8188, + "loss_base2": 4.0667, + "loss_pixel": 0.3482, + "loss_text": 2.4706, + "ppl": 16.7567, + "step": 499 + }, + { + "epoch": 0.0, + "global_step": 500, + "learning_rate": 0.0004987479131886478, + "loss": 2.7731, + "loss_base2": 4.0007, + "loss_pixel": 0.3484, + "loss_text": 2.4247, + "ppl": 16.0082, + "step": 500 + }, + { + "epoch": 0.0, + "global_step": 501, + "learning_rate": 0.0004987437395659433, + "loss": 2.774, + "loss_base2": 4.002, + "loss_pixel": 0.3477, + "loss_text": 2.4263, + "ppl": 16.0226, + "step": 501 + }, + { + "epoch": 0.0, + "global_step": 502, + "learning_rate": 0.0004987395659432387, + "loss": 2.7628, + "loss_base2": 3.9859, + "loss_pixel": 0.3469, + "loss_text": 2.4159, + "ppl": 15.8441, + "step": 502 + }, + { + "epoch": 0.0, + "global_step": 503, + "learning_rate": 0.0004987353923205342, + "loss": 2.7557, + "loss_base2": 3.9756, + "loss_pixel": 0.3468, + "loss_text": 2.4089, + "ppl": 15.732, + "step": 503 + }, + { + "epoch": 0.0, + "global_step": 504, + "learning_rate": 0.0004987312186978297, + "loss": 2.7444, + "loss_base2": 3.9593, + "loss_pixel": 0.3509, + "loss_text": 2.3935, + "ppl": 15.5553, + "step": 504 + }, + { + "epoch": 0.0, + "global_step": 505, + "learning_rate": 0.0004987270450751252, + "loss": 2.749, + "loss_base2": 3.966, + "loss_pixel": 0.357, + "loss_text": 2.3921, + "ppl": 15.627, + "step": 505 + }, + { + "epoch": 0.0, + "global_step": 506, + "learning_rate": 0.0004987228714524207, + "loss": 2.748, + "loss_base2": 3.9645, + "loss_pixel": 0.3592, + "loss_text": 2.3889, + "ppl": 15.6114, + "step": 506 + }, + { + "epoch": 0.0, + "global_step": 507, + "learning_rate": 0.0004987186978297162, + "loss": 2.7238, + "loss_base2": 3.9296, + "loss_pixel": 0.3559, + "loss_text": 2.368, + "ppl": 15.2381, + "step": 507 + }, + { + "epoch": 0.0, + "global_step": 508, + "learning_rate": 0.0004987145242070117, + "loss": 2.716, + "loss_base2": 3.9184, + "loss_pixel": 0.3569, + "loss_text": 2.3591, + "ppl": 15.1197, + "step": 508 + }, + { + "epoch": 0.0, + "global_step": 509, + "learning_rate": 0.0004987103505843072, + "loss": 2.7131, + "loss_base2": 3.9142, + "loss_pixel": 0.3537, + "loss_text": 2.3593, + "ppl": 15.0759, + "step": 509 + }, + { + "epoch": 0.0, + "global_step": 510, + "learning_rate": 0.0004987061769616027, + "loss": 2.7099, + "loss_base2": 3.9096, + "loss_pixel": 0.3502, + "loss_text": 2.3597, + "ppl": 15.0278, + "step": 510 + }, + { + "epoch": 0.0, + "global_step": 511, + "learning_rate": 0.0004987020033388981, + "loss": 2.6913, + "loss_base2": 3.8827, + "loss_pixel": 0.3496, + "loss_text": 2.3417, + "ppl": 14.7508, + "step": 511 + }, + { + "epoch": 0.0, + "global_step": 512, + "learning_rate": 0.0004986978297161936, + "loss": 2.6942, + "loss_base2": 3.8869, + "loss_pixel": 0.3492, + "loss_text": 2.3451, + "ppl": 14.7937, + "step": 512 + }, + { + "epoch": 0.0, + "global_step": 513, + "learning_rate": 0.0004986936560934891, + "loss": 2.6791, + "loss_base2": 3.8651, + "loss_pixel": 0.3479, + "loss_text": 2.3312, + "ppl": 14.572, + "step": 513 + }, + { + "epoch": 0.0, + "global_step": 514, + "learning_rate": 0.0004986894824707846, + "loss": 2.6709, + "loss_base2": 3.8533, + "loss_pixel": 0.3469, + "loss_text": 2.324, + "ppl": 14.453, + "step": 514 + }, + { + "epoch": 0.0, + "global_step": 515, + "learning_rate": 0.0004986853088480802, + "loss": 2.6556, + "loss_base2": 3.8312, + "loss_pixel": 0.3459, + "loss_text": 2.3097, + "ppl": 14.2335, + "step": 515 + }, + { + "epoch": 0.0, + "global_step": 516, + "learning_rate": 0.0004986811352253757, + "loss": 2.656, + "loss_base2": 3.8318, + "loss_pixel": 0.3455, + "loss_text": 2.3104, + "ppl": 14.2392, + "step": 516 + }, + { + "epoch": 0.0, + "global_step": 517, + "learning_rate": 0.0004986769616026712, + "loss": 2.6618, + "loss_base2": 3.8402, + "loss_pixel": 0.3448, + "loss_text": 2.317, + "ppl": 14.322, + "step": 517 + }, + { + "epoch": 0.0, + "global_step": 518, + "learning_rate": 0.0004986727879799667, + "loss": 2.6463, + "loss_base2": 3.8178, + "loss_pixel": 0.3438, + "loss_text": 2.3025, + "ppl": 14.1018, + "step": 518 + }, + { + "epoch": 0.0, + "global_step": 519, + "learning_rate": 0.0004986686143572622, + "loss": 2.6395, + "loss_base2": 3.808, + "loss_pixel": 0.3431, + "loss_text": 2.2965, + "ppl": 14.0062, + "step": 519 + }, + { + "epoch": 0.0, + "global_step": 520, + "learning_rate": 0.0004986644407345576, + "loss": 2.6527, + "loss_base2": 3.827, + "loss_pixel": 0.3445, + "loss_text": 2.3082, + "ppl": 14.1923, + "step": 520 + }, + { + "epoch": 0.0, + "global_step": 521, + "learning_rate": 0.0004986602671118531, + "loss": 2.6474, + "loss_base2": 3.8194, + "loss_pixel": 0.354, + "loss_text": 2.2934, + "ppl": 14.1173, + "step": 521 + }, + { + "epoch": 0.0, + "global_step": 522, + "learning_rate": 0.0004986560934891486, + "loss": 2.6452, + "loss_base2": 3.8162, + "loss_pixel": 0.3496, + "loss_text": 2.2956, + "ppl": 14.0863, + "step": 522 + }, + { + "epoch": 0.0, + "global_step": 523, + "learning_rate": 0.0004986519198664441, + "loss": 2.634, + "loss_base2": 3.8001, + "loss_pixel": 0.3473, + "loss_text": 2.2867, + "ppl": 13.9294, + "step": 523 + }, + { + "epoch": 0.0, + "global_step": 524, + "learning_rate": 0.0004986477462437396, + "loss": 2.6307, + "loss_base2": 3.7953, + "loss_pixel": 0.3461, + "loss_text": 2.2846, + "ppl": 13.8835, + "step": 524 + }, + { + "epoch": 0.0, + "global_step": 525, + "learning_rate": 0.000498643572621035, + "loss": 2.6248, + "loss_base2": 3.7868, + "loss_pixel": 0.3449, + "loss_text": 2.2799, + "ppl": 13.8018, + "step": 525 + }, + { + "epoch": 0.0, + "global_step": 526, + "learning_rate": 0.0004986393989983305, + "loss": 2.6273, + "loss_base2": 3.7904, + "loss_pixel": 0.344, + "loss_text": 2.2833, + "ppl": 13.8364, + "step": 526 + }, + { + "epoch": 0.0, + "global_step": 527, + "learning_rate": 0.000498635225375626, + "loss": 2.6256, + "loss_base2": 3.7879, + "loss_pixel": 0.3427, + "loss_text": 2.2829, + "ppl": 13.8129, + "step": 527 + }, + { + "epoch": 0.0, + "global_step": 528, + "learning_rate": 0.0004986310517529215, + "loss": 2.6134, + "loss_base2": 3.7703, + "loss_pixel": 0.3427, + "loss_text": 2.2707, + "ppl": 13.6454, + "step": 528 + }, + { + "epoch": 0.0, + "global_step": 529, + "learning_rate": 0.000498626878130217, + "loss": 2.6083, + "loss_base2": 3.763, + "loss_pixel": 0.3428, + "loss_text": 2.2656, + "ppl": 13.576, + "step": 529 + }, + { + "epoch": 0.0, + "global_step": 530, + "learning_rate": 0.0004986227045075125, + "loss": 2.5855, + "loss_base2": 3.7301, + "loss_pixel": 0.3413, + "loss_text": 2.2442, + "ppl": 13.2699, + "step": 530 + }, + { + "epoch": 0.0, + "global_step": 531, + "learning_rate": 0.000498618530884808, + "loss": 2.6073, + "loss_base2": 3.7615, + "loss_pixel": 0.3413, + "loss_text": 2.2661, + "ppl": 13.5624, + "step": 531 + }, + { + "epoch": 0.0, + "global_step": 532, + "learning_rate": 0.0004986143572621036, + "loss": 2.5935, + "loss_base2": 3.7416, + "loss_pixel": 0.3396, + "loss_text": 2.2539, + "ppl": 13.3765, + "step": 532 + }, + { + "epoch": 0.0, + "global_step": 533, + "learning_rate": 0.0004986101836393991, + "loss": 2.5952, + "loss_base2": 3.7441, + "loss_pixel": 0.3405, + "loss_text": 2.2547, + "ppl": 13.3993, + "step": 533 + }, + { + "epoch": 0.0, + "global_step": 534, + "learning_rate": 0.0004986060100166945, + "loss": 2.5793, + "loss_base2": 3.7211, + "loss_pixel": 0.3379, + "loss_text": 2.2414, + "ppl": 13.1879, + "step": 534 + }, + { + "epoch": 0.0, + "global_step": 535, + "learning_rate": 0.00049860183639399, + "loss": 2.5878, + "loss_base2": 3.7334, + "loss_pixel": 0.3375, + "loss_text": 2.2503, + "ppl": 13.3005, + "step": 535 + }, + { + "epoch": 0.0, + "global_step": 536, + "learning_rate": 0.0004985976627712855, + "loss": 2.5814, + "loss_base2": 3.7242, + "loss_pixel": 0.3376, + "loss_text": 2.2438, + "ppl": 13.2156, + "step": 536 + }, + { + "epoch": 0.0, + "global_step": 537, + "learning_rate": 0.000498593489148581, + "loss": 2.5775, + "loss_base2": 3.7185, + "loss_pixel": 0.3375, + "loss_text": 2.2401, + "ppl": 13.1642, + "step": 537 + }, + { + "epoch": 0.0, + "global_step": 538, + "learning_rate": 0.0004985893155258765, + "loss": 2.5745, + "loss_base2": 3.7142, + "loss_pixel": 0.3361, + "loss_text": 2.2385, + "ppl": 13.1248, + "step": 538 + }, + { + "epoch": 0.0, + "global_step": 539, + "learning_rate": 0.0004985851419031719, + "loss": 2.5963, + "loss_base2": 3.7457, + "loss_pixel": 0.3348, + "loss_text": 2.2615, + "ppl": 13.414, + "step": 539 + }, + { + "epoch": 0.0, + "global_step": 540, + "learning_rate": 0.0004985809682804674, + "loss": 2.5703, + "loss_base2": 3.7082, + "loss_pixel": 0.3357, + "loss_text": 2.2346, + "ppl": 13.0697, + "step": 540 + }, + { + "epoch": 0.0, + "global_step": 541, + "learning_rate": 0.0004985767946577629, + "loss": 2.5762, + "loss_base2": 3.7167, + "loss_pixel": 0.3352, + "loss_text": 2.241, + "ppl": 13.1471, + "step": 541 + }, + { + "epoch": 0.0, + "global_step": 542, + "learning_rate": 0.0004985726210350584, + "loss": 2.5586, + "loss_base2": 3.6913, + "loss_pixel": 0.3336, + "loss_text": 2.2251, + "ppl": 12.9177, + "step": 542 + }, + { + "epoch": 0.0, + "global_step": 543, + "learning_rate": 0.0004985684474123539, + "loss": 2.5508, + "loss_base2": 3.68, + "loss_pixel": 0.3336, + "loss_text": 2.2172, + "ppl": 12.8174, + "step": 543 + }, + { + "epoch": 0.0, + "global_step": 544, + "learning_rate": 0.0004985642737896494, + "loss": 2.5554, + "loss_base2": 3.6867, + "loss_pixel": 0.3331, + "loss_text": 2.2223, + "ppl": 12.8764, + "step": 544 + }, + { + "epoch": 0.0, + "global_step": 545, + "learning_rate": 0.0004985601001669449, + "loss": 2.5557, + "loss_base2": 3.6871, + "loss_pixel": 0.3315, + "loss_text": 2.2241, + "ppl": 12.8803, + "step": 545 + }, + { + "epoch": 0.0, + "global_step": 546, + "learning_rate": 0.0004985559265442404, + "loss": 2.5679, + "loss_base2": 3.7047, + "loss_pixel": 0.3324, + "loss_text": 2.2355, + "ppl": 13.0384, + "step": 546 + }, + { + "epoch": 0.0, + "global_step": 547, + "learning_rate": 0.000498551752921536, + "loss": 2.5509, + "loss_base2": 3.6802, + "loss_pixel": 0.3311, + "loss_text": 2.2198, + "ppl": 12.8186, + "step": 547 + }, + { + "epoch": 0.0, + "global_step": 548, + "learning_rate": 0.0004985475792988314, + "loss": 2.5393, + "loss_base2": 3.6634, + "loss_pixel": 0.331, + "loss_text": 2.2083, + "ppl": 12.6708, + "step": 548 + }, + { + "epoch": 0.0, + "global_step": 549, + "learning_rate": 0.0004985434056761269, + "loss": 2.5378, + "loss_base2": 3.6613, + "loss_pixel": 0.3306, + "loss_text": 2.2072, + "ppl": 12.6518, + "step": 549 + }, + { + "epoch": 0.0, + "global_step": 550, + "learning_rate": 0.0004985392320534224, + "loss": 2.5439, + "loss_base2": 3.6701, + "loss_pixel": 0.3301, + "loss_text": 2.2138, + "ppl": 12.7292, + "step": 550 + }, + { + "epoch": 0.0, + "global_step": 551, + "learning_rate": 0.0004985350584307179, + "loss": 2.5319, + "loss_base2": 3.6528, + "loss_pixel": 0.3295, + "loss_text": 2.2024, + "ppl": 12.5774, + "step": 551 + }, + { + "epoch": 0.0, + "global_step": 552, + "learning_rate": 0.0004985308848080134, + "loss": 2.5448, + "loss_base2": 3.6714, + "loss_pixel": 0.3286, + "loss_text": 2.2163, + "ppl": 12.7407, + "step": 552 + }, + { + "epoch": 0.0, + "global_step": 553, + "learning_rate": 0.0004985267111853089, + "loss": 2.5311, + "loss_base2": 3.6516, + "loss_pixel": 0.328, + "loss_text": 2.2031, + "ppl": 12.5673, + "step": 553 + }, + { + "epoch": 0.0, + "global_step": 554, + "learning_rate": 0.0004985225375626044, + "loss": 2.5226, + "loss_base2": 3.6393, + "loss_pixel": 0.3277, + "loss_text": 2.1949, + "ppl": 12.461, + "step": 554 + }, + { + "epoch": 0.0, + "global_step": 555, + "learning_rate": 0.0004985183639398999, + "loss": 2.53, + "loss_base2": 3.65, + "loss_pixel": 0.3278, + "loss_text": 2.2022, + "ppl": 12.5535, + "step": 555 + }, + { + "epoch": 0.0, + "global_step": 556, + "learning_rate": 0.0004985141903171954, + "loss": 2.5175, + "loss_base2": 3.632, + "loss_pixel": 0.3261, + "loss_text": 2.1914, + "ppl": 12.3976, + "step": 556 + }, + { + "epoch": 0.0, + "global_step": 557, + "learning_rate": 0.0004985100166944908, + "loss": 2.5392, + "loss_base2": 3.6633, + "loss_pixel": 0.326, + "loss_text": 2.2131, + "ppl": 12.6695, + "step": 557 + }, + { + "epoch": 0.0, + "global_step": 558, + "learning_rate": 0.0004985058430717863, + "loss": 2.5358, + "loss_base2": 3.6584, + "loss_pixel": 0.327, + "loss_text": 2.2087, + "ppl": 12.6265, + "step": 558 + }, + { + "epoch": 0.0, + "global_step": 559, + "learning_rate": 0.0004985016694490818, + "loss": 2.5382, + "loss_base2": 3.6618, + "loss_pixel": 0.3275, + "loss_text": 2.2106, + "ppl": 12.6569, + "step": 559 + }, + { + "epoch": 0.0, + "global_step": 560, + "learning_rate": 0.0004984974958263773, + "loss": 2.5279, + "loss_base2": 3.647, + "loss_pixel": 0.3265, + "loss_text": 2.2014, + "ppl": 12.5272, + "step": 560 + }, + { + "epoch": 0.0, + "global_step": 561, + "learning_rate": 0.0004984933222036727, + "loss": 2.5279, + "loss_base2": 3.647, + "loss_pixel": 0.3248, + "loss_text": 2.203, + "ppl": 12.5272, + "step": 561 + }, + { + "epoch": 0.0, + "global_step": 562, + "learning_rate": 0.0004984891485809682, + "loss": 2.5186, + "loss_base2": 3.6336, + "loss_pixel": 0.3244, + "loss_text": 2.1941, + "ppl": 12.4112, + "step": 562 + }, + { + "epoch": 0.0, + "global_step": 563, + "learning_rate": 0.0004984849749582637, + "loss": 2.4605, + "loss_base2": 3.5498, + "loss_pixel": 0.3246, + "loss_text": 2.1359, + "ppl": 11.7107, + "step": 563 + }, + { + "epoch": 0.0, + "global_step": 564, + "learning_rate": 0.0004984808013355593, + "loss": 2.4524, + "loss_base2": 3.5381, + "loss_pixel": 0.3256, + "loss_text": 2.1268, + "ppl": 11.6162, + "step": 564 + }, + { + "epoch": 0.0, + "global_step": 565, + "learning_rate": 0.0004984766277128548, + "loss": 2.4727, + "loss_base2": 3.5674, + "loss_pixel": 0.3324, + "loss_text": 2.1403, + "ppl": 11.8544, + "step": 565 + }, + { + "epoch": 0.0, + "global_step": 566, + "learning_rate": 0.0004984724540901503, + "loss": 2.4474, + "loss_base2": 3.5309, + "loss_pixel": 0.3322, + "loss_text": 2.1152, + "ppl": 11.5583, + "step": 566 + }, + { + "epoch": 0.0, + "global_step": 567, + "learning_rate": 0.0004984682804674458, + "loss": 2.4356, + "loss_base2": 3.5138, + "loss_pixel": 0.3308, + "loss_text": 2.1048, + "ppl": 11.4227, + "step": 567 + }, + { + "epoch": 0.0, + "global_step": 568, + "learning_rate": 0.0004984641068447413, + "loss": 2.4139, + "loss_base2": 3.4825, + "loss_pixel": 0.3303, + "loss_text": 2.0835, + "ppl": 11.1775, + "step": 568 + }, + { + "epoch": 0.0, + "global_step": 569, + "learning_rate": 0.0004984599332220368, + "loss": 2.3993, + "loss_base2": 3.4615, + "loss_pixel": 0.3292, + "loss_text": 2.0701, + "ppl": 11.0155, + "step": 569 + }, + { + "epoch": 0.0, + "global_step": 570, + "learning_rate": 0.0004984557595993322, + "loss": 2.4004, + "loss_base2": 3.463, + "loss_pixel": 0.3291, + "loss_text": 2.0713, + "ppl": 11.0276, + "step": 570 + }, + { + "epoch": 0.0, + "global_step": 571, + "learning_rate": 0.0004984515859766277, + "loss": 2.4386, + "loss_base2": 3.5182, + "loss_pixel": 0.3293, + "loss_text": 2.1093, + "ppl": 11.457, + "step": 571 + }, + { + "epoch": 0.0, + "global_step": 572, + "learning_rate": 0.0004984474123539232, + "loss": 2.6162, + "loss_base2": 3.7744, + "loss_pixel": 0.3258, + "loss_text": 2.2904, + "ppl": 13.6836, + "step": 572 + }, + { + "epoch": 0.0, + "global_step": 573, + "learning_rate": 0.0004984432387312187, + "loss": 2.6145, + "loss_base2": 3.7719, + "loss_pixel": 0.3251, + "loss_text": 2.2894, + "ppl": 13.6604, + "step": 573 + }, + { + "epoch": 0.0, + "global_step": 574, + "learning_rate": 0.0004984390651085142, + "loss": 2.624, + "loss_base2": 3.7856, + "loss_pixel": 0.3261, + "loss_text": 2.298, + "ppl": 13.7908, + "step": 574 + }, + { + "epoch": 0.0, + "global_step": 575, + "learning_rate": 0.0004984348914858097, + "loss": 2.6073, + "loss_base2": 3.7615, + "loss_pixel": 0.3258, + "loss_text": 2.2815, + "ppl": 13.5624, + "step": 575 + }, + { + "epoch": 0.0, + "global_step": 576, + "learning_rate": 0.0004984307178631051, + "loss": 2.5757, + "loss_base2": 3.7159, + "loss_pixel": 0.3245, + "loss_text": 2.2511, + "ppl": 13.1405, + "step": 576 + }, + { + "epoch": 0.0, + "global_step": 577, + "learning_rate": 0.0004984265442404006, + "loss": 2.5627, + "loss_base2": 3.6972, + "loss_pixel": 0.3228, + "loss_text": 2.2399, + "ppl": 12.9708, + "step": 577 + }, + { + "epoch": 0.0, + "global_step": 578, + "learning_rate": 0.0004984223706176961, + "loss": 2.5837, + "loss_base2": 3.7275, + "loss_pixel": 0.3262, + "loss_text": 2.2575, + "ppl": 13.2461, + "step": 578 + }, + { + "epoch": 0.0, + "global_step": 579, + "learning_rate": 0.0004984181969949916, + "loss": 2.566, + "loss_base2": 3.702, + "loss_pixel": 0.3253, + "loss_text": 2.2407, + "ppl": 13.0137, + "step": 579 + }, + { + "epoch": 0.0, + "global_step": 580, + "learning_rate": 0.0004984140233722872, + "loss": 2.5538, + "loss_base2": 3.6844, + "loss_pixel": 0.324, + "loss_text": 2.2298, + "ppl": 12.8559, + "step": 580 + }, + { + "epoch": 0.0, + "global_step": 581, + "learning_rate": 0.0004984098497495827, + "loss": 2.5445, + "loss_base2": 3.6709, + "loss_pixel": 0.3219, + "loss_text": 2.2226, + "ppl": 12.7369, + "step": 581 + }, + { + "epoch": 0.0, + "global_step": 582, + "learning_rate": 0.0004984056761268782, + "loss": 2.5336, + "loss_base2": 3.6552, + "loss_pixel": 0.3227, + "loss_text": 2.211, + "ppl": 12.5988, + "step": 582 + }, + { + "epoch": 0.0, + "global_step": 583, + "learning_rate": 0.0004984015025041737, + "loss": 2.5333, + "loss_base2": 3.6548, + "loss_pixel": 0.3204, + "loss_text": 2.2129, + "ppl": 12.595, + "step": 583 + }, + { + "epoch": 0.0, + "global_step": 584, + "learning_rate": 0.0004983973288814691, + "loss": 2.5385, + "loss_base2": 3.6623, + "loss_pixel": 0.3196, + "loss_text": 2.2189, + "ppl": 12.6607, + "step": 584 + }, + { + "epoch": 0.0, + "global_step": 585, + "learning_rate": 0.0004983931552587646, + "loss": 2.5281, + "loss_base2": 3.6473, + "loss_pixel": 0.3194, + "loss_text": 2.2087, + "ppl": 12.5297, + "step": 585 + }, + { + "epoch": 0.0, + "global_step": 586, + "learning_rate": 0.0004983889816360601, + "loss": 2.517, + "loss_base2": 3.6313, + "loss_pixel": 0.3185, + "loss_text": 2.1985, + "ppl": 12.3914, + "step": 586 + }, + { + "epoch": 0.0, + "global_step": 587, + "learning_rate": 0.0004983848080133556, + "loss": 2.5192, + "loss_base2": 3.6344, + "loss_pixel": 0.3188, + "loss_text": 2.2003, + "ppl": 12.4187, + "step": 587 + }, + { + "epoch": 0.0, + "global_step": 588, + "learning_rate": 0.0004983806343906511, + "loss": 2.5049, + "loss_base2": 3.6138, + "loss_pixel": 0.3194, + "loss_text": 2.1855, + "ppl": 12.2423, + "step": 588 + }, + { + "epoch": 0.0, + "global_step": 589, + "learning_rate": 0.0004983764607679466, + "loss": 2.5001, + "loss_base2": 3.6069, + "loss_pixel": 0.319, + "loss_text": 2.1811, + "ppl": 12.1837, + "step": 589 + }, + { + "epoch": 0.0, + "global_step": 590, + "learning_rate": 0.0004983722871452421, + "loss": 2.4894, + "loss_base2": 3.5914, + "loss_pixel": 0.3228, + "loss_text": 2.1666, + "ppl": 12.054, + "step": 590 + }, + { + "epoch": 0.0, + "global_step": 591, + "learning_rate": 0.0004983681135225376, + "loss": 2.4991, + "loss_base2": 3.6054, + "loss_pixel": 0.3176, + "loss_text": 2.1815, + "ppl": 12.1715, + "step": 591 + }, + { + "epoch": 0.0, + "global_step": 592, + "learning_rate": 0.0004983639398998331, + "loss": 2.4789, + "loss_base2": 3.5763, + "loss_pixel": 0.3194, + "loss_text": 2.1595, + "ppl": 11.9281, + "step": 592 + }, + { + "epoch": 0.0, + "global_step": 593, + "learning_rate": 0.0004983597662771285, + "loss": 2.497, + "loss_base2": 3.6024, + "loss_pixel": 0.3147, + "loss_text": 2.1823, + "ppl": 12.146, + "step": 593 + }, + { + "epoch": 0.0, + "global_step": 594, + "learning_rate": 0.000498355592654424, + "loss": 2.4771, + "loss_base2": 3.5737, + "loss_pixel": 0.3152, + "loss_text": 2.1619, + "ppl": 11.9067, + "step": 594 + }, + { + "epoch": 0.0, + "global_step": 595, + "learning_rate": 0.0004983514190317195, + "loss": 2.4825, + "loss_base2": 3.5815, + "loss_pixel": 0.3144, + "loss_text": 2.168, + "ppl": 11.9712, + "step": 595 + }, + { + "epoch": 0.0, + "global_step": 596, + "learning_rate": 0.000498347245409015, + "loss": 2.3696, + "loss_base2": 3.4186, + "loss_pixel": 0.3181, + "loss_text": 2.0516, + "ppl": 10.6931, + "step": 596 + }, + { + "epoch": 0.0, + "global_step": 597, + "learning_rate": 0.0004983430717863106, + "loss": 2.3506, + "loss_base2": 3.3912, + "loss_pixel": 0.3154, + "loss_text": 2.0352, + "ppl": 10.4919, + "step": 597 + }, + { + "epoch": 0.0, + "global_step": 598, + "learning_rate": 0.000498338898163606, + "loss": 2.3351, + "loss_base2": 3.3688, + "loss_pixel": 0.3147, + "loss_text": 2.0204, + "ppl": 10.3305, + "step": 598 + }, + { + "epoch": 0.0, + "global_step": 599, + "learning_rate": 0.0004983347245409015, + "loss": 2.3199, + "loss_base2": 3.3469, + "loss_pixel": 0.3137, + "loss_text": 2.0062, + "ppl": 10.1747, + "step": 599 + }, + { + "epoch": 0.0, + "global_step": 600, + "learning_rate": 0.000498330550918197, + "loss": 2.334, + "loss_base2": 3.3673, + "loss_pixel": 0.3163, + "loss_text": 2.0178, + "ppl": 10.3191, + "step": 600 + }, + { + "epoch": 0.0, + "global_step": 601, + "learning_rate": 0.0004983263772954925, + "loss": 2.2919, + "loss_base2": 3.3065, + "loss_pixel": 0.3162, + "loss_text": 1.9757, + "ppl": 9.8937, + "step": 601 + }, + { + "epoch": 0.0, + "global_step": 602, + "learning_rate": 0.000498322203672788, + "loss": 2.3009, + "loss_base2": 3.3195, + "loss_pixel": 0.3162, + "loss_text": 1.9847, + "ppl": 9.9832, + "step": 602 + }, + { + "epoch": 0.0, + "global_step": 603, + "learning_rate": 0.0004983180300500835, + "loss": 2.3057, + "loss_base2": 3.3264, + "loss_pixel": 0.3131, + "loss_text": 1.9926, + "ppl": 10.0312, + "step": 603 + }, + { + "epoch": 0.0, + "global_step": 604, + "learning_rate": 0.000498313856427379, + "loss": 2.2846, + "loss_base2": 3.296, + "loss_pixel": 0.3171, + "loss_text": 1.9675, + "ppl": 9.8218, + "step": 604 + }, + { + "epoch": 0.0, + "global_step": 605, + "learning_rate": 0.0004983096828046745, + "loss": 2.2688, + "loss_base2": 3.2732, + "loss_pixel": 0.3103, + "loss_text": 1.9585, + "ppl": 9.6678, + "step": 605 + }, + { + "epoch": 0.0, + "global_step": 606, + "learning_rate": 0.00049830550918197, + "loss": 2.2773, + "loss_base2": 3.2854, + "loss_pixel": 0.3092, + "loss_text": 1.9681, + "ppl": 9.7503, + "step": 606 + }, + { + "epoch": 0.0, + "global_step": 607, + "learning_rate": 0.0004983013355592654, + "loss": 2.2796, + "loss_base2": 3.2888, + "loss_pixel": 0.3105, + "loss_text": 1.9691, + "ppl": 9.7728, + "step": 607 + }, + { + "epoch": 0.0, + "global_step": 608, + "learning_rate": 0.0004982971619365609, + "loss": 2.2522, + "loss_base2": 3.2492, + "loss_pixel": 0.3077, + "loss_text": 1.9445, + "ppl": 9.5086, + "step": 608 + }, + { + "epoch": 0.0, + "global_step": 609, + "learning_rate": 0.0004982929883138564, + "loss": 2.2519, + "loss_base2": 3.2488, + "loss_pixel": 0.306, + "loss_text": 1.9459, + "ppl": 9.5058, + "step": 609 + }, + { + "epoch": 0.0, + "global_step": 610, + "learning_rate": 0.0004982888146911519, + "loss": 2.2369, + "loss_base2": 3.2272, + "loss_pixel": 0.3056, + "loss_text": 1.9313, + "ppl": 9.3643, + "step": 610 + }, + { + "epoch": 0.0, + "global_step": 611, + "learning_rate": 0.0004982846410684474, + "loss": 2.2522, + "loss_base2": 3.2492, + "loss_pixel": 0.3051, + "loss_text": 1.9471, + "ppl": 9.5086, + "step": 611 + }, + { + "epoch": 0.0, + "global_step": 612, + "learning_rate": 0.000498280467445743, + "loss": 2.4338, + "loss_base2": 3.5112, + "loss_pixel": 0.3048, + "loss_text": 2.129, + "ppl": 11.4021, + "step": 612 + }, + { + "epoch": 0.0, + "global_step": 613, + "learning_rate": 0.0004982762938230384, + "loss": 2.5036, + "loss_base2": 3.6119, + "loss_pixel": 0.3043, + "loss_text": 2.1993, + "ppl": 12.2264, + "step": 613 + }, + { + "epoch": 0.0, + "global_step": 614, + "learning_rate": 0.0004982721202003339, + "loss": 2.4944, + "loss_base2": 3.5987, + "loss_pixel": 0.3035, + "loss_text": 2.1909, + "ppl": 12.1145, + "step": 614 + }, + { + "epoch": 0.0, + "global_step": 615, + "learning_rate": 0.0004982679465776294, + "loss": 2.4945, + "loss_base2": 3.5988, + "loss_pixel": 0.3021, + "loss_text": 2.1923, + "ppl": 12.1157, + "step": 615 + }, + { + "epoch": 0.0, + "global_step": 616, + "learning_rate": 0.0004982637729549249, + "loss": 2.4799, + "loss_base2": 3.5777, + "loss_pixel": 0.3014, + "loss_text": 2.1786, + "ppl": 11.9401, + "step": 616 + }, + { + "epoch": 0.0, + "global_step": 617, + "learning_rate": 0.0004982595993322204, + "loss": 2.4849, + "loss_base2": 3.585, + "loss_pixel": 0.3003, + "loss_text": 2.1847, + "ppl": 11.9999, + "step": 617 + }, + { + "epoch": 0.0, + "global_step": 618, + "learning_rate": 0.0004982554257095159, + "loss": 2.4742, + "loss_base2": 3.5695, + "loss_pixel": 0.3001, + "loss_text": 2.1741, + "ppl": 11.8722, + "step": 618 + }, + { + "epoch": 0.0, + "global_step": 619, + "learning_rate": 0.0004982512520868114, + "loss": 2.4679, + "loss_base2": 3.5604, + "loss_pixel": 0.3006, + "loss_text": 2.1674, + "ppl": 11.7976, + "step": 619 + }, + { + "epoch": 0.0, + "global_step": 620, + "learning_rate": 0.0004982470784641068, + "loss": 2.4653, + "loss_base2": 3.5567, + "loss_pixel": 0.3005, + "loss_text": 2.1648, + "ppl": 11.767, + "step": 620 + }, + { + "epoch": 0.0, + "global_step": 621, + "learning_rate": 0.0004982429048414023, + "loss": 2.4598, + "loss_base2": 3.5487, + "loss_pixel": 0.3, + "loss_text": 2.1598, + "ppl": 11.7025, + "step": 621 + }, + { + "epoch": 0.0, + "global_step": 622, + "learning_rate": 0.0004982387312186978, + "loss": 2.4561, + "loss_base2": 3.5434, + "loss_pixel": 0.2998, + "loss_text": 2.1563, + "ppl": 11.6593, + "step": 622 + }, + { + "epoch": 0.0, + "global_step": 623, + "learning_rate": 0.0004982345575959933, + "loss": 2.4585, + "loss_base2": 3.5469, + "loss_pixel": 0.3015, + "loss_text": 2.157, + "ppl": 11.6873, + "step": 623 + }, + { + "epoch": 0.0, + "global_step": 624, + "learning_rate": 0.0004982303839732888, + "loss": 2.4602, + "loss_base2": 3.5493, + "loss_pixel": 0.3147, + "loss_text": 2.1455, + "ppl": 11.7072, + "step": 624 + }, + { + "epoch": 0.0, + "global_step": 625, + "learning_rate": 0.0004982262103505843, + "loss": 2.4892, + "loss_base2": 3.5912, + "loss_pixel": 0.3264, + "loss_text": 2.1628, + "ppl": 12.0516, + "step": 625 + }, + { + "epoch": 0.0, + "global_step": 626, + "learning_rate": 0.0004982220367278798, + "loss": 2.4662, + "loss_base2": 3.558, + "loss_pixel": 0.32, + "loss_text": 2.1462, + "ppl": 11.7776, + "step": 626 + }, + { + "epoch": 0.0, + "global_step": 627, + "learning_rate": 0.0004982178631051753, + "loss": 2.4588, + "loss_base2": 3.5473, + "loss_pixel": 0.3163, + "loss_text": 2.1425, + "ppl": 11.6908, + "step": 627 + }, + { + "epoch": 0.0, + "global_step": 628, + "learning_rate": 0.0004982136894824709, + "loss": 2.458, + "loss_base2": 3.5461, + "loss_pixel": 0.3139, + "loss_text": 2.1441, + "ppl": 11.6814, + "step": 628 + }, + { + "epoch": 0.0, + "global_step": 629, + "learning_rate": 0.0004982095158597663, + "loss": 2.4624, + "loss_base2": 3.5525, + "loss_pixel": 0.3139, + "loss_text": 2.1484, + "ppl": 11.7329, + "step": 629 + }, + { + "epoch": 0.0, + "global_step": 630, + "learning_rate": 0.0004982053422370618, + "loss": 2.4565, + "loss_base2": 3.544, + "loss_pixel": 0.3111, + "loss_text": 2.1454, + "ppl": 11.6639, + "step": 630 + }, + { + "epoch": 0.0, + "global_step": 631, + "learning_rate": 0.0004982011686143573, + "loss": 2.4371, + "loss_base2": 3.516, + "loss_pixel": 0.3095, + "loss_text": 2.1276, + "ppl": 11.4398, + "step": 631 + }, + { + "epoch": 0.0, + "global_step": 632, + "learning_rate": 0.0004981969949916528, + "loss": 2.4345, + "loss_base2": 3.5122, + "loss_pixel": 0.3072, + "loss_text": 2.1273, + "ppl": 11.4101, + "step": 632 + }, + { + "epoch": 0.0, + "global_step": 633, + "learning_rate": 0.0004981928213689483, + "loss": 2.4231, + "loss_base2": 3.4958, + "loss_pixel": 0.3052, + "loss_text": 2.1179, + "ppl": 11.2808, + "step": 633 + }, + { + "epoch": 0.0, + "global_step": 634, + "learning_rate": 0.0004981886477462437, + "loss": 2.4399, + "loss_base2": 3.52, + "loss_pixel": 0.3032, + "loss_text": 2.1367, + "ppl": 11.4719, + "step": 634 + }, + { + "epoch": 0.0, + "global_step": 635, + "learning_rate": 0.0004981844741235392, + "loss": 2.4351, + "loss_base2": 3.5131, + "loss_pixel": 0.3027, + "loss_text": 2.1324, + "ppl": 11.417, + "step": 635 + }, + { + "epoch": 0.0, + "global_step": 636, + "learning_rate": 0.0004981803005008347, + "loss": 2.4184, + "loss_base2": 3.489, + "loss_pixel": 0.3011, + "loss_text": 2.1173, + "ppl": 11.2279, + "step": 636 + }, + { + "epoch": 0.0, + "global_step": 637, + "learning_rate": 0.0004981761268781302, + "loss": 2.4223, + "loss_base2": 3.4946, + "loss_pixel": 0.301, + "loss_text": 2.1213, + "ppl": 11.2718, + "step": 637 + }, + { + "epoch": 0.0, + "global_step": 638, + "learning_rate": 0.0004981719532554257, + "loss": 2.4245, + "loss_base2": 3.4978, + "loss_pixel": 0.2983, + "loss_text": 2.1262, + "ppl": 11.2966, + "step": 638 + }, + { + "epoch": 0.0, + "global_step": 639, + "learning_rate": 0.0004981677796327212, + "loss": 2.4113, + "loss_base2": 3.4788, + "loss_pixel": 0.2984, + "loss_text": 2.1129, + "ppl": 11.1484, + "step": 639 + }, + { + "epoch": 0.0, + "global_step": 640, + "learning_rate": 0.0004981636060100167, + "loss": 2.4037, + "loss_base2": 3.4678, + "loss_pixel": 0.2983, + "loss_text": 2.1054, + "ppl": 11.064, + "step": 640 + }, + { + "epoch": 0.0, + "global_step": 641, + "learning_rate": 0.0004981594323873122, + "loss": 2.4072, + "loss_base2": 3.4729, + "loss_pixel": 0.2967, + "loss_text": 2.1104, + "ppl": 11.1028, + "step": 641 + }, + { + "epoch": 0.0, + "global_step": 642, + "learning_rate": 0.0004981552587646077, + "loss": 2.4037, + "loss_base2": 3.4678, + "loss_pixel": 0.2968, + "loss_text": 2.1069, + "ppl": 11.064, + "step": 642 + }, + { + "epoch": 0.0, + "global_step": 643, + "learning_rate": 0.0004981510851419031, + "loss": 2.3973, + "loss_base2": 3.4586, + "loss_pixel": 0.2957, + "loss_text": 2.1016, + "ppl": 10.9935, + "step": 643 + }, + { + "epoch": 0.0, + "global_step": 644, + "learning_rate": 0.0004981469115191986, + "loss": 2.3897, + "loss_base2": 3.4476, + "loss_pixel": 0.2959, + "loss_text": 2.0939, + "ppl": 10.9102, + "step": 644 + }, + { + "epoch": 0.0, + "global_step": 645, + "learning_rate": 0.0004981427378964942, + "loss": 2.3874, + "loss_base2": 3.4443, + "loss_pixel": 0.2978, + "loss_text": 2.0896, + "ppl": 10.8852, + "step": 645 + }, + { + "epoch": 0.0, + "global_step": 646, + "learning_rate": 0.0004981385642737897, + "loss": 2.3934, + "loss_base2": 3.4529, + "loss_pixel": 0.297, + "loss_text": 2.0965, + "ppl": 10.9507, + "step": 646 + }, + { + "epoch": 0.0, + "global_step": 647, + "learning_rate": 0.0004981343906510852, + "loss": 2.3936, + "loss_base2": 3.4532, + "loss_pixel": 0.2945, + "loss_text": 2.0991, + "ppl": 10.9529, + "step": 647 + }, + { + "epoch": 0.0, + "global_step": 648, + "learning_rate": 0.0004981302170283807, + "loss": 2.388, + "loss_base2": 3.4452, + "loss_pixel": 0.294, + "loss_text": 2.094, + "ppl": 10.8917, + "step": 648 + }, + { + "epoch": 0.0, + "global_step": 649, + "learning_rate": 0.0004981260434056762, + "loss": 2.4112, + "loss_base2": 3.4786, + "loss_pixel": 0.2933, + "loss_text": 2.118, + "ppl": 11.1473, + "step": 649 + }, + { + "epoch": 0.0, + "global_step": 650, + "learning_rate": 0.0004981218697829717, + "loss": 2.4091, + "loss_base2": 3.4756, + "loss_pixel": 0.2941, + "loss_text": 2.115, + "ppl": 11.1239, + "step": 650 + }, + { + "epoch": 0.0, + "global_step": 651, + "learning_rate": 0.0004981176961602671, + "loss": 2.3809, + "loss_base2": 3.4349, + "loss_pixel": 0.293, + "loss_text": 2.0879, + "ppl": 10.8146, + "step": 651 + }, + { + "epoch": 0.0, + "global_step": 652, + "learning_rate": 0.0004981135225375626, + "loss": 2.3754, + "loss_base2": 3.427, + "loss_pixel": 0.292, + "loss_text": 2.0833, + "ppl": 10.7553, + "step": 652 + }, + { + "epoch": 0.0, + "global_step": 653, + "learning_rate": 0.0004981093489148581, + "loss": 2.3768, + "loss_base2": 3.429, + "loss_pixel": 0.2908, + "loss_text": 2.086, + "ppl": 10.7704, + "step": 653 + }, + { + "epoch": 0.0, + "global_step": 654, + "learning_rate": 0.0004981051752921536, + "loss": 2.3683, + "loss_base2": 3.4167, + "loss_pixel": 0.2924, + "loss_text": 2.0759, + "ppl": 10.6792, + "step": 654 + }, + { + "epoch": 0.0, + "global_step": 655, + "learning_rate": 0.0004981010016694491, + "loss": 2.3833, + "loss_base2": 3.4384, + "loss_pixel": 0.2897, + "loss_text": 2.0936, + "ppl": 10.8406, + "step": 655 + }, + { + "epoch": 0.0, + "global_step": 656, + "learning_rate": 0.0004980968280467446, + "loss": 2.3763, + "loss_base2": 3.4283, + "loss_pixel": 0.2913, + "loss_text": 2.0851, + "ppl": 10.765, + "step": 656 + }, + { + "epoch": 0.0, + "global_step": 657, + "learning_rate": 0.00049809265442404, + "loss": 2.3535, + "loss_base2": 3.3954, + "loss_pixel": 0.2901, + "loss_text": 2.0634, + "ppl": 10.5223, + "step": 657 + }, + { + "epoch": 0.0, + "global_step": 658, + "learning_rate": 0.0004980884808013355, + "loss": 2.2166, + "loss_base2": 3.1979, + "loss_pixel": 0.2897, + "loss_text": 1.9269, + "ppl": 9.1761, + "step": 658 + }, + { + "epoch": 0.0, + "global_step": 659, + "learning_rate": 0.000498084307178631, + "loss": 2.1914, + "loss_base2": 3.1615, + "loss_pixel": 0.2891, + "loss_text": 1.9023, + "ppl": 8.9477, + "step": 659 + }, + { + "epoch": 0.0, + "global_step": 660, + "learning_rate": 0.0004980801335559265, + "loss": 2.2251, + "loss_base2": 3.2101, + "loss_pixel": 0.2887, + "loss_text": 1.9364, + "ppl": 9.2544, + "step": 660 + }, + { + "epoch": 0.0, + "global_step": 661, + "learning_rate": 0.000498075959933222, + "loss": 2.2293, + "loss_base2": 3.2162, + "loss_pixel": 0.2881, + "loss_text": 1.9412, + "ppl": 9.2934, + "step": 661 + }, + { + "epoch": 0.0, + "global_step": 662, + "learning_rate": 0.0004980717863105176, + "loss": 2.2303, + "loss_base2": 3.2176, + "loss_pixel": 0.2881, + "loss_text": 1.9422, + "ppl": 9.3027, + "step": 662 + }, + { + "epoch": 0.0, + "global_step": 663, + "learning_rate": 0.0004980676126878131, + "loss": 2.207, + "loss_base2": 3.184, + "loss_pixel": 0.2889, + "loss_text": 1.9181, + "ppl": 9.0884, + "step": 663 + }, + { + "epoch": 0.0, + "global_step": 664, + "learning_rate": 0.0004980634390651086, + "loss": 2.1983, + "loss_base2": 3.1715, + "loss_pixel": 0.2912, + "loss_text": 1.907, + "ppl": 9.0097, + "step": 664 + }, + { + "epoch": 0.0, + "global_step": 665, + "learning_rate": 0.0004980592654424041, + "loss": 2.2012, + "loss_base2": 3.1757, + "loss_pixel": 0.2902, + "loss_text": 1.911, + "ppl": 9.0359, + "step": 665 + }, + { + "epoch": 0.0, + "global_step": 666, + "learning_rate": 0.0004980550918196995, + "loss": 2.4096, + "loss_base2": 3.4763, + "loss_pixel": 0.2913, + "loss_text": 2.1183, + "ppl": 11.1295, + "step": 666 + }, + { + "epoch": 0.0, + "global_step": 667, + "learning_rate": 0.000498050918196995, + "loss": 2.4457, + "loss_base2": 3.5284, + "loss_pixel": 0.2896, + "loss_text": 2.1561, + "ppl": 11.5386, + "step": 667 + }, + { + "epoch": 0.0, + "global_step": 668, + "learning_rate": 0.0004980467445742905, + "loss": 2.46, + "loss_base2": 3.549, + "loss_pixel": 0.2874, + "loss_text": 2.1725, + "ppl": 11.7048, + "step": 668 + }, + { + "epoch": 0.0, + "global_step": 669, + "learning_rate": 0.000498042570951586, + "loss": 2.457, + "loss_base2": 3.5447, + "loss_pixel": 0.2866, + "loss_text": 2.1704, + "ppl": 11.6697, + "step": 669 + }, + { + "epoch": 0.0, + "global_step": 670, + "learning_rate": 0.0004980383973288814, + "loss": 2.4339, + "loss_base2": 3.5114, + "loss_pixel": 0.2877, + "loss_text": 2.1462, + "ppl": 11.4033, + "step": 670 + }, + { + "epoch": 0.0, + "global_step": 671, + "learning_rate": 0.0004980342237061769, + "loss": 2.426, + "loss_base2": 3.5, + "loss_pixel": 0.2872, + "loss_text": 2.1388, + "ppl": 11.3135, + "step": 671 + }, + { + "epoch": 0.0, + "global_step": 672, + "learning_rate": 0.0004980300500834724, + "loss": 2.4298, + "loss_base2": 3.5055, + "loss_pixel": 0.2847, + "loss_text": 2.1451, + "ppl": 11.3566, + "step": 672 + }, + { + "epoch": 0.0, + "global_step": 673, + "learning_rate": 0.0004980258764607679, + "loss": 2.4056, + "loss_base2": 3.4705, + "loss_pixel": 0.2864, + "loss_text": 2.1192, + "ppl": 11.0851, + "step": 673 + }, + { + "epoch": 0.0, + "global_step": 674, + "learning_rate": 0.0004980217028380634, + "loss": 2.3963, + "loss_base2": 3.4571, + "loss_pixel": 0.2862, + "loss_text": 2.1101, + "ppl": 10.9825, + "step": 674 + }, + { + "epoch": 0.0, + "global_step": 675, + "learning_rate": 0.0004980175292153589, + "loss": 2.3936, + "loss_base2": 3.4532, + "loss_pixel": 0.2865, + "loss_text": 2.107, + "ppl": 10.9529, + "step": 675 + }, + { + "epoch": 0.0, + "global_step": 676, + "learning_rate": 0.0004980133555926544, + "loss": 2.3911, + "loss_base2": 3.4496, + "loss_pixel": 0.2862, + "loss_text": 2.105, + "ppl": 10.9255, + "step": 676 + }, + { + "epoch": 0.0, + "global_step": 677, + "learning_rate": 0.00049800918196995, + "loss": 2.4072, + "loss_base2": 3.4729, + "loss_pixel": 0.2858, + "loss_text": 2.1214, + "ppl": 11.1028, + "step": 677 + }, + { + "epoch": 0.0, + "global_step": 678, + "learning_rate": 0.0004980050083472455, + "loss": 2.3925, + "loss_base2": 3.4516, + "loss_pixel": 0.2856, + "loss_text": 2.1069, + "ppl": 10.9408, + "step": 678 + }, + { + "epoch": 0.0, + "global_step": 679, + "learning_rate": 0.0004980008347245409, + "loss": 2.3695, + "loss_base2": 3.4185, + "loss_pixel": 0.2842, + "loss_text": 2.0853, + "ppl": 10.692, + "step": 679 + }, + { + "epoch": 0.0, + "global_step": 680, + "learning_rate": 0.0004979966611018364, + "loss": 2.3947, + "loss_base2": 3.4548, + "loss_pixel": 0.2835, + "loss_text": 2.1112, + "ppl": 10.9649, + "step": 680 + }, + { + "epoch": 0.0, + "global_step": 681, + "learning_rate": 0.0004979924874791319, + "loss": 2.3821, + "loss_base2": 3.4366, + "loss_pixel": 0.283, + "loss_text": 2.0991, + "ppl": 10.8276, + "step": 681 + }, + { + "epoch": 0.0, + "global_step": 682, + "learning_rate": 0.0004979883138564274, + "loss": 2.372, + "loss_base2": 3.4221, + "loss_pixel": 0.2822, + "loss_text": 2.0898, + "ppl": 10.7188, + "step": 682 + }, + { + "epoch": 0.0, + "global_step": 683, + "learning_rate": 0.0004979841402337229, + "loss": 2.3741, + "loss_base2": 3.4251, + "loss_pixel": 0.282, + "loss_text": 2.0921, + "ppl": 10.7413, + "step": 683 + }, + { + "epoch": 0.0, + "global_step": 684, + "learning_rate": 0.0004979799666110184, + "loss": 2.3641, + "loss_base2": 3.4107, + "loss_pixel": 0.2818, + "loss_text": 2.0823, + "ppl": 10.6345, + "step": 684 + }, + { + "epoch": 0.0, + "global_step": 685, + "learning_rate": 0.0004979757929883139, + "loss": 2.3758, + "loss_base2": 3.4276, + "loss_pixel": 0.281, + "loss_text": 2.0948, + "ppl": 10.7596, + "step": 685 + }, + { + "epoch": 0.0, + "global_step": 686, + "learning_rate": 0.0004979716193656094, + "loss": 2.3715, + "loss_base2": 3.4214, + "loss_pixel": 0.2806, + "loss_text": 2.0909, + "ppl": 10.7135, + "step": 686 + }, + { + "epoch": 0.0, + "global_step": 687, + "learning_rate": 0.0004979674457429049, + "loss": 2.341, + "loss_base2": 3.3773, + "loss_pixel": 0.2799, + "loss_text": 2.0611, + "ppl": 10.3916, + "step": 687 + }, + { + "epoch": 0.0, + "global_step": 688, + "learning_rate": 0.0004979632721202003, + "loss": 2.3496, + "loss_base2": 3.3898, + "loss_pixel": 0.2797, + "loss_text": 2.07, + "ppl": 10.4814, + "step": 688 + }, + { + "epoch": 0.0, + "global_step": 689, + "learning_rate": 0.0004979590984974958, + "loss": 2.3592, + "loss_base2": 3.4036, + "loss_pixel": 0.2786, + "loss_text": 2.0806, + "ppl": 10.5825, + "step": 689 + }, + { + "epoch": 0.0, + "global_step": 690, + "learning_rate": 0.0004979549248747913, + "loss": 2.3643, + "loss_base2": 3.411, + "loss_pixel": 0.2789, + "loss_text": 2.0854, + "ppl": 10.6366, + "step": 690 + }, + { + "epoch": 0.0, + "global_step": 691, + "learning_rate": 0.0004979507512520868, + "loss": 2.3383, + "loss_base2": 3.3735, + "loss_pixel": 0.2777, + "loss_text": 2.0606, + "ppl": 10.3636, + "step": 691 + }, + { + "epoch": 0.0, + "global_step": 692, + "learning_rate": 0.0004979465776293823, + "loss": 2.3465, + "loss_base2": 3.3853, + "loss_pixel": 0.2773, + "loss_text": 2.0693, + "ppl": 10.4489, + "step": 692 + }, + { + "epoch": 0.0, + "global_step": 693, + "learning_rate": 0.0004979424040066777, + "loss": 2.3299, + "loss_base2": 3.3613, + "loss_pixel": 0.2765, + "loss_text": 2.0533, + "ppl": 10.2769, + "step": 693 + }, + { + "epoch": 0.0, + "global_step": 694, + "learning_rate": 0.0004979382303839733, + "loss": 2.3317, + "loss_base2": 3.3639, + "loss_pixel": 0.2771, + "loss_text": 2.0546, + "ppl": 10.2954, + "step": 694 + }, + { + "epoch": 0.0, + "global_step": 695, + "learning_rate": 0.0004979340567612688, + "loss": 2.3323, + "loss_base2": 3.3648, + "loss_pixel": 0.2774, + "loss_text": 2.0549, + "ppl": 10.3016, + "step": 695 + }, + { + "epoch": 0.0, + "global_step": 696, + "learning_rate": 0.0004979298831385643, + "loss": 2.334, + "loss_base2": 3.3673, + "loss_pixel": 0.2783, + "loss_text": 2.0557, + "ppl": 10.3191, + "step": 696 + }, + { + "epoch": 0.0, + "global_step": 697, + "learning_rate": 0.0004979257095158598, + "loss": 2.3404, + "loss_base2": 3.3765, + "loss_pixel": 0.28, + "loss_text": 2.0604, + "ppl": 10.3854, + "step": 697 + }, + { + "epoch": 0.0, + "global_step": 698, + "learning_rate": 0.0004979215358931553, + "loss": 2.356, + "loss_base2": 3.399, + "loss_pixel": 0.2842, + "loss_text": 2.0718, + "ppl": 10.5487, + "step": 698 + }, + { + "epoch": 0.0, + "global_step": 699, + "learning_rate": 0.0004979173622704508, + "loss": 2.3171, + "loss_base2": 3.3429, + "loss_pixel": 0.2796, + "loss_text": 2.0375, + "ppl": 10.1462, + "step": 699 + }, + { + "epoch": 0.0, + "global_step": 700, + "learning_rate": 0.0004979131886477463, + "loss": 2.3285, + "loss_base2": 3.3593, + "loss_pixel": 0.2811, + "loss_text": 2.0474, + "ppl": 10.2625, + "step": 700 + }, + { + "epoch": 0.0, + "global_step": 701, + "learning_rate": 0.0004979090150250418, + "loss": 2.3287, + "loss_base2": 3.3596, + "loss_pixel": 0.2783, + "loss_text": 2.0504, + "ppl": 10.2646, + "step": 701 + }, + { + "epoch": 0.0, + "global_step": 702, + "learning_rate": 0.0004979048414023372, + "loss": 2.3364, + "loss_base2": 3.3707, + "loss_pixel": 0.2779, + "loss_text": 2.0585, + "ppl": 10.3439, + "step": 702 + }, + { + "epoch": 0.0, + "global_step": 703, + "learning_rate": 0.0004979006677796327, + "loss": 2.3341, + "loss_base2": 3.3674, + "loss_pixel": 0.2778, + "loss_text": 2.0562, + "ppl": 10.3202, + "step": 703 + }, + { + "epoch": 0.0, + "global_step": 704, + "learning_rate": 0.0004978964941569282, + "loss": 2.3227, + "loss_base2": 3.3509, + "loss_pixel": 0.2767, + "loss_text": 2.046, + "ppl": 10.2032, + "step": 704 + }, + { + "epoch": 0.0, + "global_step": 705, + "learning_rate": 0.0004978923205342237, + "loss": 2.3138, + "loss_base2": 3.3381, + "loss_pixel": 0.277, + "loss_text": 2.0367, + "ppl": 10.1128, + "step": 705 + }, + { + "epoch": 0.0, + "global_step": 706, + "learning_rate": 0.0004978881469115192, + "loss": 2.3095, + "loss_base2": 3.3319, + "loss_pixel": 0.2758, + "loss_text": 2.0337, + "ppl": 10.0694, + "step": 706 + }, + { + "epoch": 0.0, + "global_step": 707, + "learning_rate": 0.0004978839732888146, + "loss": 2.3143, + "loss_base2": 3.3388, + "loss_pixel": 0.2757, + "loss_text": 2.0387, + "ppl": 10.1178, + "step": 707 + }, + { + "epoch": 0.0, + "global_step": 708, + "learning_rate": 0.0004978797996661101, + "loss": 2.3198, + "loss_base2": 3.3468, + "loss_pixel": 0.2766, + "loss_text": 2.0431, + "ppl": 10.1736, + "step": 708 + }, + { + "epoch": 0.0, + "global_step": 709, + "learning_rate": 0.0004978756260434056, + "loss": 2.3176, + "loss_base2": 3.3436, + "loss_pixel": 0.276, + "loss_text": 2.0415, + "ppl": 10.1513, + "step": 709 + }, + { + "epoch": 0.0, + "global_step": 710, + "learning_rate": 0.0004978714524207012, + "loss": 2.3179, + "loss_base2": 3.344, + "loss_pixel": 0.2744, + "loss_text": 2.0434, + "ppl": 10.1543, + "step": 710 + }, + { + "epoch": 0.0, + "global_step": 711, + "learning_rate": 0.0004978672787979967, + "loss": 2.3088, + "loss_base2": 3.3309, + "loss_pixel": 0.2753, + "loss_text": 2.0336, + "ppl": 10.0623, + "step": 711 + }, + { + "epoch": 0.0, + "global_step": 712, + "learning_rate": 0.0004978631051752922, + "loss": 2.3321, + "loss_base2": 3.3645, + "loss_pixel": 0.2811, + "loss_text": 2.0509, + "ppl": 10.2995, + "step": 712 + }, + { + "epoch": 0.0, + "global_step": 713, + "learning_rate": 0.0004978589315525877, + "loss": 2.3168, + "loss_base2": 3.3424, + "loss_pixel": 0.2799, + "loss_text": 2.0369, + "ppl": 10.1432, + "step": 713 + }, + { + "epoch": 0.0, + "global_step": 714, + "learning_rate": 0.0004978547579298832, + "loss": 2.3162, + "loss_base2": 3.3416, + "loss_pixel": 0.2799, + "loss_text": 2.0362, + "ppl": 10.1371, + "step": 714 + }, + { + "epoch": 0.0, + "global_step": 715, + "learning_rate": 0.0004978505843071787, + "loss": 2.2969, + "loss_base2": 3.3137, + "loss_pixel": 0.2763, + "loss_text": 2.0206, + "ppl": 9.9433, + "step": 715 + }, + { + "epoch": 0.0, + "global_step": 716, + "learning_rate": 0.0004978464106844741, + "loss": 2.311, + "loss_base2": 3.3341, + "loss_pixel": 0.2777, + "loss_text": 2.0333, + "ppl": 10.0845, + "step": 716 + }, + { + "epoch": 0.0, + "global_step": 717, + "learning_rate": 0.0004978422370617696, + "loss": 2.3156, + "loss_base2": 3.3407, + "loss_pixel": 0.276, + "loss_text": 2.0397, + "ppl": 10.131, + "step": 717 + }, + { + "epoch": 0.0, + "global_step": 718, + "learning_rate": 0.0004978380634390651, + "loss": 2.3157, + "loss_base2": 3.3408, + "loss_pixel": 0.2771, + "loss_text": 2.0386, + "ppl": 10.132, + "step": 718 + }, + { + "epoch": 0.0, + "global_step": 719, + "learning_rate": 0.0004978338898163606, + "loss": 2.3595, + "loss_base2": 3.404, + "loss_pixel": 0.2774, + "loss_text": 2.0821, + "ppl": 10.5857, + "step": 719 + }, + { + "epoch": 0.0, + "global_step": 720, + "learning_rate": 0.0004978297161936561, + "loss": 2.3318, + "loss_base2": 3.3641, + "loss_pixel": 0.2755, + "loss_text": 2.0562, + "ppl": 10.2965, + "step": 720 + }, + { + "epoch": 0.0, + "global_step": 721, + "learning_rate": 0.0004978255425709516, + "loss": 2.34, + "loss_base2": 3.3759, + "loss_pixel": 0.2743, + "loss_text": 2.0657, + "ppl": 10.3812, + "step": 721 + }, + { + "epoch": 0.0, + "global_step": 722, + "learning_rate": 0.0004978213689482471, + "loss": 2.3215, + "loss_base2": 3.3492, + "loss_pixel": 0.2737, + "loss_text": 2.0478, + "ppl": 10.1909, + "step": 722 + }, + { + "epoch": 0.0, + "global_step": 723, + "learning_rate": 0.0004978171953255426, + "loss": 2.3552, + "loss_base2": 3.3978, + "loss_pixel": 0.2733, + "loss_text": 2.0819, + "ppl": 10.5402, + "step": 723 + }, + { + "epoch": 0.0, + "global_step": 724, + "learning_rate": 0.0004978130217028381, + "loss": 2.3404, + "loss_base2": 3.3765, + "loss_pixel": 0.2726, + "loss_text": 2.0677, + "ppl": 10.3854, + "step": 724 + }, + { + "epoch": 0.0, + "global_step": 725, + "learning_rate": 0.0004978088480801335, + "loss": 2.3251, + "loss_base2": 3.3544, + "loss_pixel": 0.2718, + "loss_text": 2.0533, + "ppl": 10.2277, + "step": 725 + }, + { + "epoch": 0.0, + "global_step": 726, + "learning_rate": 0.000497804674457429, + "loss": 2.3438, + "loss_base2": 3.3814, + "loss_pixel": 0.2709, + "loss_text": 2.0729, + "ppl": 10.4208, + "step": 726 + }, + { + "epoch": 0.0, + "global_step": 727, + "learning_rate": 0.0004978005008347246, + "loss": 2.3455, + "loss_base2": 3.3838, + "loss_pixel": 0.2707, + "loss_text": 2.0748, + "ppl": 10.4385, + "step": 727 + }, + { + "epoch": 0.0, + "global_step": 728, + "learning_rate": 0.0004977963272120201, + "loss": 2.3218, + "loss_base2": 3.3496, + "loss_pixel": 0.2696, + "loss_text": 2.0522, + "ppl": 10.194, + "step": 728 + }, + { + "epoch": 0.0, + "global_step": 729, + "learning_rate": 0.0004977921535893155, + "loss": 2.3013, + "loss_base2": 3.3201, + "loss_pixel": 0.2708, + "loss_text": 2.0305, + "ppl": 9.9872, + "step": 729 + }, + { + "epoch": 0.0, + "global_step": 730, + "learning_rate": 0.000497787979966611, + "loss": 2.3321, + "loss_base2": 3.3645, + "loss_pixel": 0.2735, + "loss_text": 2.0586, + "ppl": 10.2995, + "step": 730 + }, + { + "epoch": 0.0, + "global_step": 731, + "learning_rate": 0.0004977838063439065, + "loss": 2.3207, + "loss_base2": 3.3481, + "loss_pixel": 0.2775, + "loss_text": 2.0432, + "ppl": 10.1828, + "step": 731 + }, + { + "epoch": 0.0, + "global_step": 732, + "learning_rate": 0.000497779632721202, + "loss": 2.3109, + "loss_base2": 3.3339, + "loss_pixel": 0.274, + "loss_text": 2.0369, + "ppl": 10.0835, + "step": 732 + }, + { + "epoch": 0.0, + "global_step": 733, + "learning_rate": 0.0004977754590984975, + "loss": 2.3257, + "loss_base2": 3.3553, + "loss_pixel": 0.2743, + "loss_text": 2.0514, + "ppl": 10.2338, + "step": 733 + }, + { + "epoch": 0.0, + "global_step": 734, + "learning_rate": 0.000497771285475793, + "loss": 2.2998, + "loss_base2": 3.3179, + "loss_pixel": 0.2734, + "loss_text": 2.0264, + "ppl": 9.9722, + "step": 734 + }, + { + "epoch": 0.0, + "global_step": 735, + "learning_rate": 0.0004977671118530885, + "loss": 2.2965, + "loss_base2": 3.3131, + "loss_pixel": 0.2712, + "loss_text": 2.0253, + "ppl": 9.9393, + "step": 735 + }, + { + "epoch": 0.0, + "global_step": 736, + "learning_rate": 0.000497762938230384, + "loss": 2.3037, + "loss_base2": 3.3235, + "loss_pixel": 0.2707, + "loss_text": 2.033, + "ppl": 10.0112, + "step": 736 + }, + { + "epoch": 0.0, + "global_step": 737, + "learning_rate": 0.0004977587646076795, + "loss": 2.2863, + "loss_base2": 3.2984, + "loss_pixel": 0.2701, + "loss_text": 2.0162, + "ppl": 9.8385, + "step": 737 + }, + { + "epoch": 0.0, + "global_step": 738, + "learning_rate": 0.0004977545909849749, + "loss": 2.3082, + "loss_base2": 3.33, + "loss_pixel": 0.2695, + "loss_text": 2.0387, + "ppl": 10.0563, + "step": 738 + }, + { + "epoch": 0.0, + "global_step": 739, + "learning_rate": 0.0004977504173622704, + "loss": 2.2889, + "loss_base2": 3.3022, + "loss_pixel": 0.2702, + "loss_text": 2.0188, + "ppl": 9.8641, + "step": 739 + }, + { + "epoch": 0.0, + "global_step": 740, + "learning_rate": 0.0004977462437395659, + "loss": 2.2901, + "loss_base2": 3.3039, + "loss_pixel": 0.2679, + "loss_text": 2.0222, + "ppl": 9.8759, + "step": 740 + }, + { + "epoch": 0.0, + "global_step": 741, + "learning_rate": 0.0004977420701168614, + "loss": 2.2688, + "loss_base2": 3.2732, + "loss_pixel": 0.2681, + "loss_text": 2.0008, + "ppl": 9.6678, + "step": 741 + }, + { + "epoch": 0.0, + "global_step": 742, + "learning_rate": 0.000497737896494157, + "loss": 2.2904, + "loss_base2": 3.3043, + "loss_pixel": 0.2687, + "loss_text": 2.0216, + "ppl": 9.8789, + "step": 742 + }, + { + "epoch": 0.0, + "global_step": 743, + "learning_rate": 0.0004977337228714525, + "loss": 2.2821, + "loss_base2": 3.2924, + "loss_pixel": 0.268, + "loss_text": 2.0141, + "ppl": 9.7972, + "step": 743 + }, + { + "epoch": 0.0, + "global_step": 744, + "learning_rate": 0.000497729549248748, + "loss": 2.2814, + "loss_base2": 3.2914, + "loss_pixel": 0.2705, + "loss_text": 2.0109, + "ppl": 9.7904, + "step": 744 + }, + { + "epoch": 0.0, + "global_step": 745, + "learning_rate": 0.0004977253756260434, + "loss": 2.2907, + "loss_base2": 3.3048, + "loss_pixel": 0.2741, + "loss_text": 2.0165, + "ppl": 9.8819, + "step": 745 + }, + { + "epoch": 0.0, + "global_step": 746, + "learning_rate": 0.0004977212020033389, + "loss": 2.2783, + "loss_base2": 3.2869, + "loss_pixel": 0.2732, + "loss_text": 2.0052, + "ppl": 9.7601, + "step": 746 + }, + { + "epoch": 0.0, + "global_step": 747, + "learning_rate": 0.0004977170283806344, + "loss": 2.2851, + "loss_base2": 3.2967, + "loss_pixel": 0.2741, + "loss_text": 2.011, + "ppl": 9.8267, + "step": 747 + }, + { + "epoch": 0.0, + "global_step": 748, + "learning_rate": 0.0004977128547579299, + "loss": 2.2752, + "loss_base2": 3.2824, + "loss_pixel": 0.2749, + "loss_text": 2.0003, + "ppl": 9.7299, + "step": 748 + }, + { + "epoch": 0.0, + "global_step": 749, + "learning_rate": 0.0004977086811352254, + "loss": 2.2772, + "loss_base2": 3.2853, + "loss_pixel": 0.2744, + "loss_text": 2.0028, + "ppl": 9.7493, + "step": 749 + }, + { + "epoch": 0.0, + "global_step": 750, + "learning_rate": 0.0004977045075125209, + "loss": 2.2683, + "loss_base2": 3.2725, + "loss_pixel": 0.2739, + "loss_text": 1.9944, + "ppl": 9.663, + "step": 750 + }, + { + "epoch": 0.0, + "global_step": 751, + "learning_rate": 0.0004977003338898164, + "loss": 2.283, + "loss_base2": 3.2937, + "loss_pixel": 0.2722, + "loss_text": 2.0108, + "ppl": 9.8061, + "step": 751 + }, + { + "epoch": 0.0, + "global_step": 752, + "learning_rate": 0.0004976961602671118, + "loss": 2.2806, + "loss_base2": 3.2902, + "loss_pixel": 0.2696, + "loss_text": 2.0111, + "ppl": 9.7825, + "step": 752 + }, + { + "epoch": 0.0, + "global_step": 753, + "learning_rate": 0.0004976919866444073, + "loss": 2.2804, + "loss_base2": 3.2899, + "loss_pixel": 0.2716, + "loss_text": 2.0088, + "ppl": 9.7806, + "step": 753 + }, + { + "epoch": 0.0, + "global_step": 754, + "learning_rate": 0.0004976878130217028, + "loss": 2.2766, + "loss_base2": 3.2844, + "loss_pixel": 0.2707, + "loss_text": 2.0059, + "ppl": 9.7435, + "step": 754 + }, + { + "epoch": 0.0, + "global_step": 755, + "learning_rate": 0.0004976836393989983, + "loss": 2.2652, + "loss_base2": 3.268, + "loss_pixel": 0.2693, + "loss_text": 1.9959, + "ppl": 9.6331, + "step": 755 + }, + { + "epoch": 0.0, + "global_step": 756, + "learning_rate": 0.0004976794657762938, + "loss": 2.2617, + "loss_base2": 3.2629, + "loss_pixel": 0.2685, + "loss_text": 1.9932, + "ppl": 9.5994, + "step": 756 + }, + { + "epoch": 0.0, + "global_step": 757, + "learning_rate": 0.0004976752921535893, + "loss": 2.2678, + "loss_base2": 3.2717, + "loss_pixel": 0.2676, + "loss_text": 2.0002, + "ppl": 9.6581, + "step": 757 + }, + { + "epoch": 0.0, + "global_step": 758, + "learning_rate": 0.0004976711185308849, + "loss": 2.2657, + "loss_base2": 3.2687, + "loss_pixel": 0.2671, + "loss_text": 1.9986, + "ppl": 9.6379, + "step": 758 + }, + { + "epoch": 0.0, + "global_step": 759, + "learning_rate": 0.0004976669449081804, + "loss": 2.264, + "loss_base2": 3.2663, + "loss_pixel": 0.2667, + "loss_text": 1.9973, + "ppl": 9.6215, + "step": 759 + }, + { + "epoch": 0.0, + "global_step": 760, + "learning_rate": 0.0004976627712854759, + "loss": 2.2682, + "loss_base2": 3.2723, + "loss_pixel": 0.2667, + "loss_text": 2.0016, + "ppl": 9.662, + "step": 760 + }, + { + "epoch": 0.0, + "global_step": 761, + "learning_rate": 0.0004976585976627713, + "loss": 2.265, + "loss_base2": 3.2677, + "loss_pixel": 0.2657, + "loss_text": 1.9993, + "ppl": 9.6311, + "step": 761 + }, + { + "epoch": 0.0, + "global_step": 762, + "learning_rate": 0.0004976544240400668, + "loss": 2.2556, + "loss_base2": 3.2541, + "loss_pixel": 0.2656, + "loss_text": 1.9901, + "ppl": 9.541, + "step": 762 + }, + { + "epoch": 0.0, + "global_step": 763, + "learning_rate": 0.0004976502504173623, + "loss": 2.2617, + "loss_base2": 3.2629, + "loss_pixel": 0.2644, + "loss_text": 1.9973, + "ppl": 9.5994, + "step": 763 + }, + { + "epoch": 0.0, + "global_step": 764, + "learning_rate": 0.0004976460767946578, + "loss": 2.2593, + "loss_base2": 3.2595, + "loss_pixel": 0.2673, + "loss_text": 1.992, + "ppl": 9.5764, + "step": 764 + }, + { + "epoch": 0.0, + "global_step": 765, + "learning_rate": 0.0004976419031719533, + "loss": 2.2553, + "loss_base2": 3.2537, + "loss_pixel": 0.2643, + "loss_text": 1.991, + "ppl": 9.5382, + "step": 765 + }, + { + "epoch": 0.0, + "global_step": 766, + "learning_rate": 0.0004976377295492487, + "loss": 2.2019, + "loss_base2": 3.1767, + "loss_pixel": 0.2646, + "loss_text": 1.9373, + "ppl": 9.0422, + "step": 766 + }, + { + "epoch": 0.0, + "global_step": 767, + "learning_rate": 0.0004976335559265442, + "loss": 2.1301, + "loss_base2": 3.0731, + "loss_pixel": 0.2652, + "loss_text": 1.865, + "ppl": 8.4157, + "step": 767 + }, + { + "epoch": 0.0, + "global_step": 768, + "learning_rate": 0.0004976293823038397, + "loss": 2.1026, + "loss_base2": 3.0334, + "loss_pixel": 0.2625, + "loss_text": 1.8401, + "ppl": 8.1874, + "step": 768 + }, + { + "epoch": 0.0, + "global_step": 769, + "learning_rate": 0.0004976252086811352, + "loss": 2.1112, + "loss_base2": 3.0458, + "loss_pixel": 0.2637, + "loss_text": 1.8475, + "ppl": 8.2581, + "step": 769 + }, + { + "epoch": 0.0, + "global_step": 770, + "learning_rate": 0.0004976210350584307, + "loss": 2.1255, + "loss_base2": 3.0664, + "loss_pixel": 0.2634, + "loss_text": 1.8621, + "ppl": 8.3771, + "step": 770 + }, + { + "epoch": 0.0, + "global_step": 771, + "learning_rate": 0.0004976168614357262, + "loss": 2.1066, + "loss_base2": 3.0392, + "loss_pixel": 0.2626, + "loss_text": 1.844, + "ppl": 8.2202, + "step": 771 + }, + { + "epoch": 0.0, + "global_step": 772, + "learning_rate": 0.0004976126878130217, + "loss": 2.1049, + "loss_base2": 3.0367, + "loss_pixel": 0.2646, + "loss_text": 1.8403, + "ppl": 8.2063, + "step": 772 + }, + { + "epoch": 0.0, + "global_step": 773, + "learning_rate": 0.0004976085141903172, + "loss": 2.0881, + "loss_base2": 3.0125, + "loss_pixel": 0.2653, + "loss_text": 1.8227, + "ppl": 8.0696, + "step": 773 + }, + { + "epoch": 0.0, + "global_step": 774, + "learning_rate": 0.0004976043405676128, + "loss": 2.1439, + "loss_base2": 3.093, + "loss_pixel": 0.2627, + "loss_text": 1.8812, + "ppl": 8.5327, + "step": 774 + }, + { + "epoch": 0.0, + "global_step": 775, + "learning_rate": 0.0004976001669449082, + "loss": 2.3199, + "loss_base2": 3.3469, + "loss_pixel": 0.2645, + "loss_text": 2.0554, + "ppl": 10.1747, + "step": 775 + }, + { + "epoch": 0.0, + "global_step": 776, + "learning_rate": 0.0004975959933222037, + "loss": 2.2968, + "loss_base2": 3.3136, + "loss_pixel": 0.2649, + "loss_text": 2.0319, + "ppl": 9.9423, + "step": 776 + }, + { + "epoch": 0.0, + "global_step": 777, + "learning_rate": 0.0004975918196994992, + "loss": 2.2986, + "loss_base2": 3.3162, + "loss_pixel": 0.2658, + "loss_text": 2.0328, + "ppl": 9.9602, + "step": 777 + }, + { + "epoch": 0.0, + "global_step": 778, + "learning_rate": 0.0004975876460767947, + "loss": 2.2975, + "loss_base2": 3.3146, + "loss_pixel": 0.2701, + "loss_text": 2.0274, + "ppl": 9.9493, + "step": 778 + }, + { + "epoch": 0.0, + "global_step": 779, + "learning_rate": 0.0004975834724540902, + "loss": 2.3091, + "loss_base2": 3.3313, + "loss_pixel": 0.2712, + "loss_text": 2.0378, + "ppl": 10.0654, + "step": 779 + }, + { + "epoch": 0.0, + "global_step": 780, + "learning_rate": 0.0004975792988313857, + "loss": 2.2952, + "loss_base2": 3.3113, + "loss_pixel": 0.2719, + "loss_text": 2.0233, + "ppl": 9.9264, + "step": 780 + }, + { + "epoch": 0.0, + "global_step": 781, + "learning_rate": 0.0004975751252086812, + "loss": 2.2857, + "loss_base2": 3.2976, + "loss_pixel": 0.2685, + "loss_text": 2.0172, + "ppl": 9.8326, + "step": 781 + }, + { + "epoch": 0.0, + "global_step": 782, + "learning_rate": 0.0004975709515859766, + "loss": 2.2883, + "loss_base2": 3.3013, + "loss_pixel": 0.2666, + "loss_text": 2.0218, + "ppl": 9.8582, + "step": 782 + }, + { + "epoch": 0.0, + "global_step": 783, + "learning_rate": 0.0004975667779632721, + "loss": 2.2783, + "loss_base2": 3.2869, + "loss_pixel": 0.2657, + "loss_text": 2.0127, + "ppl": 9.7601, + "step": 783 + }, + { + "epoch": 0.0, + "global_step": 784, + "learning_rate": 0.0004975626043405676, + "loss": 2.2765, + "loss_base2": 3.2843, + "loss_pixel": 0.2653, + "loss_text": 2.0112, + "ppl": 9.7425, + "step": 784 + }, + { + "epoch": 0.0, + "global_step": 785, + "learning_rate": 0.0004975584307178631, + "loss": 2.2539, + "loss_base2": 3.2517, + "loss_pixel": 0.2619, + "loss_text": 1.992, + "ppl": 9.5248, + "step": 785 + }, + { + "epoch": 0.0, + "global_step": 786, + "learning_rate": 0.0004975542570951586, + "loss": 2.2615, + "loss_base2": 3.2627, + "loss_pixel": 0.2617, + "loss_text": 1.9997, + "ppl": 9.5975, + "step": 786 + }, + { + "epoch": 0.0, + "global_step": 787, + "learning_rate": 0.0004975500834724541, + "loss": 2.2536, + "loss_base2": 3.2513, + "loss_pixel": 0.2618, + "loss_text": 1.9919, + "ppl": 9.522, + "step": 787 + }, + { + "epoch": 0.0, + "global_step": 788, + "learning_rate": 0.0004975459098497495, + "loss": 2.266, + "loss_base2": 3.2691, + "loss_pixel": 0.2602, + "loss_text": 2.0058, + "ppl": 9.6408, + "step": 788 + }, + { + "epoch": 0.0, + "global_step": 789, + "learning_rate": 0.000497541736227045, + "loss": 2.276, + "loss_base2": 3.2836, + "loss_pixel": 0.2605, + "loss_text": 2.0156, + "ppl": 9.7377, + "step": 789 + }, + { + "epoch": 0.0, + "global_step": 790, + "learning_rate": 0.0004975375626043405, + "loss": 2.2515, + "loss_base2": 3.2482, + "loss_pixel": 0.2605, + "loss_text": 1.9909, + "ppl": 9.502, + "step": 790 + }, + { + "epoch": 0.0, + "global_step": 791, + "learning_rate": 0.000497533388981636, + "loss": 2.2453, + "loss_base2": 3.2393, + "loss_pixel": 0.2597, + "loss_text": 1.9856, + "ppl": 9.4432, + "step": 791 + }, + { + "epoch": 0.0, + "global_step": 792, + "learning_rate": 0.0004975292153589316, + "loss": 2.2478, + "loss_base2": 3.2429, + "loss_pixel": 0.259, + "loss_text": 1.9888, + "ppl": 9.4669, + "step": 792 + }, + { + "epoch": 0.0, + "global_step": 793, + "learning_rate": 0.0004975250417362271, + "loss": 2.241, + "loss_base2": 3.2331, + "loss_pixel": 0.2576, + "loss_text": 1.9834, + "ppl": 9.4027, + "step": 793 + }, + { + "epoch": 0.0, + "global_step": 794, + "learning_rate": 0.0004975208681135226, + "loss": 2.2286, + "loss_base2": 3.2152, + "loss_pixel": 0.2587, + "loss_text": 1.9699, + "ppl": 9.2869, + "step": 794 + }, + { + "epoch": 0.0, + "global_step": 795, + "learning_rate": 0.0004975166944908181, + "loss": 2.2537, + "loss_base2": 3.2514, + "loss_pixel": 0.2576, + "loss_text": 1.9962, + "ppl": 9.5229, + "step": 795 + }, + { + "epoch": 0.0, + "global_step": 796, + "learning_rate": 0.0004975125208681136, + "loss": 2.2508, + "loss_base2": 3.2472, + "loss_pixel": 0.2589, + "loss_text": 1.9919, + "ppl": 9.4953, + "step": 796 + }, + { + "epoch": 0.0, + "global_step": 797, + "learning_rate": 0.000497508347245409, + "loss": 2.2631, + "loss_base2": 3.265, + "loss_pixel": 0.2609, + "loss_text": 2.0022, + "ppl": 9.6128, + "step": 797 + }, + { + "epoch": 0.0, + "global_step": 798, + "learning_rate": 0.0004975041736227045, + "loss": 2.2352, + "loss_base2": 3.2247, + "loss_pixel": 0.2582, + "loss_text": 1.977, + "ppl": 9.3484, + "step": 798 + }, + { + "epoch": 0.0, + "global_step": 799, + "learning_rate": 0.0004975, + "loss": 2.2078, + "loss_base2": 3.1852, + "loss_pixel": 0.2579, + "loss_text": 1.9498, + "ppl": 9.0957, + "step": 799 + }, + { + "epoch": 0.0, + "global_step": 800, + "learning_rate": 0.0004974958263772955, + "loss": 2.2276, + "loss_base2": 3.2137, + "loss_pixel": 0.2582, + "loss_text": 1.9694, + "ppl": 9.2776, + "step": 800 + }, + { + "epoch": 0.0, + "global_step": 801, + "learning_rate": 0.000497491652754591, + "loss": 2.2438, + "loss_base2": 3.2371, + "loss_pixel": 0.2564, + "loss_text": 1.9874, + "ppl": 9.4291, + "step": 801 + }, + { + "epoch": 0.0, + "global_step": 802, + "learning_rate": 0.0004974874791318864, + "loss": 2.2244, + "loss_base2": 3.2091, + "loss_pixel": 0.2559, + "loss_text": 1.9685, + "ppl": 9.2479, + "step": 802 + }, + { + "epoch": 0.0, + "global_step": 803, + "learning_rate": 0.0004974833055091819, + "loss": 2.2326, + "loss_base2": 3.221, + "loss_pixel": 0.2556, + "loss_text": 1.977, + "ppl": 9.3241, + "step": 803 + }, + { + "epoch": 0.0, + "global_step": 804, + "learning_rate": 0.0004974791318864774, + "loss": 2.2447, + "loss_base2": 3.2384, + "loss_pixel": 0.2561, + "loss_text": 1.9886, + "ppl": 9.4376, + "step": 804 + }, + { + "epoch": 0.0, + "global_step": 805, + "learning_rate": 0.0004974749582637729, + "loss": 2.2224, + "loss_base2": 3.2062, + "loss_pixel": 0.2569, + "loss_text": 1.9654, + "ppl": 9.2295, + "step": 805 + }, + { + "epoch": 0.0, + "global_step": 806, + "learning_rate": 0.0004974707846410684, + "loss": 2.23, + "loss_base2": 3.2172, + "loss_pixel": 0.2558, + "loss_text": 1.9743, + "ppl": 9.2999, + "step": 806 + }, + { + "epoch": 0.0, + "global_step": 807, + "learning_rate": 0.000497466611018364, + "loss": 2.2308, + "loss_base2": 3.2184, + "loss_pixel": 0.2544, + "loss_text": 1.9764, + "ppl": 9.3073, + "step": 807 + }, + { + "epoch": 0.0, + "global_step": 808, + "learning_rate": 0.0004974624373956595, + "loss": 2.2255, + "loss_base2": 3.2107, + "loss_pixel": 0.2546, + "loss_text": 1.9709, + "ppl": 9.2581, + "step": 808 + }, + { + "epoch": 0.0, + "global_step": 809, + "learning_rate": 0.000497458263772955, + "loss": 2.2133, + "loss_base2": 3.1931, + "loss_pixel": 0.2576, + "loss_text": 1.9557, + "ppl": 9.1458, + "step": 809 + }, + { + "epoch": 0.0, + "global_step": 810, + "learning_rate": 0.0004974540901502505, + "loss": 2.233, + "loss_base2": 3.2215, + "loss_pixel": 0.2549, + "loss_text": 1.9781, + "ppl": 9.3278, + "step": 810 + }, + { + "epoch": 0.0, + "global_step": 811, + "learning_rate": 0.0004974499165275459, + "loss": 2.2189, + "loss_base2": 3.2012, + "loss_pixel": 0.2533, + "loss_text": 1.9657, + "ppl": 9.1972, + "step": 811 + }, + { + "epoch": 0.0, + "global_step": 812, + "learning_rate": 0.0004974457429048414, + "loss": 2.2109, + "loss_base2": 3.1897, + "loss_pixel": 0.2559, + "loss_text": 1.955, + "ppl": 9.1239, + "step": 812 + }, + { + "epoch": 0.0, + "global_step": 813, + "learning_rate": 0.0004974415692821369, + "loss": 2.2013, + "loss_base2": 3.1758, + "loss_pixel": 0.2529, + "loss_text": 1.9484, + "ppl": 9.0368, + "step": 813 + }, + { + "epoch": 0.0, + "global_step": 814, + "learning_rate": 0.0004974373956594324, + "loss": 2.2281, + "loss_base2": 3.2145, + "loss_pixel": 0.2531, + "loss_text": 1.9749, + "ppl": 9.2822, + "step": 814 + }, + { + "epoch": 0.0, + "global_step": 815, + "learning_rate": 0.0004974332220367279, + "loss": 2.2279, + "loss_base2": 3.2142, + "loss_pixel": 0.2536, + "loss_text": 1.9743, + "ppl": 9.2804, + "step": 815 + }, + { + "epoch": 0.0, + "global_step": 816, + "learning_rate": 0.0004974290484140234, + "loss": 2.2091, + "loss_base2": 3.1871, + "loss_pixel": 0.2531, + "loss_text": 1.9559, + "ppl": 9.1075, + "step": 816 + }, + { + "epoch": 0.0, + "global_step": 817, + "learning_rate": 0.0004974248747913189, + "loss": 2.2043, + "loss_base2": 3.1801, + "loss_pixel": 0.2513, + "loss_text": 1.953, + "ppl": 9.0639, + "step": 817 + }, + { + "epoch": 0.0, + "global_step": 818, + "learning_rate": 0.0004974207011686144, + "loss": 2.2124, + "loss_base2": 3.1918, + "loss_pixel": 0.254, + "loss_text": 1.9584, + "ppl": 9.1376, + "step": 818 + }, + { + "epoch": 0.0, + "global_step": 819, + "learning_rate": 0.0004974165275459099, + "loss": 2.2148, + "loss_base2": 3.1953, + "loss_pixel": 0.255, + "loss_text": 1.9598, + "ppl": 9.1596, + "step": 819 + }, + { + "epoch": 0.0, + "global_step": 820, + "learning_rate": 0.0004974123539232053, + "loss": 2.2057, + "loss_base2": 3.1822, + "loss_pixel": 0.2525, + "loss_text": 1.9532, + "ppl": 9.0766, + "step": 820 + }, + { + "epoch": 0.0, + "global_step": 821, + "learning_rate": 0.0004974081803005008, + "loss": 2.2142, + "loss_base2": 3.1944, + "loss_pixel": 0.2566, + "loss_text": 1.9577, + "ppl": 9.1541, + "step": 821 + }, + { + "epoch": 0.0, + "global_step": 822, + "learning_rate": 0.0004974040066777963, + "loss": 2.2099, + "loss_base2": 3.1882, + "loss_pixel": 0.2557, + "loss_text": 1.9542, + "ppl": 9.1148, + "step": 822 + }, + { + "epoch": 0.0, + "global_step": 823, + "learning_rate": 0.0004973998330550919, + "loss": 2.1951, + "loss_base2": 3.1669, + "loss_pixel": 0.2544, + "loss_text": 1.9407, + "ppl": 8.9809, + "step": 823 + }, + { + "epoch": 0.0, + "global_step": 824, + "learning_rate": 0.0004973956594323874, + "loss": 2.1985, + "loss_base2": 3.1718, + "loss_pixel": 0.2529, + "loss_text": 1.9456, + "ppl": 9.0115, + "step": 824 + }, + { + "epoch": 0.0, + "global_step": 825, + "learning_rate": 0.0004973914858096828, + "loss": 2.2415, + "loss_base2": 3.2338, + "loss_pixel": 0.2513, + "loss_text": 1.9902, + "ppl": 9.4074, + "step": 825 + }, + { + "epoch": 0.0, + "global_step": 826, + "learning_rate": 0.0004973873121869783, + "loss": 2.2523, + "loss_base2": 3.2494, + "loss_pixel": 0.2516, + "loss_text": 2.0007, + "ppl": 9.5096, + "step": 826 + }, + { + "epoch": 0.0, + "global_step": 827, + "learning_rate": 0.0004973831385642738, + "loss": 2.244, + "loss_base2": 3.2374, + "loss_pixel": 0.2512, + "loss_text": 1.9928, + "ppl": 9.431, + "step": 827 + }, + { + "epoch": 0.0, + "global_step": 828, + "learning_rate": 0.0004973789649415693, + "loss": 2.2499, + "loss_base2": 3.2459, + "loss_pixel": 0.2516, + "loss_text": 1.9983, + "ppl": 9.4868, + "step": 828 + }, + { + "epoch": 0.0, + "global_step": 829, + "learning_rate": 0.0004973747913188648, + "loss": 2.2535, + "loss_base2": 3.2511, + "loss_pixel": 0.2537, + "loss_text": 1.9998, + "ppl": 9.521, + "step": 829 + }, + { + "epoch": 0.0, + "global_step": 830, + "learning_rate": 0.0004973706176961603, + "loss": 2.256, + "loss_base2": 3.2547, + "loss_pixel": 0.262, + "loss_text": 1.994, + "ppl": 9.5448, + "step": 830 + }, + { + "epoch": 0.0, + "global_step": 831, + "learning_rate": 0.0004973664440734558, + "loss": 2.2588, + "loss_base2": 3.2588, + "loss_pixel": 0.2609, + "loss_text": 1.9979, + "ppl": 9.5716, + "step": 831 + }, + { + "epoch": 0.0, + "global_step": 832, + "learning_rate": 0.0004973622704507513, + "loss": 2.2447, + "loss_base2": 3.2384, + "loss_pixel": 0.2541, + "loss_text": 1.9906, + "ppl": 9.4376, + "step": 832 + }, + { + "epoch": 0.0, + "global_step": 833, + "learning_rate": 0.0004973580968280468, + "loss": 2.247, + "loss_base2": 3.2417, + "loss_pixel": 0.2543, + "loss_text": 1.9928, + "ppl": 9.4593, + "step": 833 + }, + { + "epoch": 0.0, + "global_step": 834, + "learning_rate": 0.0004973539232053422, + "loss": 2.2556, + "loss_base2": 3.2541, + "loss_pixel": 0.2504, + "loss_text": 2.0052, + "ppl": 9.541, + "step": 834 + }, + { + "epoch": 0.0, + "global_step": 835, + "learning_rate": 0.0004973497495826377, + "loss": 2.2156, + "loss_base2": 3.1964, + "loss_pixel": 0.2492, + "loss_text": 1.9665, + "ppl": 9.1669, + "step": 835 + }, + { + "epoch": 0.0, + "global_step": 836, + "learning_rate": 0.0004973455759599332, + "loss": 2.2076, + "loss_base2": 3.1849, + "loss_pixel": 0.2481, + "loss_text": 1.9595, + "ppl": 9.0939, + "step": 836 + }, + { + "epoch": 0.0, + "global_step": 837, + "learning_rate": 0.0004973414023372287, + "loss": 2.2167, + "loss_base2": 3.198, + "loss_pixel": 0.2497, + "loss_text": 1.967, + "ppl": 9.177, + "step": 837 + }, + { + "epoch": 0.0, + "global_step": 838, + "learning_rate": 0.0004973372287145241, + "loss": 2.2022, + "loss_base2": 3.1771, + "loss_pixel": 0.2491, + "loss_text": 1.9532, + "ppl": 9.0449, + "step": 838 + }, + { + "epoch": 0.0, + "global_step": 839, + "learning_rate": 0.0004973330550918196, + "loss": 2.2022, + "loss_base2": 3.1771, + "loss_pixel": 0.2497, + "loss_text": 1.9525, + "ppl": 9.0449, + "step": 839 + }, + { + "epoch": 0.0, + "global_step": 840, + "learning_rate": 0.0004973288814691152, + "loss": 2.2168, + "loss_base2": 3.1982, + "loss_pixel": 0.2533, + "loss_text": 1.9635, + "ppl": 9.1779, + "step": 840 + }, + { + "epoch": 0.0, + "global_step": 841, + "learning_rate": 0.0004973247078464107, + "loss": 2.2045, + "loss_base2": 3.1804, + "loss_pixel": 0.2559, + "loss_text": 1.9486, + "ppl": 9.0657, + "step": 841 + }, + { + "epoch": 0.0, + "global_step": 842, + "learning_rate": 0.0004973205342237062, + "loss": 2.2098, + "loss_base2": 3.1881, + "loss_pixel": 0.253, + "loss_text": 1.9568, + "ppl": 9.1139, + "step": 842 + }, + { + "epoch": 0.0, + "global_step": 843, + "learning_rate": 0.0004973163606010017, + "loss": 2.2088, + "loss_base2": 3.1866, + "loss_pixel": 0.2543, + "loss_text": 1.9545, + "ppl": 9.1048, + "step": 843 + }, + { + "epoch": 0.0, + "global_step": 844, + "learning_rate": 0.0004973121869782972, + "loss": 2.1936, + "loss_base2": 3.1647, + "loss_pixel": 0.2542, + "loss_text": 1.9394, + "ppl": 8.9674, + "step": 844 + }, + { + "epoch": 0.0, + "global_step": 845, + "learning_rate": 0.0004973080133555927, + "loss": 2.205, + "loss_base2": 3.1811, + "loss_pixel": 0.2563, + "loss_text": 1.9487, + "ppl": 9.0703, + "step": 845 + }, + { + "epoch": 0.0, + "global_step": 846, + "learning_rate": 0.0004973038397328882, + "loss": 2.2077, + "loss_base2": 3.185, + "loss_pixel": 0.2526, + "loss_text": 1.9551, + "ppl": 9.0948, + "step": 846 + }, + { + "epoch": 0.0, + "global_step": 847, + "learning_rate": 0.0004972996661101836, + "loss": 2.1988, + "loss_base2": 3.1722, + "loss_pixel": 0.2524, + "loss_text": 1.9464, + "ppl": 9.0142, + "step": 847 + }, + { + "epoch": 0.0, + "global_step": 848, + "learning_rate": 0.0004972954924874791, + "loss": 2.2031, + "loss_base2": 3.1784, + "loss_pixel": 0.252, + "loss_text": 1.9511, + "ppl": 9.053, + "step": 848 + }, + { + "epoch": 0.0, + "global_step": 849, + "learning_rate": 0.0004972913188647746, + "loss": 2.1935, + "loss_base2": 3.1646, + "loss_pixel": 0.251, + "loss_text": 1.9425, + "ppl": 8.9665, + "step": 849 + }, + { + "epoch": 0.0, + "global_step": 850, + "learning_rate": 0.0004972871452420701, + "loss": 2.1792, + "loss_base2": 3.1439, + "loss_pixel": 0.2519, + "loss_text": 1.9272, + "ppl": 8.8392, + "step": 850 + }, + { + "epoch": 0.0, + "global_step": 851, + "learning_rate": 0.0004972829716193656, + "loss": 2.2007, + "loss_base2": 3.1749, + "loss_pixel": 0.2596, + "loss_text": 1.9412, + "ppl": 9.0313, + "step": 851 + }, + { + "epoch": 0.0, + "global_step": 852, + "learning_rate": 0.0004972787979966611, + "loss": 2.2023, + "loss_base2": 3.1772, + "loss_pixel": 0.2587, + "loss_text": 1.9436, + "ppl": 9.0458, + "step": 852 + }, + { + "epoch": 0.0, + "global_step": 853, + "learning_rate": 0.0004972746243739566, + "loss": 2.1903, + "loss_base2": 3.1599, + "loss_pixel": 0.2517, + "loss_text": 1.9386, + "ppl": 8.9379, + "step": 853 + }, + { + "epoch": 0.0, + "global_step": 854, + "learning_rate": 0.0004972704507512521, + "loss": 2.1874, + "loss_base2": 3.1558, + "loss_pixel": 0.2504, + "loss_text": 1.937, + "ppl": 8.912, + "step": 854 + }, + { + "epoch": 0.0, + "global_step": 855, + "learning_rate": 0.0004972662771285477, + "loss": 2.1958, + "loss_base2": 3.1679, + "loss_pixel": 0.2483, + "loss_text": 1.9475, + "ppl": 8.9872, + "step": 855 + }, + { + "epoch": 0.0, + "global_step": 856, + "learning_rate": 0.000497262103505843, + "loss": 2.2059, + "loss_base2": 3.1824, + "loss_pixel": 0.2493, + "loss_text": 1.9566, + "ppl": 9.0784, + "step": 856 + }, + { + "epoch": 0.0, + "global_step": 857, + "learning_rate": 0.0004972579298831386, + "loss": 2.1912, + "loss_base2": 3.1612, + "loss_pixel": 0.2477, + "loss_text": 1.9436, + "ppl": 8.9459, + "step": 857 + }, + { + "epoch": 0.0, + "global_step": 858, + "learning_rate": 0.0004972537562604341, + "loss": 2.1634, + "loss_base2": 3.1211, + "loss_pixel": 0.2501, + "loss_text": 1.9133, + "ppl": 8.7007, + "step": 858 + }, + { + "epoch": 0.0, + "global_step": 859, + "learning_rate": 0.0004972495826377296, + "loss": 2.1943, + "loss_base2": 3.1657, + "loss_pixel": 0.2524, + "loss_text": 1.9419, + "ppl": 8.9737, + "step": 859 + }, + { + "epoch": 0.0, + "global_step": 860, + "learning_rate": 0.0004972454090150251, + "loss": 2.1696, + "loss_base2": 3.1301, + "loss_pixel": 0.2514, + "loss_text": 1.9182, + "ppl": 8.7548, + "step": 860 + }, + { + "epoch": 0.0, + "global_step": 861, + "learning_rate": 0.0004972412353923205, + "loss": 2.1931, + "loss_base2": 3.164, + "loss_pixel": 0.2478, + "loss_text": 1.9453, + "ppl": 8.963, + "step": 861 + }, + { + "epoch": 0.0, + "global_step": 862, + "learning_rate": 0.000497237061769616, + "loss": 2.1754, + "loss_base2": 3.1384, + "loss_pixel": 0.2474, + "loss_text": 1.928, + "ppl": 8.8057, + "step": 862 + }, + { + "epoch": 0.0, + "global_step": 863, + "learning_rate": 0.0004972328881469115, + "loss": 2.1924, + "loss_base2": 3.163, + "loss_pixel": 0.248, + "loss_text": 1.9444, + "ppl": 8.9567, + "step": 863 + }, + { + "epoch": 0.0, + "global_step": 864, + "learning_rate": 0.000497228714524207, + "loss": 2.1619, + "loss_base2": 3.119, + "loss_pixel": 0.2469, + "loss_text": 1.915, + "ppl": 8.6876, + "step": 864 + }, + { + "epoch": 0.0, + "global_step": 865, + "learning_rate": 0.0004972245409015025, + "loss": 2.166, + "loss_base2": 3.1249, + "loss_pixel": 0.2481, + "loss_text": 1.9179, + "ppl": 8.7233, + "step": 865 + }, + { + "epoch": 0.0, + "global_step": 866, + "learning_rate": 0.000497220367278798, + "loss": 2.1685, + "loss_base2": 3.1285, + "loss_pixel": 0.2456, + "loss_text": 1.9229, + "ppl": 8.7452, + "step": 866 + }, + { + "epoch": 0.0, + "global_step": 867, + "learning_rate": 0.0004972161936560935, + "loss": 2.1672, + "loss_base2": 3.1266, + "loss_pixel": 0.2465, + "loss_text": 1.9208, + "ppl": 8.7338, + "step": 867 + }, + { + "epoch": 0.0, + "global_step": 868, + "learning_rate": 0.000497212020033389, + "loss": 2.1533, + "loss_base2": 3.1066, + "loss_pixel": 0.2425, + "loss_text": 1.9108, + "ppl": 8.6132, + "step": 868 + }, + { + "epoch": 0.0, + "global_step": 869, + "learning_rate": 0.0004972078464106845, + "loss": 2.1953, + "loss_base2": 3.1671, + "loss_pixel": 0.2476, + "loss_text": 1.9477, + "ppl": 8.9827, + "step": 869 + }, + { + "epoch": 0.0, + "global_step": 870, + "learning_rate": 0.0004972036727879799, + "loss": 2.1838, + "loss_base2": 3.1506, + "loss_pixel": 0.2545, + "loss_text": 1.9293, + "ppl": 8.88, + "step": 870 + }, + { + "epoch": 0.0, + "global_step": 871, + "learning_rate": 0.0004971994991652754, + "loss": 2.1896, + "loss_base2": 3.1589, + "loss_pixel": 0.2539, + "loss_text": 1.9357, + "ppl": 8.9316, + "step": 871 + }, + { + "epoch": 0.0, + "global_step": 872, + "learning_rate": 0.000497195325542571, + "loss": 2.157, + "loss_base2": 3.1119, + "loss_pixel": 0.2522, + "loss_text": 1.9048, + "ppl": 8.6452, + "step": 872 + }, + { + "epoch": 0.0, + "global_step": 873, + "learning_rate": 0.0004971911519198665, + "loss": 2.1072, + "loss_base2": 3.04, + "loss_pixel": 0.2506, + "loss_text": 1.8566, + "ppl": 8.2252, + "step": 873 + }, + { + "epoch": 0.0, + "global_step": 874, + "learning_rate": 0.000497186978297162, + "loss": 2.0765, + "loss_base2": 2.9958, + "loss_pixel": 0.2492, + "loss_text": 1.8272, + "ppl": 7.9765, + "step": 874 + }, + { + "epoch": 0.0, + "global_step": 875, + "learning_rate": 0.0004971828046744575, + "loss": 2.0481, + "loss_base2": 2.9548, + "loss_pixel": 0.2486, + "loss_text": 1.7995, + "ppl": 7.7532, + "step": 875 + }, + { + "epoch": 0.0, + "global_step": 876, + "learning_rate": 0.0004971786310517529, + "loss": 2.0484, + "loss_base2": 2.9552, + "loss_pixel": 0.2478, + "loss_text": 1.8006, + "ppl": 7.7555, + "step": 876 + }, + { + "epoch": 0.0, + "global_step": 877, + "learning_rate": 0.0004971744574290484, + "loss": 2.0836, + "loss_base2": 3.006, + "loss_pixel": 0.2476, + "loss_text": 1.836, + "ppl": 8.0333, + "step": 877 + }, + { + "epoch": 0.0, + "global_step": 878, + "learning_rate": 0.0004971702838063439, + "loss": 2.0709, + "loss_base2": 2.9877, + "loss_pixel": 0.2497, + "loss_text": 1.8211, + "ppl": 7.932, + "step": 878 + }, + { + "epoch": 0.0, + "global_step": 879, + "learning_rate": 0.0004971661101836394, + "loss": 2.0782, + "loss_base2": 2.9982, + "loss_pixel": 0.2557, + "loss_text": 1.8224, + "ppl": 7.9901, + "step": 879 + }, + { + "epoch": 0.0, + "global_step": 880, + "learning_rate": 0.0004971619365609349, + "loss": 2.0649, + "loss_base2": 2.979, + "loss_pixel": 0.2618, + "loss_text": 1.8031, + "ppl": 7.8845, + "step": 880 + }, + { + "epoch": 0.0, + "global_step": 881, + "learning_rate": 0.0004971577629382304, + "loss": 2.0816, + "loss_base2": 3.0031, + "loss_pixel": 0.2794, + "loss_text": 1.8021, + "ppl": 8.0173, + "step": 881 + }, + { + "epoch": 0.0, + "global_step": 882, + "learning_rate": 0.0004971535893155259, + "loss": 2.066, + "loss_base2": 2.9806, + "loss_pixel": 0.2745, + "loss_text": 1.7915, + "ppl": 7.8932, + "step": 882 + }, + { + "epoch": 0.0, + "global_step": 883, + "learning_rate": 0.0004971494156928214, + "loss": 2.0923, + "loss_base2": 3.0186, + "loss_pixel": 0.2726, + "loss_text": 1.8197, + "ppl": 8.1035, + "step": 883 + }, + { + "epoch": 0.0, + "global_step": 884, + "learning_rate": 0.0004971452420701168, + "loss": 2.0491, + "loss_base2": 2.9562, + "loss_pixel": 0.2714, + "loss_text": 1.7777, + "ppl": 7.7609, + "step": 884 + }, + { + "epoch": 0.0, + "global_step": 885, + "learning_rate": 0.0004971410684474123, + "loss": 2.0547, + "loss_base2": 2.9643, + "loss_pixel": 0.276, + "loss_text": 1.7787, + "ppl": 7.8045, + "step": 885 + }, + { + "epoch": 0.0, + "global_step": 886, + "learning_rate": 0.0004971368948247078, + "loss": 2.0622, + "loss_base2": 2.9751, + "loss_pixel": 0.2829, + "loss_text": 1.7793, + "ppl": 7.8632, + "step": 886 + }, + { + "epoch": 0.0, + "global_step": 887, + "learning_rate": 0.0004971327212020033, + "loss": 2.0414, + "loss_base2": 2.9451, + "loss_pixel": 0.2786, + "loss_text": 1.7628, + "ppl": 7.7014, + "step": 887 + }, + { + "epoch": 0.0, + "global_step": 888, + "learning_rate": 0.0004971285475792989, + "loss": 2.0446, + "loss_base2": 2.9497, + "loss_pixel": 0.278, + "loss_text": 1.7666, + "ppl": 7.7261, + "step": 888 + }, + { + "epoch": 0.0, + "global_step": 889, + "learning_rate": 0.0004971243739565944, + "loss": 2.0693, + "loss_base2": 2.9854, + "loss_pixel": 0.2749, + "loss_text": 1.7944, + "ppl": 7.9193, + "step": 889 + }, + { + "epoch": 0.0, + "global_step": 890, + "learning_rate": 0.0004971202003338899, + "loss": 2.2122, + "loss_base2": 3.1915, + "loss_pixel": 0.2687, + "loss_text": 1.9435, + "ppl": 9.1358, + "step": 890 + }, + { + "epoch": 0.0, + "global_step": 891, + "learning_rate": 0.0004971160267111854, + "loss": 2.2074, + "loss_base2": 3.1846, + "loss_pixel": 0.2675, + "loss_text": 1.9399, + "ppl": 9.092, + "step": 891 + }, + { + "epoch": 0.0, + "global_step": 892, + "learning_rate": 0.0004971118530884809, + "loss": 2.2621, + "loss_base2": 3.2635, + "loss_pixel": 0.2662, + "loss_text": 1.996, + "ppl": 9.6032, + "step": 892 + }, + { + "epoch": 0.0, + "global_step": 893, + "learning_rate": 0.0004971076794657763, + "loss": 2.2406, + "loss_base2": 3.2325, + "loss_pixel": 0.2625, + "loss_text": 1.9781, + "ppl": 9.399, + "step": 893 + }, + { + "epoch": 0.0, + "global_step": 894, + "learning_rate": 0.0004971035058430718, + "loss": 2.2482, + "loss_base2": 3.2435, + "loss_pixel": 0.2611, + "loss_text": 1.9871, + "ppl": 9.4707, + "step": 894 + }, + { + "epoch": 0.0, + "global_step": 895, + "learning_rate": 0.0004970993322203673, + "loss": 2.2467, + "loss_base2": 3.2413, + "loss_pixel": 0.2616, + "loss_text": 1.9852, + "ppl": 9.4565, + "step": 895 + }, + { + "epoch": 0.0, + "global_step": 896, + "learning_rate": 0.0004970951585976628, + "loss": 2.2182, + "loss_base2": 3.2002, + "loss_pixel": 0.2593, + "loss_text": 1.9589, + "ppl": 9.1908, + "step": 896 + }, + { + "epoch": 0.0, + "global_step": 897, + "learning_rate": 0.0004970909849749582, + "loss": 2.2268, + "loss_base2": 3.2126, + "loss_pixel": 0.2582, + "loss_text": 1.9686, + "ppl": 9.2702, + "step": 897 + }, + { + "epoch": 0.0, + "global_step": 898, + "learning_rate": 0.0004970868113522537, + "loss": 2.212, + "loss_base2": 3.1912, + "loss_pixel": 0.2571, + "loss_text": 1.9549, + "ppl": 9.134, + "step": 898 + }, + { + "epoch": 0.0, + "global_step": 899, + "learning_rate": 0.0004970826377295492, + "loss": 2.2081, + "loss_base2": 3.1856, + "loss_pixel": 0.256, + "loss_text": 1.9521, + "ppl": 9.0984, + "step": 899 + }, + { + "epoch": 0.0, + "global_step": 900, + "learning_rate": 0.0004970784641068447, + "loss": 2.2092, + "loss_base2": 3.1872, + "loss_pixel": 0.2552, + "loss_text": 1.954, + "ppl": 9.1084, + "step": 900 + }, + { + "epoch": 0.0, + "global_step": 901, + "learning_rate": 0.0004970742904841402, + "loss": 2.2147, + "loss_base2": 3.1951, + "loss_pixel": 0.2544, + "loss_text": 1.9603, + "ppl": 9.1587, + "step": 901 + }, + { + "epoch": 0.0, + "global_step": 902, + "learning_rate": 0.0004970701168614357, + "loss": 2.1924, + "loss_base2": 3.163, + "loss_pixel": 0.2533, + "loss_text": 1.9391, + "ppl": 8.9567, + "step": 902 + }, + { + "epoch": 0.0, + "global_step": 903, + "learning_rate": 0.0004970659432387312, + "loss": 2.1953, + "loss_base2": 3.1671, + "loss_pixel": 0.2524, + "loss_text": 1.9429, + "ppl": 8.9827, + "step": 903 + }, + { + "epoch": 0.0, + "global_step": 904, + "learning_rate": 0.0004970617696160268, + "loss": 2.2038, + "loss_base2": 3.1794, + "loss_pixel": 0.252, + "loss_text": 1.9519, + "ppl": 9.0594, + "step": 904 + }, + { + "epoch": 0.0, + "global_step": 905, + "learning_rate": 0.0004970575959933223, + "loss": 2.186, + "loss_base2": 3.1537, + "loss_pixel": 0.2521, + "loss_text": 1.9339, + "ppl": 8.8995, + "step": 905 + }, + { + "epoch": 0.0, + "global_step": 906, + "learning_rate": 0.0004970534223706177, + "loss": 2.1899, + "loss_base2": 3.1594, + "loss_pixel": 0.2522, + "loss_text": 1.9376, + "ppl": 8.9343, + "step": 906 + }, + { + "epoch": 0.0, + "global_step": 907, + "learning_rate": 0.0004970492487479132, + "loss": 2.2046, + "loss_base2": 3.1806, + "loss_pixel": 0.2521, + "loss_text": 1.9525, + "ppl": 9.0666, + "step": 907 + }, + { + "epoch": 0.0, + "global_step": 908, + "learning_rate": 0.0004970450751252087, + "loss": 2.194, + "loss_base2": 3.1653, + "loss_pixel": 0.2522, + "loss_text": 1.9418, + "ppl": 8.971, + "step": 908 + }, + { + "epoch": 0.0, + "global_step": 909, + "learning_rate": 0.0004970409015025042, + "loss": 2.2013, + "loss_base2": 3.1758, + "loss_pixel": 0.2507, + "loss_text": 1.9507, + "ppl": 9.0368, + "step": 909 + }, + { + "epoch": 0.0, + "global_step": 910, + "learning_rate": 0.0004970367278797997, + "loss": 2.1723, + "loss_base2": 3.134, + "loss_pixel": 0.2499, + "loss_text": 1.9223, + "ppl": 8.7785, + "step": 910 + }, + { + "epoch": 0.0, + "global_step": 911, + "learning_rate": 0.0004970325542570952, + "loss": 2.1704, + "loss_base2": 3.1312, + "loss_pixel": 0.2497, + "loss_text": 1.9207, + "ppl": 8.7618, + "step": 911 + }, + { + "epoch": 0.0, + "global_step": 912, + "learning_rate": 0.0004970283806343907, + "loss": 2.1641, + "loss_base2": 3.1221, + "loss_pixel": 0.2486, + "loss_text": 1.9155, + "ppl": 8.7068, + "step": 912 + }, + { + "epoch": 0.0, + "global_step": 913, + "learning_rate": 0.0004970242070116862, + "loss": 2.1739, + "loss_base2": 3.1363, + "loss_pixel": 0.2483, + "loss_text": 1.9256, + "ppl": 8.7925, + "step": 913 + }, + { + "epoch": 0.0, + "global_step": 914, + "learning_rate": 0.0004970200333889816, + "loss": 2.1584, + "loss_base2": 3.1139, + "loss_pixel": 0.2478, + "loss_text": 1.9106, + "ppl": 8.6573, + "step": 914 + }, + { + "epoch": 0.0, + "global_step": 915, + "learning_rate": 0.0004970158597662771, + "loss": 2.1634, + "loss_base2": 3.1211, + "loss_pixel": 0.2474, + "loss_text": 1.916, + "ppl": 8.7007, + "step": 915 + }, + { + "epoch": 0.0, + "global_step": 916, + "learning_rate": 0.0004970116861435726, + "loss": 2.1621, + "loss_base2": 3.1193, + "loss_pixel": 0.2461, + "loss_text": 1.916, + "ppl": 8.6894, + "step": 916 + }, + { + "epoch": 0.0, + "global_step": 917, + "learning_rate": 0.0004970075125208681, + "loss": 2.0096, + "loss_base2": 2.8992, + "loss_pixel": 0.2474, + "loss_text": 1.7622, + "ppl": 7.4603, + "step": 917 + }, + { + "epoch": 0.0, + "global_step": 918, + "learning_rate": 0.0004970033388981636, + "loss": 2.0149, + "loss_base2": 2.9069, + "loss_pixel": 0.2453, + "loss_text": 1.7696, + "ppl": 7.5, + "step": 918 + }, + { + "epoch": 0.0, + "global_step": 919, + "learning_rate": 0.0004969991652754591, + "loss": 1.9994, + "loss_base2": 2.8845, + "loss_pixel": 0.2457, + "loss_text": 1.7537, + "ppl": 7.3846, + "step": 919 + }, + { + "epoch": 0.0, + "global_step": 920, + "learning_rate": 0.0004969949916527545, + "loss": 2.0033, + "loss_base2": 2.8902, + "loss_pixel": 0.2454, + "loss_text": 1.7579, + "ppl": 7.4135, + "step": 920 + }, + { + "epoch": 0.0, + "global_step": 921, + "learning_rate": 0.00049699081803005, + "loss": 1.9842, + "loss_base2": 2.8626, + "loss_pixel": 0.2445, + "loss_text": 1.7397, + "ppl": 7.2732, + "step": 921 + }, + { + "epoch": 0.0, + "global_step": 922, + "learning_rate": 0.0004969866444073456, + "loss": 1.9919, + "loss_base2": 2.8737, + "loss_pixel": 0.2438, + "loss_text": 1.7481, + "ppl": 7.3294, + "step": 922 + }, + { + "epoch": 0.0, + "global_step": 923, + "learning_rate": 0.0004969824707846411, + "loss": 1.9787, + "loss_base2": 2.8547, + "loss_pixel": 0.2443, + "loss_text": 1.7344, + "ppl": 7.2333, + "step": 923 + }, + { + "epoch": 0.0, + "global_step": 924, + "learning_rate": 0.0004969782971619366, + "loss": 1.9587, + "loss_base2": 2.8258, + "loss_pixel": 0.2456, + "loss_text": 1.7131, + "ppl": 7.0901, + "step": 924 + }, + { + "epoch": 0.0, + "global_step": 925, + "learning_rate": 0.0004969741235392321, + "loss": 1.9475, + "loss_base2": 2.8096, + "loss_pixel": 0.2474, + "loss_text": 1.7, + "ppl": 7.0111, + "step": 925 + }, + { + "epoch": 0.0, + "global_step": 926, + "learning_rate": 0.0004969699499165276, + "loss": 1.9799, + "loss_base2": 2.8564, + "loss_pixel": 0.2474, + "loss_text": 1.7325, + "ppl": 7.242, + "step": 926 + }, + { + "epoch": 0.0, + "global_step": 927, + "learning_rate": 0.0004969657762938231, + "loss": 1.9679, + "loss_base2": 2.8391, + "loss_pixel": 0.2519, + "loss_text": 1.716, + "ppl": 7.1556, + "step": 927 + }, + { + "epoch": 0.0, + "global_step": 928, + "learning_rate": 0.0004969616026711186, + "loss": 1.9587, + "loss_base2": 2.8258, + "loss_pixel": 0.2546, + "loss_text": 1.704, + "ppl": 7.0901, + "step": 928 + }, + { + "epoch": 0.0, + "global_step": 929, + "learning_rate": 0.000496957429048414, + "loss": 1.9601, + "loss_base2": 2.8278, + "loss_pixel": 0.2547, + "loss_text": 1.7054, + "ppl": 7.1, + "step": 929 + }, + { + "epoch": 0.0, + "global_step": 930, + "learning_rate": 0.0004969532554257095, + "loss": 1.9476, + "loss_base2": 2.8098, + "loss_pixel": 0.2529, + "loss_text": 1.6947, + "ppl": 7.0118, + "step": 930 + }, + { + "epoch": 0.0, + "global_step": 931, + "learning_rate": 0.000496949081803005, + "loss": 1.9666, + "loss_base2": 2.8372, + "loss_pixel": 0.2505, + "loss_text": 1.7161, + "ppl": 7.1463, + "step": 931 + }, + { + "epoch": 0.0, + "global_step": 932, + "learning_rate": 0.0004969449081803005, + "loss": 2.0767, + "loss_base2": 2.996, + "loss_pixel": 0.2502, + "loss_text": 1.8265, + "ppl": 7.9781, + "step": 932 + }, + { + "epoch": 0.0, + "global_step": 933, + "learning_rate": 0.000496940734557596, + "loss": 2.1447, + "loss_base2": 3.0941, + "loss_pixel": 0.25, + "loss_text": 1.8948, + "ppl": 8.5395, + "step": 933 + }, + { + "epoch": 0.0, + "global_step": 934, + "learning_rate": 0.0004969365609348914, + "loss": 2.023, + "loss_base2": 2.9186, + "loss_pixel": 0.2496, + "loss_text": 1.7734, + "ppl": 7.561, + "step": 934 + }, + { + "epoch": 0.0, + "global_step": 935, + "learning_rate": 0.0004969323873121869, + "loss": 1.9577, + "loss_base2": 2.8244, + "loss_pixel": 0.2475, + "loss_text": 1.7102, + "ppl": 7.083, + "step": 935 + }, + { + "epoch": 0.0, + "global_step": 936, + "learning_rate": 0.0004969282136894824, + "loss": 1.9554, + "loss_base2": 2.821, + "loss_pixel": 0.2463, + "loss_text": 1.7091, + "ppl": 7.0667, + "step": 936 + }, + { + "epoch": 0.0, + "global_step": 937, + "learning_rate": 0.000496924040066778, + "loss": 1.9419, + "loss_base2": 2.8016, + "loss_pixel": 0.2458, + "loss_text": 1.6961, + "ppl": 6.972, + "step": 937 + }, + { + "epoch": 0.0, + "global_step": 938, + "learning_rate": 0.0004969198664440735, + "loss": 1.9411, + "loss_base2": 2.8004, + "loss_pixel": 0.2453, + "loss_text": 1.6958, + "ppl": 6.9664, + "step": 938 + }, + { + "epoch": 0.0, + "global_step": 939, + "learning_rate": 0.000496915692821369, + "loss": 1.9578, + "loss_base2": 2.8245, + "loss_pixel": 0.2462, + "loss_text": 1.7116, + "ppl": 7.0837, + "step": 939 + }, + { + "epoch": 0.0, + "global_step": 940, + "learning_rate": 0.0004969115191986645, + "loss": 1.9339, + "loss_base2": 2.79, + "loss_pixel": 0.2456, + "loss_text": 1.6883, + "ppl": 6.9164, + "step": 940 + }, + { + "epoch": 0.0, + "global_step": 941, + "learning_rate": 0.00049690734557596, + "loss": 2.0375, + "loss_base2": 2.9395, + "loss_pixel": 0.2435, + "loss_text": 1.7939, + "ppl": 7.6714, + "step": 941 + }, + { + "epoch": 0.0, + "global_step": 942, + "learning_rate": 0.0004969031719532555, + "loss": 2.0268, + "loss_base2": 2.9241, + "loss_pixel": 0.2453, + "loss_text": 1.7816, + "ppl": 7.5898, + "step": 942 + }, + { + "epoch": 0.0, + "global_step": 943, + "learning_rate": 0.0004968989983305509, + "loss": 1.9399, + "loss_base2": 2.7987, + "loss_pixel": 0.2465, + "loss_text": 1.6934, + "ppl": 6.9581, + "step": 943 + }, + { + "epoch": 0.0, + "global_step": 944, + "learning_rate": 0.0004968948247078464, + "loss": 1.918, + "loss_base2": 2.7671, + "loss_pixel": 0.2439, + "loss_text": 1.6741, + "ppl": 6.8073, + "step": 944 + }, + { + "epoch": 0.0, + "global_step": 945, + "learning_rate": 0.0004968906510851419, + "loss": 1.9345, + "loss_base2": 2.7909, + "loss_pixel": 0.2431, + "loss_text": 1.6913, + "ppl": 6.9206, + "step": 945 + }, + { + "epoch": 0.0, + "global_step": 946, + "learning_rate": 0.0004968864774624374, + "loss": 1.9075, + "loss_base2": 2.7519, + "loss_pixel": 0.2435, + "loss_text": 1.664, + "ppl": 6.7362, + "step": 946 + }, + { + "epoch": 0.0, + "global_step": 947, + "learning_rate": 0.0004968823038397329, + "loss": 1.9343, + "loss_base2": 2.7906, + "loss_pixel": 0.247, + "loss_text": 1.6872, + "ppl": 6.9192, + "step": 947 + }, + { + "epoch": 0.0, + "global_step": 948, + "learning_rate": 0.0004968781302170284, + "loss": 1.9375, + "loss_base2": 2.7952, + "loss_pixel": 0.2521, + "loss_text": 1.6854, + "ppl": 6.9414, + "step": 948 + }, + { + "epoch": 0.0, + "global_step": 949, + "learning_rate": 0.0004968739565943239, + "loss": 1.9318, + "loss_base2": 2.787, + "loss_pixel": 0.249, + "loss_text": 1.6829, + "ppl": 6.9019, + "step": 949 + }, + { + "epoch": 0.0, + "global_step": 950, + "learning_rate": 0.0004968697829716194, + "loss": 2.0947, + "loss_base2": 3.022, + "loss_pixel": 0.2474, + "loss_text": 1.8473, + "ppl": 8.123, + "step": 950 + }, + { + "epoch": 0.0, + "global_step": 951, + "learning_rate": 0.0004968656093489148, + "loss": 1.9615, + "loss_base2": 2.8298, + "loss_pixel": 0.2456, + "loss_text": 1.7159, + "ppl": 7.11, + "step": 951 + }, + { + "epoch": 0.0, + "global_step": 952, + "learning_rate": 0.0004968614357262103, + "loss": 1.9275, + "loss_base2": 2.7808, + "loss_pixel": 0.2465, + "loss_text": 1.681, + "ppl": 6.8723, + "step": 952 + }, + { + "epoch": 0.0, + "global_step": 953, + "learning_rate": 0.0004968572621035059, + "loss": 1.9129, + "loss_base2": 2.7597, + "loss_pixel": 0.244, + "loss_text": 1.6689, + "ppl": 6.7727, + "step": 953 + }, + { + "epoch": 0.0, + "global_step": 954, + "learning_rate": 0.0004968530884808014, + "loss": 1.9214, + "loss_base2": 2.772, + "loss_pixel": 0.2464, + "loss_text": 1.675, + "ppl": 6.8305, + "step": 954 + }, + { + "epoch": 0.0, + "global_step": 955, + "learning_rate": 0.0004968489148580969, + "loss": 1.9141, + "loss_base2": 2.7615, + "loss_pixel": 0.2489, + "loss_text": 1.6652, + "ppl": 6.7808, + "step": 955 + }, + { + "epoch": 0.0, + "global_step": 956, + "learning_rate": 0.0004968447412353923, + "loss": 1.8984, + "loss_base2": 2.7388, + "loss_pixel": 0.2462, + "loss_text": 1.6522, + "ppl": 6.6752, + "step": 956 + }, + { + "epoch": 0.0, + "global_step": 957, + "learning_rate": 0.0004968405676126878, + "loss": 1.9235, + "loss_base2": 2.775, + "loss_pixel": 0.2463, + "loss_text": 1.6772, + "ppl": 6.8449, + "step": 957 + }, + { + "epoch": 0.0, + "global_step": 958, + "learning_rate": 0.0004968363939899833, + "loss": 1.9173, + "loss_base2": 2.7661, + "loss_pixel": 0.2457, + "loss_text": 1.6716, + "ppl": 6.8026, + "step": 958 + }, + { + "epoch": 0.0, + "global_step": 959, + "learning_rate": 0.0004968322203672788, + "loss": 1.8905, + "loss_base2": 2.7274, + "loss_pixel": 0.245, + "loss_text": 1.6454, + "ppl": 6.6227, + "step": 959 + }, + { + "epoch": 0.0, + "global_step": 960, + "learning_rate": 0.0004968280467445743, + "loss": 1.8893, + "loss_base2": 2.7257, + "loss_pixel": 0.245, + "loss_text": 1.6443, + "ppl": 6.6147, + "step": 960 + }, + { + "epoch": 0.0, + "global_step": 961, + "learning_rate": 0.0004968238731218698, + "loss": 1.8853, + "loss_base2": 2.7199, + "loss_pixel": 0.2441, + "loss_text": 1.6412, + "ppl": 6.5883, + "step": 961 + }, + { + "epoch": 0.0, + "global_step": 962, + "learning_rate": 0.0004968196994991653, + "loss": 1.8827, + "loss_base2": 2.7162, + "loss_pixel": 0.2451, + "loss_text": 1.6376, + "ppl": 6.5712, + "step": 962 + }, + { + "epoch": 0.0, + "global_step": 963, + "learning_rate": 0.0004968155258764608, + "loss": 1.8812, + "loss_base2": 2.714, + "loss_pixel": 0.2454, + "loss_text": 1.6357, + "ppl": 6.5614, + "step": 963 + }, + { + "epoch": 0.0, + "global_step": 964, + "learning_rate": 0.0004968113522537563, + "loss": 1.8775, + "loss_base2": 2.7087, + "loss_pixel": 0.2462, + "loss_text": 1.6313, + "ppl": 6.5371, + "step": 964 + }, + { + "epoch": 0.0, + "global_step": 965, + "learning_rate": 0.0004968071786310517, + "loss": 1.8826, + "loss_base2": 2.716, + "loss_pixel": 0.2426, + "loss_text": 1.64, + "ppl": 6.5706, + "step": 965 + }, + { + "epoch": 0.0, + "global_step": 966, + "learning_rate": 0.0004968030050083472, + "loss": 1.8989, + "loss_base2": 2.7395, + "loss_pixel": 0.2428, + "loss_text": 1.6561, + "ppl": 6.6785, + "step": 966 + }, + { + "epoch": 0.0, + "global_step": 967, + "learning_rate": 0.0004967988313856427, + "loss": 1.8913, + "loss_base2": 2.7286, + "loss_pixel": 0.2426, + "loss_text": 1.6487, + "ppl": 6.628, + "step": 967 + }, + { + "epoch": 0.0, + "global_step": 968, + "learning_rate": 0.0004967946577629382, + "loss": 1.8843, + "loss_base2": 2.7185, + "loss_pixel": 0.2416, + "loss_text": 1.6428, + "ppl": 6.5817, + "step": 968 + }, + { + "epoch": 0.0, + "global_step": 969, + "learning_rate": 0.0004967904841402338, + "loss": 1.874, + "loss_base2": 2.7036, + "loss_pixel": 0.2409, + "loss_text": 1.6332, + "ppl": 6.5143, + "step": 969 + }, + { + "epoch": 0.0, + "global_step": 970, + "learning_rate": 0.0004967863105175292, + "loss": 1.8628, + "loss_base2": 2.6875, + "loss_pixel": 0.2409, + "loss_text": 1.6219, + "ppl": 6.4417, + "step": 970 + }, + { + "epoch": 0.0, + "global_step": 971, + "learning_rate": 0.0004967821368948247, + "loss": 1.8861, + "loss_base2": 2.7211, + "loss_pixel": 0.2407, + "loss_text": 1.6454, + "ppl": 6.5936, + "step": 971 + }, + { + "epoch": 0.0, + "global_step": 972, + "learning_rate": 0.0004967779632721202, + "loss": 1.8618, + "loss_base2": 2.686, + "loss_pixel": 0.2392, + "loss_text": 1.6226, + "ppl": 6.4353, + "step": 972 + }, + { + "epoch": 0.0, + "global_step": 973, + "learning_rate": 0.0004967737896494157, + "loss": 1.8683, + "loss_base2": 2.6954, + "loss_pixel": 0.2388, + "loss_text": 1.6295, + "ppl": 6.4773, + "step": 973 + }, + { + "epoch": 0.0, + "global_step": 974, + "learning_rate": 0.0004967696160267112, + "loss": 1.8468, + "loss_base2": 2.6644, + "loss_pixel": 0.238, + "loss_text": 1.6088, + "ppl": 6.3395, + "step": 974 + }, + { + "epoch": 0.0, + "global_step": 975, + "learning_rate": 0.0004967654424040067, + "loss": 2.088, + "loss_base2": 3.0123, + "loss_pixel": 0.2393, + "loss_text": 1.8488, + "ppl": 8.0688, + "step": 975 + }, + { + "epoch": 0.0, + "global_step": 976, + "learning_rate": 0.0004967612687813022, + "loss": 2.2203, + "loss_base2": 3.2032, + "loss_pixel": 0.242, + "loss_text": 1.9783, + "ppl": 9.2101, + "step": 976 + }, + { + "epoch": 0.0, + "global_step": 977, + "learning_rate": 0.0004967570951585977, + "loss": 2.2294, + "loss_base2": 3.2163, + "loss_pixel": 0.2625, + "loss_text": 1.9669, + "ppl": 9.2943, + "step": 977 + }, + { + "epoch": 0.0, + "global_step": 978, + "learning_rate": 0.0004967529215358932, + "loss": 2.2014, + "loss_base2": 3.1759, + "loss_pixel": 0.2627, + "loss_text": 1.9388, + "ppl": 9.0377, + "step": 978 + }, + { + "epoch": 0.0, + "global_step": 979, + "learning_rate": 0.0004967487479131886, + "loss": 2.2324, + "loss_base2": 3.2207, + "loss_pixel": 0.2727, + "loss_text": 1.9597, + "ppl": 9.3222, + "step": 979 + }, + { + "epoch": 0.0, + "global_step": 980, + "learning_rate": 0.0004967445742904841, + "loss": 2.2345, + "loss_base2": 3.2237, + "loss_pixel": 0.2718, + "loss_text": 1.9627, + "ppl": 9.3418, + "step": 980 + }, + { + "epoch": 0.0, + "global_step": 981, + "learning_rate": 0.0004967404006677796, + "loss": 2.2191, + "loss_base2": 3.2015, + "loss_pixel": 0.273, + "loss_text": 1.9462, + "ppl": 9.199, + "step": 981 + }, + { + "epoch": 0.0, + "global_step": 982, + "learning_rate": 0.0004967362270450751, + "loss": 2.2099, + "loss_base2": 3.1882, + "loss_pixel": 0.2667, + "loss_text": 1.9432, + "ppl": 9.1148, + "step": 982 + }, + { + "epoch": 0.0, + "global_step": 983, + "learning_rate": 0.0004967320534223706, + "loss": 2.1921, + "loss_base2": 3.1625, + "loss_pixel": 0.2646, + "loss_text": 1.9275, + "ppl": 8.954, + "step": 983 + }, + { + "epoch": 0.0, + "global_step": 984, + "learning_rate": 0.0004967278797996661, + "loss": 2.2043, + "loss_base2": 3.1801, + "loss_pixel": 0.2631, + "loss_text": 1.9411, + "ppl": 9.0639, + "step": 984 + }, + { + "epoch": 0.0, + "global_step": 985, + "learning_rate": 0.0004967237061769617, + "loss": 2.1861, + "loss_base2": 3.1539, + "loss_pixel": 0.2608, + "loss_text": 1.9253, + "ppl": 8.9004, + "step": 985 + }, + { + "epoch": 0.0, + "global_step": 986, + "learning_rate": 0.0004967195325542572, + "loss": 2.1876, + "loss_base2": 3.156, + "loss_pixel": 0.2566, + "loss_text": 1.931, + "ppl": 8.9138, + "step": 986 + }, + { + "epoch": 0.0, + "global_step": 987, + "learning_rate": 0.0004967153589315527, + "loss": 2.1743, + "loss_base2": 3.1369, + "loss_pixel": 0.2563, + "loss_text": 1.918, + "ppl": 8.796, + "step": 987 + }, + { + "epoch": 0.0, + "global_step": 988, + "learning_rate": 0.0004967111853088481, + "loss": 2.1649, + "loss_base2": 3.1233, + "loss_pixel": 0.254, + "loss_text": 1.9109, + "ppl": 8.7137, + "step": 988 + }, + { + "epoch": 0.0, + "global_step": 989, + "learning_rate": 0.0004967070116861436, + "loss": 2.161, + "loss_base2": 3.1177, + "loss_pixel": 0.2539, + "loss_text": 1.9072, + "ppl": 8.6798, + "step": 989 + }, + { + "epoch": 0.0, + "global_step": 990, + "learning_rate": 0.0004967028380634391, + "loss": 2.1599, + "loss_base2": 3.1161, + "loss_pixel": 0.2516, + "loss_text": 1.9083, + "ppl": 8.6703, + "step": 990 + }, + { + "epoch": 0.0, + "global_step": 991, + "learning_rate": 0.0004966986644407346, + "loss": 2.1595, + "loss_base2": 3.1155, + "loss_pixel": 0.2502, + "loss_text": 1.9093, + "ppl": 8.6668, + "step": 991 + }, + { + "epoch": 0.0, + "global_step": 992, + "learning_rate": 0.0004966944908180301, + "loss": 2.1636, + "loss_base2": 3.1214, + "loss_pixel": 0.2514, + "loss_text": 1.9122, + "ppl": 8.7024, + "step": 992 + }, + { + "epoch": 0.0, + "global_step": 993, + "learning_rate": 0.0004966903171953255, + "loss": 2.1603, + "loss_base2": 3.1167, + "loss_pixel": 0.2489, + "loss_text": 1.9114, + "ppl": 8.6737, + "step": 993 + }, + { + "epoch": 0.0, + "global_step": 994, + "learning_rate": 0.000496686143572621, + "loss": 2.1386, + "loss_base2": 3.0853, + "loss_pixel": 0.2474, + "loss_text": 1.8912, + "ppl": 8.4875, + "step": 994 + }, + { + "epoch": 0.0, + "global_step": 995, + "learning_rate": 0.0004966819699499165, + "loss": 2.1453, + "loss_base2": 3.095, + "loss_pixel": 0.2458, + "loss_text": 1.8995, + "ppl": 8.5446, + "step": 995 + }, + { + "epoch": 0.0, + "global_step": 996, + "learning_rate": 0.000496677796327212, + "loss": 2.1362, + "loss_base2": 3.0819, + "loss_pixel": 0.2447, + "loss_text": 1.8915, + "ppl": 8.4672, + "step": 996 + }, + { + "epoch": 0.0, + "global_step": 997, + "learning_rate": 0.0004966736227045075, + "loss": 2.1351, + "loss_base2": 3.0803, + "loss_pixel": 0.2431, + "loss_text": 1.892, + "ppl": 8.4579, + "step": 997 + }, + { + "epoch": 0.0, + "global_step": 998, + "learning_rate": 0.000496669449081803, + "loss": 2.1522, + "loss_base2": 3.105, + "loss_pixel": 0.2427, + "loss_text": 1.9096, + "ppl": 8.6038, + "step": 998 + }, + { + "epoch": 0.0, + "global_step": 999, + "learning_rate": 0.0004966652754590985, + "loss": 2.1514, + "loss_base2": 3.1038, + "loss_pixel": 0.2437, + "loss_text": 1.9077, + "ppl": 8.5969, + "step": 999 + }, + { + "epoch": 0.0, + "global_step": 1000, + "learning_rate": 0.000496661101836394, + "loss": 2.036, + "loss_base2": 2.9373, + "loss_pixel": 0.2436, + "loss_text": 1.7924, + "ppl": 7.6599, + "step": 1000 + }, + { + "epoch": 0.0, + "global_step": 1001, + "learning_rate": 0.0004966569282136896, + "loss": 1.8847, + "loss_base2": 2.719, + "loss_pixel": 0.2425, + "loss_text": 1.6422, + "ppl": 6.5844, + "step": 1001 + }, + { + "epoch": 0.0, + "global_step": 1002, + "learning_rate": 0.000496652754590985, + "loss": 1.8986, + "loss_base2": 2.7391, + "loss_pixel": 0.244, + "loss_text": 1.6546, + "ppl": 6.6765, + "step": 1002 + }, + { + "epoch": 0.0, + "global_step": 1003, + "learning_rate": 0.0004966485809682805, + "loss": 1.8913, + "loss_base2": 2.7286, + "loss_pixel": 0.2405, + "loss_text": 1.6508, + "ppl": 6.628, + "step": 1003 + }, + { + "epoch": 0.0, + "global_step": 1004, + "learning_rate": 0.000496644407345576, + "loss": 1.8728, + "loss_base2": 2.7019, + "loss_pixel": 0.2404, + "loss_text": 1.6324, + "ppl": 6.5065, + "step": 1004 + }, + { + "epoch": 0.0, + "global_step": 1005, + "learning_rate": 0.0004966402337228715, + "loss": 1.8755, + "loss_base2": 2.7058, + "loss_pixel": 0.2404, + "loss_text": 1.6351, + "ppl": 6.5241, + "step": 1005 + }, + { + "epoch": 0.0, + "global_step": 1006, + "learning_rate": 0.000496636060100167, + "loss": 1.8768, + "loss_base2": 2.7077, + "loss_pixel": 0.2396, + "loss_text": 1.6372, + "ppl": 6.5326, + "step": 1006 + }, + { + "epoch": 0.0, + "global_step": 1007, + "learning_rate": 0.0004966318864774624, + "loss": 1.8648, + "loss_base2": 2.6903, + "loss_pixel": 0.2406, + "loss_text": 1.6242, + "ppl": 6.4546, + "step": 1007 + }, + { + "epoch": 0.0, + "global_step": 1008, + "learning_rate": 0.0004966277128547579, + "loss": 1.9016, + "loss_base2": 2.7434, + "loss_pixel": 0.2392, + "loss_text": 1.6624, + "ppl": 6.6966, + "step": 1008 + }, + { + "epoch": 0.0, + "global_step": 1009, + "learning_rate": 0.0004966235392320534, + "loss": 1.8805, + "loss_base2": 2.713, + "loss_pixel": 0.2392, + "loss_text": 1.6413, + "ppl": 6.5568, + "step": 1009 + }, + { + "epoch": 0.0, + "global_step": 1010, + "learning_rate": 0.0004966193656093489, + "loss": 1.8561, + "loss_base2": 2.6778, + "loss_pixel": 0.2381, + "loss_text": 1.6179, + "ppl": 6.3987, + "step": 1010 + }, + { + "epoch": 0.0, + "global_step": 1011, + "learning_rate": 0.0004966151919866444, + "loss": 1.8688, + "loss_base2": 2.6961, + "loss_pixel": 0.238, + "loss_text": 1.6307, + "ppl": 6.4805, + "step": 1011 + }, + { + "epoch": 0.0, + "global_step": 1012, + "learning_rate": 0.0004966110183639399, + "loss": 1.8689, + "loss_base2": 2.6963, + "loss_pixel": 0.237, + "loss_text": 1.6319, + "ppl": 6.4812, + "step": 1012 + }, + { + "epoch": 0.0, + "global_step": 1013, + "learning_rate": 0.0004966068447412354, + "loss": 1.8771, + "loss_base2": 2.7081, + "loss_pixel": 0.2377, + "loss_text": 1.6393, + "ppl": 6.5345, + "step": 1013 + }, + { + "epoch": 0.0, + "global_step": 1014, + "learning_rate": 0.0004966026711185309, + "loss": 1.834, + "loss_base2": 2.6459, + "loss_pixel": 0.2364, + "loss_text": 1.5976, + "ppl": 6.2589, + "step": 1014 + }, + { + "epoch": 0.0, + "global_step": 1015, + "learning_rate": 0.0004965984974958263, + "loss": 1.8375, + "loss_base2": 2.651, + "loss_pixel": 0.2356, + "loss_text": 1.602, + "ppl": 6.2808, + "step": 1015 + }, + { + "epoch": 0.0, + "global_step": 1016, + "learning_rate": 0.0004965943238731218, + "loss": 1.8756, + "loss_base2": 2.7059, + "loss_pixel": 0.2356, + "loss_text": 1.64, + "ppl": 6.5247, + "step": 1016 + }, + { + "epoch": 0.0, + "global_step": 1017, + "learning_rate": 0.0004965901502504173, + "loss": 2.0862, + "loss_base2": 3.0098, + "loss_pixel": 0.2346, + "loss_text": 1.8515, + "ppl": 8.0543, + "step": 1017 + }, + { + "epoch": 0.0, + "global_step": 1018, + "learning_rate": 0.0004965859766277129, + "loss": 2.0537, + "loss_base2": 2.9629, + "loss_pixel": 0.2344, + "loss_text": 1.8193, + "ppl": 7.7967, + "step": 1018 + }, + { + "epoch": 0.0, + "global_step": 1019, + "learning_rate": 0.0004965818030050084, + "loss": 1.8688, + "loss_base2": 2.6961, + "loss_pixel": 0.2359, + "loss_text": 1.6328, + "ppl": 6.4805, + "step": 1019 + }, + { + "epoch": 0.0, + "global_step": 1020, + "learning_rate": 0.0004965776293823039, + "loss": 1.872, + "loss_base2": 2.7007, + "loss_pixel": 0.2352, + "loss_text": 1.6368, + "ppl": 6.5013, + "step": 1020 + }, + { + "epoch": 0.0, + "global_step": 1021, + "learning_rate": 0.0004965734557595994, + "loss": 1.86, + "loss_base2": 2.6834, + "loss_pixel": 0.2361, + "loss_text": 1.6239, + "ppl": 6.4237, + "step": 1021 + }, + { + "epoch": 0.0, + "global_step": 1022, + "learning_rate": 0.0004965692821368949, + "loss": 1.8731, + "loss_base2": 2.7023, + "loss_pixel": 0.2365, + "loss_text": 1.6366, + "ppl": 6.5084, + "step": 1022 + }, + { + "epoch": 0.0, + "global_step": 1023, + "learning_rate": 0.0004965651085141904, + "loss": 1.8393, + "loss_base2": 2.6535, + "loss_pixel": 0.236, + "loss_text": 1.6033, + "ppl": 6.2921, + "step": 1023 + }, + { + "epoch": 0.0, + "global_step": 1024, + "learning_rate": 0.0004965609348914858, + "loss": 1.8488, + "loss_base2": 2.6673, + "loss_pixel": 0.2366, + "loss_text": 1.6122, + "ppl": 6.3522, + "step": 1024 + }, + { + "epoch": 0.0, + "global_step": 1025, + "learning_rate": 0.0004965567612687813, + "loss": 1.8372, + "loss_base2": 2.6505, + "loss_pixel": 0.2344, + "loss_text": 1.6028, + "ppl": 6.2789, + "step": 1025 + }, + { + "epoch": 0.0, + "global_step": 1026, + "learning_rate": 0.0004965525876460768, + "loss": 1.8377, + "loss_base2": 2.6512, + "loss_pixel": 0.2343, + "loss_text": 1.6034, + "ppl": 6.2821, + "step": 1026 + }, + { + "epoch": 0.0, + "global_step": 1027, + "learning_rate": 0.0004965484140233723, + "loss": 1.8426, + "loss_base2": 2.6583, + "loss_pixel": 0.2338, + "loss_text": 1.6088, + "ppl": 6.3129, + "step": 1027 + }, + { + "epoch": 0.0, + "global_step": 1028, + "learning_rate": 0.0004965442404006678, + "loss": 1.8517, + "loss_base2": 2.6714, + "loss_pixel": 0.2365, + "loss_text": 1.6152, + "ppl": 6.3706, + "step": 1028 + }, + { + "epoch": 0.0, + "global_step": 1029, + "learning_rate": 0.0004965400667779632, + "loss": 1.844, + "loss_base2": 2.6603, + "loss_pixel": 0.2409, + "loss_text": 1.6031, + "ppl": 6.3218, + "step": 1029 + }, + { + "epoch": 0.0, + "global_step": 1030, + "learning_rate": 0.0004965358931552587, + "loss": 1.8298, + "loss_base2": 2.6398, + "loss_pixel": 0.2391, + "loss_text": 1.5907, + "ppl": 6.2326, + "step": 1030 + }, + { + "epoch": 0.0, + "global_step": 1031, + "learning_rate": 0.0004965317195325542, + "loss": 1.8335, + "loss_base2": 2.6452, + "loss_pixel": 0.2437, + "loss_text": 1.5897, + "ppl": 6.2557, + "step": 1031 + }, + { + "epoch": 0.0, + "global_step": 1032, + "learning_rate": 0.0004965275459098497, + "loss": 1.8571, + "loss_base2": 2.6792, + "loss_pixel": 0.2416, + "loss_text": 1.6154, + "ppl": 6.4051, + "step": 1032 + }, + { + "epoch": 0.0, + "global_step": 1033, + "learning_rate": 0.0004965233722871452, + "loss": 1.8485, + "loss_base2": 2.6668, + "loss_pixel": 0.2394, + "loss_text": 1.6091, + "ppl": 6.3503, + "step": 1033 + }, + { + "epoch": 0.0, + "global_step": 1034, + "learning_rate": 0.0004965191986644408, + "loss": 1.8144, + "loss_base2": 2.6176, + "loss_pixel": 0.2387, + "loss_text": 1.5757, + "ppl": 6.1374, + "step": 1034 + }, + { + "epoch": 0.0, + "global_step": 1035, + "learning_rate": 0.0004965150250417363, + "loss": 1.9299, + "loss_base2": 2.7843, + "loss_pixel": 0.2375, + "loss_text": 1.6924, + "ppl": 6.8888, + "step": 1035 + }, + { + "epoch": 0.0, + "global_step": 1036, + "learning_rate": 0.0004965108514190318, + "loss": 2.1971, + "loss_base2": 3.1697, + "loss_pixel": 0.2384, + "loss_text": 1.9587, + "ppl": 8.9989, + "step": 1036 + }, + { + "epoch": 0.0, + "global_step": 1037, + "learning_rate": 0.0004965066777963273, + "loss": 2.1724, + "loss_base2": 3.1341, + "loss_pixel": 0.2359, + "loss_text": 1.9365, + "ppl": 8.7793, + "step": 1037 + }, + { + "epoch": 0.0, + "global_step": 1038, + "learning_rate": 0.0004965025041736227, + "loss": 2.162, + "loss_base2": 3.1191, + "loss_pixel": 0.2356, + "loss_text": 1.9264, + "ppl": 8.6885, + "step": 1038 + }, + { + "epoch": 0.0, + "global_step": 1039, + "learning_rate": 0.0004964983305509182, + "loss": 2.1636, + "loss_base2": 3.1214, + "loss_pixel": 0.2339, + "loss_text": 1.9297, + "ppl": 8.7024, + "step": 1039 + }, + { + "epoch": 0.0, + "global_step": 1040, + "learning_rate": 0.0004964941569282137, + "loss": 2.1571, + "loss_base2": 3.112, + "loss_pixel": 0.2351, + "loss_text": 1.922, + "ppl": 8.646, + "step": 1040 + }, + { + "epoch": 0.0, + "global_step": 1041, + "learning_rate": 0.0004964899833055092, + "loss": 2.1471, + "loss_base2": 3.0976, + "loss_pixel": 0.2342, + "loss_text": 1.9129, + "ppl": 8.56, + "step": 1041 + }, + { + "epoch": 0.0, + "global_step": 1042, + "learning_rate": 0.0004964858096828047, + "loss": 2.1288, + "loss_base2": 3.0712, + "loss_pixel": 0.2327, + "loss_text": 1.8962, + "ppl": 8.4048, + "step": 1042 + }, + { + "epoch": 0.0, + "global_step": 1043, + "learning_rate": 0.0004964816360601002, + "loss": 2.1297, + "loss_base2": 3.0725, + "loss_pixel": 0.2327, + "loss_text": 1.897, + "ppl": 8.4123, + "step": 1043 + }, + { + "epoch": 0.0, + "global_step": 1044, + "learning_rate": 0.0004964774624373957, + "loss": 2.141, + "loss_base2": 3.0888, + "loss_pixel": 0.2334, + "loss_text": 1.9076, + "ppl": 8.5079, + "step": 1044 + }, + { + "epoch": 0.0, + "global_step": 1045, + "learning_rate": 0.0004964732888146911, + "loss": 2.1482, + "loss_base2": 3.0992, + "loss_pixel": 0.2332, + "loss_text": 1.9149, + "ppl": 8.5694, + "step": 1045 + }, + { + "epoch": 0.0, + "global_step": 1046, + "learning_rate": 0.0004964691151919866, + "loss": 2.1278, + "loss_base2": 3.0698, + "loss_pixel": 0.2314, + "loss_text": 1.8963, + "ppl": 8.3964, + "step": 1046 + }, + { + "epoch": 0.0, + "global_step": 1047, + "learning_rate": 0.0004964649415692821, + "loss": 2.122, + "loss_base2": 3.0614, + "loss_pixel": 0.2326, + "loss_text": 1.8894, + "ppl": 8.3478, + "step": 1047 + }, + { + "epoch": 0.0, + "global_step": 1048, + "learning_rate": 0.0004964607679465776, + "loss": 2.1225, + "loss_base2": 3.0621, + "loss_pixel": 0.2328, + "loss_text": 1.8897, + "ppl": 8.352, + "step": 1048 + }, + { + "epoch": 0.0, + "global_step": 1049, + "learning_rate": 0.0004964565943238731, + "loss": 2.1327, + "loss_base2": 3.0768, + "loss_pixel": 0.2365, + "loss_text": 1.8961, + "ppl": 8.4376, + "step": 1049 + }, + { + "epoch": 0.0, + "global_step": 1050, + "learning_rate": 0.0004964524207011687, + "loss": 2.1191, + "loss_base2": 3.0572, + "loss_pixel": 0.2349, + "loss_text": 1.8842, + "ppl": 8.3236, + "step": 1050 + }, + { + "epoch": 0.0, + "global_step": 1051, + "learning_rate": 0.0004964482470784642, + "loss": 2.1336, + "loss_base2": 3.0781, + "loss_pixel": 0.2348, + "loss_text": 1.8988, + "ppl": 8.4452, + "step": 1051 + }, + { + "epoch": 0.0, + "global_step": 1052, + "learning_rate": 0.0004964440734557596, + "loss": 2.1238, + "loss_base2": 3.064, + "loss_pixel": 0.2338, + "loss_text": 1.8899, + "ppl": 8.3629, + "step": 1052 + }, + { + "epoch": 0.0, + "global_step": 1053, + "learning_rate": 0.0004964398998330551, + "loss": 2.1251, + "loss_base2": 3.0659, + "loss_pixel": 0.2333, + "loss_text": 1.8918, + "ppl": 8.3737, + "step": 1053 + }, + { + "epoch": 0.0, + "global_step": 1054, + "learning_rate": 0.0004964357262103506, + "loss": 2.125, + "loss_base2": 3.0657, + "loss_pixel": 0.2326, + "loss_text": 1.8924, + "ppl": 8.3729, + "step": 1054 + }, + { + "epoch": 0.0, + "global_step": 1055, + "learning_rate": 0.0004964315525876461, + "loss": 2.0994, + "loss_base2": 3.0288, + "loss_pixel": 0.2312, + "loss_text": 1.8682, + "ppl": 8.1613, + "step": 1055 + }, + { + "epoch": 0.0, + "global_step": 1056, + "learning_rate": 0.0004964273789649416, + "loss": 2.1101, + "loss_base2": 3.0442, + "loss_pixel": 0.2321, + "loss_text": 1.878, + "ppl": 8.2491, + "step": 1056 + }, + { + "epoch": 0.0, + "global_step": 1057, + "learning_rate": 0.0004964232053422371, + "loss": 2.1185, + "loss_base2": 3.0563, + "loss_pixel": 0.2324, + "loss_text": 1.8861, + "ppl": 8.3187, + "step": 1057 + }, + { + "epoch": 0.0, + "global_step": 1058, + "learning_rate": 0.0004964190317195326, + "loss": 2.1196, + "loss_base2": 3.0579, + "loss_pixel": 0.2313, + "loss_text": 1.8884, + "ppl": 8.3278, + "step": 1058 + }, + { + "epoch": 0.0, + "global_step": 1059, + "learning_rate": 0.0004964148580968281, + "loss": 2.1165, + "loss_base2": 3.0535, + "loss_pixel": 0.2314, + "loss_text": 1.8851, + "ppl": 8.302, + "step": 1059 + }, + { + "epoch": 0.0, + "global_step": 1060, + "learning_rate": 0.0004964106844741236, + "loss": 2.0865, + "loss_base2": 3.0102, + "loss_pixel": 0.2299, + "loss_text": 1.8567, + "ppl": 8.0567, + "step": 1060 + }, + { + "epoch": 0.0, + "global_step": 1061, + "learning_rate": 0.000496406510851419, + "loss": 2.1039, + "loss_base2": 3.0353, + "loss_pixel": 0.2298, + "loss_text": 1.8741, + "ppl": 8.1981, + "step": 1061 + }, + { + "epoch": 0.0, + "global_step": 1062, + "learning_rate": 0.0004964023372287145, + "loss": 2.1017, + "loss_base2": 3.0321, + "loss_pixel": 0.2298, + "loss_text": 1.8719, + "ppl": 8.1801, + "step": 1062 + }, + { + "epoch": 0.0, + "global_step": 1063, + "learning_rate": 0.00049639816360601, + "loss": 2.0636, + "loss_base2": 2.9771, + "loss_pixel": 0.2295, + "loss_text": 1.8341, + "ppl": 7.8743, + "step": 1063 + }, + { + "epoch": 0.0, + "global_step": 1064, + "learning_rate": 0.0004963939899833055, + "loss": 2.0831, + "loss_base2": 3.0053, + "loss_pixel": 0.2286, + "loss_text": 1.8545, + "ppl": 8.0293, + "step": 1064 + }, + { + "epoch": 0.0, + "global_step": 1065, + "learning_rate": 0.0004963898163606009, + "loss": 2.0987, + "loss_base2": 3.0278, + "loss_pixel": 0.2294, + "loss_text": 1.8693, + "ppl": 8.1556, + "step": 1065 + }, + { + "epoch": 0.0, + "global_step": 1066, + "learning_rate": 0.0004963856427378964, + "loss": 2.0888, + "loss_base2": 3.0135, + "loss_pixel": 0.2297, + "loss_text": 1.8591, + "ppl": 8.0752, + "step": 1066 + }, + { + "epoch": 0.0, + "global_step": 1067, + "learning_rate": 0.000496381469115192, + "loss": 2.0932, + "loss_base2": 3.0198, + "loss_pixel": 0.2298, + "loss_text": 1.8634, + "ppl": 8.1108, + "step": 1067 + }, + { + "epoch": 0.0, + "global_step": 1068, + "learning_rate": 0.0004963772954924875, + "loss": 2.0959, + "loss_base2": 3.0237, + "loss_pixel": 0.2307, + "loss_text": 1.8651, + "ppl": 8.1328, + "step": 1068 + }, + { + "epoch": 0.0, + "global_step": 1069, + "learning_rate": 0.000496373121869783, + "loss": 2.0839, + "loss_base2": 3.0064, + "loss_pixel": 0.2296, + "loss_text": 1.8543, + "ppl": 8.0357, + "step": 1069 + }, + { + "epoch": 0.0, + "global_step": 1070, + "learning_rate": 0.0004963689482470785, + "loss": 2.0922, + "loss_base2": 3.0184, + "loss_pixel": 0.2282, + "loss_text": 1.864, + "ppl": 8.1027, + "step": 1070 + }, + { + "epoch": 0.0, + "global_step": 1071, + "learning_rate": 0.000496364774624374, + "loss": 2.089, + "loss_base2": 3.0138, + "loss_pixel": 0.2287, + "loss_text": 1.8603, + "ppl": 8.0768, + "step": 1071 + }, + { + "epoch": 0.0, + "global_step": 1072, + "learning_rate": 0.0004963606010016695, + "loss": 2.0842, + "loss_base2": 3.0069, + "loss_pixel": 0.2276, + "loss_text": 1.8566, + "ppl": 8.0382, + "step": 1072 + }, + { + "epoch": 0.0, + "global_step": 1073, + "learning_rate": 0.000496356427378965, + "loss": 2.0581, + "loss_base2": 2.9692, + "loss_pixel": 0.2278, + "loss_text": 1.8303, + "ppl": 7.8311, + "step": 1073 + }, + { + "epoch": 0.0, + "global_step": 1074, + "learning_rate": 0.0004963522537562604, + "loss": 2.0925, + "loss_base2": 3.0188, + "loss_pixel": 0.2283, + "loss_text": 1.8642, + "ppl": 8.1052, + "step": 1074 + }, + { + "epoch": 0.0, + "global_step": 1075, + "learning_rate": 0.0004963480801335559, + "loss": 2.1053, + "loss_base2": 3.0373, + "loss_pixel": 0.2276, + "loss_text": 1.8777, + "ppl": 8.2096, + "step": 1075 + }, + { + "epoch": 0.0, + "global_step": 1076, + "learning_rate": 0.0004963439065108514, + "loss": 2.0673, + "loss_base2": 2.9825, + "loss_pixel": 0.2281, + "loss_text": 1.8392, + "ppl": 7.9035, + "step": 1076 + }, + { + "epoch": 0.0, + "global_step": 1077, + "learning_rate": 0.0004963397328881469, + "loss": 2.0896, + "loss_base2": 3.0147, + "loss_pixel": 0.2278, + "loss_text": 1.8618, + "ppl": 8.0817, + "step": 1077 + }, + { + "epoch": 0.0, + "global_step": 1078, + "learning_rate": 0.0004963355592654424, + "loss": 2.0951, + "loss_base2": 3.0226, + "loss_pixel": 0.2286, + "loss_text": 1.8665, + "ppl": 8.1263, + "step": 1078 + }, + { + "epoch": 0.0, + "global_step": 1079, + "learning_rate": 0.0004963313856427379, + "loss": 2.0929, + "loss_base2": 3.0194, + "loss_pixel": 0.2277, + "loss_text": 1.8652, + "ppl": 8.1084, + "step": 1079 + }, + { + "epoch": 0.0, + "global_step": 1080, + "learning_rate": 0.0004963272120200334, + "loss": 2.0905, + "loss_base2": 3.016, + "loss_pixel": 0.2278, + "loss_text": 1.8627, + "ppl": 8.089, + "step": 1080 + }, + { + "epoch": 0.0, + "global_step": 1081, + "learning_rate": 0.000496323038397329, + "loss": 2.0932, + "loss_base2": 3.0198, + "loss_pixel": 0.228, + "loss_text": 1.8652, + "ppl": 8.1108, + "step": 1081 + }, + { + "epoch": 0.0, + "global_step": 1082, + "learning_rate": 0.0004963188647746245, + "loss": 1.9023, + "loss_base2": 2.7444, + "loss_pixel": 0.2265, + "loss_text": 1.6758, + "ppl": 6.7013, + "step": 1082 + }, + { + "epoch": 0.0, + "global_step": 1083, + "learning_rate": 0.0004963146911519199, + "loss": 1.8427, + "loss_base2": 2.6585, + "loss_pixel": 0.2253, + "loss_text": 1.6174, + "ppl": 6.3136, + "step": 1083 + }, + { + "epoch": 0.0, + "global_step": 1084, + "learning_rate": 0.0004963105175292154, + "loss": 1.8417, + "loss_base2": 2.657, + "loss_pixel": 0.2272, + "loss_text": 1.6145, + "ppl": 6.3073, + "step": 1084 + }, + { + "epoch": 0.0, + "global_step": 1085, + "learning_rate": 0.0004963063439065109, + "loss": 1.8464, + "loss_base2": 2.6638, + "loss_pixel": 0.2269, + "loss_text": 1.6194, + "ppl": 6.337, + "step": 1085 + }, + { + "epoch": 0.0, + "global_step": 1086, + "learning_rate": 0.0004963021702838064, + "loss": 1.8193, + "loss_base2": 2.6247, + "loss_pixel": 0.228, + "loss_text": 1.5913, + "ppl": 6.1675, + "step": 1086 + }, + { + "epoch": 0.0, + "global_step": 1087, + "learning_rate": 0.0004962979966611019, + "loss": 1.852, + "loss_base2": 2.6719, + "loss_pixel": 0.2322, + "loss_text": 1.6199, + "ppl": 6.3726, + "step": 1087 + }, + { + "epoch": 0.0, + "global_step": 1088, + "learning_rate": 0.0004962938230383973, + "loss": 1.864, + "loss_base2": 2.6892, + "loss_pixel": 0.231, + "loss_text": 1.633, + "ppl": 6.4495, + "step": 1088 + }, + { + "epoch": 0.0, + "global_step": 1089, + "learning_rate": 0.0004962896494156928, + "loss": 1.8608, + "loss_base2": 2.6846, + "loss_pixel": 0.2347, + "loss_text": 1.6261, + "ppl": 6.4289, + "step": 1089 + }, + { + "epoch": 0.0, + "global_step": 1090, + "learning_rate": 0.0004962854757929883, + "loss": 1.9432, + "loss_base2": 2.8034, + "loss_pixel": 0.2311, + "loss_text": 1.7121, + "ppl": 6.9811, + "step": 1090 + }, + { + "epoch": 0.0, + "global_step": 1091, + "learning_rate": 0.0004962813021702838, + "loss": 1.9249, + "loss_base2": 2.777, + "loss_pixel": 0.2303, + "loss_text": 1.6946, + "ppl": 6.8545, + "step": 1091 + }, + { + "epoch": 0.0, + "global_step": 1092, + "learning_rate": 0.0004962771285475793, + "loss": 1.8387, + "loss_base2": 2.6527, + "loss_pixel": 0.2299, + "loss_text": 1.6088, + "ppl": 6.2884, + "step": 1092 + }, + { + "epoch": 0.0, + "global_step": 1093, + "learning_rate": 0.0004962729549248748, + "loss": 1.843, + "loss_base2": 2.6589, + "loss_pixel": 0.2294, + "loss_text": 1.6136, + "ppl": 6.3155, + "step": 1093 + }, + { + "epoch": 0.0, + "global_step": 1094, + "learning_rate": 0.0004962687813021703, + "loss": 1.8415, + "loss_base2": 2.6567, + "loss_pixel": 0.2294, + "loss_text": 1.6121, + "ppl": 6.306, + "step": 1094 + }, + { + "epoch": 0.0, + "global_step": 1095, + "learning_rate": 0.0004962646076794658, + "loss": 1.8209, + "loss_base2": 2.627, + "loss_pixel": 0.2289, + "loss_text": 1.592, + "ppl": 6.1774, + "step": 1095 + }, + { + "epoch": 0.0, + "global_step": 1096, + "learning_rate": 0.0004962604340567613, + "loss": 1.8222, + "loss_base2": 2.6289, + "loss_pixel": 0.2273, + "loss_text": 1.5948, + "ppl": 6.1855, + "step": 1096 + }, + { + "epoch": 0.0, + "global_step": 1097, + "learning_rate": 0.0004962562604340567, + "loss": 1.8163, + "loss_base2": 2.6204, + "loss_pixel": 0.2268, + "loss_text": 1.5895, + "ppl": 6.1491, + "step": 1097 + }, + { + "epoch": 0.0, + "global_step": 1098, + "learning_rate": 0.0004962520868113522, + "loss": 1.8128, + "loss_base2": 2.6153, + "loss_pixel": 0.2277, + "loss_text": 1.5851, + "ppl": 6.1276, + "step": 1098 + }, + { + "epoch": 0.0, + "global_step": 1099, + "learning_rate": 0.0004962479131886478, + "loss": 1.8124, + "loss_base2": 2.6147, + "loss_pixel": 0.2281, + "loss_text": 1.5843, + "ppl": 6.1251, + "step": 1099 + }, + { + "epoch": 0.0, + "global_step": 1100, + "learning_rate": 0.0004962437395659433, + "loss": 1.8194, + "loss_base2": 2.6248, + "loss_pixel": 0.2278, + "loss_text": 1.5916, + "ppl": 6.1682, + "step": 1100 + }, + { + "epoch": 0.0, + "global_step": 1101, + "learning_rate": 0.0004962395659432388, + "loss": 1.7947, + "loss_base2": 2.5892, + "loss_pixel": 0.2261, + "loss_text": 1.5685, + "ppl": 6.0177, + "step": 1101 + }, + { + "epoch": 0.0, + "global_step": 1102, + "learning_rate": 0.0004962353923205342, + "loss": 1.8061, + "loss_base2": 2.6057, + "loss_pixel": 0.2253, + "loss_text": 1.5807, + "ppl": 6.0867, + "step": 1102 + }, + { + "epoch": 0.0, + "global_step": 1103, + "learning_rate": 0.0004962312186978297, + "loss": 1.8127, + "loss_base2": 2.6152, + "loss_pixel": 0.2248, + "loss_text": 1.5879, + "ppl": 6.127, + "step": 1103 + }, + { + "epoch": 0.0, + "global_step": 1104, + "learning_rate": 0.0004962270450751252, + "loss": 1.7852, + "loss_base2": 2.5755, + "loss_pixel": 0.2244, + "loss_text": 1.5607, + "ppl": 5.9608, + "step": 1104 + }, + { + "epoch": 0.0, + "global_step": 1105, + "learning_rate": 0.0004962228714524207, + "loss": 1.7903, + "loss_base2": 2.5829, + "loss_pixel": 0.2246, + "loss_text": 1.5657, + "ppl": 5.9912, + "step": 1105 + }, + { + "epoch": 0.0, + "global_step": 1106, + "learning_rate": 0.0004962186978297162, + "loss": 1.8041, + "loss_base2": 2.6028, + "loss_pixel": 0.2241, + "loss_text": 1.5799, + "ppl": 6.0745, + "step": 1106 + }, + { + "epoch": 0.0, + "global_step": 1107, + "learning_rate": 0.0004962145242070117, + "loss": 1.7861, + "loss_base2": 2.5768, + "loss_pixel": 0.2238, + "loss_text": 1.5624, + "ppl": 5.9661, + "step": 1107 + }, + { + "epoch": 0.0, + "global_step": 1108, + "learning_rate": 0.0004962103505843072, + "loss": 1.8034, + "loss_base2": 2.6018, + "loss_pixel": 0.2236, + "loss_text": 1.5798, + "ppl": 6.0703, + "step": 1108 + }, + { + "epoch": 0.0, + "global_step": 1109, + "learning_rate": 0.0004962061769616027, + "loss": 1.7875, + "loss_base2": 2.5788, + "loss_pixel": 0.2236, + "loss_text": 1.5638, + "ppl": 5.9745, + "step": 1109 + }, + { + "epoch": 0.0, + "global_step": 1110, + "learning_rate": 0.0004962020033388982, + "loss": 1.7916, + "loss_base2": 2.5847, + "loss_pixel": 0.224, + "loss_text": 1.5676, + "ppl": 5.999, + "step": 1110 + }, + { + "epoch": 0.0, + "global_step": 1111, + "learning_rate": 0.0004961978297161936, + "loss": 1.7772, + "loss_base2": 2.564, + "loss_pixel": 0.2258, + "loss_text": 1.5514, + "ppl": 5.9133, + "step": 1111 + }, + { + "epoch": 0.0, + "global_step": 1112, + "learning_rate": 0.0004961936560934891, + "loss": 1.7694, + "loss_base2": 2.5527, + "loss_pixel": 0.2285, + "loss_text": 1.5408, + "ppl": 5.8673, + "step": 1112 + }, + { + "epoch": 0.0, + "global_step": 1113, + "learning_rate": 0.0004961894824707846, + "loss": 1.7882, + "loss_base2": 2.5798, + "loss_pixel": 0.2264, + "loss_text": 1.5618, + "ppl": 5.9787, + "step": 1113 + }, + { + "epoch": 0.0, + "global_step": 1114, + "learning_rate": 0.0004961853088480801, + "loss": 1.8011, + "loss_base2": 2.5984, + "loss_pixel": 0.2285, + "loss_text": 1.5726, + "ppl": 6.0563, + "step": 1114 + }, + { + "epoch": 0.0, + "global_step": 1115, + "learning_rate": 0.0004961811352253757, + "loss": 1.7877, + "loss_base2": 2.5791, + "loss_pixel": 0.2273, + "loss_text": 1.5605, + "ppl": 5.9757, + "step": 1115 + }, + { + "epoch": 0.0, + "global_step": 1116, + "learning_rate": 0.0004961769616026712, + "loss": 2.1455, + "loss_base2": 3.0953, + "loss_pixel": 0.2262, + "loss_text": 1.9192, + "ppl": 8.5463, + "step": 1116 + }, + { + "epoch": 0.0, + "global_step": 1117, + "learning_rate": 0.0004961727879799667, + "loss": 2.1324, + "loss_base2": 3.0764, + "loss_pixel": 0.2262, + "loss_text": 1.9062, + "ppl": 8.4351, + "step": 1117 + }, + { + "epoch": 0.0, + "global_step": 1118, + "learning_rate": 0.0004961686143572622, + "loss": 2.1193, + "loss_base2": 3.0575, + "loss_pixel": 0.2253, + "loss_text": 1.894, + "ppl": 8.3253, + "step": 1118 + }, + { + "epoch": 0.0, + "global_step": 1119, + "learning_rate": 0.0004961644407345577, + "loss": 2.1197, + "loss_base2": 3.0581, + "loss_pixel": 0.2242, + "loss_text": 1.8955, + "ppl": 8.3286, + "step": 1119 + }, + { + "epoch": 0.0, + "global_step": 1120, + "learning_rate": 0.0004961602671118531, + "loss": 2.1236, + "loss_base2": 3.0637, + "loss_pixel": 0.2246, + "loss_text": 1.899, + "ppl": 8.3612, + "step": 1120 + }, + { + "epoch": 0.0, + "global_step": 1121, + "learning_rate": 0.0004961560934891486, + "loss": 2.1258, + "loss_base2": 3.0669, + "loss_pixel": 0.2257, + "loss_text": 1.9, + "ppl": 8.3796, + "step": 1121 + }, + { + "epoch": 0.0, + "global_step": 1122, + "learning_rate": 0.0004961519198664441, + "loss": 2.124, + "loss_base2": 3.0643, + "loss_pixel": 0.223, + "loss_text": 1.9011, + "ppl": 8.3645, + "step": 1122 + }, + { + "epoch": 0.0, + "global_step": 1123, + "learning_rate": 0.0004961477462437396, + "loss": 2.1023, + "loss_base2": 3.033, + "loss_pixel": 0.2249, + "loss_text": 1.8775, + "ppl": 8.185, + "step": 1123 + }, + { + "epoch": 0.0, + "global_step": 1124, + "learning_rate": 0.000496143572621035, + "loss": 2.0864, + "loss_base2": 3.01, + "loss_pixel": 0.2223, + "loss_text": 1.8641, + "ppl": 8.0559, + "step": 1124 + }, + { + "epoch": 0.0, + "global_step": 1125, + "learning_rate": 0.0004961393989983305, + "loss": 2.0935, + "loss_base2": 3.0203, + "loss_pixel": 0.2231, + "loss_text": 1.8705, + "ppl": 8.1133, + "step": 1125 + }, + { + "epoch": 0.0, + "global_step": 1126, + "learning_rate": 0.000496135225375626, + "loss": 2.084, + "loss_base2": 3.0066, + "loss_pixel": 0.2219, + "loss_text": 1.8622, + "ppl": 8.0366, + "step": 1126 + }, + { + "epoch": 0.0, + "global_step": 1127, + "learning_rate": 0.0004961310517529215, + "loss": 2.088, + "loss_base2": 3.0123, + "loss_pixel": 0.2212, + "loss_text": 1.8669, + "ppl": 8.0688, + "step": 1127 + }, + { + "epoch": 0.0, + "global_step": 1128, + "learning_rate": 0.000496126878130217, + "loss": 2.0872, + "loss_base2": 3.0112, + "loss_pixel": 0.2226, + "loss_text": 1.8646, + "ppl": 8.0623, + "step": 1128 + }, + { + "epoch": 0.0, + "global_step": 1129, + "learning_rate": 0.0004961227045075125, + "loss": 2.0859, + "loss_base2": 3.0093, + "loss_pixel": 0.2216, + "loss_text": 1.8643, + "ppl": 8.0518, + "step": 1129 + }, + { + "epoch": 0.0, + "global_step": 1130, + "learning_rate": 0.000496118530884808, + "loss": 2.093, + "loss_base2": 3.0196, + "loss_pixel": 0.2209, + "loss_text": 1.8721, + "ppl": 8.1092, + "step": 1130 + }, + { + "epoch": 0.0, + "global_step": 1131, + "learning_rate": 0.0004961143572621036, + "loss": 2.0833, + "loss_base2": 3.0056, + "loss_pixel": 0.2212, + "loss_text": 1.8621, + "ppl": 8.0309, + "step": 1131 + }, + { + "epoch": 0.0, + "global_step": 1132, + "learning_rate": 0.0004961101836393991, + "loss": 2.0978, + "loss_base2": 3.0265, + "loss_pixel": 0.2204, + "loss_text": 1.8774, + "ppl": 8.1482, + "step": 1132 + }, + { + "epoch": 0.0, + "global_step": 1133, + "learning_rate": 0.0004961060100166945, + "loss": 2.1023, + "loss_base2": 3.033, + "loss_pixel": 0.2221, + "loss_text": 1.8802, + "ppl": 8.185, + "step": 1133 + }, + { + "epoch": 0.0, + "global_step": 1134, + "learning_rate": 0.00049610183639399, + "loss": 2.0908, + "loss_base2": 3.0164, + "loss_pixel": 0.2197, + "loss_text": 1.8711, + "ppl": 8.0914, + "step": 1134 + }, + { + "epoch": 0.0, + "global_step": 1135, + "learning_rate": 0.0004960976627712855, + "loss": 2.0896, + "loss_base2": 3.0147, + "loss_pixel": 0.2194, + "loss_text": 1.8702, + "ppl": 8.0817, + "step": 1135 + }, + { + "epoch": 0.0, + "global_step": 1136, + "learning_rate": 0.000496093489148581, + "loss": 2.0595, + "loss_base2": 2.9712, + "loss_pixel": 0.2207, + "loss_text": 1.8389, + "ppl": 7.842, + "step": 1136 + }, + { + "epoch": 0.0, + "global_step": 1137, + "learning_rate": 0.0004960893155258765, + "loss": 2.0772, + "loss_base2": 2.9968, + "loss_pixel": 0.2214, + "loss_text": 1.8558, + "ppl": 7.9821, + "step": 1137 + }, + { + "epoch": 0.0, + "global_step": 1138, + "learning_rate": 0.000496085141903172, + "loss": 2.0764, + "loss_base2": 2.9956, + "loss_pixel": 0.2196, + "loss_text": 1.8567, + "ppl": 7.9757, + "step": 1138 + }, + { + "epoch": 0.0, + "global_step": 1139, + "learning_rate": 0.0004960809682804674, + "loss": 2.0678, + "loss_base2": 2.9832, + "loss_pixel": 0.2195, + "loss_text": 1.8483, + "ppl": 7.9074, + "step": 1139 + }, + { + "epoch": 0.0, + "global_step": 1140, + "learning_rate": 0.0004960767946577629, + "loss": 1.9599, + "loss_base2": 2.8275, + "loss_pixel": 0.2196, + "loss_text": 1.7403, + "ppl": 7.0986, + "step": 1140 + }, + { + "epoch": 0.0, + "global_step": 1141, + "learning_rate": 0.0004960726210350584, + "loss": 1.8229, + "loss_base2": 2.6299, + "loss_pixel": 0.2199, + "loss_text": 1.603, + "ppl": 6.1898, + "step": 1141 + }, + { + "epoch": 0.0, + "global_step": 1142, + "learning_rate": 0.0004960684474123539, + "loss": 1.812, + "loss_base2": 2.6142, + "loss_pixel": 0.2211, + "loss_text": 1.5909, + "ppl": 6.1227, + "step": 1142 + }, + { + "epoch": 0.0, + "global_step": 1143, + "learning_rate": 0.0004960642737896494, + "loss": 1.797, + "loss_base2": 2.5925, + "loss_pixel": 0.2241, + "loss_text": 1.5728, + "ppl": 6.0315, + "step": 1143 + }, + { + "epoch": 0.0, + "global_step": 1144, + "learning_rate": 0.0004960601001669449, + "loss": 1.7992, + "loss_base2": 2.5957, + "loss_pixel": 0.2292, + "loss_text": 1.57, + "ppl": 6.0448, + "step": 1144 + }, + { + "epoch": 0.0, + "global_step": 1145, + "learning_rate": 0.0004960559265442404, + "loss": 1.797, + "loss_base2": 2.5925, + "loss_pixel": 0.227, + "loss_text": 1.57, + "ppl": 6.0315, + "step": 1145 + }, + { + "epoch": 0.0, + "global_step": 1146, + "learning_rate": 0.000496051752921536, + "loss": 1.8033, + "loss_base2": 2.6016, + "loss_pixel": 0.2295, + "loss_text": 1.5738, + "ppl": 6.0696, + "step": 1146 + }, + { + "epoch": 0.0, + "global_step": 1147, + "learning_rate": 0.0004960475792988313, + "loss": 1.765, + "loss_base2": 2.5464, + "loss_pixel": 0.2289, + "loss_text": 1.5361, + "ppl": 5.8416, + "step": 1147 + }, + { + "epoch": 0.0, + "global_step": 1148, + "learning_rate": 0.0004960434056761269, + "loss": 1.9761, + "loss_base2": 2.8509, + "loss_pixel": 0.2296, + "loss_text": 1.7464, + "ppl": 7.2146, + "step": 1148 + }, + { + "epoch": 0.0, + "global_step": 1149, + "learning_rate": 0.0004960392320534224, + "loss": 2.0547, + "loss_base2": 2.9643, + "loss_pixel": 0.2348, + "loss_text": 1.8199, + "ppl": 7.8045, + "step": 1149 + }, + { + "epoch": 0.0, + "global_step": 1150, + "learning_rate": 0.0004960350584307179, + "loss": 2.1038, + "loss_base2": 3.0351, + "loss_pixel": 0.2302, + "loss_text": 1.8737, + "ppl": 8.1973, + "step": 1150 + }, + { + "epoch": 0.0, + "global_step": 1151, + "learning_rate": 0.0004960308848080134, + "loss": 2.1026, + "loss_base2": 3.0334, + "loss_pixel": 0.2305, + "loss_text": 1.872, + "ppl": 8.1874, + "step": 1151 + }, + { + "epoch": 0.0, + "global_step": 1152, + "learning_rate": 0.0004960267111853089, + "loss": 2.1158, + "loss_base2": 3.0525, + "loss_pixel": 0.2277, + "loss_text": 1.8881, + "ppl": 8.2962, + "step": 1152 + }, + { + "epoch": 0.0, + "global_step": 1153, + "learning_rate": 0.0004960225375626044, + "loss": 2.0834, + "loss_base2": 3.0057, + "loss_pixel": 0.2273, + "loss_text": 1.8561, + "ppl": 8.0317, + "step": 1153 + }, + { + "epoch": 0.0, + "global_step": 1154, + "learning_rate": 0.0004960183639398999, + "loss": 2.094, + "loss_base2": 3.021, + "loss_pixel": 0.2275, + "loss_text": 1.8666, + "ppl": 8.1173, + "step": 1154 + }, + { + "epoch": 0.0, + "global_step": 1155, + "learning_rate": 0.0004960141903171954, + "loss": 2.0766, + "loss_base2": 2.9959, + "loss_pixel": 0.2249, + "loss_text": 1.8516, + "ppl": 7.9773, + "step": 1155 + }, + { + "epoch": 0.0, + "global_step": 1156, + "learning_rate": 0.0004960100166944908, + "loss": 2.0817, + "loss_base2": 3.0033, + "loss_pixel": 0.2246, + "loss_text": 1.8571, + "ppl": 8.0181, + "step": 1156 + }, + { + "epoch": 0.0, + "global_step": 1157, + "learning_rate": 0.0004960058430717863, + "loss": 2.0922, + "loss_base2": 3.0184, + "loss_pixel": 0.2245, + "loss_text": 1.8677, + "ppl": 8.1027, + "step": 1157 + }, + { + "epoch": 0.0, + "global_step": 1158, + "learning_rate": 0.0004960016694490818, + "loss": 2.0788, + "loss_base2": 2.9991, + "loss_pixel": 0.2237, + "loss_text": 1.8551, + "ppl": 7.9949, + "step": 1158 + }, + { + "epoch": 0.0, + "global_step": 1159, + "learning_rate": 0.0004959974958263773, + "loss": 2.0897, + "loss_base2": 3.0148, + "loss_pixel": 0.2257, + "loss_text": 1.864, + "ppl": 8.0825, + "step": 1159 + }, + { + "epoch": 0.0, + "global_step": 1160, + "learning_rate": 0.0004959933222036728, + "loss": 2.0706, + "loss_base2": 2.9872, + "loss_pixel": 0.2218, + "loss_text": 1.8488, + "ppl": 7.9296, + "step": 1160 + }, + { + "epoch": 0.0, + "global_step": 1161, + "learning_rate": 0.0004959891485809682, + "loss": 2.0734, + "loss_base2": 2.9913, + "loss_pixel": 0.2227, + "loss_text": 1.8507, + "ppl": 7.9518, + "step": 1161 + }, + { + "epoch": 0.0, + "global_step": 1162, + "learning_rate": 0.0004959849749582637, + "loss": 2.0725, + "loss_base2": 2.99, + "loss_pixel": 0.2214, + "loss_text": 1.8511, + "ppl": 7.9447, + "step": 1162 + }, + { + "epoch": 0.0, + "global_step": 1163, + "learning_rate": 0.0004959808013355592, + "loss": 2.0718, + "loss_base2": 2.989, + "loss_pixel": 0.2211, + "loss_text": 1.8506, + "ppl": 7.9391, + "step": 1163 + }, + { + "epoch": 0.0, + "global_step": 1164, + "learning_rate": 0.0004959766277128548, + "loss": 2.0826, + "loss_base2": 3.0046, + "loss_pixel": 0.22, + "loss_text": 1.8626, + "ppl": 8.0253, + "step": 1164 + }, + { + "epoch": 0.0, + "global_step": 1165, + "learning_rate": 0.0004959724540901503, + "loss": 2.0634, + "loss_base2": 2.9769, + "loss_pixel": 0.2204, + "loss_text": 1.843, + "ppl": 7.8727, + "step": 1165 + }, + { + "epoch": 0.0, + "global_step": 1166, + "learning_rate": 0.0004959682804674458, + "loss": 2.0553, + "loss_base2": 2.9652, + "loss_pixel": 0.22, + "loss_text": 1.8353, + "ppl": 7.8092, + "step": 1166 + }, + { + "epoch": 0.0, + "global_step": 1167, + "learning_rate": 0.0004959641068447413, + "loss": 2.0665, + "loss_base2": 2.9813, + "loss_pixel": 0.2202, + "loss_text": 1.8463, + "ppl": 7.8971, + "step": 1167 + }, + { + "epoch": 0.0, + "global_step": 1168, + "learning_rate": 0.0004959599332220368, + "loss": 2.0607, + "loss_base2": 2.973, + "loss_pixel": 0.219, + "loss_text": 1.8417, + "ppl": 7.8515, + "step": 1168 + }, + { + "epoch": 0.0, + "global_step": 1169, + "learning_rate": 0.0004959557595993323, + "loss": 2.0559, + "loss_base2": 2.966, + "loss_pixel": 0.2195, + "loss_text": 1.8363, + "ppl": 7.8139, + "step": 1169 + }, + { + "epoch": 0.0, + "global_step": 1170, + "learning_rate": 0.0004959515859766277, + "loss": 2.0638, + "loss_base2": 2.9774, + "loss_pixel": 0.2192, + "loss_text": 1.8446, + "ppl": 7.8758, + "step": 1170 + }, + { + "epoch": 0.0, + "global_step": 1171, + "learning_rate": 0.0004959474123539232, + "loss": 2.0505, + "loss_base2": 2.9582, + "loss_pixel": 0.2209, + "loss_text": 1.8296, + "ppl": 7.7718, + "step": 1171 + }, + { + "epoch": 0.0, + "global_step": 1172, + "learning_rate": 0.0004959432387312187, + "loss": 2.0643, + "loss_base2": 2.9782, + "loss_pixel": 0.2205, + "loss_text": 1.8438, + "ppl": 7.8798, + "step": 1172 + }, + { + "epoch": 0.0, + "global_step": 1173, + "learning_rate": 0.0004959390651085142, + "loss": 2.0499, + "loss_base2": 2.9574, + "loss_pixel": 0.2194, + "loss_text": 1.8305, + "ppl": 7.7671, + "step": 1173 + }, + { + "epoch": 0.0, + "global_step": 1174, + "learning_rate": 0.0004959348914858097, + "loss": 2.0531, + "loss_base2": 2.962, + "loss_pixel": 0.2185, + "loss_text": 1.8346, + "ppl": 7.792, + "step": 1174 + }, + { + "epoch": 0.0, + "global_step": 1175, + "learning_rate": 0.0004959307178631052, + "loss": 2.0548, + "loss_base2": 2.9644, + "loss_pixel": 0.2188, + "loss_text": 1.836, + "ppl": 7.8053, + "step": 1175 + }, + { + "epoch": 0.0, + "global_step": 1176, + "learning_rate": 0.0004959265442404006, + "loss": 2.0295, + "loss_base2": 2.9279, + "loss_pixel": 0.2189, + "loss_text": 1.8106, + "ppl": 7.6103, + "step": 1176 + }, + { + "epoch": 0.0, + "global_step": 1177, + "learning_rate": 0.0004959223706176961, + "loss": 2.0526, + "loss_base2": 2.9613, + "loss_pixel": 0.2183, + "loss_text": 1.8343, + "ppl": 7.7881, + "step": 1177 + }, + { + "epoch": 0.0, + "global_step": 1178, + "learning_rate": 0.0004959181969949916, + "loss": 2.0378, + "loss_base2": 2.9399, + "loss_pixel": 0.2185, + "loss_text": 1.8193, + "ppl": 7.6737, + "step": 1178 + }, + { + "epoch": 0.0, + "global_step": 1179, + "learning_rate": 0.0004959140233722871, + "loss": 2.052, + "loss_base2": 2.9604, + "loss_pixel": 0.2162, + "loss_text": 1.8358, + "ppl": 7.7835, + "step": 1179 + }, + { + "epoch": 0.0, + "global_step": 1180, + "learning_rate": 0.0004959098497495827, + "loss": 2.0433, + "loss_base2": 2.9479, + "loss_pixel": 0.2168, + "loss_text": 1.8264, + "ppl": 7.716, + "step": 1180 + }, + { + "epoch": 0.0, + "global_step": 1181, + "learning_rate": 0.0004959056761268782, + "loss": 2.0551, + "loss_base2": 2.9649, + "loss_pixel": 0.2162, + "loss_text": 1.8389, + "ppl": 7.8076, + "step": 1181 + }, + { + "epoch": 0.0, + "global_step": 1182, + "learning_rate": 0.0004959015025041737, + "loss": 2.0609, + "loss_base2": 2.9733, + "loss_pixel": 0.2165, + "loss_text": 1.8443, + "ppl": 7.853, + "step": 1182 + }, + { + "epoch": 0.0, + "global_step": 1183, + "learning_rate": 0.0004958973288814691, + "loss": 2.038, + "loss_base2": 2.9402, + "loss_pixel": 0.217, + "loss_text": 1.821, + "ppl": 7.6752, + "step": 1183 + }, + { + "epoch": 0.0, + "global_step": 1184, + "learning_rate": 0.0004958931552587646, + "loss": 2.0526, + "loss_base2": 2.9613, + "loss_pixel": 0.2173, + "loss_text": 1.8353, + "ppl": 7.7881, + "step": 1184 + }, + { + "epoch": 0.0, + "global_step": 1185, + "learning_rate": 0.0004958889816360601, + "loss": 2.0407, + "loss_base2": 2.9441, + "loss_pixel": 0.217, + "loss_text": 1.8237, + "ppl": 7.696, + "step": 1185 + }, + { + "epoch": 0.0, + "global_step": 1186, + "learning_rate": 0.0004958848080133556, + "loss": 2.041, + "loss_base2": 2.9445, + "loss_pixel": 0.2168, + "loss_text": 1.8242, + "ppl": 7.6983, + "step": 1186 + }, + { + "epoch": 0.0, + "global_step": 1187, + "learning_rate": 0.0004958806343906511, + "loss": 2.0307, + "loss_base2": 2.9297, + "loss_pixel": 0.2159, + "loss_text": 1.8149, + "ppl": 7.6194, + "step": 1187 + }, + { + "epoch": 0.0, + "global_step": 1188, + "learning_rate": 0.0004958764607679466, + "loss": 2.0256, + "loss_base2": 2.9223, + "loss_pixel": 0.2167, + "loss_text": 1.8089, + "ppl": 7.5807, + "step": 1188 + }, + { + "epoch": 0.0, + "global_step": 1189, + "learning_rate": 0.0004958722871452421, + "loss": 2.0327, + "loss_base2": 2.9326, + "loss_pixel": 0.217, + "loss_text": 1.8157, + "ppl": 7.6347, + "step": 1189 + }, + { + "epoch": 0.0, + "global_step": 1190, + "learning_rate": 0.0004958681135225376, + "loss": 2.034, + "loss_base2": 2.9344, + "loss_pixel": 0.2158, + "loss_text": 1.8182, + "ppl": 7.6446, + "step": 1190 + }, + { + "epoch": 0.0, + "global_step": 1191, + "learning_rate": 0.0004958639398998331, + "loss": 2.0438, + "loss_base2": 2.9486, + "loss_pixel": 0.2159, + "loss_text": 1.8279, + "ppl": 7.7199, + "step": 1191 + }, + { + "epoch": 0.0, + "global_step": 1192, + "learning_rate": 0.0004958597662771285, + "loss": 2.0444, + "loss_base2": 2.9494, + "loss_pixel": 0.214, + "loss_text": 1.8304, + "ppl": 7.7245, + "step": 1192 + }, + { + "epoch": 0.0, + "global_step": 1193, + "learning_rate": 0.000495855592654424, + "loss": 2.0472, + "loss_base2": 2.9535, + "loss_pixel": 0.2143, + "loss_text": 1.8329, + "ppl": 7.7462, + "step": 1193 + }, + { + "epoch": 0.0, + "global_step": 1194, + "learning_rate": 0.0004958514190317195, + "loss": 2.0312, + "loss_base2": 2.9304, + "loss_pixel": 0.2135, + "loss_text": 1.8176, + "ppl": 7.6232, + "step": 1194 + }, + { + "epoch": 0.0, + "global_step": 1195, + "learning_rate": 0.000495847245409015, + "loss": 2.0471, + "loss_base2": 2.9533, + "loss_pixel": 0.2143, + "loss_text": 1.8327, + "ppl": 7.7454, + "step": 1195 + }, + { + "epoch": 0.0, + "global_step": 1196, + "learning_rate": 0.0004958430717863106, + "loss": 2.0196, + "loss_base2": 2.9137, + "loss_pixel": 0.2157, + "loss_text": 1.8039, + "ppl": 7.5353, + "step": 1196 + }, + { + "epoch": 0.0, + "global_step": 1197, + "learning_rate": 0.000495838898163606, + "loss": 2.0387, + "loss_base2": 2.9412, + "loss_pixel": 0.216, + "loss_text": 1.8227, + "ppl": 7.6806, + "step": 1197 + }, + { + "epoch": 0.0, + "global_step": 1198, + "learning_rate": 0.0004958347245409015, + "loss": 2.0322, + "loss_base2": 2.9318, + "loss_pixel": 0.2248, + "loss_text": 1.8074, + "ppl": 7.6309, + "step": 1198 + }, + { + "epoch": 0.0, + "global_step": 1199, + "learning_rate": 0.000495830550918197, + "loss": 2.0934, + "loss_base2": 3.0201, + "loss_pixel": 0.2521, + "loss_text": 1.8413, + "ppl": 8.1125, + "step": 1199 + }, + { + "epoch": 0.01, + "global_step": 1200, + "learning_rate": 0.0004958263772954925, + "loss": 2.0913, + "loss_base2": 3.0171, + "loss_pixel": 0.2603, + "loss_text": 1.831, + "ppl": 8.0954, + "step": 1200 + }, + { + "epoch": 0.01, + "global_step": 1201, + "learning_rate": 0.000495822203672788, + "loss": 2.1327, + "loss_base2": 3.0768, + "loss_pixel": 0.3104, + "loss_text": 1.8224, + "ppl": 8.4376, + "step": 1201 + }, + { + "epoch": 0.01, + "global_step": 1202, + "learning_rate": 0.0004958180300500835, + "loss": 2.1571, + "loss_base2": 3.112, + "loss_pixel": 0.3433, + "loss_text": 1.8138, + "ppl": 8.646, + "step": 1202 + }, + { + "epoch": 0.01, + "global_step": 1203, + "learning_rate": 0.000495813856427379, + "loss": 2.1707, + "loss_base2": 3.1317, + "loss_pixel": 0.3414, + "loss_text": 1.8292, + "ppl": 8.7644, + "step": 1203 + }, + { + "epoch": 0.01, + "global_step": 1204, + "learning_rate": 0.0004958096828046745, + "loss": 2.1929, + "loss_base2": 3.1637, + "loss_pixel": 0.3741, + "loss_text": 1.8188, + "ppl": 8.9612, + "step": 1204 + }, + { + "epoch": 0.01, + "global_step": 1205, + "learning_rate": 0.00049580550918197, + "loss": 2.1941, + "loss_base2": 3.1654, + "loss_pixel": 0.3765, + "loss_text": 1.8176, + "ppl": 8.9719, + "step": 1205 + }, + { + "epoch": 0.01, + "global_step": 1206, + "learning_rate": 0.0004958013355592654, + "loss": 2.1822, + "loss_base2": 3.1482, + "loss_pixel": 0.363, + "loss_text": 1.8192, + "ppl": 8.8658, + "step": 1206 + }, + { + "epoch": 0.01, + "global_step": 1207, + "learning_rate": 0.0004957971619365609, + "loss": 2.1569, + "loss_base2": 3.1117, + "loss_pixel": 0.3476, + "loss_text": 1.8093, + "ppl": 8.6443, + "step": 1207 + }, + { + "epoch": 0.01, + "global_step": 1208, + "learning_rate": 0.0004957929883138564, + "loss": 2.1615, + "loss_base2": 3.1184, + "loss_pixel": 0.3442, + "loss_text": 1.8172, + "ppl": 8.6842, + "step": 1208 + }, + { + "epoch": 0.01, + "global_step": 1209, + "learning_rate": 0.0004957888146911519, + "loss": 2.1599, + "loss_base2": 3.1161, + "loss_pixel": 0.3513, + "loss_text": 1.8086, + "ppl": 8.6703, + "step": 1209 + }, + { + "epoch": 0.01, + "global_step": 1210, + "learning_rate": 0.0004957846410684474, + "loss": 2.1558, + "loss_base2": 3.1102, + "loss_pixel": 0.3404, + "loss_text": 1.8154, + "ppl": 8.6348, + "step": 1210 + }, + { + "epoch": 0.01, + "global_step": 1211, + "learning_rate": 0.000495780467445743, + "loss": 2.1394, + "loss_base2": 3.0865, + "loss_pixel": 0.3386, + "loss_text": 1.8008, + "ppl": 8.4943, + "step": 1211 + }, + { + "epoch": 0.01, + "global_step": 1212, + "learning_rate": 0.0004957762938230385, + "loss": 2.1769, + "loss_base2": 3.1406, + "loss_pixel": 0.3428, + "loss_text": 1.8341, + "ppl": 8.8189, + "step": 1212 + }, + { + "epoch": 0.01, + "global_step": 1213, + "learning_rate": 0.000495772120200334, + "loss": 2.1865, + "loss_base2": 3.1545, + "loss_pixel": 0.3499, + "loss_text": 1.8366, + "ppl": 8.904, + "step": 1213 + }, + { + "epoch": 0.01, + "global_step": 1214, + "learning_rate": 0.0004957679465776294, + "loss": 2.1466, + "loss_base2": 3.0969, + "loss_pixel": 0.3303, + "loss_text": 1.8162, + "ppl": 8.5557, + "step": 1214 + }, + { + "epoch": 0.01, + "global_step": 1215, + "learning_rate": 0.0004957637729549249, + "loss": 2.1567, + "loss_base2": 3.1115, + "loss_pixel": 0.3334, + "loss_text": 1.8233, + "ppl": 8.6426, + "step": 1215 + }, + { + "epoch": 0.01, + "global_step": 1216, + "learning_rate": 0.0004957595993322204, + "loss": 2.1389, + "loss_base2": 3.0858, + "loss_pixel": 0.3301, + "loss_text": 1.8088, + "ppl": 8.4901, + "step": 1216 + }, + { + "epoch": 0.01, + "global_step": 1217, + "learning_rate": 0.0004957554257095159, + "loss": 2.1857, + "loss_base2": 3.1533, + "loss_pixel": 0.3394, + "loss_text": 1.8463, + "ppl": 8.8969, + "step": 1217 + }, + { + "epoch": 0.01, + "global_step": 1218, + "learning_rate": 0.0004957512520868114, + "loss": 2.0737, + "loss_base2": 2.9917, + "loss_pixel": 0.3344, + "loss_text": 1.7393, + "ppl": 7.9542, + "step": 1218 + }, + { + "epoch": 0.01, + "global_step": 1219, + "learning_rate": 0.0004957470784641069, + "loss": 1.8969, + "loss_base2": 2.7366, + "loss_pixel": 0.3348, + "loss_text": 1.5622, + "ppl": 6.6652, + "step": 1219 + }, + { + "epoch": 0.01, + "global_step": 1220, + "learning_rate": 0.0004957429048414023, + "loss": 1.917, + "loss_base2": 2.7656, + "loss_pixel": 0.3232, + "loss_text": 1.5938, + "ppl": 6.8005, + "step": 1220 + }, + { + "epoch": 0.01, + "global_step": 1221, + "learning_rate": 0.0004957387312186978, + "loss": 1.9015, + "loss_base2": 2.7433, + "loss_pixel": 0.3207, + "loss_text": 1.5808, + "ppl": 6.6959, + "step": 1221 + }, + { + "epoch": 0.01, + "global_step": 1222, + "learning_rate": 0.0004957345575959933, + "loss": 1.9329, + "loss_base2": 2.7886, + "loss_pixel": 0.3183, + "loss_text": 1.6147, + "ppl": 6.9095, + "step": 1222 + }, + { + "epoch": 0.01, + "global_step": 1223, + "learning_rate": 0.0004957303839732888, + "loss": 1.9124, + "loss_base2": 2.759, + "loss_pixel": 0.3137, + "loss_text": 1.5988, + "ppl": 6.7693, + "step": 1223 + }, + { + "epoch": 0.01, + "global_step": 1224, + "learning_rate": 0.0004957262103505843, + "loss": 1.8937, + "loss_base2": 2.732, + "loss_pixel": 0.3145, + "loss_text": 1.5792, + "ppl": 6.6439, + "step": 1224 + }, + { + "epoch": 0.01, + "global_step": 1225, + "learning_rate": 0.0004957220367278798, + "loss": 1.9018, + "loss_base2": 2.7437, + "loss_pixel": 0.3092, + "loss_text": 1.5926, + "ppl": 6.6979, + "step": 1225 + }, + { + "epoch": 0.01, + "global_step": 1226, + "learning_rate": 0.0004957178631051753, + "loss": 1.9031, + "loss_base2": 2.7456, + "loss_pixel": 0.3055, + "loss_text": 1.5976, + "ppl": 6.7067, + "step": 1226 + }, + { + "epoch": 0.01, + "global_step": 1227, + "learning_rate": 0.0004957136894824708, + "loss": 1.8947, + "loss_base2": 2.7335, + "loss_pixel": 0.3038, + "loss_text": 1.5909, + "ppl": 6.6506, + "step": 1227 + }, + { + "epoch": 0.01, + "global_step": 1228, + "learning_rate": 0.0004957095158597664, + "loss": 1.9153, + "loss_base2": 2.7632, + "loss_pixel": 0.3014, + "loss_text": 1.6139, + "ppl": 6.789, + "step": 1228 + }, + { + "epoch": 0.01, + "global_step": 1229, + "learning_rate": 0.0004957053422370618, + "loss": 1.9131, + "loss_base2": 2.76, + "loss_pixel": 0.298, + "loss_text": 1.6151, + "ppl": 6.7741, + "step": 1229 + }, + { + "epoch": 0.01, + "global_step": 1230, + "learning_rate": 0.0004957011686143573, + "loss": 1.9298, + "loss_base2": 2.7841, + "loss_pixel": 0.2952, + "loss_text": 1.6346, + "ppl": 6.8881, + "step": 1230 + }, + { + "epoch": 0.01, + "global_step": 1231, + "learning_rate": 0.0004956969949916528, + "loss": 1.9406, + "loss_base2": 2.7997, + "loss_pixel": 0.2965, + "loss_text": 1.6441, + "ppl": 6.9629, + "step": 1231 + }, + { + "epoch": 0.01, + "global_step": 1232, + "learning_rate": 0.0004956928213689483, + "loss": 1.9506, + "loss_base2": 2.8141, + "loss_pixel": 0.2934, + "loss_text": 1.6572, + "ppl": 7.0329, + "step": 1232 + }, + { + "epoch": 0.01, + "global_step": 1233, + "learning_rate": 0.0004956886477462437, + "loss": 1.9481, + "loss_base2": 2.8105, + "loss_pixel": 0.2896, + "loss_text": 1.6584, + "ppl": 7.0153, + "step": 1233 + }, + { + "epoch": 0.01, + "global_step": 1234, + "learning_rate": 0.0004956844741235392, + "loss": 1.9525, + "loss_base2": 2.8169, + "loss_pixel": 0.2872, + "loss_text": 1.6652, + "ppl": 7.0463, + "step": 1234 + }, + { + "epoch": 0.01, + "global_step": 1235, + "learning_rate": 0.0004956803005008347, + "loss": 1.9744, + "loss_base2": 2.8485, + "loss_pixel": 0.2847, + "loss_text": 1.6896, + "ppl": 7.2023, + "step": 1235 + }, + { + "epoch": 0.01, + "global_step": 1236, + "learning_rate": 0.0004956761268781302, + "loss": 2.2257, + "loss_base2": 3.211, + "loss_pixel": 0.282, + "loss_text": 1.9437, + "ppl": 9.26, + "step": 1236 + }, + { + "epoch": 0.01, + "global_step": 1237, + "learning_rate": 0.0004956719532554257, + "loss": 2.2495, + "loss_base2": 3.2453, + "loss_pixel": 0.2808, + "loss_text": 1.9687, + "ppl": 9.483, + "step": 1237 + }, + { + "epoch": 0.01, + "global_step": 1238, + "learning_rate": 0.0004956677796327212, + "loss": 2.2924, + "loss_base2": 3.3072, + "loss_pixel": 0.2778, + "loss_text": 2.0146, + "ppl": 9.8987, + "step": 1238 + }, + { + "epoch": 0.01, + "global_step": 1239, + "learning_rate": 0.0004956636060100167, + "loss": 2.2809, + "loss_base2": 3.2906, + "loss_pixel": 0.2765, + "loss_text": 2.0043, + "ppl": 9.7855, + "step": 1239 + }, + { + "epoch": 0.01, + "global_step": 1240, + "learning_rate": 0.0004956594323873122, + "loss": 2.2832, + "loss_base2": 3.294, + "loss_pixel": 0.274, + "loss_text": 2.0092, + "ppl": 9.808, + "step": 1240 + }, + { + "epoch": 0.01, + "global_step": 1241, + "learning_rate": 0.0004956552587646077, + "loss": 2.2531, + "loss_base2": 3.2505, + "loss_pixel": 0.2737, + "loss_text": 1.9794, + "ppl": 9.5172, + "step": 1241 + }, + { + "epoch": 0.01, + "global_step": 1242, + "learning_rate": 0.0004956510851419031, + "loss": 2.2687, + "loss_base2": 3.273, + "loss_pixel": 0.2704, + "loss_text": 1.9984, + "ppl": 9.6668, + "step": 1242 + }, + { + "epoch": 0.01, + "global_step": 1243, + "learning_rate": 0.0004956469115191986, + "loss": 2.285, + "loss_base2": 3.2966, + "loss_pixel": 0.2739, + "loss_text": 2.0111, + "ppl": 9.8257, + "step": 1243 + }, + { + "epoch": 0.01, + "global_step": 1244, + "learning_rate": 0.0004956427378964941, + "loss": 2.2729, + "loss_base2": 3.2791, + "loss_pixel": 0.2702, + "loss_text": 2.0027, + "ppl": 9.7075, + "step": 1244 + }, + { + "epoch": 0.01, + "global_step": 1245, + "learning_rate": 0.0004956385642737897, + "loss": 2.2979, + "loss_base2": 3.3152, + "loss_pixel": 0.2697, + "loss_text": 2.0282, + "ppl": 9.9533, + "step": 1245 + }, + { + "epoch": 0.01, + "global_step": 1246, + "learning_rate": 0.0004956343906510852, + "loss": 2.2538, + "loss_base2": 3.2515, + "loss_pixel": 0.2681, + "loss_text": 1.9857, + "ppl": 9.5239, + "step": 1246 + }, + { + "epoch": 0.01, + "global_step": 1247, + "learning_rate": 0.0004956302170283807, + "loss": 2.2626, + "loss_base2": 3.2642, + "loss_pixel": 0.274, + "loss_text": 1.9886, + "ppl": 9.608, + "step": 1247 + }, + { + "epoch": 0.01, + "global_step": 1248, + "learning_rate": 0.0004956260434056762, + "loss": 2.2497, + "loss_base2": 3.2456, + "loss_pixel": 0.2787, + "loss_text": 1.971, + "ppl": 9.4849, + "step": 1248 + }, + { + "epoch": 0.01, + "global_step": 1249, + "learning_rate": 0.0004956218697829717, + "loss": 2.2302, + "loss_base2": 3.2175, + "loss_pixel": 0.2708, + "loss_text": 1.9594, + "ppl": 9.3017, + "step": 1249 + }, + { + "epoch": 0.01, + "global_step": 1250, + "learning_rate": 0.0004956176961602672, + "loss": 2.2613, + "loss_base2": 3.2624, + "loss_pixel": 0.2728, + "loss_text": 1.9885, + "ppl": 9.5956, + "step": 1250 + }, + { + "epoch": 0.01, + "global_step": 1251, + "learning_rate": 0.0004956135225375626, + "loss": 2.2379, + "loss_base2": 3.2286, + "loss_pixel": 0.2712, + "loss_text": 1.9667, + "ppl": 9.3736, + "step": 1251 + }, + { + "epoch": 0.01, + "global_step": 1252, + "learning_rate": 0.0004956093489148581, + "loss": 2.2096, + "loss_base2": 3.1878, + "loss_pixel": 0.2667, + "loss_text": 1.943, + "ppl": 9.1121, + "step": 1252 + }, + { + "epoch": 0.01, + "global_step": 1253, + "learning_rate": 0.0004956051752921536, + "loss": 2.192, + "loss_base2": 3.1624, + "loss_pixel": 0.2642, + "loss_text": 1.9278, + "ppl": 8.9531, + "step": 1253 + }, + { + "epoch": 0.01, + "global_step": 1254, + "learning_rate": 0.0004956010016694491, + "loss": 2.1937, + "loss_base2": 3.1648, + "loss_pixel": 0.2635, + "loss_text": 1.9302, + "ppl": 8.9683, + "step": 1254 + }, + { + "epoch": 0.01, + "global_step": 1255, + "learning_rate": 0.0004955968280467446, + "loss": 2.1668, + "loss_base2": 3.126, + "loss_pixel": 0.2611, + "loss_text": 1.9057, + "ppl": 8.7303, + "step": 1255 + }, + { + "epoch": 0.01, + "global_step": 1256, + "learning_rate": 0.00049559265442404, + "loss": 2.2559, + "loss_base2": 3.2546, + "loss_pixel": 0.26, + "loss_text": 1.9959, + "ppl": 9.5439, + "step": 1256 + }, + { + "epoch": 0.01, + "global_step": 1257, + "learning_rate": 0.0004955884808013355, + "loss": 2.1631, + "loss_base2": 3.1207, + "loss_pixel": 0.2583, + "loss_text": 1.9048, + "ppl": 8.6981, + "step": 1257 + }, + { + "epoch": 0.01, + "global_step": 1258, + "learning_rate": 0.000495584307178631, + "loss": 2.1715, + "loss_base2": 3.1328, + "loss_pixel": 0.257, + "loss_text": 1.9145, + "ppl": 8.7714, + "step": 1258 + }, + { + "epoch": 0.01, + "global_step": 1259, + "learning_rate": 0.0004955801335559265, + "loss": 2.1621, + "loss_base2": 3.1193, + "loss_pixel": 0.2557, + "loss_text": 1.9063, + "ppl": 8.6894, + "step": 1259 + }, + { + "epoch": 0.01, + "global_step": 1260, + "learning_rate": 0.000495575959933222, + "loss": 2.1408, + "loss_base2": 3.0885, + "loss_pixel": 0.2542, + "loss_text": 1.8867, + "ppl": 8.5062, + "step": 1260 + }, + { + "epoch": 0.01, + "global_step": 1261, + "learning_rate": 0.0004955717863105176, + "loss": 2.1525, + "loss_base2": 3.1054, + "loss_pixel": 0.2548, + "loss_text": 1.8976, + "ppl": 8.6063, + "step": 1261 + }, + { + "epoch": 0.01, + "global_step": 1262, + "learning_rate": 0.0004955676126878131, + "loss": 2.1634, + "loss_base2": 3.1211, + "loss_pixel": 0.2543, + "loss_text": 1.9091, + "ppl": 8.7007, + "step": 1262 + }, + { + "epoch": 0.01, + "global_step": 1263, + "learning_rate": 0.0004955634390651086, + "loss": 2.1537, + "loss_base2": 3.1071, + "loss_pixel": 0.2529, + "loss_text": 1.9008, + "ppl": 8.6167, + "step": 1263 + }, + { + "epoch": 0.01, + "global_step": 1264, + "learning_rate": 0.0004955592654424041, + "loss": 2.1352, + "loss_base2": 3.0804, + "loss_pixel": 0.2516, + "loss_text": 1.8836, + "ppl": 8.4587, + "step": 1264 + }, + { + "epoch": 0.01, + "global_step": 1265, + "learning_rate": 0.0004955550918196995, + "loss": 2.1317, + "loss_base2": 3.0754, + "loss_pixel": 0.2504, + "loss_text": 1.8813, + "ppl": 8.4292, + "step": 1265 + }, + { + "epoch": 0.01, + "global_step": 1266, + "learning_rate": 0.000495550918196995, + "loss": 2.1311, + "loss_base2": 3.0745, + "loss_pixel": 0.2477, + "loss_text": 1.8834, + "ppl": 8.4241, + "step": 1266 + }, + { + "epoch": 0.01, + "global_step": 1267, + "learning_rate": 0.0004955467445742905, + "loss": 2.1141, + "loss_base2": 3.05, + "loss_pixel": 0.2486, + "loss_text": 1.8656, + "ppl": 8.2821, + "step": 1267 + }, + { + "epoch": 0.01, + "global_step": 1268, + "learning_rate": 0.000495542570951586, + "loss": 2.1314, + "loss_base2": 3.075, + "loss_pixel": 0.2464, + "loss_text": 1.885, + "ppl": 8.4267, + "step": 1268 + }, + { + "epoch": 0.01, + "global_step": 1269, + "learning_rate": 0.0004955383973288815, + "loss": 2.1037, + "loss_base2": 3.035, + "loss_pixel": 0.2433, + "loss_text": 1.8604, + "ppl": 8.1964, + "step": 1269 + }, + { + "epoch": 0.01, + "global_step": 1270, + "learning_rate": 0.0004955342237061769, + "loss": 2.1132, + "loss_base2": 3.0487, + "loss_pixel": 0.2455, + "loss_text": 1.8677, + "ppl": 8.2747, + "step": 1270 + }, + { + "epoch": 0.01, + "global_step": 1271, + "learning_rate": 0.0004955300500834724, + "loss": 2.1098, + "loss_base2": 3.0438, + "loss_pixel": 0.2451, + "loss_text": 1.8647, + "ppl": 8.2466, + "step": 1271 + }, + { + "epoch": 0.01, + "global_step": 1272, + "learning_rate": 0.0004955258764607679, + "loss": 2.1003, + "loss_base2": 3.0301, + "loss_pixel": 0.2437, + "loss_text": 1.8567, + "ppl": 8.1686, + "step": 1272 + }, + { + "epoch": 0.01, + "global_step": 1273, + "learning_rate": 0.0004955217028380634, + "loss": 2.105, + "loss_base2": 3.0369, + "loss_pixel": 0.2435, + "loss_text": 1.8615, + "ppl": 8.2071, + "step": 1273 + }, + { + "epoch": 0.01, + "global_step": 1274, + "learning_rate": 0.0004955175292153589, + "loss": 2.1089, + "loss_base2": 3.0425, + "loss_pixel": 0.2403, + "loss_text": 1.8686, + "ppl": 8.2392, + "step": 1274 + }, + { + "epoch": 0.01, + "global_step": 1275, + "learning_rate": 0.0004955133555926544, + "loss": 2.0744, + "loss_base2": 2.9927, + "loss_pixel": 0.2391, + "loss_text": 1.8353, + "ppl": 7.9598, + "step": 1275 + }, + { + "epoch": 0.01, + "global_step": 1276, + "learning_rate": 0.00049550918196995, + "loss": 2.0913, + "loss_base2": 3.0171, + "loss_pixel": 0.2375, + "loss_text": 1.8538, + "ppl": 8.0954, + "step": 1276 + }, + { + "epoch": 0.01, + "global_step": 1277, + "learning_rate": 0.0004955050083472455, + "loss": 2.0732, + "loss_base2": 2.991, + "loss_pixel": 0.2377, + "loss_text": 1.8355, + "ppl": 7.9502, + "step": 1277 + }, + { + "epoch": 0.01, + "global_step": 1278, + "learning_rate": 0.000495500834724541, + "loss": 2.0837, + "loss_base2": 3.0061, + "loss_pixel": 0.2364, + "loss_text": 1.8473, + "ppl": 8.0341, + "step": 1278 + }, + { + "epoch": 0.01, + "global_step": 1279, + "learning_rate": 0.0004954966611018364, + "loss": 2.0976, + "loss_base2": 3.0262, + "loss_pixel": 0.2356, + "loss_text": 1.862, + "ppl": 8.1466, + "step": 1279 + }, + { + "epoch": 0.01, + "global_step": 1280, + "learning_rate": 0.0004954924874791319, + "loss": 2.0914, + "loss_base2": 3.0173, + "loss_pixel": 0.24, + "loss_text": 1.8514, + "ppl": 8.0962, + "step": 1280 + }, + { + "epoch": 0.01, + "global_step": 1281, + "learning_rate": 0.0004954883138564274, + "loss": 2.0865, + "loss_base2": 3.0102, + "loss_pixel": 0.2386, + "loss_text": 1.8479, + "ppl": 8.0567, + "step": 1281 + }, + { + "epoch": 0.01, + "global_step": 1282, + "learning_rate": 0.0004954841402337229, + "loss": 2.0901, + "loss_base2": 3.0154, + "loss_pixel": 0.2365, + "loss_text": 1.8536, + "ppl": 8.0857, + "step": 1282 + }, + { + "epoch": 0.01, + "global_step": 1283, + "learning_rate": 0.0004954799666110184, + "loss": 2.0755, + "loss_base2": 2.9943, + "loss_pixel": 0.2355, + "loss_text": 1.84, + "ppl": 7.9685, + "step": 1283 + }, + { + "epoch": 0.01, + "global_step": 1284, + "learning_rate": 0.0004954757929883139, + "loss": 2.0723, + "loss_base2": 2.9897, + "loss_pixel": 0.2353, + "loss_text": 1.8369, + "ppl": 7.9431, + "step": 1284 + }, + { + "epoch": 0.01, + "global_step": 1285, + "learning_rate": 0.0004954716193656094, + "loss": 2.0791, + "loss_base2": 2.9995, + "loss_pixel": 0.2356, + "loss_text": 1.8436, + "ppl": 7.9973, + "step": 1285 + }, + { + "epoch": 0.01, + "global_step": 1286, + "learning_rate": 0.0004954674457429049, + "loss": 2.0745, + "loss_base2": 2.9929, + "loss_pixel": 0.2341, + "loss_text": 1.8404, + "ppl": 7.9606, + "step": 1286 + }, + { + "epoch": 0.01, + "global_step": 1287, + "learning_rate": 0.0004954632721202004, + "loss": 2.066, + "loss_base2": 2.9806, + "loss_pixel": 0.2351, + "loss_text": 1.831, + "ppl": 7.8932, + "step": 1287 + }, + { + "epoch": 0.01, + "global_step": 1288, + "learning_rate": 0.0004954590984974958, + "loss": 2.0884, + "loss_base2": 3.0129, + "loss_pixel": 0.2331, + "loss_text": 1.8553, + "ppl": 8.072, + "step": 1288 + }, + { + "epoch": 0.01, + "global_step": 1289, + "learning_rate": 0.0004954549248747913, + "loss": 2.0428, + "loss_base2": 2.9471, + "loss_pixel": 0.2319, + "loss_text": 1.8109, + "ppl": 7.7122, + "step": 1289 + }, + { + "epoch": 0.01, + "global_step": 1290, + "learning_rate": 0.0004954507512520868, + "loss": 2.0559, + "loss_base2": 2.966, + "loss_pixel": 0.2318, + "loss_text": 1.824, + "ppl": 7.8139, + "step": 1290 + }, + { + "epoch": 0.01, + "global_step": 1291, + "learning_rate": 0.0004954465776293823, + "loss": 2.0635, + "loss_base2": 2.977, + "loss_pixel": 0.2304, + "loss_text": 1.8331, + "ppl": 7.8735, + "step": 1291 + }, + { + "epoch": 0.01, + "global_step": 1292, + "learning_rate": 0.0004954424040066777, + "loss": 2.054, + "loss_base2": 2.9633, + "loss_pixel": 0.2296, + "loss_text": 1.8243, + "ppl": 7.799, + "step": 1292 + }, + { + "epoch": 0.01, + "global_step": 1293, + "learning_rate": 0.0004954382303839732, + "loss": 2.0583, + "loss_base2": 2.9695, + "loss_pixel": 0.2306, + "loss_text": 1.8278, + "ppl": 7.8326, + "step": 1293 + }, + { + "epoch": 0.01, + "global_step": 1294, + "learning_rate": 0.0004954340567612688, + "loss": 2.0458, + "loss_base2": 2.9515, + "loss_pixel": 0.2285, + "loss_text": 1.8173, + "ppl": 7.7353, + "step": 1294 + }, + { + "epoch": 0.01, + "global_step": 1295, + "learning_rate": 0.0004954298831385643, + "loss": 2.0559, + "loss_base2": 2.966, + "loss_pixel": 0.2272, + "loss_text": 1.8287, + "ppl": 7.8139, + "step": 1295 + }, + { + "epoch": 0.01, + "global_step": 1296, + "learning_rate": 0.0004954257095158598, + "loss": 2.0293, + "loss_base2": 2.9277, + "loss_pixel": 0.2266, + "loss_text": 1.8027, + "ppl": 7.6088, + "step": 1296 + }, + { + "epoch": 0.01, + "global_step": 1297, + "learning_rate": 0.0004954215358931553, + "loss": 2.0583, + "loss_base2": 2.9695, + "loss_pixel": 0.2274, + "loss_text": 1.8309, + "ppl": 7.8326, + "step": 1297 + }, + { + "epoch": 0.01, + "global_step": 1298, + "learning_rate": 0.0004954173622704508, + "loss": 2.0581, + "loss_base2": 2.9692, + "loss_pixel": 0.2254, + "loss_text": 1.8328, + "ppl": 7.8311, + "step": 1298 + }, + { + "epoch": 0.01, + "global_step": 1299, + "learning_rate": 0.0004954131886477463, + "loss": 2.037, + "loss_base2": 2.9388, + "loss_pixel": 0.2257, + "loss_text": 1.8114, + "ppl": 7.6676, + "step": 1299 + }, + { + "epoch": 0.01, + "global_step": 1300, + "learning_rate": 0.0004954090150250418, + "loss": 2.0417, + "loss_base2": 2.9456, + "loss_pixel": 0.2247, + "loss_text": 1.817, + "ppl": 7.7037, + "step": 1300 + }, + { + "epoch": 0.01, + "global_step": 1301, + "learning_rate": 0.0004954048414023372, + "loss": 2.0498, + "loss_base2": 2.9572, + "loss_pixel": 0.2254, + "loss_text": 1.8244, + "ppl": 7.7663, + "step": 1301 + }, + { + "epoch": 0.01, + "global_step": 1302, + "learning_rate": 0.0004954006677796327, + "loss": 1.931, + "loss_base2": 2.7858, + "loss_pixel": 0.2241, + "loss_text": 1.7069, + "ppl": 6.8964, + "step": 1302 + }, + { + "epoch": 0.01, + "global_step": 1303, + "learning_rate": 0.0004953964941569282, + "loss": 1.8228, + "loss_base2": 2.6297, + "loss_pixel": 0.2227, + "loss_text": 1.6001, + "ppl": 6.1892, + "step": 1303 + }, + { + "epoch": 0.01, + "global_step": 1304, + "learning_rate": 0.0004953923205342237, + "loss": 1.8155, + "loss_base2": 2.6192, + "loss_pixel": 0.2223, + "loss_text": 1.5932, + "ppl": 6.1441, + "step": 1304 + }, + { + "epoch": 0.01, + "global_step": 1305, + "learning_rate": 0.0004953881469115192, + "loss": 1.7922, + "loss_base2": 2.5856, + "loss_pixel": 0.2233, + "loss_text": 1.5689, + "ppl": 6.0026, + "step": 1305 + }, + { + "epoch": 0.01, + "global_step": 1306, + "learning_rate": 0.0004953839732888147, + "loss": 1.8102, + "loss_base2": 2.6116, + "loss_pixel": 0.2269, + "loss_text": 1.5833, + "ppl": 6.1117, + "step": 1306 + }, + { + "epoch": 0.01, + "global_step": 1307, + "learning_rate": 0.0004953797996661102, + "loss": 1.8366, + "loss_base2": 2.6497, + "loss_pixel": 0.2336, + "loss_text": 1.603, + "ppl": 6.2752, + "step": 1307 + }, + { + "epoch": 0.01, + "global_step": 1308, + "learning_rate": 0.0004953756260434056, + "loss": 1.8183, + "loss_base2": 2.6233, + "loss_pixel": 0.2462, + "loss_text": 1.5721, + "ppl": 6.1614, + "step": 1308 + }, + { + "epoch": 0.01, + "global_step": 1309, + "learning_rate": 0.0004953714524207011, + "loss": 1.8047, + "loss_base2": 2.6036, + "loss_pixel": 0.2415, + "loss_text": 1.5632, + "ppl": 6.0781, + "step": 1309 + }, + { + "epoch": 0.01, + "global_step": 1310, + "learning_rate": 0.0004953672787979967, + "loss": 1.8107, + "loss_base2": 2.6123, + "loss_pixel": 0.2397, + "loss_text": 1.5709, + "ppl": 6.1147, + "step": 1310 + }, + { + "epoch": 0.01, + "global_step": 1311, + "learning_rate": 0.0004953631051752922, + "loss": 1.8088, + "loss_base2": 2.6095, + "loss_pixel": 0.238, + "loss_text": 1.5708, + "ppl": 6.1031, + "step": 1311 + }, + { + "epoch": 0.01, + "global_step": 1312, + "learning_rate": 0.0004953589315525877, + "loss": 1.7909, + "loss_base2": 2.5837, + "loss_pixel": 0.2349, + "loss_text": 1.556, + "ppl": 5.9948, + "step": 1312 + }, + { + "epoch": 0.01, + "global_step": 1313, + "learning_rate": 0.0004953547579298832, + "loss": 1.8134, + "loss_base2": 2.6162, + "loss_pixel": 0.2334, + "loss_text": 1.58, + "ppl": 6.1313, + "step": 1313 + }, + { + "epoch": 0.01, + "global_step": 1314, + "learning_rate": 0.0004953505843071787, + "loss": 1.816, + "loss_base2": 2.6199, + "loss_pixel": 0.2315, + "loss_text": 1.5846, + "ppl": 6.1472, + "step": 1314 + }, + { + "epoch": 0.01, + "global_step": 1315, + "learning_rate": 0.0004953464106844741, + "loss": 1.7811, + "loss_base2": 2.5696, + "loss_pixel": 0.2305, + "loss_text": 1.5507, + "ppl": 5.9364, + "step": 1315 + }, + { + "epoch": 0.01, + "global_step": 1316, + "learning_rate": 0.0004953422370617696, + "loss": 1.8144, + "loss_base2": 2.6176, + "loss_pixel": 0.2298, + "loss_text": 1.5846, + "ppl": 6.1374, + "step": 1316 + }, + { + "epoch": 0.01, + "global_step": 1317, + "learning_rate": 0.0004953380634390651, + "loss": 1.7655, + "loss_base2": 2.5471, + "loss_pixel": 0.2283, + "loss_text": 1.5372, + "ppl": 5.8445, + "step": 1317 + }, + { + "epoch": 0.01, + "global_step": 1318, + "learning_rate": 0.0004953338898163606, + "loss": 1.8109, + "loss_base2": 2.6126, + "loss_pixel": 0.2292, + "loss_text": 1.5818, + "ppl": 6.1159, + "step": 1318 + }, + { + "epoch": 0.01, + "global_step": 1319, + "learning_rate": 0.0004953297161936561, + "loss": 1.7843, + "loss_base2": 2.5742, + "loss_pixel": 0.2275, + "loss_text": 1.5567, + "ppl": 5.9554, + "step": 1319 + }, + { + "epoch": 0.01, + "global_step": 1320, + "learning_rate": 0.0004953255425709516, + "loss": 1.7584, + "loss_base2": 2.5368, + "loss_pixel": 0.2259, + "loss_text": 1.5324, + "ppl": 5.8031, + "step": 1320 + }, + { + "epoch": 0.01, + "global_step": 1321, + "learning_rate": 0.0004953213689482471, + "loss": 1.7758, + "loss_base2": 2.5619, + "loss_pixel": 0.2255, + "loss_text": 1.5503, + "ppl": 5.905, + "step": 1321 + }, + { + "epoch": 0.01, + "global_step": 1322, + "learning_rate": 0.0004953171953255426, + "loss": 1.7783, + "loss_base2": 2.5655, + "loss_pixel": 0.2258, + "loss_text": 1.5525, + "ppl": 5.9198, + "step": 1322 + }, + { + "epoch": 0.01, + "global_step": 1323, + "learning_rate": 0.0004953130217028381, + "loss": 1.7565, + "loss_base2": 2.5341, + "loss_pixel": 0.2237, + "loss_text": 1.5328, + "ppl": 5.7921, + "step": 1323 + }, + { + "epoch": 0.01, + "global_step": 1324, + "learning_rate": 0.0004953088480801335, + "loss": 1.7605, + "loss_base2": 2.5399, + "loss_pixel": 0.2228, + "loss_text": 1.5377, + "ppl": 5.8153, + "step": 1324 + }, + { + "epoch": 0.01, + "global_step": 1325, + "learning_rate": 0.000495304674457429, + "loss": 1.7642, + "loss_base2": 2.5452, + "loss_pixel": 0.2236, + "loss_text": 1.5406, + "ppl": 5.8369, + "step": 1325 + }, + { + "epoch": 0.01, + "global_step": 1326, + "learning_rate": 0.0004953005008347246, + "loss": 1.7324, + "loss_base2": 2.4993, + "loss_pixel": 0.2227, + "loss_text": 1.5096, + "ppl": 5.6542, + "step": 1326 + }, + { + "epoch": 0.01, + "global_step": 1327, + "learning_rate": 0.0004952963272120201, + "loss": 1.7747, + "loss_base2": 2.5604, + "loss_pixel": 0.2231, + "loss_text": 1.5516, + "ppl": 5.8985, + "step": 1327 + }, + { + "epoch": 0.01, + "global_step": 1328, + "learning_rate": 0.0004952921535893156, + "loss": 1.7495, + "loss_base2": 2.524, + "loss_pixel": 0.2206, + "loss_text": 1.5289, + "ppl": 5.7517, + "step": 1328 + }, + { + "epoch": 0.01, + "global_step": 1329, + "learning_rate": 0.000495287979966611, + "loss": 1.7492, + "loss_base2": 2.5236, + "loss_pixel": 0.2229, + "loss_text": 1.5263, + "ppl": 5.75, + "step": 1329 + }, + { + "epoch": 0.01, + "global_step": 1330, + "learning_rate": 0.0004952838063439065, + "loss": 1.7412, + "loss_base2": 2.512, + "loss_pixel": 0.2218, + "loss_text": 1.5194, + "ppl": 5.7042, + "step": 1330 + }, + { + "epoch": 0.01, + "global_step": 1331, + "learning_rate": 0.000495279632721202, + "loss": 1.7491, + "loss_base2": 2.5234, + "loss_pixel": 0.2207, + "loss_text": 1.5284, + "ppl": 5.7494, + "step": 1331 + }, + { + "epoch": 0.01, + "global_step": 1332, + "learning_rate": 0.0004952754590984975, + "loss": 1.7585, + "loss_base2": 2.537, + "loss_pixel": 0.2209, + "loss_text": 1.5375, + "ppl": 5.8037, + "step": 1332 + }, + { + "epoch": 0.01, + "global_step": 1333, + "learning_rate": 0.000495271285475793, + "loss": 1.773, + "loss_base2": 2.5579, + "loss_pixel": 0.22, + "loss_text": 1.553, + "ppl": 5.8885, + "step": 1333 + }, + { + "epoch": 0.01, + "global_step": 1334, + "learning_rate": 0.0004952671118530885, + "loss": 1.8884, + "loss_base2": 2.7244, + "loss_pixel": 0.2202, + "loss_text": 1.6682, + "ppl": 6.6088, + "step": 1334 + }, + { + "epoch": 0.01, + "global_step": 1335, + "learning_rate": 0.000495262938230384, + "loss": 2.0629, + "loss_base2": 2.9761, + "loss_pixel": 0.2205, + "loss_text": 1.8424, + "ppl": 7.8688, + "step": 1335 + }, + { + "epoch": 0.01, + "global_step": 1336, + "learning_rate": 0.0004952587646076795, + "loss": 2.0605, + "loss_base2": 2.9727, + "loss_pixel": 0.2226, + "loss_text": 1.838, + "ppl": 7.8499, + "step": 1336 + }, + { + "epoch": 0.01, + "global_step": 1337, + "learning_rate": 0.000495254590984975, + "loss": 2.0662, + "loss_base2": 2.9809, + "loss_pixel": 0.2268, + "loss_text": 1.8394, + "ppl": 7.8948, + "step": 1337 + }, + { + "epoch": 0.01, + "global_step": 1338, + "learning_rate": 0.0004952504173622704, + "loss": 2.0611, + "loss_base2": 2.9735, + "loss_pixel": 0.2299, + "loss_text": 1.8312, + "ppl": 7.8546, + "step": 1338 + }, + { + "epoch": 0.01, + "global_step": 1339, + "learning_rate": 0.0004952462437395659, + "loss": 2.0563, + "loss_base2": 2.9666, + "loss_pixel": 0.2265, + "loss_text": 1.8298, + "ppl": 7.817, + "step": 1339 + }, + { + "epoch": 0.01, + "global_step": 1340, + "learning_rate": 0.0004952420701168614, + "loss": 2.0424, + "loss_base2": 2.9466, + "loss_pixel": 0.2227, + "loss_text": 1.8197, + "ppl": 7.7091, + "step": 1340 + }, + { + "epoch": 0.01, + "global_step": 1341, + "learning_rate": 0.000495237896494157, + "loss": 2.0469, + "loss_base2": 2.9531, + "loss_pixel": 0.2237, + "loss_text": 1.8231, + "ppl": 7.7439, + "step": 1341 + }, + { + "epoch": 0.01, + "global_step": 1342, + "learning_rate": 0.0004952337228714525, + "loss": 2.041, + "loss_base2": 2.9445, + "loss_pixel": 0.2246, + "loss_text": 1.8164, + "ppl": 7.6983, + "step": 1342 + }, + { + "epoch": 0.01, + "global_step": 1343, + "learning_rate": 0.000495229549248748, + "loss": 2.066, + "loss_base2": 2.9806, + "loss_pixel": 0.2215, + "loss_text": 1.8445, + "ppl": 7.8932, + "step": 1343 + }, + { + "epoch": 0.01, + "global_step": 1344, + "learning_rate": 0.0004952253756260435, + "loss": 2.0443, + "loss_base2": 2.9493, + "loss_pixel": 0.2218, + "loss_text": 1.8225, + "ppl": 7.7238, + "step": 1344 + }, + { + "epoch": 0.01, + "global_step": 1345, + "learning_rate": 0.0004952212020033389, + "loss": 2.0449, + "loss_base2": 2.9502, + "loss_pixel": 0.2202, + "loss_text": 1.8247, + "ppl": 7.7284, + "step": 1345 + }, + { + "epoch": 0.01, + "global_step": 1346, + "learning_rate": 0.0004952170283806344, + "loss": 2.03, + "loss_base2": 2.9287, + "loss_pixel": 0.2198, + "loss_text": 1.8102, + "ppl": 7.6141, + "step": 1346 + }, + { + "epoch": 0.01, + "global_step": 1347, + "learning_rate": 0.0004952128547579299, + "loss": 2.039, + "loss_base2": 2.9417, + "loss_pixel": 0.2214, + "loss_text": 1.8177, + "ppl": 7.6829, + "step": 1347 + }, + { + "epoch": 0.01, + "global_step": 1348, + "learning_rate": 0.0004952086811352254, + "loss": 2.0386, + "loss_base2": 2.9411, + "loss_pixel": 0.2207, + "loss_text": 1.8179, + "ppl": 7.6798, + "step": 1348 + }, + { + "epoch": 0.01, + "global_step": 1349, + "learning_rate": 0.0004952045075125209, + "loss": 2.0195, + "loss_base2": 2.9135, + "loss_pixel": 0.219, + "loss_text": 1.8005, + "ppl": 7.5346, + "step": 1349 + }, + { + "epoch": 0.01, + "global_step": 1350, + "learning_rate": 0.0004952003338898164, + "loss": 2.0423, + "loss_base2": 2.9464, + "loss_pixel": 0.2191, + "loss_text": 1.8233, + "ppl": 7.7083, + "step": 1350 + }, + { + "epoch": 0.01, + "global_step": 1351, + "learning_rate": 0.0004951961602671118, + "loss": 2.0218, + "loss_base2": 2.9168, + "loss_pixel": 0.2178, + "loss_text": 1.804, + "ppl": 7.5519, + "step": 1351 + }, + { + "epoch": 0.01, + "global_step": 1352, + "learning_rate": 0.0004951919866444073, + "loss": 2.0451, + "loss_base2": 2.9505, + "loss_pixel": 0.2188, + "loss_text": 1.8263, + "ppl": 7.7299, + "step": 1352 + }, + { + "epoch": 0.01, + "global_step": 1353, + "learning_rate": 0.0004951878130217028, + "loss": 2.0257, + "loss_base2": 2.9225, + "loss_pixel": 0.2174, + "loss_text": 1.8083, + "ppl": 7.5814, + "step": 1353 + }, + { + "epoch": 0.01, + "global_step": 1354, + "learning_rate": 0.0004951836393989983, + "loss": 2.0265, + "loss_base2": 2.9236, + "loss_pixel": 0.2173, + "loss_text": 1.8092, + "ppl": 7.5875, + "step": 1354 + }, + { + "epoch": 0.01, + "global_step": 1355, + "learning_rate": 0.0004951794657762938, + "loss": 2.0111, + "loss_base2": 2.9014, + "loss_pixel": 0.217, + "loss_text": 1.794, + "ppl": 7.4715, + "step": 1355 + }, + { + "epoch": 0.01, + "global_step": 1356, + "learning_rate": 0.0004951752921535893, + "loss": 2.0137, + "loss_base2": 2.9052, + "loss_pixel": 0.2162, + "loss_text": 1.7975, + "ppl": 7.491, + "step": 1356 + }, + { + "epoch": 0.01, + "global_step": 1357, + "learning_rate": 0.0004951711185308848, + "loss": 2.031, + "loss_base2": 2.9301, + "loss_pixel": 0.2155, + "loss_text": 1.8156, + "ppl": 7.6217, + "step": 1357 + }, + { + "epoch": 0.01, + "global_step": 1358, + "learning_rate": 0.0004951669449081804, + "loss": 2.0168, + "loss_base2": 2.9096, + "loss_pixel": 0.2174, + "loss_text": 1.7994, + "ppl": 7.5142, + "step": 1358 + }, + { + "epoch": 0.01, + "global_step": 1359, + "learning_rate": 0.0004951627712854759, + "loss": 2.0273, + "loss_base2": 2.9248, + "loss_pixel": 0.2168, + "loss_text": 1.8105, + "ppl": 7.5936, + "step": 1359 + }, + { + "epoch": 0.01, + "global_step": 1360, + "learning_rate": 0.0004951585976627713, + "loss": 1.9997, + "loss_base2": 2.885, + "loss_pixel": 0.2156, + "loss_text": 1.7841, + "ppl": 7.3868, + "step": 1360 + }, + { + "epoch": 0.01, + "global_step": 1361, + "learning_rate": 0.0004951544240400668, + "loss": 2.0214, + "loss_base2": 2.9163, + "loss_pixel": 0.2158, + "loss_text": 1.8056, + "ppl": 7.5489, + "step": 1361 + }, + { + "epoch": 0.01, + "global_step": 1362, + "learning_rate": 0.0004951502504173623, + "loss": 2.0226, + "loss_base2": 2.918, + "loss_pixel": 0.2169, + "loss_text": 1.8057, + "ppl": 7.558, + "step": 1362 + }, + { + "epoch": 0.01, + "global_step": 1363, + "learning_rate": 0.0004951460767946578, + "loss": 2.0108, + "loss_base2": 2.901, + "loss_pixel": 0.2157, + "loss_text": 1.795, + "ppl": 7.4693, + "step": 1363 + }, + { + "epoch": 0.01, + "global_step": 1364, + "learning_rate": 0.0004951419031719533, + "loss": 2.0232, + "loss_base2": 2.9189, + "loss_pixel": 0.2164, + "loss_text": 1.8068, + "ppl": 7.5625, + "step": 1364 + }, + { + "epoch": 0.01, + "global_step": 1365, + "learning_rate": 0.0004951377295492487, + "loss": 2.0095, + "loss_base2": 2.8991, + "loss_pixel": 0.2148, + "loss_text": 1.7947, + "ppl": 7.4596, + "step": 1365 + }, + { + "epoch": 0.01, + "global_step": 1366, + "learning_rate": 0.0004951335559265442, + "loss": 2.0169, + "loss_base2": 2.9098, + "loss_pixel": 0.2155, + "loss_text": 1.8014, + "ppl": 7.515, + "step": 1366 + }, + { + "epoch": 0.01, + "global_step": 1367, + "learning_rate": 0.0004951293823038397, + "loss": 2.0053, + "loss_base2": 2.893, + "loss_pixel": 0.2156, + "loss_text": 1.7898, + "ppl": 7.4283, + "step": 1367 + }, + { + "epoch": 0.01, + "global_step": 1368, + "learning_rate": 0.0004951252086811352, + "loss": 2.0113, + "loss_base2": 2.9017, + "loss_pixel": 0.2146, + "loss_text": 1.7967, + "ppl": 7.473, + "step": 1368 + }, + { + "epoch": 0.01, + "global_step": 1369, + "learning_rate": 0.0004951210350584307, + "loss": 2.0255, + "loss_base2": 2.9222, + "loss_pixel": 0.2158, + "loss_text": 1.8097, + "ppl": 7.5799, + "step": 1369 + }, + { + "epoch": 0.01, + "global_step": 1370, + "learning_rate": 0.0004951168614357262, + "loss": 1.9918, + "loss_base2": 2.8736, + "loss_pixel": 0.2151, + "loss_text": 1.7767, + "ppl": 7.3287, + "step": 1370 + }, + { + "epoch": 0.01, + "global_step": 1371, + "learning_rate": 0.0004951126878130217, + "loss": 1.9884, + "loss_base2": 2.8687, + "loss_pixel": 0.2145, + "loss_text": 1.7739, + "ppl": 7.3038, + "step": 1371 + }, + { + "epoch": 0.01, + "global_step": 1372, + "learning_rate": 0.0004951085141903172, + "loss": 2.0029, + "loss_base2": 2.8896, + "loss_pixel": 0.2147, + "loss_text": 1.7882, + "ppl": 7.4105, + "step": 1372 + }, + { + "epoch": 0.01, + "global_step": 1373, + "learning_rate": 0.0004951043405676127, + "loss": 2.0078, + "loss_base2": 2.8966, + "loss_pixel": 0.2147, + "loss_text": 1.7932, + "ppl": 7.4469, + "step": 1373 + }, + { + "epoch": 0.01, + "global_step": 1374, + "learning_rate": 0.0004951001669449081, + "loss": 2.0013, + "loss_base2": 2.8873, + "loss_pixel": 0.216, + "loss_text": 1.7853, + "ppl": 7.3987, + "step": 1374 + }, + { + "epoch": 0.01, + "global_step": 1375, + "learning_rate": 0.0004950959933222037, + "loss": 1.9738, + "loss_base2": 2.8476, + "loss_pixel": 0.2153, + "loss_text": 1.7585, + "ppl": 7.198, + "step": 1375 + }, + { + "epoch": 0.01, + "global_step": 1376, + "learning_rate": 0.0004950918196994992, + "loss": 2.01, + "loss_base2": 2.8998, + "loss_pixel": 0.2136, + "loss_text": 1.7964, + "ppl": 7.4633, + "step": 1376 + }, + { + "epoch": 0.01, + "global_step": 1377, + "learning_rate": 0.0004950876460767947, + "loss": 1.9943, + "loss_base2": 2.8772, + "loss_pixel": 0.215, + "loss_text": 1.7794, + "ppl": 7.3471, + "step": 1377 + }, + { + "epoch": 0.01, + "global_step": 1378, + "learning_rate": 0.0004950834724540902, + "loss": 2.015, + "loss_base2": 2.907, + "loss_pixel": 0.2163, + "loss_text": 1.7987, + "ppl": 7.5007, + "step": 1378 + }, + { + "epoch": 0.01, + "global_step": 1379, + "learning_rate": 0.0004950792988313857, + "loss": 2.0062, + "loss_base2": 2.8943, + "loss_pixel": 0.2151, + "loss_text": 1.7911, + "ppl": 7.435, + "step": 1379 + }, + { + "epoch": 0.01, + "global_step": 1380, + "learning_rate": 0.0004950751252086812, + "loss": 2.0032, + "loss_base2": 2.89, + "loss_pixel": 0.2122, + "loss_text": 1.791, + "ppl": 7.4127, + "step": 1380 + }, + { + "epoch": 0.01, + "global_step": 1381, + "learning_rate": 0.0004950709515859767, + "loss": 1.9855, + "loss_base2": 2.8645, + "loss_pixel": 0.2138, + "loss_text": 1.7718, + "ppl": 7.2827, + "step": 1381 + }, + { + "epoch": 0.01, + "global_step": 1382, + "learning_rate": 0.0004950667779632722, + "loss": 2.0054, + "loss_base2": 2.8932, + "loss_pixel": 0.2147, + "loss_text": 1.7906, + "ppl": 7.4291, + "step": 1382 + }, + { + "epoch": 0.01, + "global_step": 1383, + "learning_rate": 0.0004950626043405676, + "loss": 2.0108, + "loss_base2": 2.901, + "loss_pixel": 0.2147, + "loss_text": 1.796, + "ppl": 7.4693, + "step": 1383 + }, + { + "epoch": 0.01, + "global_step": 1384, + "learning_rate": 0.0004950584307178631, + "loss": 2.0093, + "loss_base2": 2.8988, + "loss_pixel": 0.2132, + "loss_text": 1.7961, + "ppl": 7.4581, + "step": 1384 + }, + { + "epoch": 0.01, + "global_step": 1385, + "learning_rate": 0.0004950542570951586, + "loss": 1.9926, + "loss_base2": 2.8747, + "loss_pixel": 0.2137, + "loss_text": 1.7789, + "ppl": 7.3346, + "step": 1385 + }, + { + "epoch": 0.01, + "global_step": 1386, + "learning_rate": 0.0004950500834724541, + "loss": 2.0059, + "loss_base2": 2.8939, + "loss_pixel": 0.2142, + "loss_text": 1.7917, + "ppl": 7.4328, + "step": 1386 + }, + { + "epoch": 0.01, + "global_step": 1387, + "learning_rate": 0.0004950459098497496, + "loss": 2.0034, + "loss_base2": 2.8903, + "loss_pixel": 0.2125, + "loss_text": 1.7909, + "ppl": 7.4142, + "step": 1387 + }, + { + "epoch": 0.01, + "global_step": 1388, + "learning_rate": 0.000495041736227045, + "loss": 1.9986, + "loss_base2": 2.8834, + "loss_pixel": 0.2128, + "loss_text": 1.7858, + "ppl": 7.3787, + "step": 1388 + }, + { + "epoch": 0.01, + "global_step": 1389, + "learning_rate": 0.0004950375626043405, + "loss": 1.9768, + "loss_base2": 2.8519, + "loss_pixel": 0.2129, + "loss_text": 1.7639, + "ppl": 7.2196, + "step": 1389 + }, + { + "epoch": 0.01, + "global_step": 1390, + "learning_rate": 0.000495033388981636, + "loss": 1.9855, + "loss_base2": 2.8645, + "loss_pixel": 0.2125, + "loss_text": 1.7729, + "ppl": 7.2827, + "step": 1390 + }, + { + "epoch": 0.01, + "global_step": 1391, + "learning_rate": 0.0004950292153589316, + "loss": 1.9748, + "loss_base2": 2.849, + "loss_pixel": 0.2112, + "loss_text": 1.7636, + "ppl": 7.2052, + "step": 1391 + }, + { + "epoch": 0.01, + "global_step": 1392, + "learning_rate": 0.0004950250417362271, + "loss": 1.9874, + "loss_base2": 2.8672, + "loss_pixel": 0.2125, + "loss_text": 1.7748, + "ppl": 7.2965, + "step": 1392 + }, + { + "epoch": 0.01, + "global_step": 1393, + "learning_rate": 0.0004950208681135226, + "loss": 1.9917, + "loss_base2": 2.8734, + "loss_pixel": 0.2116, + "loss_text": 1.7801, + "ppl": 7.328, + "step": 1393 + }, + { + "epoch": 0.01, + "global_step": 1394, + "learning_rate": 0.0004950166944908181, + "loss": 1.9917, + "loss_base2": 2.8734, + "loss_pixel": 0.2116, + "loss_text": 1.7801, + "ppl": 7.328, + "step": 1394 + }, + { + "epoch": 0.01, + "global_step": 1395, + "learning_rate": 0.0004950125208681136, + "loss": 1.9646, + "loss_base2": 2.8343, + "loss_pixel": 0.2114, + "loss_text": 1.7532, + "ppl": 7.1321, + "step": 1395 + }, + { + "epoch": 0.01, + "global_step": 1396, + "learning_rate": 0.0004950083472454091, + "loss": 1.9928, + "loss_base2": 2.875, + "loss_pixel": 0.2126, + "loss_text": 1.7802, + "ppl": 7.336, + "step": 1396 + }, + { + "epoch": 0.01, + "global_step": 1397, + "learning_rate": 0.0004950041736227045, + "loss": 1.9947, + "loss_base2": 2.8777, + "loss_pixel": 0.2123, + "loss_text": 1.7824, + "ppl": 7.35, + "step": 1397 + }, + { + "epoch": 0.01, + "global_step": 1398, + "learning_rate": 0.000495, + "loss": 2.0052, + "loss_base2": 2.8929, + "loss_pixel": 0.2117, + "loss_text": 1.7936, + "ppl": 7.4276, + "step": 1398 + }, + { + "epoch": 0.01, + "global_step": 1399, + "learning_rate": 0.0004949958263772955, + "loss": 1.9968, + "loss_base2": 2.8808, + "loss_pixel": 0.2106, + "loss_text": 1.7862, + "ppl": 7.3654, + "step": 1399 + }, + { + "epoch": 0.01, + "global_step": 1400, + "learning_rate": 0.000494991652754591, + "loss": 2.0008, + "loss_base2": 2.8865, + "loss_pixel": 0.2118, + "loss_text": 1.789, + "ppl": 7.395, + "step": 1400 + }, + { + "epoch": 0.01, + "global_step": 1401, + "learning_rate": 0.0004949874791318864, + "loss": 2.0073, + "loss_base2": 2.8959, + "loss_pixel": 0.212, + "loss_text": 1.7954, + "ppl": 7.4432, + "step": 1401 + }, + { + "epoch": 0.01, + "global_step": 1402, + "learning_rate": 0.0004949833055091819, + "loss": 1.9759, + "loss_base2": 2.8506, + "loss_pixel": 0.2118, + "loss_text": 1.7641, + "ppl": 7.2131, + "step": 1402 + }, + { + "epoch": 0.01, + "global_step": 1403, + "learning_rate": 0.0004949791318864774, + "loss": 1.9796, + "loss_base2": 2.856, + "loss_pixel": 0.2115, + "loss_text": 1.7681, + "ppl": 7.2398, + "step": 1403 + }, + { + "epoch": 0.01, + "global_step": 1404, + "learning_rate": 0.0004949749582637729, + "loss": 1.985, + "loss_base2": 2.8637, + "loss_pixel": 0.2109, + "loss_text": 1.7741, + "ppl": 7.279, + "step": 1404 + }, + { + "epoch": 0.01, + "global_step": 1405, + "learning_rate": 0.0004949707846410684, + "loss": 1.8802, + "loss_base2": 2.7126, + "loss_pixel": 0.2133, + "loss_text": 1.6669, + "ppl": 6.5548, + "step": 1405 + }, + { + "epoch": 0.01, + "global_step": 1406, + "learning_rate": 0.000494966611018364, + "loss": 1.7979, + "loss_base2": 2.5938, + "loss_pixel": 0.2227, + "loss_text": 1.5752, + "ppl": 6.037, + "step": 1406 + }, + { + "epoch": 0.01, + "global_step": 1407, + "learning_rate": 0.0004949624373956595, + "loss": 1.7553, + "loss_base2": 2.5324, + "loss_pixel": 0.2253, + "loss_text": 1.53, + "ppl": 5.7852, + "step": 1407 + }, + { + "epoch": 0.01, + "global_step": 1408, + "learning_rate": 0.000494958263772955, + "loss": 1.7653, + "loss_base2": 2.5468, + "loss_pixel": 0.226, + "loss_text": 1.5393, + "ppl": 5.8433, + "step": 1408 + }, + { + "epoch": 0.01, + "global_step": 1409, + "learning_rate": 0.0004949540901502505, + "loss": 1.7702, + "loss_base2": 2.5539, + "loss_pixel": 0.2322, + "loss_text": 1.5381, + "ppl": 5.872, + "step": 1409 + }, + { + "epoch": 0.01, + "global_step": 1410, + "learning_rate": 0.0004949499165275459, + "loss": 1.7373, + "loss_base2": 2.5064, + "loss_pixel": 0.2341, + "loss_text": 1.5033, + "ppl": 5.682, + "step": 1410 + }, + { + "epoch": 0.01, + "global_step": 1411, + "learning_rate": 0.0004949457429048414, + "loss": 1.7716, + "loss_base2": 2.5559, + "loss_pixel": 0.2373, + "loss_text": 1.5343, + "ppl": 5.8803, + "step": 1411 + }, + { + "epoch": 0.01, + "global_step": 1412, + "learning_rate": 0.0004949415692821369, + "loss": 1.758, + "loss_base2": 2.5363, + "loss_pixel": 0.2333, + "loss_text": 1.5247, + "ppl": 5.8008, + "step": 1412 + }, + { + "epoch": 0.01, + "global_step": 1413, + "learning_rate": 0.0004949373956594324, + "loss": 1.8586, + "loss_base2": 2.6814, + "loss_pixel": 0.2275, + "loss_text": 1.6312, + "ppl": 6.4147, + "step": 1413 + }, + { + "epoch": 0.01, + "global_step": 1414, + "learning_rate": 0.0004949332220367279, + "loss": 2.0385, + "loss_base2": 2.9409, + "loss_pixel": 0.2251, + "loss_text": 1.8134, + "ppl": 7.6791, + "step": 1414 + }, + { + "epoch": 0.01, + "global_step": 1415, + "learning_rate": 0.0004949290484140234, + "loss": 2.029, + "loss_base2": 2.9272, + "loss_pixel": 0.223, + "loss_text": 1.806, + "ppl": 7.6065, + "step": 1415 + }, + { + "epoch": 0.01, + "global_step": 1416, + "learning_rate": 0.0004949248747913189, + "loss": 2.0037, + "loss_base2": 2.8907, + "loss_pixel": 0.2225, + "loss_text": 1.7812, + "ppl": 7.4164, + "step": 1416 + }, + { + "epoch": 0.01, + "global_step": 1417, + "learning_rate": 0.0004949207011686144, + "loss": 2.0129, + "loss_base2": 2.904, + "loss_pixel": 0.2219, + "loss_text": 1.791, + "ppl": 7.485, + "step": 1417 + }, + { + "epoch": 0.01, + "global_step": 1418, + "learning_rate": 0.0004949165275459099, + "loss": 2.0083, + "loss_base2": 2.8974, + "loss_pixel": 0.2193, + "loss_text": 1.7891, + "ppl": 7.4506, + "step": 1418 + }, + { + "epoch": 0.01, + "global_step": 1419, + "learning_rate": 0.0004949123539232053, + "loss": 2.0198, + "loss_base2": 2.914, + "loss_pixel": 0.22, + "loss_text": 1.7998, + "ppl": 7.5368, + "step": 1419 + }, + { + "epoch": 0.01, + "global_step": 1420, + "learning_rate": 0.0004949081803005008, + "loss": 2.0071, + "loss_base2": 2.8956, + "loss_pixel": 0.2185, + "loss_text": 1.7886, + "ppl": 7.4417, + "step": 1420 + }, + { + "epoch": 0.01, + "global_step": 1421, + "learning_rate": 0.0004949040066777963, + "loss": 1.9998, + "loss_base2": 2.8851, + "loss_pixel": 0.2168, + "loss_text": 1.783, + "ppl": 7.3876, + "step": 1421 + }, + { + "epoch": 0.01, + "global_step": 1422, + "learning_rate": 0.0004948998330550918, + "loss": 2.0141, + "loss_base2": 2.9057, + "loss_pixel": 0.2163, + "loss_text": 1.7978, + "ppl": 7.494, + "step": 1422 + }, + { + "epoch": 0.01, + "global_step": 1423, + "learning_rate": 0.0004948956594323874, + "loss": 1.9998, + "loss_base2": 2.8851, + "loss_pixel": 0.2153, + "loss_text": 1.7844, + "ppl": 7.3876, + "step": 1423 + }, + { + "epoch": 0.01, + "global_step": 1424, + "learning_rate": 0.0004948914858096828, + "loss": 1.9952, + "loss_base2": 2.8785, + "loss_pixel": 0.2151, + "loss_text": 1.7801, + "ppl": 7.3537, + "step": 1424 + }, + { + "epoch": 0.01, + "global_step": 1425, + "learning_rate": 0.0004948873121869783, + "loss": 2.0013, + "loss_base2": 2.8873, + "loss_pixel": 0.2169, + "loss_text": 1.7844, + "ppl": 7.3987, + "step": 1425 + }, + { + "epoch": 0.01, + "global_step": 1426, + "learning_rate": 0.0004948831385642738, + "loss": 1.991, + "loss_base2": 2.8724, + "loss_pixel": 0.2147, + "loss_text": 1.7763, + "ppl": 7.3229, + "step": 1426 + }, + { + "epoch": 0.01, + "global_step": 1427, + "learning_rate": 0.0004948789649415693, + "loss": 2.0049, + "loss_base2": 2.8925, + "loss_pixel": 0.2147, + "loss_text": 1.7902, + "ppl": 7.4254, + "step": 1427 + }, + { + "epoch": 0.01, + "global_step": 1428, + "learning_rate": 0.0004948747913188648, + "loss": 1.987, + "loss_base2": 2.8666, + "loss_pixel": 0.2141, + "loss_text": 1.7729, + "ppl": 7.2936, + "step": 1428 + }, + { + "epoch": 0.01, + "global_step": 1429, + "learning_rate": 0.0004948706176961603, + "loss": 1.9956, + "loss_base2": 2.879, + "loss_pixel": 0.2135, + "loss_text": 1.782, + "ppl": 7.3566, + "step": 1429 + }, + { + "epoch": 0.01, + "global_step": 1430, + "learning_rate": 0.0004948664440734558, + "loss": 1.9823, + "loss_base2": 2.8599, + "loss_pixel": 0.2133, + "loss_text": 1.7689, + "ppl": 7.2594, + "step": 1430 + }, + { + "epoch": 0.01, + "global_step": 1431, + "learning_rate": 0.0004948622704507513, + "loss": 2.002, + "loss_base2": 2.8883, + "loss_pixel": 0.2139, + "loss_text": 1.7881, + "ppl": 7.4038, + "step": 1431 + }, + { + "epoch": 0.01, + "global_step": 1432, + "learning_rate": 0.0004948580968280468, + "loss": 1.9827, + "loss_base2": 2.8604, + "loss_pixel": 0.212, + "loss_text": 1.7706, + "ppl": 7.2623, + "step": 1432 + }, + { + "epoch": 0.01, + "global_step": 1433, + "learning_rate": 0.0004948539232053422, + "loss": 1.9914, + "loss_base2": 2.873, + "loss_pixel": 0.2136, + "loss_text": 1.7777, + "ppl": 7.3258, + "step": 1433 + }, + { + "epoch": 0.01, + "global_step": 1434, + "learning_rate": 0.0004948497495826377, + "loss": 2.005, + "loss_base2": 2.8926, + "loss_pixel": 0.2144, + "loss_text": 1.7906, + "ppl": 7.4261, + "step": 1434 + }, + { + "epoch": 0.01, + "global_step": 1435, + "learning_rate": 0.0004948455759599332, + "loss": 1.9996, + "loss_base2": 2.8848, + "loss_pixel": 0.213, + "loss_text": 1.7866, + "ppl": 7.3861, + "step": 1435 + }, + { + "epoch": 0.01, + "global_step": 1436, + "learning_rate": 0.0004948414023372287, + "loss": 1.998, + "loss_base2": 2.8825, + "loss_pixel": 0.212, + "loss_text": 1.7859, + "ppl": 7.3743, + "step": 1436 + }, + { + "epoch": 0.01, + "global_step": 1437, + "learning_rate": 0.0004948372287145242, + "loss": 1.9865, + "loss_base2": 2.8659, + "loss_pixel": 0.211, + "loss_text": 1.7755, + "ppl": 7.29, + "step": 1437 + }, + { + "epoch": 0.01, + "global_step": 1438, + "learning_rate": 0.0004948330550918197, + "loss": 1.8658, + "loss_base2": 2.6918, + "loss_pixel": 0.2122, + "loss_text": 1.6536, + "ppl": 6.4611, + "step": 1438 + }, + { + "epoch": 0.01, + "global_step": 1439, + "learning_rate": 0.0004948288814691151, + "loss": 1.7704, + "loss_base2": 2.5541, + "loss_pixel": 0.2119, + "loss_text": 1.5585, + "ppl": 5.8732, + "step": 1439 + }, + { + "epoch": 0.01, + "global_step": 1440, + "learning_rate": 0.0004948247078464107, + "loss": 1.7297, + "loss_base2": 2.4954, + "loss_pixel": 0.2115, + "loss_text": 1.5182, + "ppl": 5.639, + "step": 1440 + }, + { + "epoch": 0.01, + "global_step": 1441, + "learning_rate": 0.0004948205342237062, + "loss": 1.7216, + "loss_base2": 2.4837, + "loss_pixel": 0.2121, + "loss_text": 1.5095, + "ppl": 5.5935, + "step": 1441 + }, + { + "epoch": 0.01, + "global_step": 1442, + "learning_rate": 0.0004948163606010017, + "loss": 1.7403, + "loss_base2": 2.5107, + "loss_pixel": 0.2124, + "loss_text": 1.5279, + "ppl": 5.6991, + "step": 1442 + }, + { + "epoch": 0.01, + "global_step": 1443, + "learning_rate": 0.0004948121869782972, + "loss": 1.7348, + "loss_base2": 2.5028, + "loss_pixel": 0.2107, + "loss_text": 1.5241, + "ppl": 5.6678, + "step": 1443 + }, + { + "epoch": 0.01, + "global_step": 1444, + "learning_rate": 0.0004948080133555927, + "loss": 1.7414, + "loss_base2": 2.5123, + "loss_pixel": 0.2095, + "loss_text": 1.5319, + "ppl": 5.7053, + "step": 1444 + }, + { + "epoch": 0.01, + "global_step": 1445, + "learning_rate": 0.0004948038397328882, + "loss": 1.7171, + "loss_base2": 2.4773, + "loss_pixel": 0.2115, + "loss_text": 1.5056, + "ppl": 5.5684, + "step": 1445 + }, + { + "epoch": 0.01, + "global_step": 1446, + "learning_rate": 0.0004947996661101837, + "loss": 1.7031, + "loss_base2": 2.4571, + "loss_pixel": 0.2112, + "loss_text": 1.492, + "ppl": 5.4909, + "step": 1446 + }, + { + "epoch": 0.01, + "global_step": 1447, + "learning_rate": 0.0004947954924874791, + "loss": 1.7272, + "loss_base2": 2.4918, + "loss_pixel": 0.2102, + "loss_text": 1.517, + "ppl": 5.6249, + "step": 1447 + }, + { + "epoch": 0.01, + "global_step": 1448, + "learning_rate": 0.0004947913188647746, + "loss": 1.7351, + "loss_base2": 2.5032, + "loss_pixel": 0.2106, + "loss_text": 1.5245, + "ppl": 5.6695, + "step": 1448 + }, + { + "epoch": 0.01, + "global_step": 1449, + "learning_rate": 0.0004947871452420701, + "loss": 1.7261, + "loss_base2": 2.4902, + "loss_pixel": 0.2117, + "loss_text": 1.5144, + "ppl": 5.6187, + "step": 1449 + }, + { + "epoch": 0.01, + "global_step": 1450, + "learning_rate": 0.0004947829716193656, + "loss": 1.7149, + "loss_base2": 2.4741, + "loss_pixel": 0.2101, + "loss_text": 1.5048, + "ppl": 5.5561, + "step": 1450 + }, + { + "epoch": 0.01, + "global_step": 1451, + "learning_rate": 0.0004947787979966611, + "loss": 1.6967, + "loss_base2": 2.4478, + "loss_pixel": 0.2092, + "loss_text": 1.4875, + "ppl": 5.4559, + "step": 1451 + }, + { + "epoch": 0.01, + "global_step": 1452, + "learning_rate": 0.0004947746243739566, + "loss": 1.7466, + "loss_base2": 2.5198, + "loss_pixel": 0.2097, + "loss_text": 1.5369, + "ppl": 5.7351, + "step": 1452 + }, + { + "epoch": 0.01, + "global_step": 1453, + "learning_rate": 0.0004947704507512521, + "loss": 1.728, + "loss_base2": 2.493, + "loss_pixel": 0.21, + "loss_text": 1.518, + "ppl": 5.6294, + "step": 1453 + }, + { + "epoch": 0.01, + "global_step": 1454, + "learning_rate": 0.0004947662771285476, + "loss": 1.6999, + "loss_base2": 2.4524, + "loss_pixel": 0.2106, + "loss_text": 1.4893, + "ppl": 5.4734, + "step": 1454 + }, + { + "epoch": 0.01, + "global_step": 1455, + "learning_rate": 0.0004947621035058432, + "loss": 1.889, + "loss_base2": 2.7253, + "loss_pixel": 0.2094, + "loss_text": 1.6796, + "ppl": 6.6128, + "step": 1455 + }, + { + "epoch": 0.01, + "global_step": 1456, + "learning_rate": 0.0004947579298831386, + "loss": 2.0117, + "loss_base2": 2.9023, + "loss_pixel": 0.2093, + "loss_text": 1.8024, + "ppl": 7.476, + "step": 1456 + }, + { + "epoch": 0.01, + "global_step": 1457, + "learning_rate": 0.0004947537562604341, + "loss": 2.0036, + "loss_base2": 2.8906, + "loss_pixel": 0.2096, + "loss_text": 1.794, + "ppl": 7.4157, + "step": 1457 + }, + { + "epoch": 0.01, + "global_step": 1458, + "learning_rate": 0.0004947495826377296, + "loss": 1.9886, + "loss_base2": 2.8689, + "loss_pixel": 0.2084, + "loss_text": 1.7801, + "ppl": 7.3053, + "step": 1458 + }, + { + "epoch": 0.01, + "global_step": 1459, + "learning_rate": 0.0004947454090150251, + "loss": 2.011, + "loss_base2": 2.9013, + "loss_pixel": 0.2096, + "loss_text": 1.8014, + "ppl": 7.4708, + "step": 1459 + }, + { + "epoch": 0.01, + "global_step": 1460, + "learning_rate": 0.0004947412353923205, + "loss": 2.0173, + "loss_base2": 2.9103, + "loss_pixel": 0.21, + "loss_text": 1.8072, + "ppl": 7.518, + "step": 1460 + }, + { + "epoch": 0.01, + "global_step": 1461, + "learning_rate": 0.000494737061769616, + "loss": 2.016, + "loss_base2": 2.9085, + "loss_pixel": 0.2106, + "loss_text": 1.8054, + "ppl": 7.5082, + "step": 1461 + }, + { + "epoch": 0.01, + "global_step": 1462, + "learning_rate": 0.0004947328881469115, + "loss": 1.9913, + "loss_base2": 2.8728, + "loss_pixel": 0.2092, + "loss_text": 1.7822, + "ppl": 7.3251, + "step": 1462 + }, + { + "epoch": 0.01, + "global_step": 1463, + "learning_rate": 0.000494728714524207, + "loss": 1.9841, + "loss_base2": 2.8625, + "loss_pixel": 0.2103, + "loss_text": 1.7738, + "ppl": 7.2725, + "step": 1463 + }, + { + "epoch": 0.01, + "global_step": 1464, + "learning_rate": 0.0004947245409015025, + "loss": 1.9882, + "loss_base2": 2.8684, + "loss_pixel": 0.2094, + "loss_text": 1.7787, + "ppl": 7.3024, + "step": 1464 + }, + { + "epoch": 0.01, + "global_step": 1465, + "learning_rate": 0.000494720367278798, + "loss": 1.9943, + "loss_base2": 2.8772, + "loss_pixel": 0.209, + "loss_text": 1.7853, + "ppl": 7.3471, + "step": 1465 + }, + { + "epoch": 0.01, + "global_step": 1466, + "learning_rate": 0.0004947161936560935, + "loss": 1.9812, + "loss_base2": 2.8583, + "loss_pixel": 0.2095, + "loss_text": 1.7718, + "ppl": 7.2514, + "step": 1466 + }, + { + "epoch": 0.01, + "global_step": 1467, + "learning_rate": 0.000494712020033389, + "loss": 1.9821, + "loss_base2": 2.8596, + "loss_pixel": 0.2086, + "loss_text": 1.7735, + "ppl": 7.258, + "step": 1467 + }, + { + "epoch": 0.01, + "global_step": 1468, + "learning_rate": 0.0004947078464106845, + "loss": 1.9852, + "loss_base2": 2.864, + "loss_pixel": 0.209, + "loss_text": 1.7761, + "ppl": 7.2805, + "step": 1468 + }, + { + "epoch": 0.01, + "global_step": 1469, + "learning_rate": 0.0004947036727879799, + "loss": 1.994, + "loss_base2": 2.8767, + "loss_pixel": 0.2088, + "loss_text": 1.7851, + "ppl": 7.3449, + "step": 1469 + }, + { + "epoch": 0.01, + "global_step": 1470, + "learning_rate": 0.0004946994991652754, + "loss": 1.9931, + "loss_base2": 2.8754, + "loss_pixel": 0.2096, + "loss_text": 1.7835, + "ppl": 7.3382, + "step": 1470 + }, + { + "epoch": 0.01, + "global_step": 1471, + "learning_rate": 0.000494695325542571, + "loss": 1.9823, + "loss_base2": 2.8599, + "loss_pixel": 0.2074, + "loss_text": 1.7749, + "ppl": 7.2594, + "step": 1471 + }, + { + "epoch": 0.01, + "global_step": 1472, + "learning_rate": 0.0004946911519198665, + "loss": 1.9852, + "loss_base2": 2.864, + "loss_pixel": 0.2077, + "loss_text": 1.7775, + "ppl": 7.2805, + "step": 1472 + }, + { + "epoch": 0.01, + "global_step": 1473, + "learning_rate": 0.000494686978297162, + "loss": 1.9777, + "loss_base2": 2.8532, + "loss_pixel": 0.2076, + "loss_text": 1.7701, + "ppl": 7.2261, + "step": 1473 + }, + { + "epoch": 0.01, + "global_step": 1474, + "learning_rate": 0.0004946828046744575, + "loss": 1.9683, + "loss_base2": 2.8397, + "loss_pixel": 0.2086, + "loss_text": 1.7597, + "ppl": 7.1585, + "step": 1474 + }, + { + "epoch": 0.01, + "global_step": 1475, + "learning_rate": 0.000494678631051753, + "loss": 1.9765, + "loss_base2": 2.8515, + "loss_pixel": 0.2081, + "loss_text": 1.7684, + "ppl": 7.2174, + "step": 1475 + }, + { + "epoch": 0.01, + "global_step": 1476, + "learning_rate": 0.0004946744574290485, + "loss": 1.9873, + "loss_base2": 2.8671, + "loss_pixel": 0.2086, + "loss_text": 1.7787, + "ppl": 7.2958, + "step": 1476 + }, + { + "epoch": 0.01, + "global_step": 1477, + "learning_rate": 0.0004946702838063439, + "loss": 1.9804, + "loss_base2": 2.8571, + "loss_pixel": 0.2091, + "loss_text": 1.7713, + "ppl": 7.2456, + "step": 1477 + }, + { + "epoch": 0.01, + "global_step": 1478, + "learning_rate": 0.0004946661101836394, + "loss": 1.9725, + "loss_base2": 2.8457, + "loss_pixel": 0.2095, + "loss_text": 1.7631, + "ppl": 7.1886, + "step": 1478 + }, + { + "epoch": 0.01, + "global_step": 1479, + "learning_rate": 0.0004946619365609349, + "loss": 1.8209, + "loss_base2": 2.627, + "loss_pixel": 0.2122, + "loss_text": 1.6087, + "ppl": 6.1774, + "step": 1479 + }, + { + "epoch": 0.01, + "global_step": 1480, + "learning_rate": 0.0004946577629382304, + "loss": 1.7496, + "loss_base2": 2.5241, + "loss_pixel": 0.2146, + "loss_text": 1.5351, + "ppl": 5.7523, + "step": 1480 + }, + { + "epoch": 0.01, + "global_step": 1481, + "learning_rate": 0.0004946535893155259, + "loss": 1.7206, + "loss_base2": 2.4823, + "loss_pixel": 0.2126, + "loss_text": 1.5081, + "ppl": 5.5879, + "step": 1481 + }, + { + "epoch": 0.01, + "global_step": 1482, + "learning_rate": 0.0004946494156928214, + "loss": 1.7258, + "loss_base2": 2.4898, + "loss_pixel": 0.2113, + "loss_text": 1.5145, + "ppl": 5.617, + "step": 1482 + }, + { + "epoch": 0.01, + "global_step": 1483, + "learning_rate": 0.0004946452420701168, + "loss": 1.7304, + "loss_base2": 2.4964, + "loss_pixel": 0.2119, + "loss_text": 1.5185, + "ppl": 5.6429, + "step": 1483 + }, + { + "epoch": 0.01, + "global_step": 1484, + "learning_rate": 0.0004946410684474123, + "loss": 1.735, + "loss_base2": 2.5031, + "loss_pixel": 0.2087, + "loss_text": 1.5262, + "ppl": 5.6689, + "step": 1484 + }, + { + "epoch": 0.01, + "global_step": 1485, + "learning_rate": 0.0004946368948247078, + "loss": 1.7077, + "loss_base2": 2.4637, + "loss_pixel": 0.2082, + "loss_text": 1.4995, + "ppl": 5.5163, + "step": 1485 + }, + { + "epoch": 0.01, + "global_step": 1486, + "learning_rate": 0.0004946327212020033, + "loss": 1.8465, + "loss_base2": 2.6639, + "loss_pixel": 0.2074, + "loss_text": 1.6391, + "ppl": 6.3376, + "step": 1486 + }, + { + "epoch": 0.01, + "global_step": 1487, + "learning_rate": 0.0004946285475792988, + "loss": 2.0142, + "loss_base2": 2.9059, + "loss_pixel": 0.2075, + "loss_text": 1.8067, + "ppl": 7.4947, + "step": 1487 + }, + { + "epoch": 0.01, + "global_step": 1488, + "learning_rate": 0.0004946243739565944, + "loss": 2.0101, + "loss_base2": 2.9, + "loss_pixel": 0.2122, + "loss_text": 1.7979, + "ppl": 7.4641, + "step": 1488 + }, + { + "epoch": 0.01, + "global_step": 1489, + "learning_rate": 0.0004946202003338899, + "loss": 2.0192, + "loss_base2": 2.9131, + "loss_pixel": 0.2103, + "loss_text": 1.8089, + "ppl": 7.5323, + "step": 1489 + }, + { + "epoch": 0.01, + "global_step": 1490, + "learning_rate": 0.0004946160267111854, + "loss": 1.9972, + "loss_base2": 2.8814, + "loss_pixel": 0.2089, + "loss_text": 1.7883, + "ppl": 7.3684, + "step": 1490 + }, + { + "epoch": 0.01, + "global_step": 1491, + "learning_rate": 0.0004946118530884809, + "loss": 1.9854, + "loss_base2": 2.8643, + "loss_pixel": 0.2062, + "loss_text": 1.7792, + "ppl": 7.282, + "step": 1491 + }, + { + "epoch": 0.01, + "global_step": 1492, + "learning_rate": 0.0004946076794657763, + "loss": 1.9809, + "loss_base2": 2.8578, + "loss_pixel": 0.2063, + "loss_text": 1.7746, + "ppl": 7.2493, + "step": 1492 + }, + { + "epoch": 0.01, + "global_step": 1493, + "learning_rate": 0.0004946035058430718, + "loss": 1.9814, + "loss_base2": 2.8586, + "loss_pixel": 0.2072, + "loss_text": 1.7742, + "ppl": 7.2529, + "step": 1493 + }, + { + "epoch": 0.01, + "global_step": 1494, + "learning_rate": 0.0004945993322203673, + "loss": 1.973, + "loss_base2": 2.8464, + "loss_pixel": 0.2081, + "loss_text": 1.7649, + "ppl": 7.1922, + "step": 1494 + }, + { + "epoch": 0.01, + "global_step": 1495, + "learning_rate": 0.0004945951585976628, + "loss": 1.9787, + "loss_base2": 2.8547, + "loss_pixel": 0.2032, + "loss_text": 1.7755, + "ppl": 7.2333, + "step": 1495 + }, + { + "epoch": 0.01, + "global_step": 1496, + "learning_rate": 0.0004945909849749582, + "loss": 1.9794, + "loss_base2": 2.8557, + "loss_pixel": 0.2043, + "loss_text": 1.7751, + "ppl": 7.2384, + "step": 1496 + }, + { + "epoch": 0.01, + "global_step": 1497, + "learning_rate": 0.0004945868113522537, + "loss": 1.9753, + "loss_base2": 2.8498, + "loss_pixel": 0.2135, + "loss_text": 1.7618, + "ppl": 7.2088, + "step": 1497 + }, + { + "epoch": 0.01, + "global_step": 1498, + "learning_rate": 0.0004945826377295492, + "loss": 1.9872, + "loss_base2": 2.8669, + "loss_pixel": 0.2132, + "loss_text": 1.774, + "ppl": 7.2951, + "step": 1498 + }, + { + "epoch": 0.01, + "global_step": 1499, + "learning_rate": 0.0004945784641068447, + "loss": 1.9883, + "loss_base2": 2.8685, + "loss_pixel": 0.2122, + "loss_text": 1.7762, + "ppl": 7.3031, + "step": 1499 + }, + { + "epoch": 0.01, + "global_step": 1500, + "learning_rate": 0.0004945742904841402, + "loss": 1.9853, + "loss_base2": 2.8642, + "loss_pixel": 0.2112, + "loss_text": 1.7742, + "ppl": 7.2812, + "step": 1500 + }, + { + "epoch": 0.01, + "global_step": 1501, + "learning_rate": 0.0004945701168614357, + "loss": 1.9766, + "loss_base2": 2.8516, + "loss_pixel": 0.2112, + "loss_text": 1.7655, + "ppl": 7.2182, + "step": 1501 + }, + { + "epoch": 0.01, + "global_step": 1502, + "learning_rate": 0.0004945659432387312, + "loss": 1.9945, + "loss_base2": 2.8775, + "loss_pixel": 0.2097, + "loss_text": 1.7847, + "ppl": 7.3485, + "step": 1502 + }, + { + "epoch": 0.01, + "global_step": 1503, + "learning_rate": 0.0004945617696160267, + "loss": 1.9768, + "loss_base2": 2.8519, + "loss_pixel": 0.2118, + "loss_text": 1.765, + "ppl": 7.2196, + "step": 1503 + }, + { + "epoch": 0.01, + "global_step": 1504, + "learning_rate": 0.0004945575959933223, + "loss": 1.9832, + "loss_base2": 2.8612, + "loss_pixel": 0.2099, + "loss_text": 1.7733, + "ppl": 7.266, + "step": 1504 + }, + { + "epoch": 0.01, + "global_step": 1505, + "learning_rate": 0.0004945534223706178, + "loss": 1.9867, + "loss_base2": 2.8662, + "loss_pixel": 0.2102, + "loss_text": 1.7765, + "ppl": 7.2914, + "step": 1505 + }, + { + "epoch": 0.01, + "global_step": 1506, + "learning_rate": 0.0004945492487479132, + "loss": 1.969, + "loss_base2": 2.8407, + "loss_pixel": 0.209, + "loss_text": 1.76, + "ppl": 7.1635, + "step": 1506 + }, + { + "epoch": 0.01, + "global_step": 1507, + "learning_rate": 0.0004945450751252087, + "loss": 1.9581, + "loss_base2": 2.8249, + "loss_pixel": 0.2073, + "loss_text": 1.7508, + "ppl": 7.0859, + "step": 1507 + }, + { + "epoch": 0.01, + "global_step": 1508, + "learning_rate": 0.0004945409015025042, + "loss": 1.9805, + "loss_base2": 2.8573, + "loss_pixel": 0.2069, + "loss_text": 1.7736, + "ppl": 7.2464, + "step": 1508 + }, + { + "epoch": 0.01, + "global_step": 1509, + "learning_rate": 0.0004945367278797997, + "loss": 1.9729, + "loss_base2": 2.8463, + "loss_pixel": 0.2079, + "loss_text": 1.765, + "ppl": 7.1915, + "step": 1509 + }, + { + "epoch": 0.01, + "global_step": 1510, + "learning_rate": 0.0004945325542570952, + "loss": 1.9772, + "loss_base2": 2.8525, + "loss_pixel": 0.2065, + "loss_text": 1.7707, + "ppl": 7.2225, + "step": 1510 + }, + { + "epoch": 0.01, + "global_step": 1511, + "learning_rate": 0.0004945283806343907, + "loss": 1.9638, + "loss_base2": 2.8332, + "loss_pixel": 0.2068, + "loss_text": 1.757, + "ppl": 7.1264, + "step": 1511 + }, + { + "epoch": 0.01, + "global_step": 1512, + "learning_rate": 0.0004945242070116862, + "loss": 1.9946, + "loss_base2": 2.8776, + "loss_pixel": 0.2068, + "loss_text": 1.7878, + "ppl": 7.3493, + "step": 1512 + }, + { + "epoch": 0.01, + "global_step": 1513, + "learning_rate": 0.0004945200333889817, + "loss": 1.967, + "loss_base2": 2.8378, + "loss_pixel": 0.2072, + "loss_text": 1.7598, + "ppl": 7.1492, + "step": 1513 + }, + { + "epoch": 0.01, + "global_step": 1514, + "learning_rate": 0.0004945158597662771, + "loss": 1.9616, + "loss_base2": 2.83, + "loss_pixel": 0.206, + "loss_text": 1.7556, + "ppl": 7.1107, + "step": 1514 + }, + { + "epoch": 0.01, + "global_step": 1515, + "learning_rate": 0.0004945116861435726, + "loss": 1.96, + "loss_base2": 2.8277, + "loss_pixel": 0.2069, + "loss_text": 1.7531, + "ppl": 7.0993, + "step": 1515 + }, + { + "epoch": 0.01, + "global_step": 1516, + "learning_rate": 0.0004945075125208681, + "loss": 1.9584, + "loss_base2": 2.8254, + "loss_pixel": 0.2076, + "loss_text": 1.7509, + "ppl": 7.088, + "step": 1516 + }, + { + "epoch": 0.01, + "global_step": 1517, + "learning_rate": 0.0004945033388981636, + "loss": 1.9801, + "loss_base2": 2.8567, + "loss_pixel": 0.2061, + "loss_text": 1.774, + "ppl": 7.2435, + "step": 1517 + }, + { + "epoch": 0.01, + "global_step": 1518, + "learning_rate": 0.0004944991652754591, + "loss": 1.9533, + "loss_base2": 2.818, + "loss_pixel": 0.207, + "loss_text": 1.7463, + "ppl": 7.0519, + "step": 1518 + }, + { + "epoch": 0.01, + "global_step": 1519, + "learning_rate": 0.0004944949916527545, + "loss": 1.9652, + "loss_base2": 2.8352, + "loss_pixel": 0.2062, + "loss_text": 1.759, + "ppl": 7.1363, + "step": 1519 + }, + { + "epoch": 0.01, + "global_step": 1520, + "learning_rate": 0.00049449081803005, + "loss": 1.9612, + "loss_base2": 2.8294, + "loss_pixel": 0.2114, + "loss_text": 1.7498, + "ppl": 7.1079, + "step": 1520 + }, + { + "epoch": 0.01, + "global_step": 1521, + "learning_rate": 0.0004944866444073456, + "loss": 1.9877, + "loss_base2": 2.8676, + "loss_pixel": 0.2244, + "loss_text": 1.7633, + "ppl": 7.2987, + "step": 1521 + }, + { + "epoch": 0.01, + "global_step": 1522, + "learning_rate": 0.0004944824707846411, + "loss": 1.9913, + "loss_base2": 2.8728, + "loss_pixel": 0.2264, + "loss_text": 1.7648, + "ppl": 7.3251, + "step": 1522 + }, + { + "epoch": 0.01, + "global_step": 1523, + "learning_rate": 0.0004944782971619366, + "loss": 1.9762, + "loss_base2": 2.8511, + "loss_pixel": 0.2299, + "loss_text": 1.7463, + "ppl": 7.2153, + "step": 1523 + }, + { + "epoch": 0.01, + "global_step": 1524, + "learning_rate": 0.0004944741235392321, + "loss": 1.9834, + "loss_base2": 2.8614, + "loss_pixel": 0.2267, + "loss_text": 1.7567, + "ppl": 7.2674, + "step": 1524 + }, + { + "epoch": 0.01, + "global_step": 1525, + "learning_rate": 0.0004944699499165276, + "loss": 1.9789, + "loss_base2": 2.8549, + "loss_pixel": 0.2266, + "loss_text": 1.7522, + "ppl": 7.2348, + "step": 1525 + }, + { + "epoch": 0.01, + "global_step": 1526, + "learning_rate": 0.0004944657762938231, + "loss": 1.9836, + "loss_base2": 2.8617, + "loss_pixel": 0.225, + "loss_text": 1.7586, + "ppl": 7.2689, + "step": 1526 + }, + { + "epoch": 0.01, + "global_step": 1527, + "learning_rate": 0.0004944616026711186, + "loss": 1.9812, + "loss_base2": 2.8583, + "loss_pixel": 0.2225, + "loss_text": 1.7587, + "ppl": 7.2514, + "step": 1527 + }, + { + "epoch": 0.01, + "global_step": 1528, + "learning_rate": 0.000494457429048414, + "loss": 1.9664, + "loss_base2": 2.8369, + "loss_pixel": 0.2208, + "loss_text": 1.7457, + "ppl": 7.1449, + "step": 1528 + }, + { + "epoch": 0.01, + "global_step": 1529, + "learning_rate": 0.0004944532554257095, + "loss": 1.9541, + "loss_base2": 2.8192, + "loss_pixel": 0.2187, + "loss_text": 1.7354, + "ppl": 7.0576, + "step": 1529 + }, + { + "epoch": 0.01, + "global_step": 1530, + "learning_rate": 0.000494449081803005, + "loss": 1.9544, + "loss_base2": 2.8196, + "loss_pixel": 0.2186, + "loss_text": 1.7358, + "ppl": 7.0597, + "step": 1530 + }, + { + "epoch": 0.01, + "global_step": 1531, + "learning_rate": 0.0004944449081803005, + "loss": 1.9541, + "loss_base2": 2.8192, + "loss_pixel": 0.2172, + "loss_text": 1.7369, + "ppl": 7.0576, + "step": 1531 + }, + { + "epoch": 0.01, + "global_step": 1532, + "learning_rate": 0.000494440734557596, + "loss": 1.9664, + "loss_base2": 2.8369, + "loss_pixel": 0.2146, + "loss_text": 1.7518, + "ppl": 7.1449, + "step": 1532 + }, + { + "epoch": 0.01, + "global_step": 1533, + "learning_rate": 0.0004944365609348914, + "loss": 1.9491, + "loss_base2": 2.812, + "loss_pixel": 0.2136, + "loss_text": 1.7355, + "ppl": 7.0224, + "step": 1533 + }, + { + "epoch": 0.01, + "global_step": 1534, + "learning_rate": 0.0004944323873121869, + "loss": 1.9526, + "loss_base2": 2.817, + "loss_pixel": 0.2145, + "loss_text": 1.7382, + "ppl": 7.047, + "step": 1534 + }, + { + "epoch": 0.01, + "global_step": 1535, + "learning_rate": 0.0004944282136894824, + "loss": 1.9436, + "loss_base2": 2.804, + "loss_pixel": 0.2133, + "loss_text": 1.7303, + "ppl": 6.9838, + "step": 1535 + }, + { + "epoch": 0.01, + "global_step": 1536, + "learning_rate": 0.000494424040066778, + "loss": 1.8076, + "loss_base2": 2.6078, + "loss_pixel": 0.2127, + "loss_text": 1.5949, + "ppl": 6.0958, + "step": 1536 + }, + { + "epoch": 0.01, + "global_step": 1537, + "learning_rate": 0.0004944198664440735, + "loss": 1.7424, + "loss_base2": 2.5138, + "loss_pixel": 0.212, + "loss_text": 1.5304, + "ppl": 5.711, + "step": 1537 + }, + { + "epoch": 0.01, + "global_step": 1538, + "learning_rate": 0.000494415692821369, + "loss": 1.744, + "loss_base2": 2.5161, + "loss_pixel": 0.2115, + "loss_text": 1.5325, + "ppl": 5.7202, + "step": 1538 + }, + { + "epoch": 0.01, + "global_step": 1539, + "learning_rate": 0.0004944115191986645, + "loss": 1.701, + "loss_base2": 2.454, + "loss_pixel": 0.2107, + "loss_text": 1.4903, + "ppl": 5.4794, + "step": 1539 + }, + { + "epoch": 0.01, + "global_step": 1540, + "learning_rate": 0.00049440734557596, + "loss": 1.7011, + "loss_base2": 2.4542, + "loss_pixel": 0.211, + "loss_text": 1.4902, + "ppl": 5.48, + "step": 1540 + }, + { + "epoch": 0.01, + "global_step": 1541, + "learning_rate": 0.0004944031719532555, + "loss": 1.7211, + "loss_base2": 2.483, + "loss_pixel": 0.2108, + "loss_text": 1.5103, + "ppl": 5.5907, + "step": 1541 + }, + { + "epoch": 0.01, + "global_step": 1542, + "learning_rate": 0.0004943989983305509, + "loss": 1.7138, + "loss_base2": 2.4725, + "loss_pixel": 0.209, + "loss_text": 1.5048, + "ppl": 5.55, + "step": 1542 + }, + { + "epoch": 0.01, + "global_step": 1543, + "learning_rate": 0.0004943948247078464, + "loss": 1.7018, + "loss_base2": 2.4552, + "loss_pixel": 0.2089, + "loss_text": 1.4929, + "ppl": 5.4838, + "step": 1543 + }, + { + "epoch": 0.01, + "global_step": 1544, + "learning_rate": 0.0004943906510851419, + "loss": 1.8408, + "loss_base2": 2.6557, + "loss_pixel": 0.2091, + "loss_text": 1.6317, + "ppl": 6.3016, + "step": 1544 + }, + { + "epoch": 0.01, + "global_step": 1545, + "learning_rate": 0.0004943864774624374, + "loss": 1.931, + "loss_base2": 2.7858, + "loss_pixel": 0.2087, + "loss_text": 1.7222, + "ppl": 6.8964, + "step": 1545 + }, + { + "epoch": 0.01, + "global_step": 1546, + "learning_rate": 0.0004943823038397329, + "loss": 1.7721, + "loss_base2": 2.5566, + "loss_pixel": 0.2091, + "loss_text": 1.5631, + "ppl": 5.8832, + "step": 1546 + }, + { + "epoch": 0.01, + "global_step": 1547, + "learning_rate": 0.0004943781302170284, + "loss": 1.7092, + "loss_base2": 2.4659, + "loss_pixel": 0.2069, + "loss_text": 1.5022, + "ppl": 5.5245, + "step": 1547 + }, + { + "epoch": 0.01, + "global_step": 1548, + "learning_rate": 0.0004943739565943239, + "loss": 1.6993, + "loss_base2": 2.4516, + "loss_pixel": 0.2081, + "loss_text": 1.4912, + "ppl": 5.4701, + "step": 1548 + }, + { + "epoch": 0.01, + "global_step": 1549, + "learning_rate": 0.0004943697829716194, + "loss": 1.7241, + "loss_base2": 2.4874, + "loss_pixel": 0.208, + "loss_text": 1.5161, + "ppl": 5.6075, + "step": 1549 + }, + { + "epoch": 0.01, + "global_step": 1550, + "learning_rate": 0.0004943656093489149, + "loss": 1.718, + "loss_base2": 2.4786, + "loss_pixel": 0.2083, + "loss_text": 1.5098, + "ppl": 5.5734, + "step": 1550 + }, + { + "epoch": 0.01, + "global_step": 1551, + "learning_rate": 0.0004943614357262103, + "loss": 1.6999, + "loss_base2": 2.4524, + "loss_pixel": 0.207, + "loss_text": 1.4929, + "ppl": 5.4734, + "step": 1551 + }, + { + "epoch": 0.01, + "global_step": 1552, + "learning_rate": 0.0004943572621035058, + "loss": 1.6831, + "loss_base2": 2.4282, + "loss_pixel": 0.2069, + "loss_text": 1.4762, + "ppl": 5.3822, + "step": 1552 + }, + { + "epoch": 0.01, + "global_step": 1553, + "learning_rate": 0.0004943530884808014, + "loss": 1.7264, + "loss_base2": 2.4907, + "loss_pixel": 0.2067, + "loss_text": 1.5196, + "ppl": 5.6204, + "step": 1553 + }, + { + "epoch": 0.01, + "global_step": 1554, + "learning_rate": 0.0004943489148580969, + "loss": 1.8633, + "loss_base2": 2.6882, + "loss_pixel": 0.207, + "loss_text": 1.6564, + "ppl": 6.445, + "step": 1554 + }, + { + "epoch": 0.01, + "global_step": 1555, + "learning_rate": 0.0004943447412353923, + "loss": 1.9754, + "loss_base2": 2.8499, + "loss_pixel": 0.2066, + "loss_text": 1.7688, + "ppl": 7.2095, + "step": 1555 + }, + { + "epoch": 0.01, + "global_step": 1556, + "learning_rate": 0.0004943405676126878, + "loss": 2.0064, + "loss_base2": 2.8946, + "loss_pixel": 0.2067, + "loss_text": 1.7996, + "ppl": 7.4365, + "step": 1556 + }, + { + "epoch": 0.01, + "global_step": 1557, + "learning_rate": 0.0004943363939899833, + "loss": 1.9902, + "loss_base2": 2.8713, + "loss_pixel": 0.207, + "loss_text": 1.7832, + "ppl": 7.317, + "step": 1557 + }, + { + "epoch": 0.01, + "global_step": 1558, + "learning_rate": 0.0004943322203672788, + "loss": 1.9953, + "loss_base2": 2.8786, + "loss_pixel": 0.2046, + "loss_text": 1.7907, + "ppl": 7.3544, + "step": 1558 + }, + { + "epoch": 0.01, + "global_step": 1559, + "learning_rate": 0.0004943280467445743, + "loss": 1.9875, + "loss_base2": 2.8674, + "loss_pixel": 0.2056, + "loss_text": 1.7819, + "ppl": 7.2973, + "step": 1559 + }, + { + "epoch": 0.01, + "global_step": 1560, + "learning_rate": 0.0004943238731218698, + "loss": 1.978, + "loss_base2": 2.8537, + "loss_pixel": 0.2046, + "loss_text": 1.7734, + "ppl": 7.2283, + "step": 1560 + }, + { + "epoch": 0.01, + "global_step": 1561, + "learning_rate": 0.0004943196994991653, + "loss": 1.9751, + "loss_base2": 2.8495, + "loss_pixel": 0.2054, + "loss_text": 1.7698, + "ppl": 7.2073, + "step": 1561 + }, + { + "epoch": 0.01, + "global_step": 1562, + "learning_rate": 0.0004943155258764608, + "loss": 1.9678, + "loss_base2": 2.8389, + "loss_pixel": 0.2059, + "loss_text": 1.7619, + "ppl": 7.1549, + "step": 1562 + }, + { + "epoch": 0.01, + "global_step": 1563, + "learning_rate": 0.0004943113522537563, + "loss": 1.9712, + "loss_base2": 2.8438, + "loss_pixel": 0.2057, + "loss_text": 1.7656, + "ppl": 7.1793, + "step": 1563 + }, + { + "epoch": 0.01, + "global_step": 1564, + "learning_rate": 0.0004943071786310518, + "loss": 1.9695, + "loss_base2": 2.8414, + "loss_pixel": 0.2058, + "loss_text": 1.7637, + "ppl": 7.1671, + "step": 1564 + }, + { + "epoch": 0.01, + "global_step": 1565, + "learning_rate": 0.0004943030050083472, + "loss": 1.9716, + "loss_base2": 2.8444, + "loss_pixel": 0.2111, + "loss_text": 1.7605, + "ppl": 7.1822, + "step": 1565 + }, + { + "epoch": 0.01, + "global_step": 1566, + "learning_rate": 0.0004942988313856427, + "loss": 1.9625, + "loss_base2": 2.8313, + "loss_pixel": 0.2101, + "loss_text": 1.7524, + "ppl": 7.1171, + "step": 1566 + }, + { + "epoch": 0.01, + "global_step": 1567, + "learning_rate": 0.0004942946577629382, + "loss": 1.9611, + "loss_base2": 2.8293, + "loss_pixel": 0.2067, + "loss_text": 1.7543, + "ppl": 7.1071, + "step": 1567 + }, + { + "epoch": 0.01, + "global_step": 1568, + "learning_rate": 0.0004942904841402337, + "loss": 1.963, + "loss_base2": 2.832, + "loss_pixel": 0.2056, + "loss_text": 1.7574, + "ppl": 7.1207, + "step": 1568 + }, + { + "epoch": 0.01, + "global_step": 1569, + "learning_rate": 0.0004942863105175293, + "loss": 1.9555, + "loss_base2": 2.8212, + "loss_pixel": 0.206, + "loss_text": 1.7495, + "ppl": 7.0675, + "step": 1569 + }, + { + "epoch": 0.01, + "global_step": 1570, + "learning_rate": 0.0004942821368948247, + "loss": 1.9522, + "loss_base2": 2.8164, + "loss_pixel": 0.2046, + "loss_text": 1.7476, + "ppl": 7.0442, + "step": 1570 + }, + { + "epoch": 0.01, + "global_step": 1571, + "learning_rate": 0.0004942779632721202, + "loss": 1.9747, + "loss_base2": 2.8489, + "loss_pixel": 0.2054, + "loss_text": 1.7693, + "ppl": 7.2045, + "step": 1571 + }, + { + "epoch": 0.01, + "global_step": 1572, + "learning_rate": 0.0004942737896494157, + "loss": 1.9383, + "loss_base2": 2.7964, + "loss_pixel": 0.2013, + "loss_text": 1.737, + "ppl": 6.9469, + "step": 1572 + }, + { + "epoch": 0.01, + "global_step": 1573, + "learning_rate": 0.0004942696160267112, + "loss": 1.963, + "loss_base2": 2.832, + "loss_pixel": 0.2057, + "loss_text": 1.7573, + "ppl": 7.1207, + "step": 1573 + }, + { + "epoch": 0.01, + "global_step": 1574, + "learning_rate": 0.0004942654424040067, + "loss": 1.9602, + "loss_base2": 2.828, + "loss_pixel": 0.2042, + "loss_text": 1.756, + "ppl": 7.1007, + "step": 1574 + }, + { + "epoch": 0.01, + "global_step": 1575, + "learning_rate": 0.0004942612687813022, + "loss": 1.9715, + "loss_base2": 2.8443, + "loss_pixel": 0.2049, + "loss_text": 1.7666, + "ppl": 7.1814, + "step": 1575 + }, + { + "epoch": 0.01, + "global_step": 1576, + "learning_rate": 0.0004942570951585977, + "loss": 1.9463, + "loss_base2": 2.8079, + "loss_pixel": 0.2032, + "loss_text": 1.7431, + "ppl": 7.0027, + "step": 1576 + }, + { + "epoch": 0.01, + "global_step": 1577, + "learning_rate": 0.0004942529215358932, + "loss": 1.9448, + "loss_base2": 2.8058, + "loss_pixel": 0.201, + "loss_text": 1.7438, + "ppl": 6.9922, + "step": 1577 + }, + { + "epoch": 0.01, + "global_step": 1578, + "learning_rate": 0.0004942487479131886, + "loss": 1.9494, + "loss_base2": 2.8124, + "loss_pixel": 0.2018, + "loss_text": 1.7476, + "ppl": 7.0245, + "step": 1578 + }, + { + "epoch": 0.01, + "global_step": 1579, + "learning_rate": 0.0004942445742904841, + "loss": 1.9471, + "loss_base2": 2.8091, + "loss_pixel": 0.201, + "loss_text": 1.7461, + "ppl": 7.0083, + "step": 1579 + }, + { + "epoch": 0.01, + "global_step": 1580, + "learning_rate": 0.0004942404006677796, + "loss": 1.9374, + "loss_base2": 2.7951, + "loss_pixel": 0.1998, + "loss_text": 1.7376, + "ppl": 6.9407, + "step": 1580 + }, + { + "epoch": 0.01, + "global_step": 1581, + "learning_rate": 0.0004942362270450751, + "loss": 1.983, + "loss_base2": 2.8609, + "loss_pixel": 0.202, + "loss_text": 1.781, + "ppl": 7.2645, + "step": 1581 + }, + { + "epoch": 0.01, + "global_step": 1582, + "learning_rate": 0.0004942320534223706, + "loss": 1.9431, + "loss_base2": 2.8033, + "loss_pixel": 0.2018, + "loss_text": 1.7413, + "ppl": 6.9804, + "step": 1582 + }, + { + "epoch": 0.01, + "global_step": 1583, + "learning_rate": 0.0004942278797996661, + "loss": 1.9338, + "loss_base2": 2.7899, + "loss_pixel": 0.2041, + "loss_text": 1.7297, + "ppl": 6.9157, + "step": 1583 + }, + { + "epoch": 0.01, + "global_step": 1584, + "learning_rate": 0.0004942237061769616, + "loss": 1.9482, + "loss_base2": 2.8107, + "loss_pixel": 0.2002, + "loss_text": 1.748, + "ppl": 7.016, + "step": 1584 + }, + { + "epoch": 0.01, + "global_step": 1585, + "learning_rate": 0.0004942195325542572, + "loss": 1.9485, + "loss_base2": 2.8111, + "loss_pixel": 0.2011, + "loss_text": 1.7474, + "ppl": 7.0182, + "step": 1585 + }, + { + "epoch": 0.01, + "global_step": 1586, + "learning_rate": 0.0004942153589315527, + "loss": 1.9488, + "loss_base2": 2.8115, + "loss_pixel": 0.2028, + "loss_text": 1.746, + "ppl": 7.0203, + "step": 1586 + }, + { + "epoch": 0.01, + "global_step": 1587, + "learning_rate": 0.0004942111853088481, + "loss": 1.9376, + "loss_base2": 2.7954, + "loss_pixel": 0.2003, + "loss_text": 1.7373, + "ppl": 6.9421, + "step": 1587 + }, + { + "epoch": 0.01, + "global_step": 1588, + "learning_rate": 0.0004942070116861436, + "loss": 1.9438, + "loss_base2": 2.8043, + "loss_pixel": 0.1983, + "loss_text": 1.7456, + "ppl": 6.9852, + "step": 1588 + }, + { + "epoch": 0.01, + "global_step": 1589, + "learning_rate": 0.0004942028380634391, + "loss": 1.9509, + "loss_base2": 2.8146, + "loss_pixel": 0.2015, + "loss_text": 1.7494, + "ppl": 7.035, + "step": 1589 + }, + { + "epoch": 0.01, + "global_step": 1590, + "learning_rate": 0.0004941986644407346, + "loss": 1.9409, + "loss_base2": 2.8001, + "loss_pixel": 0.201, + "loss_text": 1.7399, + "ppl": 6.965, + "step": 1590 + }, + { + "epoch": 0.01, + "global_step": 1591, + "learning_rate": 0.0004941944908180301, + "loss": 1.9478, + "loss_base2": 2.8101, + "loss_pixel": 0.2003, + "loss_text": 1.7474, + "ppl": 7.0132, + "step": 1591 + }, + { + "epoch": 0.01, + "global_step": 1592, + "learning_rate": 0.0004941903171953255, + "loss": 1.9543, + "loss_base2": 2.8195, + "loss_pixel": 0.2, + "loss_text": 1.7543, + "ppl": 7.059, + "step": 1592 + }, + { + "epoch": 0.01, + "global_step": 1593, + "learning_rate": 0.000494186143572621, + "loss": 1.9419, + "loss_base2": 2.8016, + "loss_pixel": 0.1987, + "loss_text": 1.7432, + "ppl": 6.972, + "step": 1593 + }, + { + "epoch": 0.01, + "global_step": 1594, + "learning_rate": 0.0004941819699499165, + "loss": 1.9462, + "loss_base2": 2.8078, + "loss_pixel": 0.1983, + "loss_text": 1.7479, + "ppl": 7.002, + "step": 1594 + }, + { + "epoch": 0.01, + "global_step": 1595, + "learning_rate": 0.000494177796327212, + "loss": 1.9463, + "loss_base2": 2.8079, + "loss_pixel": 0.2001, + "loss_text": 1.7462, + "ppl": 7.0027, + "step": 1595 + }, + { + "epoch": 0.01, + "global_step": 1596, + "learning_rate": 0.0004941736227045075, + "loss": 1.9523, + "loss_base2": 2.8166, + "loss_pixel": 0.1995, + "loss_text": 1.7528, + "ppl": 7.0449, + "step": 1596 + }, + { + "epoch": 0.01, + "global_step": 1597, + "learning_rate": 0.000494169449081803, + "loss": 1.9386, + "loss_base2": 2.7968, + "loss_pixel": 0.1977, + "loss_text": 1.7409, + "ppl": 6.949, + "step": 1597 + }, + { + "epoch": 0.01, + "global_step": 1598, + "learning_rate": 0.0004941652754590985, + "loss": 1.9404, + "loss_base2": 2.7994, + "loss_pixel": 0.2028, + "loss_text": 1.7375, + "ppl": 6.9615, + "step": 1598 + }, + { + "epoch": 0.01, + "global_step": 1599, + "learning_rate": 0.000494161101836394, + "loss": 1.7528, + "loss_base2": 2.5288, + "loss_pixel": 0.2075, + "loss_text": 1.5453, + "ppl": 5.7707, + "step": 1599 + }, + { + "epoch": 0.01, + "global_step": 1600, + "learning_rate": 0.0004941569282136895, + "loss": 1.699, + "loss_base2": 2.4511, + "loss_pixel": 0.2072, + "loss_text": 1.4918, + "ppl": 5.4685, + "step": 1600 + }, + { + "epoch": 0.01, + "global_step": 1601, + "learning_rate": 0.000494152754590985, + "loss": 1.6977, + "loss_base2": 2.4493, + "loss_pixel": 0.2067, + "loss_text": 1.491, + "ppl": 5.4614, + "step": 1601 + }, + { + "epoch": 0.01, + "global_step": 1602, + "learning_rate": 0.0004941485809682805, + "loss": 1.7162, + "loss_base2": 2.476, + "loss_pixel": 0.2065, + "loss_text": 1.5097, + "ppl": 5.5633, + "step": 1602 + }, + { + "epoch": 0.01, + "global_step": 1603, + "learning_rate": 0.000494144407345576, + "loss": 1.7097, + "loss_base2": 2.4666, + "loss_pixel": 0.2053, + "loss_text": 1.5044, + "ppl": 5.5273, + "step": 1603 + }, + { + "epoch": 0.01, + "global_step": 1604, + "learning_rate": 0.0004941402337228715, + "loss": 1.6942, + "loss_base2": 2.4442, + "loss_pixel": 0.2054, + "loss_text": 1.4887, + "ppl": 5.4423, + "step": 1604 + }, + { + "epoch": 0.01, + "global_step": 1605, + "learning_rate": 0.000494136060100167, + "loss": 1.6923, + "loss_base2": 2.4415, + "loss_pixel": 0.2055, + "loss_text": 1.4868, + "ppl": 5.432, + "step": 1605 + }, + { + "epoch": 0.01, + "global_step": 1606, + "learning_rate": 0.0004941318864774625, + "loss": 1.8613, + "loss_base2": 2.6853, + "loss_pixel": 0.207, + "loss_text": 1.6543, + "ppl": 6.4321, + "step": 1606 + }, + { + "epoch": 0.01, + "global_step": 1607, + "learning_rate": 0.000494127712854758, + "loss": 1.9701, + "loss_base2": 2.8423, + "loss_pixel": 0.2046, + "loss_text": 1.7654, + "ppl": 7.1714, + "step": 1607 + }, + { + "epoch": 0.01, + "global_step": 1608, + "learning_rate": 0.0004941235392320534, + "loss": 1.9486, + "loss_base2": 2.8112, + "loss_pixel": 0.2053, + "loss_text": 1.7433, + "ppl": 7.0189, + "step": 1608 + }, + { + "epoch": 0.01, + "global_step": 1609, + "learning_rate": 0.0004941193656093489, + "loss": 1.9633, + "loss_base2": 2.8324, + "loss_pixel": 0.2047, + "loss_text": 1.7586, + "ppl": 7.1228, + "step": 1609 + }, + { + "epoch": 0.01, + "global_step": 1610, + "learning_rate": 0.0004941151919866444, + "loss": 1.97, + "loss_base2": 2.8421, + "loss_pixel": 0.2066, + "loss_text": 1.7633, + "ppl": 7.1707, + "step": 1610 + }, + { + "epoch": 0.01, + "global_step": 1611, + "learning_rate": 0.0004941110183639399, + "loss": 1.9453, + "loss_base2": 2.8065, + "loss_pixel": 0.207, + "loss_text": 1.7383, + "ppl": 6.9957, + "step": 1611 + }, + { + "epoch": 0.01, + "global_step": 1612, + "learning_rate": 0.0004941068447412354, + "loss": 1.9517, + "loss_base2": 2.8157, + "loss_pixel": 0.2079, + "loss_text": 1.7437, + "ppl": 7.0406, + "step": 1612 + }, + { + "epoch": 0.01, + "global_step": 1613, + "learning_rate": 0.0004941026711185309, + "loss": 1.9609, + "loss_base2": 2.829, + "loss_pixel": 0.2104, + "loss_text": 1.7505, + "ppl": 7.1057, + "step": 1613 + }, + { + "epoch": 0.01, + "global_step": 1614, + "learning_rate": 0.0004940984974958263, + "loss": 1.9598, + "loss_base2": 2.8274, + "loss_pixel": 0.2114, + "loss_text": 1.7484, + "ppl": 7.0979, + "step": 1614 + }, + { + "epoch": 0.01, + "global_step": 1615, + "learning_rate": 0.0004940943238731218, + "loss": 1.9443, + "loss_base2": 2.805, + "loss_pixel": 0.2115, + "loss_text": 1.7328, + "ppl": 6.9887, + "step": 1615 + }, + { + "epoch": 0.01, + "global_step": 1616, + "learning_rate": 0.0004940901502504173, + "loss": 1.9611, + "loss_base2": 2.8293, + "loss_pixel": 0.2104, + "loss_text": 1.7507, + "ppl": 7.1071, + "step": 1616 + }, + { + "epoch": 0.01, + "global_step": 1617, + "learning_rate": 0.0004940859766277128, + "loss": 1.9507, + "loss_base2": 2.8143, + "loss_pixel": 0.2087, + "loss_text": 1.742, + "ppl": 7.0336, + "step": 1617 + }, + { + "epoch": 0.01, + "global_step": 1618, + "learning_rate": 0.0004940818030050084, + "loss": 1.9444, + "loss_base2": 2.8052, + "loss_pixel": 0.2078, + "loss_text": 1.7366, + "ppl": 6.9894, + "step": 1618 + }, + { + "epoch": 0.01, + "global_step": 1619, + "learning_rate": 0.0004940776293823039, + "loss": 1.9546, + "loss_base2": 2.8199, + "loss_pixel": 0.2085, + "loss_text": 1.7461, + "ppl": 7.0611, + "step": 1619 + }, + { + "epoch": 0.01, + "global_step": 1620, + "learning_rate": 0.0004940734557595994, + "loss": 1.9534, + "loss_base2": 2.8182, + "loss_pixel": 0.2083, + "loss_text": 1.7451, + "ppl": 7.0526, + "step": 1620 + }, + { + "epoch": 0.01, + "global_step": 1621, + "learning_rate": 0.0004940692821368949, + "loss": 1.9479, + "loss_base2": 2.8102, + "loss_pixel": 0.2073, + "loss_text": 1.7406, + "ppl": 7.0139, + "step": 1621 + }, + { + "epoch": 0.01, + "global_step": 1622, + "learning_rate": 0.0004940651085141904, + "loss": 1.9543, + "loss_base2": 2.8195, + "loss_pixel": 0.2074, + "loss_text": 1.7469, + "ppl": 7.059, + "step": 1622 + }, + { + "epoch": 0.01, + "global_step": 1623, + "learning_rate": 0.0004940609348914859, + "loss": 1.9396, + "loss_base2": 2.7983, + "loss_pixel": 0.2054, + "loss_text": 1.7341, + "ppl": 6.956, + "step": 1623 + }, + { + "epoch": 0.01, + "global_step": 1624, + "learning_rate": 0.0004940567612687813, + "loss": 1.9528, + "loss_base2": 2.8173, + "loss_pixel": 0.207, + "loss_text": 1.7458, + "ppl": 7.0484, + "step": 1624 + }, + { + "epoch": 0.01, + "global_step": 1625, + "learning_rate": 0.0004940525876460768, + "loss": 1.9455, + "loss_base2": 2.8068, + "loss_pixel": 0.2051, + "loss_text": 1.7404, + "ppl": 6.9971, + "step": 1625 + }, + { + "epoch": 0.01, + "global_step": 1626, + "learning_rate": 0.0004940484140233723, + "loss": 1.9226, + "loss_base2": 2.7737, + "loss_pixel": 0.2054, + "loss_text": 1.7171, + "ppl": 6.8387, + "step": 1626 + }, + { + "epoch": 0.01, + "global_step": 1627, + "learning_rate": 0.0004940442404006678, + "loss": 1.9347, + "loss_base2": 2.7912, + "loss_pixel": 0.2059, + "loss_text": 1.7288, + "ppl": 6.922, + "step": 1627 + }, + { + "epoch": 0.01, + "global_step": 1628, + "learning_rate": 0.0004940400667779632, + "loss": 1.8533, + "loss_base2": 2.6737, + "loss_pixel": 0.2059, + "loss_text": 1.6474, + "ppl": 6.3808, + "step": 1628 + }, + { + "epoch": 0.01, + "global_step": 1629, + "learning_rate": 0.0004940358931552587, + "loss": 1.7135, + "loss_base2": 2.4721, + "loss_pixel": 0.2056, + "loss_text": 1.508, + "ppl": 5.5483, + "step": 1629 + }, + { + "epoch": 0.01, + "global_step": 1630, + "learning_rate": 0.0004940317195325542, + "loss": 1.695, + "loss_base2": 2.4454, + "loss_pixel": 0.2053, + "loss_text": 1.4898, + "ppl": 5.4466, + "step": 1630 + }, + { + "epoch": 0.01, + "global_step": 1631, + "learning_rate": 0.0004940275459098497, + "loss": 1.7075, + "loss_base2": 2.4634, + "loss_pixel": 0.2044, + "loss_text": 1.5031, + "ppl": 5.5152, + "step": 1631 + }, + { + "epoch": 0.01, + "global_step": 1632, + "learning_rate": 0.0004940233722871452, + "loss": 1.7094, + "loss_base2": 2.4661, + "loss_pixel": 0.204, + "loss_text": 1.5054, + "ppl": 5.5256, + "step": 1632 + }, + { + "epoch": 0.01, + "global_step": 1633, + "learning_rate": 0.0004940191986644407, + "loss": 1.6895, + "loss_base2": 2.4374, + "loss_pixel": 0.2038, + "loss_text": 1.4857, + "ppl": 5.4168, + "step": 1633 + }, + { + "epoch": 0.01, + "global_step": 1634, + "learning_rate": 0.0004940150250417363, + "loss": 1.6866, + "loss_base2": 2.4332, + "loss_pixel": 0.2037, + "loss_text": 1.483, + "ppl": 5.4011, + "step": 1634 + }, + { + "epoch": 0.01, + "global_step": 1635, + "learning_rate": 0.0004940108514190318, + "loss": 1.6958, + "loss_base2": 2.4465, + "loss_pixel": 0.2052, + "loss_text": 1.4906, + "ppl": 5.451, + "step": 1635 + }, + { + "epoch": 0.01, + "global_step": 1636, + "learning_rate": 0.0004940066777963273, + "loss": 1.6751, + "loss_base2": 2.4167, + "loss_pixel": 0.2035, + "loss_text": 1.4715, + "ppl": 5.3393, + "step": 1636 + }, + { + "epoch": 0.01, + "global_step": 1637, + "learning_rate": 0.0004940025041736227, + "loss": 1.6735, + "loss_base2": 2.4144, + "loss_pixel": 0.2043, + "loss_text": 1.4692, + "ppl": 5.3308, + "step": 1637 + }, + { + "epoch": 0.01, + "global_step": 1638, + "learning_rate": 0.0004939983305509182, + "loss": 1.6763, + "loss_base2": 2.4184, + "loss_pixel": 0.2029, + "loss_text": 1.4734, + "ppl": 5.3457, + "step": 1638 + }, + { + "epoch": 0.01, + "global_step": 1639, + "learning_rate": 0.0004939941569282137, + "loss": 1.6971, + "loss_base2": 2.4484, + "loss_pixel": 0.2034, + "loss_text": 1.4938, + "ppl": 5.4581, + "step": 1639 + }, + { + "epoch": 0.01, + "global_step": 1640, + "learning_rate": 0.0004939899833055092, + "loss": 1.6677, + "loss_base2": 2.406, + "loss_pixel": 0.2026, + "loss_text": 1.4651, + "ppl": 5.3, + "step": 1640 + }, + { + "epoch": 0.01, + "global_step": 1641, + "learning_rate": 0.0004939858096828047, + "loss": 1.6673, + "loss_base2": 2.4054, + "loss_pixel": 0.203, + "loss_text": 1.4643, + "ppl": 5.2978, + "step": 1641 + }, + { + "epoch": 0.01, + "global_step": 1642, + "learning_rate": 0.0004939816360601002, + "loss": 1.6579, + "loss_base2": 2.3918, + "loss_pixel": 0.203, + "loss_text": 1.4549, + "ppl": 5.2483, + "step": 1642 + }, + { + "epoch": 0.01, + "global_step": 1643, + "learning_rate": 0.0004939774624373957, + "loss": 1.6917, + "loss_base2": 2.4406, + "loss_pixel": 0.2035, + "loss_text": 1.4883, + "ppl": 5.4287, + "step": 1643 + }, + { + "epoch": 0.01, + "global_step": 1644, + "learning_rate": 0.0004939732888146912, + "loss": 1.6835, + "loss_base2": 2.4288, + "loss_pixel": 0.203, + "loss_text": 1.4806, + "ppl": 5.3844, + "step": 1644 + }, + { + "epoch": 0.01, + "global_step": 1645, + "learning_rate": 0.0004939691151919867, + "loss": 1.6699, + "loss_base2": 2.4092, + "loss_pixel": 0.2028, + "loss_text": 1.4672, + "ppl": 5.3116, + "step": 1645 + }, + { + "epoch": 0.01, + "global_step": 1646, + "learning_rate": 0.0004939649415692821, + "loss": 1.6791, + "loss_base2": 2.4224, + "loss_pixel": 0.2014, + "loss_text": 1.4777, + "ppl": 5.3607, + "step": 1646 + }, + { + "epoch": 0.01, + "global_step": 1647, + "learning_rate": 0.0004939607679465776, + "loss": 1.655, + "loss_base2": 2.3877, + "loss_pixel": 0.2015, + "loss_text": 1.4536, + "ppl": 5.2331, + "step": 1647 + }, + { + "epoch": 0.01, + "global_step": 1648, + "learning_rate": 0.0004939565943238731, + "loss": 1.7048, + "loss_base2": 2.4595, + "loss_pixel": 0.203, + "loss_text": 1.5018, + "ppl": 5.5003, + "step": 1648 + }, + { + "epoch": 0.01, + "global_step": 1649, + "learning_rate": 0.0004939524207011686, + "loss": 1.6679, + "loss_base2": 2.4063, + "loss_pixel": 0.203, + "loss_text": 1.4649, + "ppl": 5.301, + "step": 1649 + }, + { + "epoch": 0.01, + "global_step": 1650, + "learning_rate": 0.0004939482470784642, + "loss": 1.6626, + "loss_base2": 2.3986, + "loss_pixel": 0.2026, + "loss_text": 1.4599, + "ppl": 5.273, + "step": 1650 + }, + { + "epoch": 0.01, + "global_step": 1651, + "learning_rate": 0.0004939440734557596, + "loss": 1.6789, + "loss_base2": 2.4221, + "loss_pixel": 0.2023, + "loss_text": 1.4765, + "ppl": 5.3597, + "step": 1651 + }, + { + "epoch": 0.01, + "global_step": 1652, + "learning_rate": 0.0004939398998330551, + "loss": 1.6489, + "loss_base2": 2.3789, + "loss_pixel": 0.2035, + "loss_text": 1.4453, + "ppl": 5.2013, + "step": 1652 + }, + { + "epoch": 0.01, + "global_step": 1653, + "learning_rate": 0.0004939357262103506, + "loss": 1.6628, + "loss_base2": 2.3989, + "loss_pixel": 0.2029, + "loss_text": 1.4599, + "ppl": 5.2741, + "step": 1653 + }, + { + "epoch": 0.01, + "global_step": 1654, + "learning_rate": 0.0004939315525876461, + "loss": 1.6662, + "loss_base2": 2.4038, + "loss_pixel": 0.2031, + "loss_text": 1.4631, + "ppl": 5.292, + "step": 1654 + }, + { + "epoch": 0.01, + "global_step": 1655, + "learning_rate": 0.0004939273789649416, + "loss": 1.6845, + "loss_base2": 2.4302, + "loss_pixel": 0.2026, + "loss_text": 1.482, + "ppl": 5.3898, + "step": 1655 + }, + { + "epoch": 0.01, + "global_step": 1656, + "learning_rate": 0.0004939232053422371, + "loss": 1.663, + "loss_base2": 2.3992, + "loss_pixel": 0.2017, + "loss_text": 1.4612, + "ppl": 5.2751, + "step": 1656 + }, + { + "epoch": 0.01, + "global_step": 1657, + "learning_rate": 0.0004939190317195326, + "loss": 1.67, + "loss_base2": 2.4093, + "loss_pixel": 0.2035, + "loss_text": 1.4664, + "ppl": 5.3122, + "step": 1657 + }, + { + "epoch": 0.01, + "global_step": 1658, + "learning_rate": 0.0004939148580968281, + "loss": 1.6609, + "loss_base2": 2.3962, + "loss_pixel": 0.204, + "loss_text": 1.4569, + "ppl": 5.264, + "step": 1658 + }, + { + "epoch": 0.01, + "global_step": 1659, + "learning_rate": 0.0004939106844741236, + "loss": 1.6711, + "loss_base2": 2.4109, + "loss_pixel": 0.2049, + "loss_text": 1.4662, + "ppl": 5.318, + "step": 1659 + }, + { + "epoch": 0.01, + "global_step": 1660, + "learning_rate": 0.000493906510851419, + "loss": 1.6646, + "loss_base2": 2.4015, + "loss_pixel": 0.204, + "loss_text": 1.4606, + "ppl": 5.2836, + "step": 1660 + }, + { + "epoch": 0.01, + "global_step": 1661, + "learning_rate": 0.0004939023372287145, + "loss": 1.6542, + "loss_base2": 2.3865, + "loss_pixel": 0.2037, + "loss_text": 1.4505, + "ppl": 5.2289, + "step": 1661 + }, + { + "epoch": 0.01, + "global_step": 1662, + "learning_rate": 0.00049389816360601, + "loss": 1.6576, + "loss_base2": 2.3914, + "loss_pixel": 0.2028, + "loss_text": 1.4548, + "ppl": 5.2467, + "step": 1662 + }, + { + "epoch": 0.01, + "global_step": 1663, + "learning_rate": 0.0004938939899833055, + "loss": 1.669, + "loss_base2": 2.4079, + "loss_pixel": 0.2043, + "loss_text": 1.4647, + "ppl": 5.3069, + "step": 1663 + }, + { + "epoch": 0.01, + "global_step": 1664, + "learning_rate": 0.0004938898163606009, + "loss": 1.672, + "loss_base2": 2.4122, + "loss_pixel": 0.2019, + "loss_text": 1.47, + "ppl": 5.3228, + "step": 1664 + }, + { + "epoch": 0.01, + "global_step": 1665, + "learning_rate": 0.0004938856427378964, + "loss": 1.6511, + "loss_base2": 2.382, + "loss_pixel": 0.2033, + "loss_text": 1.4478, + "ppl": 5.2127, + "step": 1665 + }, + { + "epoch": 0.01, + "global_step": 1666, + "learning_rate": 0.000493881469115192, + "loss": 1.6471, + "loss_base2": 2.3763, + "loss_pixel": 0.2016, + "loss_text": 1.4455, + "ppl": 5.1919, + "step": 1666 + }, + { + "epoch": 0.01, + "global_step": 1667, + "learning_rate": 0.0004938772954924875, + "loss": 1.6789, + "loss_base2": 2.4221, + "loss_pixel": 0.2028, + "loss_text": 1.4761, + "ppl": 5.3597, + "step": 1667 + }, + { + "epoch": 0.01, + "global_step": 1668, + "learning_rate": 0.000493873121869783, + "loss": 1.637, + "loss_base2": 2.3617, + "loss_pixel": 0.2021, + "loss_text": 1.4349, + "ppl": 5.1397, + "step": 1668 + }, + { + "epoch": 0.01, + "global_step": 1669, + "learning_rate": 0.0004938689482470785, + "loss": 1.6564, + "loss_base2": 2.3897, + "loss_pixel": 0.202, + "loss_text": 1.4543, + "ppl": 5.2404, + "step": 1669 + }, + { + "epoch": 0.01, + "global_step": 1670, + "learning_rate": 0.000493864774624374, + "loss": 1.8957, + "loss_base2": 2.7349, + "loss_pixel": 0.2013, + "loss_text": 1.6944, + "ppl": 6.6572, + "step": 1670 + }, + { + "epoch": 0.01, + "global_step": 1671, + "learning_rate": 0.0004938606010016695, + "loss": 1.7039, + "loss_base2": 2.4582, + "loss_pixel": 0.2016, + "loss_text": 1.5024, + "ppl": 5.4953, + "step": 1671 + }, + { + "epoch": 0.01, + "global_step": 1672, + "learning_rate": 0.000493856427378965, + "loss": 1.6651, + "loss_base2": 2.4022, + "loss_pixel": 0.2022, + "loss_text": 1.4629, + "ppl": 5.2862, + "step": 1672 + }, + { + "epoch": 0.01, + "global_step": 1673, + "learning_rate": 0.0004938522537562604, + "loss": 1.6533, + "loss_base2": 2.3852, + "loss_pixel": 0.202, + "loss_text": 1.4513, + "ppl": 5.2242, + "step": 1673 + }, + { + "epoch": 0.01, + "global_step": 1674, + "learning_rate": 0.0004938480801335559, + "loss": 1.6674, + "loss_base2": 2.4055, + "loss_pixel": 0.2012, + "loss_text": 1.4662, + "ppl": 5.2984, + "step": 1674 + }, + { + "epoch": 0.01, + "global_step": 1675, + "learning_rate": 0.0004938439065108514, + "loss": 1.6481, + "loss_base2": 2.3777, + "loss_pixel": 0.2014, + "loss_text": 1.4468, + "ppl": 5.1971, + "step": 1675 + }, + { + "epoch": 0.01, + "global_step": 1676, + "learning_rate": 0.0004938397328881469, + "loss": 1.652, + "loss_base2": 2.3833, + "loss_pixel": 0.2009, + "loss_text": 1.4511, + "ppl": 5.2174, + "step": 1676 + }, + { + "epoch": 0.01, + "global_step": 1677, + "learning_rate": 0.0004938355592654424, + "loss": 1.657, + "loss_base2": 2.3905, + "loss_pixel": 0.2008, + "loss_text": 1.4562, + "ppl": 5.2436, + "step": 1677 + }, + { + "epoch": 0.01, + "global_step": 1678, + "learning_rate": 0.0004938313856427379, + "loss": 1.6466, + "loss_base2": 2.3755, + "loss_pixel": 0.2025, + "loss_text": 1.4441, + "ppl": 5.1893, + "step": 1678 + }, + { + "epoch": 0.01, + "global_step": 1679, + "learning_rate": 0.0004938272120200334, + "loss": 1.6725, + "loss_base2": 2.4129, + "loss_pixel": 0.2013, + "loss_text": 1.4712, + "ppl": 5.3255, + "step": 1679 + }, + { + "epoch": 0.01, + "global_step": 1680, + "learning_rate": 0.0004938230383973289, + "loss": 1.8649, + "loss_base2": 2.6905, + "loss_pixel": 0.2012, + "loss_text": 1.6637, + "ppl": 6.4553, + "step": 1680 + }, + { + "epoch": 0.01, + "global_step": 1681, + "learning_rate": 0.0004938188647746244, + "loss": 1.9852, + "loss_base2": 2.864, + "loss_pixel": 0.2004, + "loss_text": 1.7848, + "ppl": 7.2805, + "step": 1681 + }, + { + "epoch": 0.01, + "global_step": 1682, + "learning_rate": 0.00049381469115192, + "loss": 1.9866, + "loss_base2": 2.8661, + "loss_pixel": 0.2021, + "loss_text": 1.7845, + "ppl": 7.2907, + "step": 1682 + }, + { + "epoch": 0.01, + "global_step": 1683, + "learning_rate": 0.0004938105175292154, + "loss": 1.9769, + "loss_base2": 2.8521, + "loss_pixel": 0.2018, + "loss_text": 1.7751, + "ppl": 7.2203, + "step": 1683 + }, + { + "epoch": 0.01, + "global_step": 1684, + "learning_rate": 0.0004938063439065109, + "loss": 1.9556, + "loss_base2": 2.8213, + "loss_pixel": 0.2043, + "loss_text": 1.7512, + "ppl": 7.0682, + "step": 1684 + }, + { + "epoch": 0.01, + "global_step": 1685, + "learning_rate": 0.0004938021702838064, + "loss": 1.9668, + "loss_base2": 2.8375, + "loss_pixel": 0.2002, + "loss_text": 1.7665, + "ppl": 7.1478, + "step": 1685 + }, + { + "epoch": 0.01, + "global_step": 1686, + "learning_rate": 0.0004937979966611019, + "loss": 1.9768, + "loss_base2": 2.8519, + "loss_pixel": 0.2004, + "loss_text": 1.7764, + "ppl": 7.2196, + "step": 1686 + }, + { + "epoch": 0.01, + "global_step": 1687, + "learning_rate": 0.0004937938230383973, + "loss": 1.9248, + "loss_base2": 2.7769, + "loss_pixel": 0.2002, + "loss_text": 1.7246, + "ppl": 6.8538, + "step": 1687 + }, + { + "epoch": 0.01, + "global_step": 1688, + "learning_rate": 0.0004937896494156928, + "loss": 1.9572, + "loss_base2": 2.8236, + "loss_pixel": 0.1999, + "loss_text": 1.7573, + "ppl": 7.0795, + "step": 1688 + }, + { + "epoch": 0.01, + "global_step": 1689, + "learning_rate": 0.0004937854757929883, + "loss": 1.9411, + "loss_base2": 2.8004, + "loss_pixel": 0.2005, + "loss_text": 1.7406, + "ppl": 6.9664, + "step": 1689 + }, + { + "epoch": 0.01, + "global_step": 1690, + "learning_rate": 0.0004937813021702838, + "loss": 1.9521, + "loss_base2": 2.8163, + "loss_pixel": 0.2016, + "loss_text": 1.7505, + "ppl": 7.0435, + "step": 1690 + }, + { + "epoch": 0.01, + "global_step": 1691, + "learning_rate": 0.0004937771285475793, + "loss": 1.9458, + "loss_base2": 2.8072, + "loss_pixel": 0.2, + "loss_text": 1.7458, + "ppl": 6.9992, + "step": 1691 + }, + { + "epoch": 0.01, + "global_step": 1692, + "learning_rate": 0.0004937729549248748, + "loss": 1.9557, + "loss_base2": 2.8215, + "loss_pixel": 0.1997, + "loss_text": 1.756, + "ppl": 7.0689, + "step": 1692 + }, + { + "epoch": 0.01, + "global_step": 1693, + "learning_rate": 0.0004937687813021703, + "loss": 1.9299, + "loss_base2": 2.7843, + "loss_pixel": 0.2, + "loss_text": 1.7298, + "ppl": 6.8888, + "step": 1693 + }, + { + "epoch": 0.01, + "global_step": 1694, + "learning_rate": 0.0004937646076794658, + "loss": 1.9441, + "loss_base2": 2.8047, + "loss_pixel": 0.202, + "loss_text": 1.7421, + "ppl": 6.9873, + "step": 1694 + }, + { + "epoch": 0.01, + "global_step": 1695, + "learning_rate": 0.0004937604340567613, + "loss": 1.953, + "loss_base2": 2.8176, + "loss_pixel": 0.2029, + "loss_text": 1.75, + "ppl": 7.0498, + "step": 1695 + }, + { + "epoch": 0.01, + "global_step": 1696, + "learning_rate": 0.0004937562604340567, + "loss": 1.9646, + "loss_base2": 2.8343, + "loss_pixel": 0.2053, + "loss_text": 1.7593, + "ppl": 7.1321, + "step": 1696 + }, + { + "epoch": 0.01, + "global_step": 1697, + "learning_rate": 0.0004937520868113522, + "loss": 1.9312, + "loss_base2": 2.7861, + "loss_pixel": 0.2057, + "loss_text": 1.7255, + "ppl": 6.8978, + "step": 1697 + }, + { + "epoch": 0.01, + "global_step": 1698, + "learning_rate": 0.0004937479131886477, + "loss": 1.9248, + "loss_base2": 2.7769, + "loss_pixel": 0.2039, + "loss_text": 1.7209, + "ppl": 6.8538, + "step": 1698 + }, + { + "epoch": 0.01, + "global_step": 1699, + "learning_rate": 0.0004937437395659433, + "loss": 1.9432, + "loss_base2": 2.8034, + "loss_pixel": 0.2028, + "loss_text": 1.7404, + "ppl": 6.9811, + "step": 1699 + }, + { + "epoch": 0.01, + "global_step": 1700, + "learning_rate": 0.0004937395659432388, + "loss": 1.9382, + "loss_base2": 2.7962, + "loss_pixel": 0.2029, + "loss_text": 1.7353, + "ppl": 6.9462, + "step": 1700 + }, + { + "epoch": 0.01, + "global_step": 1701, + "learning_rate": 0.0004937353923205343, + "loss": 1.9454, + "loss_base2": 2.8066, + "loss_pixel": 0.2038, + "loss_text": 1.7417, + "ppl": 6.9964, + "step": 1701 + }, + { + "epoch": 0.01, + "global_step": 1702, + "learning_rate": 0.0004937312186978297, + "loss": 1.944, + "loss_base2": 2.8046, + "loss_pixel": 0.2027, + "loss_text": 1.7414, + "ppl": 6.9866, + "step": 1702 + }, + { + "epoch": 0.01, + "global_step": 1703, + "learning_rate": 0.0004937270450751252, + "loss": 1.9395, + "loss_base2": 2.7981, + "loss_pixel": 0.2014, + "loss_text": 1.7381, + "ppl": 6.9553, + "step": 1703 + }, + { + "epoch": 0.01, + "global_step": 1704, + "learning_rate": 0.0004937228714524207, + "loss": 1.9481, + "loss_base2": 2.8105, + "loss_pixel": 0.2034, + "loss_text": 1.7447, + "ppl": 7.0153, + "step": 1704 + }, + { + "epoch": 0.01, + "global_step": 1705, + "learning_rate": 0.0004937186978297162, + "loss": 1.919, + "loss_base2": 2.7685, + "loss_pixel": 0.203, + "loss_text": 1.716, + "ppl": 6.8141, + "step": 1705 + }, + { + "epoch": 0.01, + "global_step": 1706, + "learning_rate": 0.0004937145242070117, + "loss": 1.9345, + "loss_base2": 2.7909, + "loss_pixel": 0.201, + "loss_text": 1.7335, + "ppl": 6.9206, + "step": 1706 + }, + { + "epoch": 0.01, + "global_step": 1707, + "learning_rate": 0.0004937103505843072, + "loss": 1.9291, + "loss_base2": 2.7831, + "loss_pixel": 0.2014, + "loss_text": 1.7278, + "ppl": 6.8833, + "step": 1707 + }, + { + "epoch": 0.01, + "global_step": 1708, + "learning_rate": 0.0004937061769616027, + "loss": 1.9242, + "loss_base2": 2.776, + "loss_pixel": 0.201, + "loss_text": 1.7232, + "ppl": 6.8497, + "step": 1708 + }, + { + "epoch": 0.01, + "global_step": 1709, + "learning_rate": 0.0004937020033388982, + "loss": 1.9251, + "loss_base2": 2.7773, + "loss_pixel": 0.2, + "loss_text": 1.7251, + "ppl": 6.8558, + "step": 1709 + }, + { + "epoch": 0.01, + "global_step": 1710, + "learning_rate": 0.0004936978297161936, + "loss": 1.9219, + "loss_base2": 2.7727, + "loss_pixel": 0.1999, + "loss_text": 1.7221, + "ppl": 6.8339, + "step": 1710 + }, + { + "epoch": 0.01, + "global_step": 1711, + "learning_rate": 0.0004936936560934891, + "loss": 1.9383, + "loss_base2": 2.7964, + "loss_pixel": 0.2015, + "loss_text": 1.7368, + "ppl": 6.9469, + "step": 1711 + }, + { + "epoch": 0.01, + "global_step": 1712, + "learning_rate": 0.0004936894824707846, + "loss": 1.9287, + "loss_base2": 2.7825, + "loss_pixel": 0.2012, + "loss_text": 1.7274, + "ppl": 6.8806, + "step": 1712 + }, + { + "epoch": 0.01, + "global_step": 1713, + "learning_rate": 0.0004936853088480801, + "loss": 1.9292, + "loss_base2": 2.7832, + "loss_pixel": 0.201, + "loss_text": 1.7283, + "ppl": 6.884, + "step": 1713 + }, + { + "epoch": 0.01, + "global_step": 1714, + "learning_rate": 0.0004936811352253756, + "loss": 1.9093, + "loss_base2": 2.7545, + "loss_pixel": 0.2008, + "loss_text": 1.7085, + "ppl": 6.7484, + "step": 1714 + }, + { + "epoch": 0.01, + "global_step": 1715, + "learning_rate": 0.0004936769616026712, + "loss": 1.9257, + "loss_base2": 2.7782, + "loss_pixel": 0.1988, + "loss_text": 1.7268, + "ppl": 6.8599, + "step": 1715 + }, + { + "epoch": 0.01, + "global_step": 1716, + "learning_rate": 0.0004936727879799667, + "loss": 1.909, + "loss_base2": 2.7541, + "loss_pixel": 0.1996, + "loss_text": 1.7093, + "ppl": 6.7463, + "step": 1716 + }, + { + "epoch": 0.01, + "global_step": 1717, + "learning_rate": 0.0004936686143572622, + "loss": 1.9343, + "loss_base2": 2.7906, + "loss_pixel": 0.2, + "loss_text": 1.7343, + "ppl": 6.9192, + "step": 1717 + }, + { + "epoch": 0.01, + "global_step": 1718, + "learning_rate": 0.0004936644407345577, + "loss": 1.9245, + "loss_base2": 2.7765, + "loss_pixel": 0.2011, + "loss_text": 1.7234, + "ppl": 6.8517, + "step": 1718 + }, + { + "epoch": 0.01, + "global_step": 1719, + "learning_rate": 0.0004936602671118531, + "loss": 1.9246, + "loss_base2": 2.7766, + "loss_pixel": 0.2001, + "loss_text": 1.7244, + "ppl": 6.8524, + "step": 1719 + }, + { + "epoch": 0.01, + "global_step": 1720, + "learning_rate": 0.0004936560934891486, + "loss": 1.915, + "loss_base2": 2.7628, + "loss_pixel": 0.1986, + "loss_text": 1.7164, + "ppl": 6.7869, + "step": 1720 + }, + { + "epoch": 0.01, + "global_step": 1721, + "learning_rate": 0.0004936519198664441, + "loss": 1.9157, + "loss_base2": 2.7638, + "loss_pixel": 0.1998, + "loss_text": 1.716, + "ppl": 6.7917, + "step": 1721 + }, + { + "epoch": 0.01, + "global_step": 1722, + "learning_rate": 0.0004936477462437396, + "loss": 1.9177, + "loss_base2": 2.7667, + "loss_pixel": 0.2061, + "loss_text": 1.7116, + "ppl": 6.8053, + "step": 1722 + }, + { + "epoch": 0.01, + "global_step": 1723, + "learning_rate": 0.000493643572621035, + "loss": 1.9272, + "loss_base2": 2.7804, + "loss_pixel": 0.2084, + "loss_text": 1.7188, + "ppl": 6.8702, + "step": 1723 + }, + { + "epoch": 0.01, + "global_step": 1724, + "learning_rate": 0.0004936393989983305, + "loss": 1.9402, + "loss_base2": 2.7991, + "loss_pixel": 0.2078, + "loss_text": 1.7324, + "ppl": 6.9601, + "step": 1724 + }, + { + "epoch": 0.01, + "global_step": 1725, + "learning_rate": 0.000493635225375626, + "loss": 1.9311, + "loss_base2": 2.786, + "loss_pixel": 0.2009, + "loss_text": 1.7302, + "ppl": 6.8971, + "step": 1725 + }, + { + "epoch": 0.01, + "global_step": 1726, + "learning_rate": 0.0004936310517529215, + "loss": 1.9125, + "loss_base2": 2.7592, + "loss_pixel": 0.2019, + "loss_text": 1.7106, + "ppl": 6.77, + "step": 1726 + }, + { + "epoch": 0.01, + "global_step": 1727, + "learning_rate": 0.000493626878130217, + "loss": 1.8909, + "loss_base2": 2.728, + "loss_pixel": 0.2011, + "loss_text": 1.6898, + "ppl": 6.6253, + "step": 1727 + }, + { + "epoch": 0.01, + "global_step": 1728, + "learning_rate": 0.0004936227045075125, + "loss": 1.7829, + "loss_base2": 2.5722, + "loss_pixel": 0.2021, + "loss_text": 1.5807, + "ppl": 5.9471, + "step": 1728 + }, + { + "epoch": 0.01, + "global_step": 1729, + "learning_rate": 0.000493618530884808, + "loss": 1.6612, + "loss_base2": 2.3966, + "loss_pixel": 0.1987, + "loss_text": 1.4625, + "ppl": 5.2656, + "step": 1729 + }, + { + "epoch": 0.01, + "global_step": 1730, + "learning_rate": 0.0004936143572621035, + "loss": 1.6467, + "loss_base2": 2.3757, + "loss_pixel": 0.2002, + "loss_text": 1.4465, + "ppl": 5.1898, + "step": 1730 + }, + { + "epoch": 0.01, + "global_step": 1731, + "learning_rate": 0.0004936101836393991, + "loss": 1.6578, + "loss_base2": 2.3917, + "loss_pixel": 0.1979, + "loss_text": 1.4598, + "ppl": 5.2478, + "step": 1731 + }, + { + "epoch": 0.01, + "global_step": 1732, + "learning_rate": 0.0004936060100166945, + "loss": 1.6462, + "loss_base2": 2.375, + "loss_pixel": 0.1992, + "loss_text": 1.447, + "ppl": 5.1872, + "step": 1732 + }, + { + "epoch": 0.01, + "global_step": 1733, + "learning_rate": 0.00049360183639399, + "loss": 1.6556, + "loss_base2": 2.3885, + "loss_pixel": 0.1993, + "loss_text": 1.4563, + "ppl": 5.2362, + "step": 1733 + }, + { + "epoch": 0.01, + "global_step": 1734, + "learning_rate": 0.0004935976627712855, + "loss": 1.6629, + "loss_base2": 2.3991, + "loss_pixel": 0.1967, + "loss_text": 1.4662, + "ppl": 5.2746, + "step": 1734 + }, + { + "epoch": 0.01, + "global_step": 1735, + "learning_rate": 0.000493593489148581, + "loss": 1.6479, + "loss_base2": 2.3774, + "loss_pixel": 0.1995, + "loss_text": 1.4484, + "ppl": 5.1961, + "step": 1735 + }, + { + "epoch": 0.01, + "global_step": 1736, + "learning_rate": 0.0004935893155258765, + "loss": 1.6387, + "loss_base2": 2.3641, + "loss_pixel": 0.1974, + "loss_text": 1.4412, + "ppl": 5.1485, + "step": 1736 + }, + { + "epoch": 0.01, + "global_step": 1737, + "learning_rate": 0.000493585141903172, + "loss": 1.6464, + "loss_base2": 2.3753, + "loss_pixel": 0.1956, + "loss_text": 1.4508, + "ppl": 5.1883, + "step": 1737 + }, + { + "epoch": 0.01, + "global_step": 1738, + "learning_rate": 0.0004935809682804675, + "loss": 1.6411, + "loss_base2": 2.3676, + "loss_pixel": 0.1968, + "loss_text": 1.4443, + "ppl": 5.1608, + "step": 1738 + }, + { + "epoch": 0.01, + "global_step": 1739, + "learning_rate": 0.0004935767946577629, + "loss": 1.6365, + "loss_base2": 2.361, + "loss_pixel": 0.1949, + "loss_text": 1.4416, + "ppl": 5.1372, + "step": 1739 + }, + { + "epoch": 0.01, + "global_step": 1740, + "learning_rate": 0.0004935726210350584, + "loss": 1.654, + "loss_base2": 2.3862, + "loss_pixel": 0.1967, + "loss_text": 1.4573, + "ppl": 5.2278, + "step": 1740 + }, + { + "epoch": 0.01, + "global_step": 1741, + "learning_rate": 0.0004935684474123539, + "loss": 1.6485, + "loss_base2": 2.3783, + "loss_pixel": 0.196, + "loss_text": 1.4525, + "ppl": 5.1992, + "step": 1741 + }, + { + "epoch": 0.01, + "global_step": 1742, + "learning_rate": 0.0004935642737896494, + "loss": 1.664, + "loss_base2": 2.4006, + "loss_pixel": 0.2075, + "loss_text": 1.4565, + "ppl": 5.2804, + "step": 1742 + }, + { + "epoch": 0.01, + "global_step": 1743, + "learning_rate": 0.0004935601001669449, + "loss": 1.7426, + "loss_base2": 2.514, + "loss_pixel": 0.2116, + "loss_text": 1.531, + "ppl": 5.7122, + "step": 1743 + }, + { + "epoch": 0.01, + "global_step": 1744, + "learning_rate": 0.0004935559265442404, + "loss": 1.8725, + "loss_base2": 2.7014, + "loss_pixel": 0.2089, + "loss_text": 1.6636, + "ppl": 6.5045, + "step": 1744 + }, + { + "epoch": 0.01, + "global_step": 1745, + "learning_rate": 0.0004935517529215359, + "loss": 1.8657, + "loss_base2": 2.6916, + "loss_pixel": 0.2046, + "loss_text": 1.6611, + "ppl": 6.4605, + "step": 1745 + }, + { + "epoch": 0.01, + "global_step": 1746, + "learning_rate": 0.0004935475792988313, + "loss": 1.7757, + "loss_base2": 2.5618, + "loss_pixel": 0.2031, + "loss_text": 1.5726, + "ppl": 5.9044, + "step": 1746 + }, + { + "epoch": 0.01, + "global_step": 1747, + "learning_rate": 0.0004935434056761268, + "loss": 1.6795, + "loss_base2": 2.423, + "loss_pixel": 0.2028, + "loss_text": 1.4767, + "ppl": 5.3629, + "step": 1747 + }, + { + "epoch": 0.01, + "global_step": 1748, + "learning_rate": 0.0004935392320534224, + "loss": 1.6433, + "loss_base2": 2.3708, + "loss_pixel": 0.2028, + "loss_text": 1.4405, + "ppl": 5.1722, + "step": 1748 + }, + { + "epoch": 0.01, + "global_step": 1749, + "learning_rate": 0.0004935350584307179, + "loss": 1.6744, + "loss_base2": 2.4156, + "loss_pixel": 0.2026, + "loss_text": 1.4718, + "ppl": 5.3356, + "step": 1749 + }, + { + "epoch": 0.01, + "global_step": 1750, + "learning_rate": 0.0004935308848080134, + "loss": 1.6527, + "loss_base2": 2.3843, + "loss_pixel": 0.2018, + "loss_text": 1.4508, + "ppl": 5.2211, + "step": 1750 + }, + { + "epoch": 0.01, + "global_step": 1751, + "learning_rate": 0.0004935267111853089, + "loss": 1.6574, + "loss_base2": 2.3911, + "loss_pixel": 0.2017, + "loss_text": 1.4557, + "ppl": 5.2457, + "step": 1751 + }, + { + "epoch": 0.01, + "global_step": 1752, + "learning_rate": 0.0004935225375626044, + "loss": 1.6592, + "loss_base2": 2.3937, + "loss_pixel": 0.2008, + "loss_text": 1.4585, + "ppl": 5.2551, + "step": 1752 + }, + { + "epoch": 0.01, + "global_step": 1753, + "learning_rate": 0.0004935183639398999, + "loss": 1.7047, + "loss_base2": 2.4594, + "loss_pixel": 0.2004, + "loss_text": 1.5043, + "ppl": 5.4997, + "step": 1753 + }, + { + "epoch": 0.01, + "global_step": 1754, + "learning_rate": 0.0004935141903171954, + "loss": 1.9606, + "loss_base2": 2.8285, + "loss_pixel": 0.2015, + "loss_text": 1.7591, + "ppl": 7.1036, + "step": 1754 + }, + { + "epoch": 0.01, + "global_step": 1755, + "learning_rate": 0.0004935100166944908, + "loss": 1.9749, + "loss_base2": 2.8492, + "loss_pixel": 0.2008, + "loss_text": 1.7741, + "ppl": 7.2059, + "step": 1755 + }, + { + "epoch": 0.01, + "global_step": 1756, + "learning_rate": 0.0004935058430717863, + "loss": 1.9532, + "loss_base2": 2.8179, + "loss_pixel": 0.1997, + "loss_text": 1.7535, + "ppl": 7.0512, + "step": 1756 + }, + { + "epoch": 0.01, + "global_step": 1757, + "learning_rate": 0.0004935016694490818, + "loss": 1.9574, + "loss_base2": 2.8239, + "loss_pixel": 0.2005, + "loss_text": 1.7569, + "ppl": 7.0809, + "step": 1757 + }, + { + "epoch": 0.01, + "global_step": 1758, + "learning_rate": 0.0004934974958263773, + "loss": 1.9487, + "loss_base2": 2.8114, + "loss_pixel": 0.201, + "loss_text": 1.7478, + "ppl": 7.0196, + "step": 1758 + }, + { + "epoch": 0.01, + "global_step": 1759, + "learning_rate": 0.0004934933222036728, + "loss": 1.9598, + "loss_base2": 2.8274, + "loss_pixel": 0.1998, + "loss_text": 1.7601, + "ppl": 7.0979, + "step": 1759 + }, + { + "epoch": 0.01, + "global_step": 1760, + "learning_rate": 0.0004934891485809682, + "loss": 1.9349, + "loss_base2": 2.7915, + "loss_pixel": 0.2004, + "loss_text": 1.7345, + "ppl": 6.9234, + "step": 1760 + }, + { + "epoch": 0.01, + "global_step": 1761, + "learning_rate": 0.0004934849749582637, + "loss": 1.9449, + "loss_base2": 2.8059, + "loss_pixel": 0.1997, + "loss_text": 1.7452, + "ppl": 6.9929, + "step": 1761 + }, + { + "epoch": 0.01, + "global_step": 1762, + "learning_rate": 0.0004934808013355592, + "loss": 1.9395, + "loss_base2": 2.7981, + "loss_pixel": 0.1998, + "loss_text": 1.7397, + "ppl": 6.9553, + "step": 1762 + }, + { + "epoch": 0.01, + "global_step": 1763, + "learning_rate": 0.0004934766277128547, + "loss": 1.9273, + "loss_base2": 2.7805, + "loss_pixel": 0.1987, + "loss_text": 1.7285, + "ppl": 6.8709, + "step": 1763 + }, + { + "epoch": 0.01, + "global_step": 1764, + "learning_rate": 0.0004934724540901503, + "loss": 1.938, + "loss_base2": 2.7959, + "loss_pixel": 0.1992, + "loss_text": 1.7388, + "ppl": 6.9448, + "step": 1764 + }, + { + "epoch": 0.01, + "global_step": 1765, + "learning_rate": 0.0004934682804674458, + "loss": 1.9189, + "loss_base2": 2.7684, + "loss_pixel": 0.1984, + "loss_text": 1.7205, + "ppl": 6.8135, + "step": 1765 + }, + { + "epoch": 0.01, + "global_step": 1766, + "learning_rate": 0.0004934641068447413, + "loss": 1.9314, + "loss_base2": 2.7864, + "loss_pixel": 0.1981, + "loss_text": 1.7332, + "ppl": 6.8992, + "step": 1766 + }, + { + "epoch": 0.01, + "global_step": 1767, + "learning_rate": 0.0004934599332220368, + "loss": 1.9408, + "loss_base2": 2.8, + "loss_pixel": 0.1988, + "loss_text": 1.742, + "ppl": 6.9643, + "step": 1767 + }, + { + "epoch": 0.01, + "global_step": 1768, + "learning_rate": 0.0004934557595993323, + "loss": 1.9244, + "loss_base2": 2.7763, + "loss_pixel": 0.1989, + "loss_text": 1.7255, + "ppl": 6.851, + "step": 1768 + }, + { + "epoch": 0.01, + "global_step": 1769, + "learning_rate": 0.0004934515859766277, + "loss": 1.9848, + "loss_base2": 2.8635, + "loss_pixel": 0.1994, + "loss_text": 1.7854, + "ppl": 7.2776, + "step": 1769 + }, + { + "epoch": 0.01, + "global_step": 1770, + "learning_rate": 0.0004934474123539232, + "loss": 1.9402, + "loss_base2": 2.7991, + "loss_pixel": 0.1987, + "loss_text": 1.7416, + "ppl": 6.9601, + "step": 1770 + }, + { + "epoch": 0.01, + "global_step": 1771, + "learning_rate": 0.0004934432387312187, + "loss": 1.9265, + "loss_base2": 2.7794, + "loss_pixel": 0.1988, + "loss_text": 1.7277, + "ppl": 6.8654, + "step": 1771 + }, + { + "epoch": 0.01, + "global_step": 1772, + "learning_rate": 0.0004934390651085142, + "loss": 1.9101, + "loss_base2": 2.7557, + "loss_pixel": 0.1988, + "loss_text": 1.7113, + "ppl": 6.7538, + "step": 1772 + }, + { + "epoch": 0.01, + "global_step": 1773, + "learning_rate": 0.0004934348914858097, + "loss": 1.9309, + "loss_base2": 2.7857, + "loss_pixel": 0.1987, + "loss_text": 1.7322, + "ppl": 6.8957, + "step": 1773 + }, + { + "epoch": 0.01, + "global_step": 1774, + "learning_rate": 0.0004934307178631052, + "loss": 1.9135, + "loss_base2": 2.7606, + "loss_pixel": 0.1984, + "loss_text": 1.7152, + "ppl": 6.7768, + "step": 1774 + }, + { + "epoch": 0.01, + "global_step": 1775, + "learning_rate": 0.0004934265442404007, + "loss": 1.9232, + "loss_base2": 2.7746, + "loss_pixel": 0.1987, + "loss_text": 1.7245, + "ppl": 6.8428, + "step": 1775 + }, + { + "epoch": 0.01, + "global_step": 1776, + "learning_rate": 0.0004934223706176962, + "loss": 1.9189, + "loss_base2": 2.7684, + "loss_pixel": 0.1991, + "loss_text": 1.7197, + "ppl": 6.8135, + "step": 1776 + }, + { + "epoch": 0.01, + "global_step": 1777, + "learning_rate": 0.0004934181969949916, + "loss": 1.9131, + "loss_base2": 2.76, + "loss_pixel": 0.1979, + "loss_text": 1.7153, + "ppl": 6.7741, + "step": 1777 + }, + { + "epoch": 0.01, + "global_step": 1778, + "learning_rate": 0.0004934140233722871, + "loss": 1.9178, + "loss_base2": 2.7668, + "loss_pixel": 0.2014, + "loss_text": 1.7164, + "ppl": 6.806, + "step": 1778 + }, + { + "epoch": 0.01, + "global_step": 1779, + "learning_rate": 0.0004934098497495826, + "loss": 1.9241, + "loss_base2": 2.7759, + "loss_pixel": 0.2009, + "loss_text": 1.7232, + "ppl": 6.849, + "step": 1779 + }, + { + "epoch": 0.01, + "global_step": 1780, + "learning_rate": 0.0004934056761268782, + "loss": 1.9182, + "loss_base2": 2.7674, + "loss_pixel": 0.2063, + "loss_text": 1.7119, + "ppl": 6.8087, + "step": 1780 + }, + { + "epoch": 0.01, + "global_step": 1781, + "learning_rate": 0.0004934015025041737, + "loss": 1.9454, + "loss_base2": 2.8066, + "loss_pixel": 0.2182, + "loss_text": 1.7272, + "ppl": 6.9964, + "step": 1781 + }, + { + "epoch": 0.01, + "global_step": 1782, + "learning_rate": 0.0004933973288814691, + "loss": 1.9358, + "loss_base2": 2.7928, + "loss_pixel": 0.2147, + "loss_text": 1.7211, + "ppl": 6.9296, + "step": 1782 + }, + { + "epoch": 0.01, + "global_step": 1783, + "learning_rate": 0.0004933931552587646, + "loss": 1.9391, + "loss_base2": 2.7975, + "loss_pixel": 0.2135, + "loss_text": 1.7257, + "ppl": 6.9525, + "step": 1783 + }, + { + "epoch": 0.01, + "global_step": 1784, + "learning_rate": 0.0004933889816360601, + "loss": 1.926, + "loss_base2": 2.7786, + "loss_pixel": 0.2151, + "loss_text": 1.7109, + "ppl": 6.862, + "step": 1784 + }, + { + "epoch": 0.01, + "global_step": 1785, + "learning_rate": 0.0004933848080133556, + "loss": 1.9503, + "loss_base2": 2.8137, + "loss_pixel": 0.2113, + "loss_text": 1.739, + "ppl": 7.0308, + "step": 1785 + }, + { + "epoch": 0.01, + "global_step": 1786, + "learning_rate": 0.0004933806343906511, + "loss": 1.9449, + "loss_base2": 2.8059, + "loss_pixel": 0.2122, + "loss_text": 1.7326, + "ppl": 6.9929, + "step": 1786 + }, + { + "epoch": 0.01, + "global_step": 1787, + "learning_rate": 0.0004933764607679466, + "loss": 1.9142, + "loss_base2": 2.7616, + "loss_pixel": 0.2098, + "loss_text": 1.7044, + "ppl": 6.7815, + "step": 1787 + }, + { + "epoch": 0.01, + "global_step": 1788, + "learning_rate": 0.0004933722871452421, + "loss": 1.9108, + "loss_base2": 2.7567, + "loss_pixel": 0.2092, + "loss_text": 1.7016, + "ppl": 6.7585, + "step": 1788 + }, + { + "epoch": 0.01, + "global_step": 1789, + "learning_rate": 0.0004933681135225376, + "loss": 1.9167, + "loss_base2": 2.7652, + "loss_pixel": 0.2118, + "loss_text": 1.7048, + "ppl": 6.7985, + "step": 1789 + }, + { + "epoch": 0.01, + "global_step": 1790, + "learning_rate": 0.0004933639398998331, + "loss": 1.919, + "loss_base2": 2.7685, + "loss_pixel": 0.2088, + "loss_text": 1.7101, + "ppl": 6.8141, + "step": 1790 + }, + { + "epoch": 0.01, + "global_step": 1791, + "learning_rate": 0.0004933597662771286, + "loss": 1.9268, + "loss_base2": 2.7798, + "loss_pixel": 0.2085, + "loss_text": 1.7183, + "ppl": 6.8675, + "step": 1791 + }, + { + "epoch": 0.01, + "global_step": 1792, + "learning_rate": 0.000493355592654424, + "loss": 1.9314, + "loss_base2": 2.7864, + "loss_pixel": 0.2075, + "loss_text": 1.7239, + "ppl": 6.8992, + "step": 1792 + }, + { + "epoch": 0.01, + "global_step": 1793, + "learning_rate": 0.0004933514190317195, + "loss": 1.9154, + "loss_base2": 2.7633, + "loss_pixel": 0.2063, + "loss_text": 1.7091, + "ppl": 6.7897, + "step": 1793 + }, + { + "epoch": 0.01, + "global_step": 1794, + "learning_rate": 0.000493347245409015, + "loss": 1.9264, + "loss_base2": 2.7792, + "loss_pixel": 0.205, + "loss_text": 1.7213, + "ppl": 6.8648, + "step": 1794 + }, + { + "epoch": 0.01, + "global_step": 1795, + "learning_rate": 0.0004933430717863105, + "loss": 1.9231, + "loss_base2": 2.7744, + "loss_pixel": 0.2057, + "loss_text": 1.7173, + "ppl": 6.8421, + "step": 1795 + }, + { + "epoch": 0.01, + "global_step": 1796, + "learning_rate": 0.000493338898163606, + "loss": 1.927, + "loss_base2": 2.7801, + "loss_pixel": 0.2033, + "loss_text": 1.7237, + "ppl": 6.8689, + "step": 1796 + }, + { + "epoch": 0.01, + "global_step": 1797, + "learning_rate": 0.0004933347245409015, + "loss": 1.9335, + "loss_base2": 2.7895, + "loss_pixel": 0.2033, + "loss_text": 1.7302, + "ppl": 6.9137, + "step": 1797 + }, + { + "epoch": 0.01, + "global_step": 1798, + "learning_rate": 0.000493330550918197, + "loss": 1.9167, + "loss_base2": 2.7652, + "loss_pixel": 0.2021, + "loss_text": 1.7146, + "ppl": 6.7985, + "step": 1798 + }, + { + "epoch": 0.01, + "global_step": 1799, + "learning_rate": 0.0004933263772954925, + "loss": 1.908, + "loss_base2": 2.7527, + "loss_pixel": 0.2029, + "loss_text": 1.705, + "ppl": 6.7396, + "step": 1799 + }, + { + "epoch": 0.01, + "global_step": 1800, + "learning_rate": 0.000493322203672788, + "loss": 1.9047, + "loss_base2": 2.7479, + "loss_pixel": 0.2014, + "loss_text": 1.7033, + "ppl": 6.7174, + "step": 1800 + }, + { + "epoch": 0.01, + "global_step": 1801, + "learning_rate": 0.0004933180300500835, + "loss": 1.8963, + "loss_base2": 2.7358, + "loss_pixel": 0.2021, + "loss_text": 1.6942, + "ppl": 6.6612, + "step": 1801 + }, + { + "epoch": 0.01, + "global_step": 1802, + "learning_rate": 0.000493313856427379, + "loss": 1.9144, + "loss_base2": 2.7619, + "loss_pixel": 0.2025, + "loss_text": 1.7119, + "ppl": 6.7829, + "step": 1802 + }, + { + "epoch": 0.01, + "global_step": 1803, + "learning_rate": 0.0004933096828046745, + "loss": 1.9008, + "loss_base2": 2.7423, + "loss_pixel": 0.2002, + "loss_text": 1.7006, + "ppl": 6.6912, + "step": 1803 + }, + { + "epoch": 0.01, + "global_step": 1804, + "learning_rate": 0.00049330550918197, + "loss": 1.6706, + "loss_base2": 2.4102, + "loss_pixel": 0.2013, + "loss_text": 1.4693, + "ppl": 5.3154, + "step": 1804 + }, + { + "epoch": 0.01, + "global_step": 1805, + "learning_rate": 0.0004933013355592654, + "loss": 1.6612, + "loss_base2": 2.3966, + "loss_pixel": 0.2004, + "loss_text": 1.4608, + "ppl": 5.2656, + "step": 1805 + }, + { + "epoch": 0.01, + "global_step": 1806, + "learning_rate": 0.0004932971619365609, + "loss": 1.6745, + "loss_base2": 2.4158, + "loss_pixel": 0.2018, + "loss_text": 1.4728, + "ppl": 5.3361, + "step": 1806 + }, + { + "epoch": 0.01, + "global_step": 1807, + "learning_rate": 0.0004932929883138564, + "loss": 1.6559, + "loss_base2": 2.389, + "loss_pixel": 0.1995, + "loss_text": 1.4564, + "ppl": 5.2378, + "step": 1807 + }, + { + "epoch": 0.01, + "global_step": 1808, + "learning_rate": 0.0004932888146911519, + "loss": 1.6321, + "loss_base2": 2.3546, + "loss_pixel": 0.2001, + "loss_text": 1.432, + "ppl": 5.1146, + "step": 1808 + }, + { + "epoch": 0.01, + "global_step": 1809, + "learning_rate": 0.0004932846410684474, + "loss": 1.6492, + "loss_base2": 2.3793, + "loss_pixel": 0.201, + "loss_text": 1.4482, + "ppl": 5.2028, + "step": 1809 + }, + { + "epoch": 0.01, + "global_step": 1810, + "learning_rate": 0.0004932804674457429, + "loss": 1.626, + "loss_base2": 2.3458, + "loss_pixel": 0.1985, + "loss_text": 1.4274, + "ppl": 5.0835, + "step": 1810 + }, + { + "epoch": 0.01, + "global_step": 1811, + "learning_rate": 0.0004932762938230384, + "loss": 1.8257, + "loss_base2": 2.6339, + "loss_pixel": 0.1992, + "loss_text": 1.6265, + "ppl": 6.2071, + "step": 1811 + }, + { + "epoch": 0.01, + "global_step": 1812, + "learning_rate": 0.000493272120200334, + "loss": 1.9303, + "loss_base2": 2.7848, + "loss_pixel": 0.1991, + "loss_text": 1.7312, + "ppl": 6.8916, + "step": 1812 + }, + { + "epoch": 0.01, + "global_step": 1813, + "learning_rate": 0.0004932679465776295, + "loss": 1.9323, + "loss_base2": 2.7877, + "loss_pixel": 0.1983, + "loss_text": 1.734, + "ppl": 6.9054, + "step": 1813 + }, + { + "epoch": 0.01, + "global_step": 1814, + "learning_rate": 0.0004932637729549249, + "loss": 1.9068, + "loss_base2": 2.7509, + "loss_pixel": 0.1997, + "loss_text": 1.7071, + "ppl": 6.7315, + "step": 1814 + }, + { + "epoch": 0.01, + "global_step": 1815, + "learning_rate": 0.0004932595993322204, + "loss": 1.9144, + "loss_base2": 2.7619, + "loss_pixel": 0.1999, + "loss_text": 1.7144, + "ppl": 6.7829, + "step": 1815 + }, + { + "epoch": 0.01, + "global_step": 1816, + "learning_rate": 0.0004932554257095159, + "loss": 1.906, + "loss_base2": 2.7498, + "loss_pixel": 0.1985, + "loss_text": 1.7075, + "ppl": 6.7261, + "step": 1816 + }, + { + "epoch": 0.01, + "global_step": 1817, + "learning_rate": 0.0004932512520868114, + "loss": 1.9181, + "loss_base2": 2.7672, + "loss_pixel": 0.1973, + "loss_text": 1.7208, + "ppl": 6.808, + "step": 1817 + }, + { + "epoch": 0.01, + "global_step": 1818, + "learning_rate": 0.0004932470784641069, + "loss": 1.9421, + "loss_base2": 2.8019, + "loss_pixel": 0.1976, + "loss_text": 1.7445, + "ppl": 6.9734, + "step": 1818 + }, + { + "epoch": 0.01, + "global_step": 1819, + "learning_rate": 0.0004932429048414023, + "loss": 1.9237, + "loss_base2": 2.7753, + "loss_pixel": 0.1986, + "loss_text": 1.725, + "ppl": 6.8462, + "step": 1819 + }, + { + "epoch": 0.01, + "global_step": 1820, + "learning_rate": 0.0004932387312186978, + "loss": 1.9032, + "loss_base2": 2.7457, + "loss_pixel": 0.1969, + "loss_text": 1.7063, + "ppl": 6.7073, + "step": 1820 + }, + { + "epoch": 0.01, + "global_step": 1821, + "learning_rate": 0.0004932345575959933, + "loss": 1.9215, + "loss_base2": 2.7721, + "loss_pixel": 0.198, + "loss_text": 1.7236, + "ppl": 6.8312, + "step": 1821 + }, + { + "epoch": 0.01, + "global_step": 1822, + "learning_rate": 0.0004932303839732888, + "loss": 1.8967, + "loss_base2": 2.7364, + "loss_pixel": 0.1978, + "loss_text": 1.6989, + "ppl": 6.6639, + "step": 1822 + }, + { + "epoch": 0.01, + "global_step": 1823, + "learning_rate": 0.0004932262103505843, + "loss": 1.9015, + "loss_base2": 2.7433, + "loss_pixel": 0.198, + "loss_text": 1.7035, + "ppl": 6.6959, + "step": 1823 + }, + { + "epoch": 0.01, + "global_step": 1824, + "learning_rate": 0.0004932220367278798, + "loss": 1.9058, + "loss_base2": 2.7495, + "loss_pixel": 0.1978, + "loss_text": 1.708, + "ppl": 6.7248, + "step": 1824 + }, + { + "epoch": 0.01, + "global_step": 1825, + "learning_rate": 0.0004932178631051753, + "loss": 1.904, + "loss_base2": 2.7469, + "loss_pixel": 0.1994, + "loss_text": 1.7046, + "ppl": 6.7127, + "step": 1825 + }, + { + "epoch": 0.01, + "global_step": 1826, + "learning_rate": 0.0004932136894824708, + "loss": 1.9017, + "loss_base2": 2.7436, + "loss_pixel": 0.1984, + "loss_text": 1.7033, + "ppl": 6.6973, + "step": 1826 + }, + { + "epoch": 0.01, + "global_step": 1827, + "learning_rate": 0.0004932095158597663, + "loss": 1.9139, + "loss_base2": 2.7612, + "loss_pixel": 0.1983, + "loss_text": 1.7156, + "ppl": 6.7795, + "step": 1827 + }, + { + "epoch": 0.01, + "global_step": 1828, + "learning_rate": 0.0004932053422370617, + "loss": 1.904, + "loss_base2": 2.7469, + "loss_pixel": 0.1976, + "loss_text": 1.7064, + "ppl": 6.7127, + "step": 1828 + }, + { + "epoch": 0.01, + "global_step": 1829, + "learning_rate": 0.0004932011686143573, + "loss": 1.9154, + "loss_base2": 2.7633, + "loss_pixel": 0.1979, + "loss_text": 1.7175, + "ppl": 6.7897, + "step": 1829 + }, + { + "epoch": 0.01, + "global_step": 1830, + "learning_rate": 0.0004931969949916528, + "loss": 1.9029, + "loss_base2": 2.7453, + "loss_pixel": 0.197, + "loss_text": 1.7059, + "ppl": 6.7053, + "step": 1830 + }, + { + "epoch": 0.01, + "global_step": 1831, + "learning_rate": 0.0004931928213689483, + "loss": 1.8998, + "loss_base2": 2.7408, + "loss_pixel": 0.1985, + "loss_text": 1.7013, + "ppl": 6.6846, + "step": 1831 + }, + { + "epoch": 0.01, + "global_step": 1832, + "learning_rate": 0.0004931886477462438, + "loss": 1.8929, + "loss_base2": 2.7309, + "loss_pixel": 0.1979, + "loss_text": 1.695, + "ppl": 6.6386, + "step": 1832 + }, + { + "epoch": 0.01, + "global_step": 1833, + "learning_rate": 0.0004931844741235392, + "loss": 1.8587, + "loss_base2": 2.6815, + "loss_pixel": 0.1979, + "loss_text": 1.6608, + "ppl": 6.4154, + "step": 1833 + }, + { + "epoch": 0.01, + "global_step": 1834, + "learning_rate": 0.0004931803005008347, + "loss": 1.9084, + "loss_base2": 2.7532, + "loss_pixel": 0.1973, + "loss_text": 1.7111, + "ppl": 6.7423, + "step": 1834 + }, + { + "epoch": 0.01, + "global_step": 1835, + "learning_rate": 0.0004931761268781302, + "loss": 1.92, + "loss_base2": 2.77, + "loss_pixel": 0.198, + "loss_text": 1.722, + "ppl": 6.821, + "step": 1835 + }, + { + "epoch": 0.01, + "global_step": 1836, + "learning_rate": 0.0004931719532554257, + "loss": 1.8989, + "loss_base2": 2.7395, + "loss_pixel": 0.1975, + "loss_text": 1.7014, + "ppl": 6.6785, + "step": 1836 + }, + { + "epoch": 0.01, + "global_step": 1837, + "learning_rate": 0.0004931677796327212, + "loss": 1.8879, + "loss_base2": 2.7237, + "loss_pixel": 0.1965, + "loss_text": 1.6914, + "ppl": 6.6055, + "step": 1837 + }, + { + "epoch": 0.01, + "global_step": 1838, + "learning_rate": 0.0004931636060100167, + "loss": 1.9276, + "loss_base2": 2.7809, + "loss_pixel": 0.1976, + "loss_text": 1.73, + "ppl": 6.873, + "step": 1838 + }, + { + "epoch": 0.01, + "global_step": 1839, + "learning_rate": 0.0004931594323873122, + "loss": 1.9122, + "loss_base2": 2.7587, + "loss_pixel": 0.1968, + "loss_text": 1.7153, + "ppl": 6.768, + "step": 1839 + }, + { + "epoch": 0.01, + "global_step": 1840, + "learning_rate": 0.0004931552587646077, + "loss": 1.9026, + "loss_base2": 2.7449, + "loss_pixel": 0.198, + "loss_text": 1.7046, + "ppl": 6.7033, + "step": 1840 + }, + { + "epoch": 0.01, + "global_step": 1841, + "learning_rate": 0.0004931510851419031, + "loss": 1.8958, + "loss_base2": 2.7351, + "loss_pixel": 0.1973, + "loss_text": 1.6985, + "ppl": 6.6579, + "step": 1841 + }, + { + "epoch": 0.01, + "global_step": 1842, + "learning_rate": 0.0004931469115191986, + "loss": 1.8904, + "loss_base2": 2.7273, + "loss_pixel": 0.1974, + "loss_text": 1.693, + "ppl": 6.622, + "step": 1842 + }, + { + "epoch": 0.01, + "global_step": 1843, + "learning_rate": 0.0004931427378964941, + "loss": 1.899, + "loss_base2": 2.7397, + "loss_pixel": 0.1972, + "loss_text": 1.7018, + "ppl": 6.6792, + "step": 1843 + }, + { + "epoch": 0.01, + "global_step": 1844, + "learning_rate": 0.0004931385642737896, + "loss": 1.9077, + "loss_base2": 2.7522, + "loss_pixel": 0.1975, + "loss_text": 1.7102, + "ppl": 6.7376, + "step": 1844 + }, + { + "epoch": 0.01, + "global_step": 1845, + "learning_rate": 0.0004931343906510852, + "loss": 1.8991, + "loss_base2": 2.7398, + "loss_pixel": 0.1963, + "loss_text": 1.7027, + "ppl": 6.6799, + "step": 1845 + }, + { + "epoch": 0.01, + "global_step": 1846, + "learning_rate": 0.0004931302170283807, + "loss": 1.9094, + "loss_base2": 2.7547, + "loss_pixel": 0.1977, + "loss_text": 1.7117, + "ppl": 6.749, + "step": 1846 + }, + { + "epoch": 0.01, + "global_step": 1847, + "learning_rate": 0.0004931260434056762, + "loss": 1.907, + "loss_base2": 2.7512, + "loss_pixel": 0.198, + "loss_text": 1.709, + "ppl": 6.7329, + "step": 1847 + }, + { + "epoch": 0.01, + "global_step": 1848, + "learning_rate": 0.0004931218697829717, + "loss": 1.906, + "loss_base2": 2.7498, + "loss_pixel": 0.1961, + "loss_text": 1.7098, + "ppl": 6.7261, + "step": 1848 + }, + { + "epoch": 0.01, + "global_step": 1849, + "learning_rate": 0.0004931176961602672, + "loss": 1.8957, + "loss_base2": 2.7349, + "loss_pixel": 0.1973, + "loss_text": 1.6984, + "ppl": 6.6572, + "step": 1849 + }, + { + "epoch": 0.01, + "global_step": 1850, + "learning_rate": 0.0004931135225375627, + "loss": 1.8878, + "loss_base2": 2.7235, + "loss_pixel": 0.1965, + "loss_text": 1.6913, + "ppl": 6.6048, + "step": 1850 + }, + { + "epoch": 0.01, + "global_step": 1851, + "learning_rate": 0.0004931093489148581, + "loss": 1.9033, + "loss_base2": 2.7459, + "loss_pixel": 0.1977, + "loss_text": 1.7056, + "ppl": 6.708, + "step": 1851 + }, + { + "epoch": 0.01, + "global_step": 1852, + "learning_rate": 0.0004931051752921536, + "loss": 1.8686, + "loss_base2": 2.6958, + "loss_pixel": 0.1973, + "loss_text": 1.6713, + "ppl": 6.4792, + "step": 1852 + }, + { + "epoch": 0.01, + "global_step": 1853, + "learning_rate": 0.0004931010016694491, + "loss": 1.9053, + "loss_base2": 2.7488, + "loss_pixel": 0.1964, + "loss_text": 1.7089, + "ppl": 6.7214, + "step": 1853 + }, + { + "epoch": 0.01, + "global_step": 1854, + "learning_rate": 0.0004930968280467446, + "loss": 1.9134, + "loss_base2": 2.7605, + "loss_pixel": 0.1997, + "loss_text": 1.7137, + "ppl": 6.7761, + "step": 1854 + }, + { + "epoch": 0.01, + "global_step": 1855, + "learning_rate": 0.00049309265442404, + "loss": 1.8737, + "loss_base2": 2.7032, + "loss_pixel": 0.1969, + "loss_text": 1.6768, + "ppl": 6.5123, + "step": 1855 + }, + { + "epoch": 0.01, + "global_step": 1856, + "learning_rate": 0.0004930884808013355, + "loss": 1.9096, + "loss_base2": 2.755, + "loss_pixel": 0.1974, + "loss_text": 1.7122, + "ppl": 6.7504, + "step": 1856 + }, + { + "epoch": 0.01, + "global_step": 1857, + "learning_rate": 0.000493084307178631, + "loss": 1.9022, + "loss_base2": 2.7443, + "loss_pixel": 0.1972, + "loss_text": 1.705, + "ppl": 6.7006, + "step": 1857 + }, + { + "epoch": 0.01, + "global_step": 1858, + "learning_rate": 0.0004930801335559265, + "loss": 1.8828, + "loss_base2": 2.7163, + "loss_pixel": 0.1962, + "loss_text": 1.6866, + "ppl": 6.5719, + "step": 1858 + }, + { + "epoch": 0.01, + "global_step": 1859, + "learning_rate": 0.000493075959933222, + "loss": 1.9, + "loss_base2": 2.7411, + "loss_pixel": 0.1953, + "loss_text": 1.7046, + "ppl": 6.6859, + "step": 1859 + }, + { + "epoch": 0.01, + "global_step": 1860, + "learning_rate": 0.0004930717863105175, + "loss": 1.8918, + "loss_base2": 2.7293, + "loss_pixel": 0.196, + "loss_text": 1.6958, + "ppl": 6.6313, + "step": 1860 + }, + { + "epoch": 0.01, + "global_step": 1861, + "learning_rate": 0.0004930676126878131, + "loss": 1.8973, + "loss_base2": 2.7372, + "loss_pixel": 0.1973, + "loss_text": 1.7, + "ppl": 6.6679, + "step": 1861 + }, + { + "epoch": 0.01, + "global_step": 1862, + "learning_rate": 0.0004930634390651086, + "loss": 1.8821, + "loss_base2": 2.7153, + "loss_pixel": 0.1985, + "loss_text": 1.6835, + "ppl": 6.5673, + "step": 1862 + }, + { + "epoch": 0.01, + "global_step": 1863, + "learning_rate": 0.0004930592654424041, + "loss": 1.885, + "loss_base2": 2.7195, + "loss_pixel": 0.1961, + "loss_text": 1.6889, + "ppl": 6.5864, + "step": 1863 + }, + { + "epoch": 0.01, + "global_step": 1864, + "learning_rate": 0.0004930550918196995, + "loss": 1.8939, + "loss_base2": 2.7323, + "loss_pixel": 0.1957, + "loss_text": 1.6982, + "ppl": 6.6452, + "step": 1864 + }, + { + "epoch": 0.01, + "global_step": 1865, + "learning_rate": 0.000493050918196995, + "loss": 1.8871, + "loss_base2": 2.7225, + "loss_pixel": 0.1974, + "loss_text": 1.6896, + "ppl": 6.6002, + "step": 1865 + }, + { + "epoch": 0.01, + "global_step": 1866, + "learning_rate": 0.0004930467445742905, + "loss": 1.9104, + "loss_base2": 2.7561, + "loss_pixel": 0.1967, + "loss_text": 1.7137, + "ppl": 6.7558, + "step": 1866 + }, + { + "epoch": 0.01, + "global_step": 1867, + "learning_rate": 0.000493042570951586, + "loss": 1.8926, + "loss_base2": 2.7304, + "loss_pixel": 0.1965, + "loss_text": 1.696, + "ppl": 6.6366, + "step": 1867 + }, + { + "epoch": 0.01, + "global_step": 1868, + "learning_rate": 0.0004930383973288815, + "loss": 1.9003, + "loss_base2": 2.7416, + "loss_pixel": 0.1967, + "loss_text": 1.7036, + "ppl": 6.6879, + "step": 1868 + }, + { + "epoch": 0.01, + "global_step": 1869, + "learning_rate": 0.000493034223706177, + "loss": 1.8809, + "loss_base2": 2.7136, + "loss_pixel": 0.1967, + "loss_text": 1.6842, + "ppl": 6.5594, + "step": 1869 + }, + { + "epoch": 0.01, + "global_step": 1870, + "learning_rate": 0.0004930300500834725, + "loss": 1.898, + "loss_base2": 2.7382, + "loss_pixel": 0.1961, + "loss_text": 1.7019, + "ppl": 6.6725, + "step": 1870 + }, + { + "epoch": 0.01, + "global_step": 1871, + "learning_rate": 0.0004930258764607679, + "loss": 1.9041, + "loss_base2": 2.747, + "loss_pixel": 0.1962, + "loss_text": 1.7079, + "ppl": 6.7134, + "step": 1871 + }, + { + "epoch": 0.01, + "global_step": 1872, + "learning_rate": 0.0004930217028380634, + "loss": 1.9039, + "loss_base2": 2.7467, + "loss_pixel": 0.196, + "loss_text": 1.7078, + "ppl": 6.712, + "step": 1872 + }, + { + "epoch": 0.01, + "global_step": 1873, + "learning_rate": 0.0004930175292153589, + "loss": 1.882, + "loss_base2": 2.7152, + "loss_pixel": 0.1961, + "loss_text": 1.6859, + "ppl": 6.5666, + "step": 1873 + }, + { + "epoch": 0.01, + "global_step": 1874, + "learning_rate": 0.0004930133555926544, + "loss": 1.8829, + "loss_base2": 2.7165, + "loss_pixel": 0.1957, + "loss_text": 1.6873, + "ppl": 6.5725, + "step": 1874 + }, + { + "epoch": 0.01, + "global_step": 1875, + "learning_rate": 0.0004930091819699499, + "loss": 1.8978, + "loss_base2": 2.7379, + "loss_pixel": 0.196, + "loss_text": 1.7019, + "ppl": 6.6712, + "step": 1875 + }, + { + "epoch": 0.01, + "global_step": 1876, + "learning_rate": 0.0004930050083472454, + "loss": 1.8935, + "loss_base2": 2.7317, + "loss_pixel": 0.1975, + "loss_text": 1.6959, + "ppl": 6.6426, + "step": 1876 + }, + { + "epoch": 0.01, + "global_step": 1877, + "learning_rate": 0.000493000834724541, + "loss": 1.8899, + "loss_base2": 2.7265, + "loss_pixel": 0.1964, + "loss_text": 1.6934, + "ppl": 6.6187, + "step": 1877 + }, + { + "epoch": 0.01, + "global_step": 1878, + "learning_rate": 0.0004929966611018364, + "loss": 1.8919, + "loss_base2": 2.7294, + "loss_pixel": 0.1978, + "loss_text": 1.6941, + "ppl": 6.632, + "step": 1878 + }, + { + "epoch": 0.01, + "global_step": 1879, + "learning_rate": 0.0004929924874791319, + "loss": 1.9016, + "loss_base2": 2.7434, + "loss_pixel": 0.1952, + "loss_text": 1.7064, + "ppl": 6.6966, + "step": 1879 + }, + { + "epoch": 0.01, + "global_step": 1880, + "learning_rate": 0.0004929883138564274, + "loss": 1.8757, + "loss_base2": 2.7061, + "loss_pixel": 0.1954, + "loss_text": 1.6802, + "ppl": 6.5254, + "step": 1880 + }, + { + "epoch": 0.01, + "global_step": 1881, + "learning_rate": 0.0004929841402337229, + "loss": 1.8895, + "loss_base2": 2.726, + "loss_pixel": 0.1955, + "loss_text": 1.6941, + "ppl": 6.6161, + "step": 1881 + }, + { + "epoch": 0.01, + "global_step": 1882, + "learning_rate": 0.0004929799666110184, + "loss": 1.8957, + "loss_base2": 2.7349, + "loss_pixel": 0.1954, + "loss_text": 1.7003, + "ppl": 6.6572, + "step": 1882 + }, + { + "epoch": 0.01, + "global_step": 1883, + "learning_rate": 0.0004929757929883139, + "loss": 1.9048, + "loss_base2": 2.748, + "loss_pixel": 0.2053, + "loss_text": 1.6995, + "ppl": 6.7181, + "step": 1883 + }, + { + "epoch": 0.01, + "global_step": 1884, + "learning_rate": 0.0004929716193656094, + "loss": 1.9024, + "loss_base2": 2.7446, + "loss_pixel": 0.2073, + "loss_text": 1.6951, + "ppl": 6.702, + "step": 1884 + }, + { + "epoch": 0.01, + "global_step": 1885, + "learning_rate": 0.0004929674457429049, + "loss": 1.8938, + "loss_base2": 2.7322, + "loss_pixel": 0.2052, + "loss_text": 1.6885, + "ppl": 6.6446, + "step": 1885 + }, + { + "epoch": 0.01, + "global_step": 1886, + "learning_rate": 0.0004929632721202004, + "loss": 1.9003, + "loss_base2": 2.7416, + "loss_pixel": 0.2043, + "loss_text": 1.696, + "ppl": 6.6879, + "step": 1886 + }, + { + "epoch": 0.01, + "global_step": 1887, + "learning_rate": 0.0004929590984974958, + "loss": 1.8937, + "loss_base2": 2.732, + "loss_pixel": 0.2035, + "loss_text": 1.6902, + "ppl": 6.6439, + "step": 1887 + }, + { + "epoch": 0.01, + "global_step": 1888, + "learning_rate": 0.0004929549248747913, + "loss": 1.889, + "loss_base2": 2.7253, + "loss_pixel": 0.1998, + "loss_text": 1.6892, + "ppl": 6.6128, + "step": 1888 + }, + { + "epoch": 0.01, + "global_step": 1889, + "learning_rate": 0.0004929507512520868, + "loss": 1.9018, + "loss_base2": 2.7437, + "loss_pixel": 0.1976, + "loss_text": 1.7041, + "ppl": 6.6979, + "step": 1889 + }, + { + "epoch": 0.01, + "global_step": 1890, + "learning_rate": 0.0004929465776293823, + "loss": 1.8822, + "loss_base2": 2.7154, + "loss_pixel": 0.1987, + "loss_text": 1.6835, + "ppl": 6.5679, + "step": 1890 + }, + { + "epoch": 0.01, + "global_step": 1891, + "learning_rate": 0.0004929424040066777, + "loss": 1.8841, + "loss_base2": 2.7182, + "loss_pixel": 0.197, + "loss_text": 1.6871, + "ppl": 6.5804, + "step": 1891 + }, + { + "epoch": 0.01, + "global_step": 1892, + "learning_rate": 0.0004929382303839732, + "loss": 1.8651, + "loss_base2": 2.6908, + "loss_pixel": 0.1973, + "loss_text": 1.6678, + "ppl": 6.4566, + "step": 1892 + }, + { + "epoch": 0.01, + "global_step": 1893, + "learning_rate": 0.0004929340567612687, + "loss": 1.8823, + "loss_base2": 2.7156, + "loss_pixel": 0.198, + "loss_text": 1.6843, + "ppl": 6.5686, + "step": 1893 + }, + { + "epoch": 0.01, + "global_step": 1894, + "learning_rate": 0.0004929298831385643, + "loss": 1.8737, + "loss_base2": 2.7032, + "loss_pixel": 0.1971, + "loss_text": 1.6766, + "ppl": 6.5123, + "step": 1894 + }, + { + "epoch": 0.01, + "global_step": 1895, + "learning_rate": 0.0004929257095158598, + "loss": 1.8781, + "loss_base2": 2.7095, + "loss_pixel": 0.196, + "loss_text": 1.6821, + "ppl": 6.5411, + "step": 1895 + }, + { + "epoch": 0.01, + "global_step": 1896, + "learning_rate": 0.0004929215358931553, + "loss": 1.882, + "loss_base2": 2.7152, + "loss_pixel": 0.1953, + "loss_text": 1.6868, + "ppl": 6.5666, + "step": 1896 + }, + { + "epoch": 0.01, + "global_step": 1897, + "learning_rate": 0.0004929173622704508, + "loss": 1.8712, + "loss_base2": 2.6996, + "loss_pixel": 0.1944, + "loss_text": 1.6768, + "ppl": 6.4961, + "step": 1897 + }, + { + "epoch": 0.01, + "global_step": 1898, + "learning_rate": 0.0004929131886477463, + "loss": 1.8772, + "loss_base2": 2.7082, + "loss_pixel": 0.1954, + "loss_text": 1.6819, + "ppl": 6.5352, + "step": 1898 + }, + { + "epoch": 0.01, + "global_step": 1899, + "learning_rate": 0.0004929090150250418, + "loss": 1.8772, + "loss_base2": 2.7082, + "loss_pixel": 0.1962, + "loss_text": 1.681, + "ppl": 6.5352, + "step": 1899 + }, + { + "epoch": 0.01, + "global_step": 1900, + "learning_rate": 0.0004929048414023372, + "loss": 1.8337, + "loss_base2": 2.6455, + "loss_pixel": 0.1974, + "loss_text": 1.6364, + "ppl": 6.257, + "step": 1900 + }, + { + "epoch": 0.01, + "global_step": 1901, + "learning_rate": 0.0004929006677796327, + "loss": 1.8536, + "loss_base2": 2.6742, + "loss_pixel": 0.1954, + "loss_text": 1.6583, + "ppl": 6.3828, + "step": 1901 + }, + { + "epoch": 0.01, + "global_step": 1902, + "learning_rate": 0.0004928964941569282, + "loss": 1.8902, + "loss_base2": 2.727, + "loss_pixel": 0.1951, + "loss_text": 1.6951, + "ppl": 6.6207, + "step": 1902 + }, + { + "epoch": 0.01, + "global_step": 1903, + "learning_rate": 0.0004928923205342237, + "loss": 1.8815, + "loss_base2": 2.7144, + "loss_pixel": 0.1964, + "loss_text": 1.6852, + "ppl": 6.5633, + "step": 1903 + }, + { + "epoch": 0.01, + "global_step": 1904, + "learning_rate": 0.0004928881469115192, + "loss": 1.9189, + "loss_base2": 2.7684, + "loss_pixel": 0.1946, + "loss_text": 1.7244, + "ppl": 6.8135, + "step": 1904 + }, + { + "epoch": 0.01, + "global_step": 1905, + "learning_rate": 0.0004928839732888147, + "loss": 1.9012, + "loss_base2": 2.7429, + "loss_pixel": 0.1948, + "loss_text": 1.7063, + "ppl": 6.6939, + "step": 1905 + }, + { + "epoch": 0.01, + "global_step": 1906, + "learning_rate": 0.0004928797996661102, + "loss": 1.8925, + "loss_base2": 2.7303, + "loss_pixel": 0.1948, + "loss_text": 1.6977, + "ppl": 6.6359, + "step": 1906 + }, + { + "epoch": 0.01, + "global_step": 1907, + "learning_rate": 0.0004928756260434057, + "loss": 1.8932, + "loss_base2": 2.7313, + "loss_pixel": 0.1976, + "loss_text": 1.6956, + "ppl": 6.6406, + "step": 1907 + }, + { + "epoch": 0.01, + "global_step": 1908, + "learning_rate": 0.0004928714524207011, + "loss": 1.902, + "loss_base2": 2.744, + "loss_pixel": 0.1977, + "loss_text": 1.7043, + "ppl": 6.6993, + "step": 1908 + }, + { + "epoch": 0.01, + "global_step": 1909, + "learning_rate": 0.0004928672787979966, + "loss": 1.9011, + "loss_base2": 2.7427, + "loss_pixel": 0.1984, + "loss_text": 1.7028, + "ppl": 6.6933, + "step": 1909 + }, + { + "epoch": 0.01, + "global_step": 1910, + "learning_rate": 0.0004928631051752922, + "loss": 1.8974, + "loss_base2": 2.7374, + "loss_pixel": 0.1976, + "loss_text": 1.6999, + "ppl": 6.6685, + "step": 1910 + }, + { + "epoch": 0.01, + "global_step": 1911, + "learning_rate": 0.0004928589315525877, + "loss": 1.8916, + "loss_base2": 2.729, + "loss_pixel": 0.1967, + "loss_text": 1.6949, + "ppl": 6.63, + "step": 1911 + }, + { + "epoch": 0.01, + "global_step": 1912, + "learning_rate": 0.0004928547579298832, + "loss": 1.8984, + "loss_base2": 2.7388, + "loss_pixel": 0.1963, + "loss_text": 1.7021, + "ppl": 6.6752, + "step": 1912 + }, + { + "epoch": 0.01, + "global_step": 1913, + "learning_rate": 0.0004928505843071787, + "loss": 1.8985, + "loss_base2": 2.739, + "loss_pixel": 0.1958, + "loss_text": 1.7027, + "ppl": 6.6759, + "step": 1913 + }, + { + "epoch": 0.01, + "global_step": 1914, + "learning_rate": 0.0004928464106844741, + "loss": 1.8714, + "loss_base2": 2.6999, + "loss_pixel": 0.1966, + "loss_text": 1.6748, + "ppl": 6.4974, + "step": 1914 + }, + { + "epoch": 0.01, + "global_step": 1915, + "learning_rate": 0.0004928422370617696, + "loss": 1.892, + "loss_base2": 2.7296, + "loss_pixel": 0.1969, + "loss_text": 1.6951, + "ppl": 6.6326, + "step": 1915 + }, + { + "epoch": 0.01, + "global_step": 1916, + "learning_rate": 0.0004928380634390651, + "loss": 1.8753, + "loss_base2": 2.7055, + "loss_pixel": 0.1951, + "loss_text": 1.6802, + "ppl": 6.5228, + "step": 1916 + }, + { + "epoch": 0.01, + "global_step": 1917, + "learning_rate": 0.0004928338898163606, + "loss": 1.8849, + "loss_base2": 2.7193, + "loss_pixel": 0.1953, + "loss_text": 1.6896, + "ppl": 6.5857, + "step": 1917 + }, + { + "epoch": 0.01, + "global_step": 1918, + "learning_rate": 0.0004928297161936561, + "loss": 1.8674, + "loss_base2": 2.6941, + "loss_pixel": 0.1966, + "loss_text": 1.6708, + "ppl": 6.4714, + "step": 1918 + }, + { + "epoch": 0.01, + "global_step": 1919, + "learning_rate": 0.0004928255425709516, + "loss": 1.8889, + "loss_base2": 2.7251, + "loss_pixel": 0.196, + "loss_text": 1.6929, + "ppl": 6.6121, + "step": 1919 + }, + { + "epoch": 0.01, + "global_step": 1920, + "learning_rate": 0.0004928213689482471, + "loss": 1.8908, + "loss_base2": 2.7278, + "loss_pixel": 0.195, + "loss_text": 1.6958, + "ppl": 6.6247, + "step": 1920 + }, + { + "epoch": 0.01, + "global_step": 1921, + "learning_rate": 0.0004928171953255426, + "loss": 1.8818, + "loss_base2": 2.7149, + "loss_pixel": 0.1985, + "loss_text": 1.6833, + "ppl": 6.5653, + "step": 1921 + }, + { + "epoch": 0.01, + "global_step": 1922, + "learning_rate": 0.0004928130217028381, + "loss": 1.8975, + "loss_base2": 2.7375, + "loss_pixel": 0.195, + "loss_text": 1.7024, + "ppl": 6.6692, + "step": 1922 + }, + { + "epoch": 0.01, + "global_step": 1923, + "learning_rate": 0.0004928088480801335, + "loss": 1.8768, + "loss_base2": 2.7077, + "loss_pixel": 0.1955, + "loss_text": 1.6813, + "ppl": 6.5326, + "step": 1923 + }, + { + "epoch": 0.01, + "global_step": 1924, + "learning_rate": 0.000492804674457429, + "loss": 1.8361, + "loss_base2": 2.6489, + "loss_pixel": 0.1952, + "loss_text": 1.6409, + "ppl": 6.272, + "step": 1924 + }, + { + "epoch": 0.01, + "global_step": 1925, + "learning_rate": 0.0004928005008347245, + "loss": 1.7548, + "loss_base2": 2.5316, + "loss_pixel": 0.1945, + "loss_text": 1.5603, + "ppl": 5.7823, + "step": 1925 + }, + { + "epoch": 0.01, + "global_step": 1926, + "learning_rate": 0.0004927963272120201, + "loss": 1.6597, + "loss_base2": 2.3944, + "loss_pixel": 0.1953, + "loss_text": 1.4644, + "ppl": 5.2577, + "step": 1926 + }, + { + "epoch": 0.01, + "global_step": 1927, + "learning_rate": 0.0004927921535893156, + "loss": 1.6545, + "loss_base2": 2.3869, + "loss_pixel": 0.1943, + "loss_text": 1.4602, + "ppl": 5.2305, + "step": 1927 + }, + { + "epoch": 0.01, + "global_step": 1928, + "learning_rate": 0.000492787979966611, + "loss": 1.6481, + "loss_base2": 2.3777, + "loss_pixel": 0.1944, + "loss_text": 1.4536, + "ppl": 5.1971, + "step": 1928 + }, + { + "epoch": 0.01, + "global_step": 1929, + "learning_rate": 0.0004927838063439065, + "loss": 1.6526, + "loss_base2": 2.3842, + "loss_pixel": 0.1943, + "loss_text": 1.4583, + "ppl": 5.2205, + "step": 1929 + }, + { + "epoch": 0.01, + "global_step": 1930, + "learning_rate": 0.000492779632721202, + "loss": 1.6656, + "loss_base2": 2.403, + "loss_pixel": 0.1951, + "loss_text": 1.4705, + "ppl": 5.2888, + "step": 1930 + }, + { + "epoch": 0.01, + "global_step": 1931, + "learning_rate": 0.0004927754590984975, + "loss": 1.6653, + "loss_base2": 2.4025, + "loss_pixel": 0.1968, + "loss_text": 1.4685, + "ppl": 5.2873, + "step": 1931 + }, + { + "epoch": 0.01, + "global_step": 1932, + "learning_rate": 0.000492771285475793, + "loss": 1.6551, + "loss_base2": 2.3878, + "loss_pixel": 0.1946, + "loss_text": 1.4604, + "ppl": 5.2336, + "step": 1932 + }, + { + "epoch": 0.01, + "global_step": 1933, + "learning_rate": 0.0004927671118530885, + "loss": 1.6566, + "loss_base2": 2.39, + "loss_pixel": 0.1949, + "loss_text": 1.4617, + "ppl": 5.2415, + "step": 1933 + }, + { + "epoch": 0.01, + "global_step": 1934, + "learning_rate": 0.000492762938230384, + "loss": 1.8779, + "loss_base2": 2.7092, + "loss_pixel": 0.1949, + "loss_text": 1.6831, + "ppl": 6.5398, + "step": 1934 + }, + { + "epoch": 0.01, + "global_step": 1935, + "learning_rate": 0.0004927587646076795, + "loss": 1.9319, + "loss_base2": 2.7871, + "loss_pixel": 0.2015, + "loss_text": 1.7305, + "ppl": 6.9026, + "step": 1935 + }, + { + "epoch": 0.01, + "global_step": 1936, + "learning_rate": 0.000492754590984975, + "loss": 1.9146, + "loss_base2": 2.7622, + "loss_pixel": 0.1985, + "loss_text": 1.7161, + "ppl": 6.7842, + "step": 1936 + }, + { + "epoch": 0.01, + "global_step": 1937, + "learning_rate": 0.0004927504173622704, + "loss": 1.9151, + "loss_base2": 2.7629, + "loss_pixel": 0.1999, + "loss_text": 1.7151, + "ppl": 6.7876, + "step": 1937 + }, + { + "epoch": 0.01, + "global_step": 1938, + "learning_rate": 0.0004927462437395659, + "loss": 1.901, + "loss_base2": 2.7426, + "loss_pixel": 0.2013, + "loss_text": 1.6997, + "ppl": 6.6926, + "step": 1938 + }, + { + "epoch": 0.01, + "global_step": 1939, + "learning_rate": 0.0004927420701168614, + "loss": 1.9207, + "loss_base2": 2.771, + "loss_pixel": 0.211, + "loss_text": 1.7097, + "ppl": 6.8257, + "step": 1939 + }, + { + "epoch": 0.01, + "global_step": 1940, + "learning_rate": 0.0004927378964941569, + "loss": 1.9181, + "loss_base2": 2.7672, + "loss_pixel": 0.2086, + "loss_text": 1.7094, + "ppl": 6.808, + "step": 1940 + }, + { + "epoch": 0.01, + "global_step": 1941, + "learning_rate": 0.0004927337228714524, + "loss": 1.9106, + "loss_base2": 2.7564, + "loss_pixel": 0.211, + "loss_text": 1.6995, + "ppl": 6.7571, + "step": 1941 + }, + { + "epoch": 0.01, + "global_step": 1942, + "learning_rate": 0.000492729549248748, + "loss": 1.9277, + "loss_base2": 2.7811, + "loss_pixel": 0.2187, + "loss_text": 1.709, + "ppl": 6.8737, + "step": 1942 + }, + { + "epoch": 0.01, + "global_step": 1943, + "learning_rate": 0.0004927253756260435, + "loss": 1.9191, + "loss_base2": 2.7687, + "loss_pixel": 0.2226, + "loss_text": 1.6966, + "ppl": 6.8148, + "step": 1943 + }, + { + "epoch": 0.01, + "global_step": 1944, + "learning_rate": 0.000492721202003339, + "loss": 1.9246, + "loss_base2": 2.7766, + "loss_pixel": 0.2178, + "loss_text": 1.7068, + "ppl": 6.8524, + "step": 1944 + }, + { + "epoch": 0.01, + "global_step": 1945, + "learning_rate": 0.0004927170283806345, + "loss": 1.909, + "loss_base2": 2.7541, + "loss_pixel": 0.2135, + "loss_text": 1.6955, + "ppl": 6.7463, + "step": 1945 + }, + { + "epoch": 0.01, + "global_step": 1946, + "learning_rate": 0.0004927128547579299, + "loss": 1.918, + "loss_base2": 2.7671, + "loss_pixel": 0.2121, + "loss_text": 1.7059, + "ppl": 6.8073, + "step": 1946 + }, + { + "epoch": 0.01, + "global_step": 1947, + "learning_rate": 0.0004927086811352254, + "loss": 1.8996, + "loss_base2": 2.7405, + "loss_pixel": 0.2069, + "loss_text": 1.6927, + "ppl": 6.6832, + "step": 1947 + }, + { + "epoch": 0.01, + "global_step": 1948, + "learning_rate": 0.0004927045075125209, + "loss": 1.8974, + "loss_base2": 2.7374, + "loss_pixel": 0.2064, + "loss_text": 1.691, + "ppl": 6.6685, + "step": 1948 + }, + { + "epoch": 0.01, + "global_step": 1949, + "learning_rate": 0.0004927003338898164, + "loss": 1.9075, + "loss_base2": 2.7519, + "loss_pixel": 0.2046, + "loss_text": 1.7029, + "ppl": 6.7362, + "step": 1949 + }, + { + "epoch": 0.01, + "global_step": 1950, + "learning_rate": 0.0004926961602671118, + "loss": 1.9, + "loss_base2": 2.7411, + "loss_pixel": 0.2049, + "loss_text": 1.6951, + "ppl": 6.6859, + "step": 1950 + }, + { + "epoch": 0.01, + "global_step": 1951, + "learning_rate": 0.0004926919866444073, + "loss": 1.9134, + "loss_base2": 2.7605, + "loss_pixel": 0.2042, + "loss_text": 1.7091, + "ppl": 6.7761, + "step": 1951 + }, + { + "epoch": 0.01, + "global_step": 1952, + "learning_rate": 0.0004926878130217028, + "loss": 1.8812, + "loss_base2": 2.714, + "loss_pixel": 0.2027, + "loss_text": 1.6785, + "ppl": 6.5614, + "step": 1952 + }, + { + "epoch": 0.01, + "global_step": 1953, + "learning_rate": 0.0004926836393989983, + "loss": 1.8964, + "loss_base2": 2.7359, + "loss_pixel": 0.2013, + "loss_text": 1.6951, + "ppl": 6.6619, + "step": 1953 + }, + { + "epoch": 0.01, + "global_step": 1954, + "learning_rate": 0.0004926794657762938, + "loss": 1.8984, + "loss_base2": 2.7388, + "loss_pixel": 0.203, + "loss_text": 1.6955, + "ppl": 6.6752, + "step": 1954 + }, + { + "epoch": 0.01, + "global_step": 1955, + "learning_rate": 0.0004926752921535893, + "loss": 1.8872, + "loss_base2": 2.7227, + "loss_pixel": 0.2002, + "loss_text": 1.6869, + "ppl": 6.6009, + "step": 1955 + }, + { + "epoch": 0.01, + "global_step": 1956, + "learning_rate": 0.0004926711185308848, + "loss": 1.9065, + "loss_base2": 2.7505, + "loss_pixel": 0.2004, + "loss_text": 1.7061, + "ppl": 6.7295, + "step": 1956 + }, + { + "epoch": 0.01, + "global_step": 1957, + "learning_rate": 0.0004926669449081803, + "loss": 1.7859, + "loss_base2": 2.5765, + "loss_pixel": 0.2004, + "loss_text": 1.5856, + "ppl": 5.9649, + "step": 1957 + }, + { + "epoch": 0.01, + "global_step": 1958, + "learning_rate": 0.0004926627712854759, + "loss": 1.6791, + "loss_base2": 2.4224, + "loss_pixel": 0.1981, + "loss_text": 1.481, + "ppl": 5.3607, + "step": 1958 + }, + { + "epoch": 0.01, + "global_step": 1959, + "learning_rate": 0.0004926585976627713, + "loss": 1.6808, + "loss_base2": 2.4249, + "loss_pixel": 0.1997, + "loss_text": 1.481, + "ppl": 5.3699, + "step": 1959 + }, + { + "epoch": 0.01, + "global_step": 1960, + "learning_rate": 0.0004926544240400668, + "loss": 1.6499, + "loss_base2": 2.3803, + "loss_pixel": 0.1989, + "loss_text": 1.4511, + "ppl": 5.2065, + "step": 1960 + }, + { + "epoch": 0.01, + "global_step": 1961, + "learning_rate": 0.0004926502504173623, + "loss": 1.6424, + "loss_base2": 2.3695, + "loss_pixel": 0.1987, + "loss_text": 1.4437, + "ppl": 5.1676, + "step": 1961 + }, + { + "epoch": 0.01, + "global_step": 1962, + "learning_rate": 0.0004926460767946578, + "loss": 1.6583, + "loss_base2": 2.3924, + "loss_pixel": 0.1984, + "loss_text": 1.4599, + "ppl": 5.2504, + "step": 1962 + }, + { + "epoch": 0.01, + "global_step": 1963, + "learning_rate": 0.0004926419031719533, + "loss": 1.6401, + "loss_base2": 2.3662, + "loss_pixel": 0.1974, + "loss_text": 1.4427, + "ppl": 5.1557, + "step": 1963 + }, + { + "epoch": 0.01, + "global_step": 1964, + "learning_rate": 0.0004926377295492487, + "loss": 1.656, + "loss_base2": 2.3891, + "loss_pixel": 0.1964, + "loss_text": 1.4597, + "ppl": 5.2383, + "step": 1964 + }, + { + "epoch": 0.01, + "global_step": 1965, + "learning_rate": 0.0004926335559265442, + "loss": 1.6745, + "loss_base2": 2.4158, + "loss_pixel": 0.1971, + "loss_text": 1.4774, + "ppl": 5.3361, + "step": 1965 + }, + { + "epoch": 0.01, + "global_step": 1966, + "learning_rate": 0.0004926293823038397, + "loss": 1.9248, + "loss_base2": 2.7769, + "loss_pixel": 0.1958, + "loss_text": 1.729, + "ppl": 6.8538, + "step": 1966 + }, + { + "epoch": 0.01, + "global_step": 1967, + "learning_rate": 0.0004926252086811352, + "loss": 1.9187, + "loss_base2": 2.7681, + "loss_pixel": 0.1959, + "loss_text": 1.7228, + "ppl": 6.8121, + "step": 1967 + }, + { + "epoch": 0.01, + "global_step": 1968, + "learning_rate": 0.0004926210350584307, + "loss": 1.8989, + "loss_base2": 2.7395, + "loss_pixel": 0.1972, + "loss_text": 1.7017, + "ppl": 6.6785, + "step": 1968 + }, + { + "epoch": 0.01, + "global_step": 1969, + "learning_rate": 0.0004926168614357262, + "loss": 1.9006, + "loss_base2": 2.742, + "loss_pixel": 0.1971, + "loss_text": 1.7035, + "ppl": 6.6899, + "step": 1969 + }, + { + "epoch": 0.01, + "global_step": 1970, + "learning_rate": 0.0004926126878130217, + "loss": 1.9055, + "loss_base2": 2.7491, + "loss_pixel": 0.196, + "loss_text": 1.7096, + "ppl": 6.7228, + "step": 1970 + }, + { + "epoch": 0.01, + "global_step": 1971, + "learning_rate": 0.0004926085141903172, + "loss": 1.9238, + "loss_base2": 2.7755, + "loss_pixel": 0.1959, + "loss_text": 1.7279, + "ppl": 6.8469, + "step": 1971 + }, + { + "epoch": 0.01, + "global_step": 1972, + "learning_rate": 0.0004926043405676127, + "loss": 1.8836, + "loss_base2": 2.7175, + "loss_pixel": 0.1964, + "loss_text": 1.6873, + "ppl": 6.5771, + "step": 1972 + }, + { + "epoch": 0.01, + "global_step": 1973, + "learning_rate": 0.0004926001669449081, + "loss": 1.8912, + "loss_base2": 2.7284, + "loss_pixel": 0.1963, + "loss_text": 1.6948, + "ppl": 6.6273, + "step": 1973 + }, + { + "epoch": 0.01, + "global_step": 1974, + "learning_rate": 0.0004925959933222036, + "loss": 1.8817, + "loss_base2": 2.7147, + "loss_pixel": 0.196, + "loss_text": 1.6857, + "ppl": 6.5647, + "step": 1974 + }, + { + "epoch": 0.01, + "global_step": 1975, + "learning_rate": 0.0004925918196994992, + "loss": 1.8941, + "loss_base2": 2.7326, + "loss_pixel": 0.1953, + "loss_text": 1.6989, + "ppl": 6.6466, + "step": 1975 + }, + { + "epoch": 0.01, + "global_step": 1976, + "learning_rate": 0.0004925876460767947, + "loss": 1.8849, + "loss_base2": 2.7193, + "loss_pixel": 0.1966, + "loss_text": 1.6882, + "ppl": 6.5857, + "step": 1976 + }, + { + "epoch": 0.01, + "global_step": 1977, + "learning_rate": 0.0004925834724540902, + "loss": 1.8937, + "loss_base2": 2.732, + "loss_pixel": 0.197, + "loss_text": 1.6967, + "ppl": 6.6439, + "step": 1977 + }, + { + "epoch": 0.01, + "global_step": 1978, + "learning_rate": 0.0004925792988313857, + "loss": 1.8779, + "loss_base2": 2.7092, + "loss_pixel": 0.1956, + "loss_text": 1.6823, + "ppl": 6.5398, + "step": 1978 + }, + { + "epoch": 0.01, + "global_step": 1979, + "learning_rate": 0.0004925751252086812, + "loss": 1.8941, + "loss_base2": 2.7326, + "loss_pixel": 0.196, + "loss_text": 1.6982, + "ppl": 6.6466, + "step": 1979 + }, + { + "epoch": 0.01, + "global_step": 1980, + "learning_rate": 0.0004925709515859767, + "loss": 1.8842, + "loss_base2": 2.7183, + "loss_pixel": 0.1949, + "loss_text": 1.6893, + "ppl": 6.5811, + "step": 1980 + }, + { + "epoch": 0.01, + "global_step": 1981, + "learning_rate": 0.0004925667779632722, + "loss": 1.9029, + "loss_base2": 2.7453, + "loss_pixel": 0.1954, + "loss_text": 1.7075, + "ppl": 6.7053, + "step": 1981 + }, + { + "epoch": 0.01, + "global_step": 1982, + "learning_rate": 0.0004925626043405676, + "loss": 1.887, + "loss_base2": 2.7224, + "loss_pixel": 0.1952, + "loss_text": 1.6918, + "ppl": 6.5995, + "step": 1982 + }, + { + "epoch": 0.01, + "global_step": 1983, + "learning_rate": 0.0004925584307178631, + "loss": 1.8628, + "loss_base2": 2.6875, + "loss_pixel": 0.1978, + "loss_text": 1.665, + "ppl": 6.4417, + "step": 1983 + }, + { + "epoch": 0.01, + "global_step": 1984, + "learning_rate": 0.0004925542570951586, + "loss": 1.8905, + "loss_base2": 2.7274, + "loss_pixel": 0.1943, + "loss_text": 1.6963, + "ppl": 6.6227, + "step": 1984 + }, + { + "epoch": 0.01, + "global_step": 1985, + "learning_rate": 0.0004925500834724541, + "loss": 1.8846, + "loss_base2": 2.7189, + "loss_pixel": 0.195, + "loss_text": 1.6896, + "ppl": 6.5837, + "step": 1985 + }, + { + "epoch": 0.01, + "global_step": 1986, + "learning_rate": 0.0004925459098497496, + "loss": 1.8816, + "loss_base2": 2.7146, + "loss_pixel": 0.1949, + "loss_text": 1.6867, + "ppl": 6.564, + "step": 1986 + }, + { + "epoch": 0.01, + "global_step": 1987, + "learning_rate": 0.000492541736227045, + "loss": 1.7109, + "loss_base2": 2.4683, + "loss_pixel": 0.1944, + "loss_text": 1.5164, + "ppl": 5.5339, + "step": 1987 + }, + { + "epoch": 0.01, + "global_step": 1988, + "learning_rate": 0.0004925375626043405, + "loss": 1.6825, + "loss_base2": 2.4273, + "loss_pixel": 0.1949, + "loss_text": 1.4876, + "ppl": 5.379, + "step": 1988 + }, + { + "epoch": 0.01, + "global_step": 1989, + "learning_rate": 0.000492533388981636, + "loss": 1.6574, + "loss_base2": 2.3911, + "loss_pixel": 0.1953, + "loss_text": 1.4621, + "ppl": 5.2457, + "step": 1989 + }, + { + "epoch": 0.01, + "global_step": 1990, + "learning_rate": 0.0004925292153589315, + "loss": 1.6544, + "loss_base2": 2.3868, + "loss_pixel": 0.1948, + "loss_text": 1.4597, + "ppl": 5.2299, + "step": 1990 + }, + { + "epoch": 0.01, + "global_step": 1991, + "learning_rate": 0.0004925250417362271, + "loss": 1.6113, + "loss_base2": 2.3246, + "loss_pixel": 0.1941, + "loss_text": 1.4172, + "ppl": 5.0093, + "step": 1991 + }, + { + "epoch": 0.01, + "global_step": 1992, + "learning_rate": 0.0004925208681135226, + "loss": 1.6152, + "loss_base2": 2.3302, + "loss_pixel": 0.1937, + "loss_text": 1.4214, + "ppl": 5.0289, + "step": 1992 + }, + { + "epoch": 0.01, + "global_step": 1993, + "learning_rate": 0.0004925166944908181, + "loss": 1.6182, + "loss_base2": 2.3346, + "loss_pixel": 0.1933, + "loss_text": 1.425, + "ppl": 5.044, + "step": 1993 + }, + { + "epoch": 0.01, + "global_step": 1994, + "learning_rate": 0.0004925125208681136, + "loss": 1.731, + "loss_base2": 2.4973, + "loss_pixel": 0.1938, + "loss_text": 1.5373, + "ppl": 5.6463, + "step": 1994 + }, + { + "epoch": 0.01, + "global_step": 1995, + "learning_rate": 0.0004925083472454091, + "loss": 1.9169, + "loss_base2": 2.7655, + "loss_pixel": 0.1952, + "loss_text": 1.7218, + "ppl": 6.7998, + "step": 1995 + }, + { + "epoch": 0.01, + "global_step": 1996, + "learning_rate": 0.0004925041736227045, + "loss": 1.8993, + "loss_base2": 2.7401, + "loss_pixel": 0.195, + "loss_text": 1.7043, + "ppl": 6.6812, + "step": 1996 + }, + { + "epoch": 0.01, + "global_step": 1997, + "learning_rate": 0.0004925, + "loss": 1.8998, + "loss_base2": 2.7408, + "loss_pixel": 0.1952, + "loss_text": 1.7046, + "ppl": 6.6846, + "step": 1997 + }, + { + "epoch": 0.01, + "global_step": 1998, + "learning_rate": 0.0004924958263772955, + "loss": 1.9108, + "loss_base2": 2.7567, + "loss_pixel": 0.1941, + "loss_text": 1.7167, + "ppl": 6.7585, + "step": 1998 + }, + { + "epoch": 0.01, + "global_step": 1999, + "learning_rate": 0.000492491652754591, + "loss": 1.8961, + "loss_base2": 2.7355, + "loss_pixel": 0.1944, + "loss_text": 1.7017, + "ppl": 6.6599, + "step": 1999 + }, + { + "epoch": 0.01, + "global_step": 2000, + "learning_rate": 0.0004924874791318865, + "loss": 1.8852, + "loss_base2": 2.7198, + "loss_pixel": 0.1939, + "loss_text": 1.6913, + "ppl": 6.5877, + "step": 2000 + }, + { + "epoch": 0.01, + "global_step": 2001, + "learning_rate": 0.000492483305509182, + "loss": 1.8728, + "loss_base2": 2.7019, + "loss_pixel": 0.1953, + "loss_text": 1.6775, + "ppl": 6.5065, + "step": 2001 + }, + { + "epoch": 0.01, + "global_step": 2002, + "learning_rate": 0.0004924791318864774, + "loss": 1.8912, + "loss_base2": 2.7284, + "loss_pixel": 0.1945, + "loss_text": 1.6967, + "ppl": 6.6273, + "step": 2002 + }, + { + "epoch": 0.01, + "global_step": 2003, + "learning_rate": 0.0004924749582637729, + "loss": 1.8866, + "loss_base2": 2.7218, + "loss_pixel": 0.1942, + "loss_text": 1.6924, + "ppl": 6.5969, + "step": 2003 + }, + { + "epoch": 0.01, + "global_step": 2004, + "learning_rate": 0.0004924707846410684, + "loss": 1.8869, + "loss_base2": 2.7222, + "loss_pixel": 0.1942, + "loss_text": 1.6927, + "ppl": 6.5989, + "step": 2004 + }, + { + "epoch": 0.01, + "global_step": 2005, + "learning_rate": 0.0004924666110183639, + "loss": 1.8904, + "loss_base2": 2.7273, + "loss_pixel": 0.1939, + "loss_text": 1.6965, + "ppl": 6.622, + "step": 2005 + }, + { + "epoch": 0.01, + "global_step": 2006, + "learning_rate": 0.0004924624373956594, + "loss": 1.8734, + "loss_base2": 2.7027, + "loss_pixel": 0.1943, + "loss_text": 1.679, + "ppl": 6.5104, + "step": 2006 + }, + { + "epoch": 0.01, + "global_step": 2007, + "learning_rate": 0.000492458263772955, + "loss": 1.8961, + "loss_base2": 2.7355, + "loss_pixel": 0.1945, + "loss_text": 1.7015, + "ppl": 6.6599, + "step": 2007 + }, + { + "epoch": 0.01, + "global_step": 2008, + "learning_rate": 0.0004924540901502505, + "loss": 1.872, + "loss_base2": 2.7007, + "loss_pixel": 0.1936, + "loss_text": 1.6784, + "ppl": 6.5013, + "step": 2008 + }, + { + "epoch": 0.01, + "global_step": 2009, + "learning_rate": 0.0004924499165275459, + "loss": 1.8783, + "loss_base2": 2.7098, + "loss_pixel": 0.194, + "loss_text": 1.6843, + "ppl": 6.5424, + "step": 2009 + }, + { + "epoch": 0.01, + "global_step": 2010, + "learning_rate": 0.0004924457429048414, + "loss": 1.8622, + "loss_base2": 2.6866, + "loss_pixel": 0.1933, + "loss_text": 1.6689, + "ppl": 6.4379, + "step": 2010 + }, + { + "epoch": 0.01, + "global_step": 2011, + "learning_rate": 0.0004924415692821369, + "loss": 1.8681, + "loss_base2": 2.6951, + "loss_pixel": 0.1925, + "loss_text": 1.6756, + "ppl": 6.476, + "step": 2011 + }, + { + "epoch": 0.01, + "global_step": 2012, + "learning_rate": 0.0004924373956594324, + "loss": 1.891, + "loss_base2": 2.7281, + "loss_pixel": 0.193, + "loss_text": 1.698, + "ppl": 6.626, + "step": 2012 + }, + { + "epoch": 0.01, + "global_step": 2013, + "learning_rate": 0.0004924332220367279, + "loss": 1.8704, + "loss_base2": 2.6984, + "loss_pixel": 0.1931, + "loss_text": 1.6772, + "ppl": 6.4909, + "step": 2013 + }, + { + "epoch": 0.01, + "global_step": 2014, + "learning_rate": 0.0004924290484140234, + "loss": 1.8679, + "loss_base2": 2.6948, + "loss_pixel": 0.1925, + "loss_text": 1.6754, + "ppl": 6.4747, + "step": 2014 + }, + { + "epoch": 0.01, + "global_step": 2015, + "learning_rate": 0.0004924248747913189, + "loss": 1.9045, + "loss_base2": 2.7476, + "loss_pixel": 0.1928, + "loss_text": 1.7117, + "ppl": 6.716, + "step": 2015 + }, + { + "epoch": 0.01, + "global_step": 2016, + "learning_rate": 0.0004924207011686144, + "loss": 1.8745, + "loss_base2": 2.7043, + "loss_pixel": 0.1933, + "loss_text": 1.6812, + "ppl": 6.5176, + "step": 2016 + }, + { + "epoch": 0.01, + "global_step": 2017, + "learning_rate": 0.0004924165275459099, + "loss": 1.8572, + "loss_base2": 2.6794, + "loss_pixel": 0.1933, + "loss_text": 1.664, + "ppl": 6.4058, + "step": 2017 + }, + { + "epoch": 0.01, + "global_step": 2018, + "learning_rate": 0.0004924123539232053, + "loss": 1.8728, + "loss_base2": 2.7019, + "loss_pixel": 0.1928, + "loss_text": 1.68, + "ppl": 6.5065, + "step": 2018 + }, + { + "epoch": 0.01, + "global_step": 2019, + "learning_rate": 0.0004924081803005008, + "loss": 1.8748, + "loss_base2": 2.7048, + "loss_pixel": 0.1938, + "loss_text": 1.681, + "ppl": 6.5195, + "step": 2019 + }, + { + "epoch": 0.01, + "global_step": 2020, + "learning_rate": 0.0004924040066777963, + "loss": 1.8879, + "loss_base2": 2.7237, + "loss_pixel": 0.1939, + "loss_text": 1.694, + "ppl": 6.6055, + "step": 2020 + }, + { + "epoch": 0.01, + "global_step": 2021, + "learning_rate": 0.0004923998330550918, + "loss": 1.8735, + "loss_base2": 2.7029, + "loss_pixel": 0.1992, + "loss_text": 1.6743, + "ppl": 6.511, + "step": 2021 + }, + { + "epoch": 0.01, + "global_step": 2022, + "learning_rate": 0.0004923956594323873, + "loss": 1.8668, + "loss_base2": 2.6932, + "loss_pixel": 0.1963, + "loss_text": 1.6705, + "ppl": 6.4676, + "step": 2022 + }, + { + "epoch": 0.01, + "global_step": 2023, + "learning_rate": 0.0004923914858096827, + "loss": 1.8747, + "loss_base2": 2.7046, + "loss_pixel": 0.1946, + "loss_text": 1.68, + "ppl": 6.5189, + "step": 2023 + }, + { + "epoch": 0.01, + "global_step": 2024, + "learning_rate": 0.0004923873121869783, + "loss": 1.8692, + "loss_base2": 2.6967, + "loss_pixel": 0.1931, + "loss_text": 1.6761, + "ppl": 6.4831, + "step": 2024 + }, + { + "epoch": 0.01, + "global_step": 2025, + "learning_rate": 0.0004923831385642738, + "loss": 1.8522, + "loss_base2": 2.6722, + "loss_pixel": 0.1958, + "loss_text": 1.6564, + "ppl": 6.3738, + "step": 2025 + }, + { + "epoch": 0.01, + "global_step": 2026, + "learning_rate": 0.0004923789649415693, + "loss": 1.8668, + "loss_base2": 2.6932, + "loss_pixel": 0.1938, + "loss_text": 1.673, + "ppl": 6.4676, + "step": 2026 + }, + { + "epoch": 0.01, + "global_step": 2027, + "learning_rate": 0.0004923747913188648, + "loss": 1.8613, + "loss_base2": 2.6853, + "loss_pixel": 0.1935, + "loss_text": 1.6678, + "ppl": 6.4321, + "step": 2027 + }, + { + "epoch": 0.01, + "global_step": 2028, + "learning_rate": 0.0004923706176961603, + "loss": 1.8629, + "loss_base2": 2.6876, + "loss_pixel": 0.1912, + "loss_text": 1.6717, + "ppl": 6.4424, + "step": 2028 + }, + { + "epoch": 0.01, + "global_step": 2029, + "learning_rate": 0.0004923664440734558, + "loss": 1.8568, + "loss_base2": 2.6788, + "loss_pixel": 0.1936, + "loss_text": 1.6632, + "ppl": 6.4032, + "step": 2029 + }, + { + "epoch": 0.01, + "global_step": 2030, + "learning_rate": 0.0004923622704507513, + "loss": 1.8652, + "loss_base2": 2.6909, + "loss_pixel": 0.1917, + "loss_text": 1.6734, + "ppl": 6.4572, + "step": 2030 + }, + { + "epoch": 0.01, + "global_step": 2031, + "learning_rate": 0.0004923580968280468, + "loss": 1.8661, + "loss_base2": 2.6922, + "loss_pixel": 0.1931, + "loss_text": 1.6729, + "ppl": 6.463, + "step": 2031 + }, + { + "epoch": 0.01, + "global_step": 2032, + "learning_rate": 0.0004923539232053422, + "loss": 1.8537, + "loss_base2": 2.6743, + "loss_pixel": 0.1933, + "loss_text": 1.6604, + "ppl": 6.3834, + "step": 2032 + }, + { + "epoch": 0.01, + "global_step": 2033, + "learning_rate": 0.0004923497495826377, + "loss": 1.8588, + "loss_base2": 2.6817, + "loss_pixel": 0.1923, + "loss_text": 1.6665, + "ppl": 6.416, + "step": 2033 + }, + { + "epoch": 0.01, + "global_step": 2034, + "learning_rate": 0.0004923455759599332, + "loss": 1.872, + "loss_base2": 2.7007, + "loss_pixel": 0.1927, + "loss_text": 1.6793, + "ppl": 6.5013, + "step": 2034 + }, + { + "epoch": 0.01, + "global_step": 2035, + "learning_rate": 0.0004923414023372287, + "loss": 1.8829, + "loss_base2": 2.7165, + "loss_pixel": 0.1939, + "loss_text": 1.6891, + "ppl": 6.5725, + "step": 2035 + }, + { + "epoch": 0.01, + "global_step": 2036, + "learning_rate": 0.0004923372287145242, + "loss": 1.8501, + "loss_base2": 2.6691, + "loss_pixel": 0.1909, + "loss_text": 1.6593, + "ppl": 6.3605, + "step": 2036 + }, + { + "epoch": 0.01, + "global_step": 2037, + "learning_rate": 0.0004923330550918197, + "loss": 1.8335, + "loss_base2": 2.6452, + "loss_pixel": 0.1924, + "loss_text": 1.6411, + "ppl": 6.2557, + "step": 2037 + }, + { + "epoch": 0.01, + "global_step": 2038, + "learning_rate": 0.0004923288814691152, + "loss": 1.8709, + "loss_base2": 2.6991, + "loss_pixel": 0.1942, + "loss_text": 1.6767, + "ppl": 6.4941, + "step": 2038 + }, + { + "epoch": 0.01, + "global_step": 2039, + "learning_rate": 0.0004923247078464108, + "loss": 1.8618, + "loss_base2": 2.686, + "loss_pixel": 0.197, + "loss_text": 1.6648, + "ppl": 6.4353, + "step": 2039 + }, + { + "epoch": 0.01, + "global_step": 2040, + "learning_rate": 0.0004923205342237062, + "loss": 1.8863, + "loss_base2": 2.7214, + "loss_pixel": 0.1996, + "loss_text": 1.6867, + "ppl": 6.5949, + "step": 2040 + }, + { + "epoch": 0.01, + "global_step": 2041, + "learning_rate": 0.0004923163606010017, + "loss": 1.8549, + "loss_base2": 2.6761, + "loss_pixel": 0.1982, + "loss_text": 1.6567, + "ppl": 6.3911, + "step": 2041 + }, + { + "epoch": 0.01, + "global_step": 2042, + "learning_rate": 0.0004923121869782972, + "loss": 1.8565, + "loss_base2": 2.6784, + "loss_pixel": 0.1965, + "loss_text": 1.66, + "ppl": 6.4013, + "step": 2042 + }, + { + "epoch": 0.01, + "global_step": 2043, + "learning_rate": 0.0004923080133555927, + "loss": 1.8638, + "loss_base2": 2.6889, + "loss_pixel": 0.1981, + "loss_text": 1.6657, + "ppl": 6.4482, + "step": 2043 + }, + { + "epoch": 0.01, + "global_step": 2044, + "learning_rate": 0.0004923038397328882, + "loss": 1.8762, + "loss_base2": 2.7068, + "loss_pixel": 0.1968, + "loss_text": 1.6794, + "ppl": 6.5286, + "step": 2044 + }, + { + "epoch": 0.01, + "global_step": 2045, + "learning_rate": 0.0004922996661101837, + "loss": 1.8619, + "loss_base2": 2.6862, + "loss_pixel": 0.1955, + "loss_text": 1.6664, + "ppl": 6.436, + "step": 2045 + }, + { + "epoch": 0.01, + "global_step": 2046, + "learning_rate": 0.0004922954924874791, + "loss": 1.8515, + "loss_base2": 2.6711, + "loss_pixel": 0.195, + "loss_text": 1.6565, + "ppl": 6.3694, + "step": 2046 + }, + { + "epoch": 0.01, + "global_step": 2047, + "learning_rate": 0.0004922913188647746, + "loss": 1.8772, + "loss_base2": 2.7082, + "loss_pixel": 0.1935, + "loss_text": 1.6837, + "ppl": 6.5352, + "step": 2047 + }, + { + "epoch": 0.01, + "global_step": 2048, + "learning_rate": 0.0004922871452420701, + "loss": 1.8812, + "loss_base2": 2.714, + "loss_pixel": 0.1943, + "loss_text": 1.6869, + "ppl": 6.5614, + "step": 2048 + }, + { + "epoch": 0.01, + "global_step": 2049, + "learning_rate": 0.0004922829716193656, + "loss": 1.8629, + "loss_base2": 2.6876, + "loss_pixel": 0.1956, + "loss_text": 1.6673, + "ppl": 6.4424, + "step": 2049 + }, + { + "epoch": 0.01, + "global_step": 2050, + "learning_rate": 0.0004922787979966611, + "loss": 1.8692, + "loss_base2": 2.6967, + "loss_pixel": 0.1953, + "loss_text": 1.6739, + "ppl": 6.4831, + "step": 2050 + }, + { + "epoch": 0.01, + "global_step": 2051, + "learning_rate": 0.0004922746243739566, + "loss": 1.8613, + "loss_base2": 2.6853, + "loss_pixel": 0.1949, + "loss_text": 1.6664, + "ppl": 6.4321, + "step": 2051 + }, + { + "epoch": 0.01, + "global_step": 2052, + "learning_rate": 0.0004922704507512521, + "loss": 1.8892, + "loss_base2": 2.7255, + "loss_pixel": 0.1939, + "loss_text": 1.6952, + "ppl": 6.6141, + "step": 2052 + }, + { + "epoch": 0.01, + "global_step": 2053, + "learning_rate": 0.0004922662771285476, + "loss": 1.8564, + "loss_base2": 2.6782, + "loss_pixel": 0.1975, + "loss_text": 1.6589, + "ppl": 6.4007, + "step": 2053 + }, + { + "epoch": 0.01, + "global_step": 2054, + "learning_rate": 0.0004922621035058431, + "loss": 1.8617, + "loss_base2": 2.6859, + "loss_pixel": 0.1935, + "loss_text": 1.6682, + "ppl": 6.4347, + "step": 2054 + }, + { + "epoch": 0.01, + "global_step": 2055, + "learning_rate": 0.0004922579298831385, + "loss": 1.8702, + "loss_base2": 2.6981, + "loss_pixel": 0.1953, + "loss_text": 1.6749, + "ppl": 6.4896, + "step": 2055 + }, + { + "epoch": 0.01, + "global_step": 2056, + "learning_rate": 0.0004922537562604341, + "loss": 1.8628, + "loss_base2": 2.6875, + "loss_pixel": 0.1943, + "loss_text": 1.6685, + "ppl": 6.4417, + "step": 2056 + }, + { + "epoch": 0.01, + "global_step": 2057, + "learning_rate": 0.0004922495826377296, + "loss": 1.8559, + "loss_base2": 2.6775, + "loss_pixel": 0.1946, + "loss_text": 1.6613, + "ppl": 6.3975, + "step": 2057 + }, + { + "epoch": 0.01, + "global_step": 2058, + "learning_rate": 0.0004922454090150251, + "loss": 1.8725, + "loss_base2": 2.7014, + "loss_pixel": 0.1941, + "loss_text": 1.6784, + "ppl": 6.5045, + "step": 2058 + }, + { + "epoch": 0.01, + "global_step": 2059, + "learning_rate": 0.0004922412353923205, + "loss": 1.871, + "loss_base2": 2.6993, + "loss_pixel": 0.1948, + "loss_text": 1.6762, + "ppl": 6.4948, + "step": 2059 + }, + { + "epoch": 0.01, + "global_step": 2060, + "learning_rate": 0.000492237061769616, + "loss": 1.8545, + "loss_base2": 2.6755, + "loss_pixel": 0.194, + "loss_text": 1.6605, + "ppl": 6.3885, + "step": 2060 + }, + { + "epoch": 0.01, + "global_step": 2061, + "learning_rate": 0.0004922328881469115, + "loss": 1.8585, + "loss_base2": 2.6812, + "loss_pixel": 0.1931, + "loss_text": 1.6654, + "ppl": 6.4141, + "step": 2061 + }, + { + "epoch": 0.01, + "global_step": 2062, + "learning_rate": 0.000492228714524207, + "loss": 1.8511, + "loss_base2": 2.6706, + "loss_pixel": 0.1944, + "loss_text": 1.6567, + "ppl": 6.3668, + "step": 2062 + }, + { + "epoch": 0.01, + "global_step": 2063, + "learning_rate": 0.0004922245409015025, + "loss": 1.8729, + "loss_base2": 2.702, + "loss_pixel": 0.1948, + "loss_text": 1.678, + "ppl": 6.5071, + "step": 2063 + }, + { + "epoch": 0.01, + "global_step": 2064, + "learning_rate": 0.000492220367278798, + "loss": 1.8798, + "loss_base2": 2.712, + "loss_pixel": 0.1946, + "loss_text": 1.6851, + "ppl": 6.5522, + "step": 2064 + }, + { + "epoch": 0.01, + "global_step": 2065, + "learning_rate": 0.0004922161936560935, + "loss": 1.8546, + "loss_base2": 2.6756, + "loss_pixel": 0.1933, + "loss_text": 1.6613, + "ppl": 6.3891, + "step": 2065 + }, + { + "epoch": 0.01, + "global_step": 2066, + "learning_rate": 0.000492212020033389, + "loss": 1.8577, + "loss_base2": 2.6801, + "loss_pixel": 0.1935, + "loss_text": 1.6642, + "ppl": 6.409, + "step": 2066 + }, + { + "epoch": 0.01, + "global_step": 2067, + "learning_rate": 0.0004922078464106845, + "loss": 1.8602, + "loss_base2": 2.6837, + "loss_pixel": 0.1927, + "loss_text": 1.6675, + "ppl": 6.425, + "step": 2067 + }, + { + "epoch": 0.01, + "global_step": 2068, + "learning_rate": 0.0004922036727879799, + "loss": 1.8454, + "loss_base2": 2.6623, + "loss_pixel": 0.1936, + "loss_text": 1.6518, + "ppl": 6.3306, + "step": 2068 + }, + { + "epoch": 0.01, + "global_step": 2069, + "learning_rate": 0.0004921994991652754, + "loss": 1.8664, + "loss_base2": 2.6926, + "loss_pixel": 0.1912, + "loss_text": 1.6753, + "ppl": 6.465, + "step": 2069 + }, + { + "epoch": 0.01, + "global_step": 2070, + "learning_rate": 0.0004921953255425709, + "loss": 1.8237, + "loss_base2": 2.631, + "loss_pixel": 0.1926, + "loss_text": 1.6311, + "ppl": 6.1947, + "step": 2070 + }, + { + "epoch": 0.01, + "global_step": 2071, + "learning_rate": 0.0004921911519198664, + "loss": 1.852, + "loss_base2": 2.6719, + "loss_pixel": 0.1936, + "loss_text": 1.6584, + "ppl": 6.3726, + "step": 2071 + }, + { + "epoch": 0.01, + "global_step": 2072, + "learning_rate": 0.000492186978297162, + "loss": 1.8647, + "loss_base2": 2.6902, + "loss_pixel": 0.1926, + "loss_text": 1.672, + "ppl": 6.454, + "step": 2072 + }, + { + "epoch": 0.01, + "global_step": 2073, + "learning_rate": 0.0004921828046744575, + "loss": 1.8659, + "loss_base2": 2.6919, + "loss_pixel": 0.1921, + "loss_text": 1.6738, + "ppl": 6.4617, + "step": 2073 + }, + { + "epoch": 0.01, + "global_step": 2074, + "learning_rate": 0.000492178631051753, + "loss": 1.8479, + "loss_base2": 2.666, + "loss_pixel": 0.192, + "loss_text": 1.6558, + "ppl": 6.3465, + "step": 2074 + }, + { + "epoch": 0.01, + "global_step": 2075, + "learning_rate": 0.0004921744574290485, + "loss": 1.8386, + "loss_base2": 2.6525, + "loss_pixel": 0.1932, + "loss_text": 1.6455, + "ppl": 6.2877, + "step": 2075 + }, + { + "epoch": 0.01, + "global_step": 2076, + "learning_rate": 0.000492170283806344, + "loss": 1.8562, + "loss_base2": 2.6779, + "loss_pixel": 0.192, + "loss_text": 1.6641, + "ppl": 6.3994, + "step": 2076 + }, + { + "epoch": 0.01, + "global_step": 2077, + "learning_rate": 0.0004921661101836394, + "loss": 1.8509, + "loss_base2": 2.6703, + "loss_pixel": 0.1925, + "loss_text": 1.6584, + "ppl": 6.3655, + "step": 2077 + }, + { + "epoch": 0.01, + "global_step": 2078, + "learning_rate": 0.0004921619365609349, + "loss": 1.8421, + "loss_base2": 2.6576, + "loss_pixel": 0.1925, + "loss_text": 1.6496, + "ppl": 6.3098, + "step": 2078 + }, + { + "epoch": 0.01, + "global_step": 2079, + "learning_rate": 0.0004921577629382304, + "loss": 1.8397, + "loss_base2": 2.6541, + "loss_pixel": 0.1938, + "loss_text": 1.646, + "ppl": 6.2946, + "step": 2079 + }, + { + "epoch": 0.01, + "global_step": 2080, + "learning_rate": 0.0004921535893155259, + "loss": 1.8602, + "loss_base2": 2.6837, + "loss_pixel": 0.1934, + "loss_text": 1.6668, + "ppl": 6.425, + "step": 2080 + }, + { + "epoch": 0.01, + "global_step": 2081, + "learning_rate": 0.0004921494156928214, + "loss": 1.8644, + "loss_base2": 2.6898, + "loss_pixel": 0.1921, + "loss_text": 1.6723, + "ppl": 6.4521, + "step": 2081 + }, + { + "epoch": 0.01, + "global_step": 2082, + "learning_rate": 0.0004921452420701168, + "loss": 1.8746, + "loss_base2": 2.7045, + "loss_pixel": 0.1931, + "loss_text": 1.6815, + "ppl": 6.5182, + "step": 2082 + }, + { + "epoch": 0.01, + "global_step": 2083, + "learning_rate": 0.0004921410684474123, + "loss": 1.8462, + "loss_base2": 2.6635, + "loss_pixel": 0.1924, + "loss_text": 1.6539, + "ppl": 6.3357, + "step": 2083 + }, + { + "epoch": 0.01, + "global_step": 2084, + "learning_rate": 0.0004921368948247078, + "loss": 1.8176, + "loss_base2": 2.6222, + "loss_pixel": 0.1917, + "loss_text": 1.6259, + "ppl": 6.1571, + "step": 2084 + }, + { + "epoch": 0.01, + "global_step": 2085, + "learning_rate": 0.0004921327212020033, + "loss": 1.8616, + "loss_base2": 2.6857, + "loss_pixel": 0.1922, + "loss_text": 1.6694, + "ppl": 6.434, + "step": 2085 + }, + { + "epoch": 0.01, + "global_step": 2086, + "learning_rate": 0.0004921285475792988, + "loss": 1.8569, + "loss_base2": 2.6789, + "loss_pixel": 0.1926, + "loss_text": 1.6643, + "ppl": 6.4039, + "step": 2086 + }, + { + "epoch": 0.01, + "global_step": 2087, + "learning_rate": 0.0004921243739565943, + "loss": 1.8658, + "loss_base2": 2.6918, + "loss_pixel": 0.193, + "loss_text": 1.6728, + "ppl": 6.4611, + "step": 2087 + }, + { + "epoch": 0.01, + "global_step": 2088, + "learning_rate": 0.0004921202003338899, + "loss": 1.8596, + "loss_base2": 2.6828, + "loss_pixel": 0.1934, + "loss_text": 1.6662, + "ppl": 6.4212, + "step": 2088 + }, + { + "epoch": 0.01, + "global_step": 2089, + "learning_rate": 0.0004921160267111854, + "loss": 1.8516, + "loss_base2": 2.6713, + "loss_pixel": 0.1939, + "loss_text": 1.6577, + "ppl": 6.37, + "step": 2089 + }, + { + "epoch": 0.01, + "global_step": 2090, + "learning_rate": 0.0004921118530884809, + "loss": 1.8607, + "loss_base2": 2.6844, + "loss_pixel": 0.1948, + "loss_text": 1.6659, + "ppl": 6.4282, + "step": 2090 + }, + { + "epoch": 0.01, + "global_step": 2091, + "learning_rate": 0.0004921076794657763, + "loss": 1.8755, + "loss_base2": 2.7058, + "loss_pixel": 0.1936, + "loss_text": 1.6819, + "ppl": 6.5241, + "step": 2091 + }, + { + "epoch": 0.01, + "global_step": 2092, + "learning_rate": 0.0004921035058430718, + "loss": 1.8764, + "loss_base2": 2.7071, + "loss_pixel": 0.1926, + "loss_text": 1.6838, + "ppl": 6.53, + "step": 2092 + }, + { + "epoch": 0.01, + "global_step": 2093, + "learning_rate": 0.0004920993322203673, + "loss": 1.8498, + "loss_base2": 2.6687, + "loss_pixel": 0.1924, + "loss_text": 1.6574, + "ppl": 6.3585, + "step": 2093 + }, + { + "epoch": 0.01, + "global_step": 2094, + "learning_rate": 0.0004920951585976628, + "loss": 1.8494, + "loss_base2": 2.6681, + "loss_pixel": 0.1927, + "loss_text": 1.6566, + "ppl": 6.356, + "step": 2094 + }, + { + "epoch": 0.01, + "global_step": 2095, + "learning_rate": 0.0004920909849749583, + "loss": 1.8399, + "loss_base2": 2.6544, + "loss_pixel": 0.1936, + "loss_text": 1.6464, + "ppl": 6.2959, + "step": 2095 + }, + { + "epoch": 0.01, + "global_step": 2096, + "learning_rate": 0.0004920868113522537, + "loss": 1.8534, + "loss_base2": 2.6739, + "loss_pixel": 0.1942, + "loss_text": 1.6592, + "ppl": 6.3815, + "step": 2096 + }, + { + "epoch": 0.01, + "global_step": 2097, + "learning_rate": 0.0004920826377295492, + "loss": 1.8409, + "loss_base2": 2.6559, + "loss_pixel": 0.1932, + "loss_text": 1.6477, + "ppl": 6.3022, + "step": 2097 + }, + { + "epoch": 0.01, + "global_step": 2098, + "learning_rate": 0.0004920784641068447, + "loss": 1.8453, + "loss_base2": 2.6622, + "loss_pixel": 0.1935, + "loss_text": 1.6518, + "ppl": 6.33, + "step": 2098 + }, + { + "epoch": 0.01, + "global_step": 2099, + "learning_rate": 0.0004920742904841402, + "loss": 1.8383, + "loss_base2": 2.6521, + "loss_pixel": 0.1922, + "loss_text": 1.6461, + "ppl": 6.2858, + "step": 2099 + }, + { + "epoch": 0.01, + "global_step": 2100, + "learning_rate": 0.0004920701168614357, + "loss": 1.8501, + "loss_base2": 2.6691, + "loss_pixel": 0.1923, + "loss_text": 1.6578, + "ppl": 6.3605, + "step": 2100 + }, + { + "epoch": 0.01, + "global_step": 2101, + "learning_rate": 0.0004920659432387312, + "loss": 1.845, + "loss_base2": 2.6618, + "loss_pixel": 0.1939, + "loss_text": 1.6511, + "ppl": 6.3281, + "step": 2101 + }, + { + "epoch": 0.01, + "global_step": 2102, + "learning_rate": 0.0004920617696160267, + "loss": 1.8454, + "loss_base2": 2.6623, + "loss_pixel": 0.1916, + "loss_text": 1.6537, + "ppl": 6.3306, + "step": 2102 + }, + { + "epoch": 0.01, + "global_step": 2103, + "learning_rate": 0.0004920575959933222, + "loss": 1.8396, + "loss_base2": 2.654, + "loss_pixel": 0.1916, + "loss_text": 1.648, + "ppl": 6.294, + "step": 2103 + }, + { + "epoch": 0.01, + "global_step": 2104, + "learning_rate": 0.0004920534223706178, + "loss": 1.8554, + "loss_base2": 2.6768, + "loss_pixel": 0.1934, + "loss_text": 1.662, + "ppl": 6.3943, + "step": 2104 + }, + { + "epoch": 0.01, + "global_step": 2105, + "learning_rate": 0.0004920492487479132, + "loss": 1.8689, + "loss_base2": 2.6963, + "loss_pixel": 0.203, + "loss_text": 1.6659, + "ppl": 6.4812, + "step": 2105 + }, + { + "epoch": 0.01, + "global_step": 2106, + "learning_rate": 0.0004920450751252087, + "loss": 1.8641, + "loss_base2": 2.6893, + "loss_pixel": 0.2008, + "loss_text": 1.6633, + "ppl": 6.4501, + "step": 2106 + }, + { + "epoch": 0.01, + "global_step": 2107, + "learning_rate": 0.0004920409015025042, + "loss": 1.8542, + "loss_base2": 2.675, + "loss_pixel": 0.1973, + "loss_text": 1.6569, + "ppl": 6.3866, + "step": 2107 + }, + { + "epoch": 0.01, + "global_step": 2108, + "learning_rate": 0.0004920367278797997, + "loss": 1.8543, + "loss_base2": 2.6752, + "loss_pixel": 0.1921, + "loss_text": 1.6621, + "ppl": 6.3872, + "step": 2108 + }, + { + "epoch": 0.01, + "global_step": 2109, + "learning_rate": 0.0004920325542570952, + "loss": 1.8643, + "loss_base2": 2.6896, + "loss_pixel": 0.193, + "loss_text": 1.6713, + "ppl": 6.4514, + "step": 2109 + }, + { + "epoch": 0.01, + "global_step": 2110, + "learning_rate": 0.0004920283806343907, + "loss": 1.8638, + "loss_base2": 2.6889, + "loss_pixel": 0.1918, + "loss_text": 1.672, + "ppl": 6.4482, + "step": 2110 + }, + { + "epoch": 0.01, + "global_step": 2111, + "learning_rate": 0.0004920242070116862, + "loss": 1.8593, + "loss_base2": 2.6824, + "loss_pixel": 0.1931, + "loss_text": 1.6662, + "ppl": 6.4192, + "step": 2111 + }, + { + "epoch": 0.01, + "global_step": 2112, + "learning_rate": 0.0004920200333889817, + "loss": 1.8726, + "loss_base2": 2.7016, + "loss_pixel": 0.1916, + "loss_text": 1.6811, + "ppl": 6.5052, + "step": 2112 + }, + { + "epoch": 0.01, + "global_step": 2113, + "learning_rate": 0.0004920158597662772, + "loss": 1.8186, + "loss_base2": 2.6237, + "loss_pixel": 0.1929, + "loss_text": 1.6257, + "ppl": 6.1632, + "step": 2113 + }, + { + "epoch": 0.01, + "global_step": 2114, + "learning_rate": 0.0004920116861435726, + "loss": 1.8752, + "loss_base2": 2.7053, + "loss_pixel": 0.193, + "loss_text": 1.6822, + "ppl": 6.5221, + "step": 2114 + }, + { + "epoch": 0.01, + "global_step": 2115, + "learning_rate": 0.0004920075125208681, + "loss": 1.8436, + "loss_base2": 2.6598, + "loss_pixel": 0.1916, + "loss_text": 1.652, + "ppl": 6.3192, + "step": 2115 + }, + { + "epoch": 0.01, + "global_step": 2116, + "learning_rate": 0.0004920033388981636, + "loss": 1.8539, + "loss_base2": 2.6746, + "loss_pixel": 0.1921, + "loss_text": 1.6618, + "ppl": 6.3847, + "step": 2116 + }, + { + "epoch": 0.01, + "global_step": 2117, + "learning_rate": 0.0004919991652754591, + "loss": 1.8563, + "loss_base2": 2.6781, + "loss_pixel": 0.1929, + "loss_text": 1.6634, + "ppl": 6.4, + "step": 2117 + }, + { + "epoch": 0.01, + "global_step": 2118, + "learning_rate": 0.0004919949916527545, + "loss": 1.8187, + "loss_base2": 2.6238, + "loss_pixel": 0.1922, + "loss_text": 1.6265, + "ppl": 6.1638, + "step": 2118 + }, + { + "epoch": 0.01, + "global_step": 2119, + "learning_rate": 0.00049199081803005, + "loss": 1.8548, + "loss_base2": 2.6759, + "loss_pixel": 0.192, + "loss_text": 1.6627, + "ppl": 6.3904, + "step": 2119 + }, + { + "epoch": 0.01, + "global_step": 2120, + "learning_rate": 0.0004919866444073455, + "loss": 1.828, + "loss_base2": 2.6372, + "loss_pixel": 0.1922, + "loss_text": 1.6359, + "ppl": 6.2214, + "step": 2120 + }, + { + "epoch": 0.01, + "global_step": 2121, + "learning_rate": 0.0004919824707846411, + "loss": 1.8441, + "loss_base2": 2.6605, + "loss_pixel": 0.1917, + "loss_text": 1.6525, + "ppl": 6.3224, + "step": 2121 + }, + { + "epoch": 0.01, + "global_step": 2122, + "learning_rate": 0.0004919782971619366, + "loss": 1.8506, + "loss_base2": 2.6699, + "loss_pixel": 0.1923, + "loss_text": 1.6583, + "ppl": 6.3636, + "step": 2122 + }, + { + "epoch": 0.01, + "global_step": 2123, + "learning_rate": 0.0004919741235392321, + "loss": 1.8428, + "loss_base2": 2.6586, + "loss_pixel": 0.1909, + "loss_text": 1.6519, + "ppl": 6.3142, + "step": 2123 + }, + { + "epoch": 0.01, + "global_step": 2124, + "learning_rate": 0.0004919699499165276, + "loss": 1.8447, + "loss_base2": 2.6613, + "loss_pixel": 0.1919, + "loss_text": 1.6528, + "ppl": 6.3262, + "step": 2124 + }, + { + "epoch": 0.01, + "global_step": 2125, + "learning_rate": 0.0004919657762938231, + "loss": 1.8705, + "loss_base2": 2.6986, + "loss_pixel": 0.1923, + "loss_text": 1.6782, + "ppl": 6.4915, + "step": 2125 + }, + { + "epoch": 0.01, + "global_step": 2126, + "learning_rate": 0.0004919616026711186, + "loss": 1.865, + "loss_base2": 2.6906, + "loss_pixel": 0.1911, + "loss_text": 1.6738, + "ppl": 6.4559, + "step": 2126 + }, + { + "epoch": 0.01, + "global_step": 2127, + "learning_rate": 0.000491957429048414, + "loss": 1.8656, + "loss_base2": 2.6915, + "loss_pixel": 0.1927, + "loss_text": 1.6729, + "ppl": 6.4598, + "step": 2127 + }, + { + "epoch": 0.01, + "global_step": 2128, + "learning_rate": 0.0004919532554257095, + "loss": 1.8311, + "loss_base2": 2.6417, + "loss_pixel": 0.1917, + "loss_text": 1.6394, + "ppl": 6.2407, + "step": 2128 + }, + { + "epoch": 0.01, + "global_step": 2129, + "learning_rate": 0.000491949081803005, + "loss": 1.8539, + "loss_base2": 2.6746, + "loss_pixel": 0.1921, + "loss_text": 1.6618, + "ppl": 6.3847, + "step": 2129 + }, + { + "epoch": 0.01, + "global_step": 2130, + "learning_rate": 0.0004919449081803005, + "loss": 1.8318, + "loss_base2": 2.6427, + "loss_pixel": 0.192, + "loss_text": 1.6398, + "ppl": 6.2451, + "step": 2130 + }, + { + "epoch": 0.01, + "global_step": 2131, + "learning_rate": 0.000491940734557596, + "loss": 1.8483, + "loss_base2": 2.6665, + "loss_pixel": 0.1912, + "loss_text": 1.6572, + "ppl": 6.349, + "step": 2131 + }, + { + "epoch": 0.01, + "global_step": 2132, + "learning_rate": 0.0004919365609348915, + "loss": 1.8393, + "loss_base2": 2.6535, + "loss_pixel": 0.1909, + "loss_text": 1.6483, + "ppl": 6.2921, + "step": 2132 + }, + { + "epoch": 0.01, + "global_step": 2133, + "learning_rate": 0.0004919323873121869, + "loss": 1.8582, + "loss_base2": 2.6808, + "loss_pixel": 0.1915, + "loss_text": 1.6667, + "ppl": 6.4122, + "step": 2133 + }, + { + "epoch": 0.01, + "global_step": 2134, + "learning_rate": 0.0004919282136894824, + "loss": 1.8654, + "loss_base2": 2.6912, + "loss_pixel": 0.1912, + "loss_text": 1.6742, + "ppl": 6.4585, + "step": 2134 + }, + { + "epoch": 0.01, + "global_step": 2135, + "learning_rate": 0.0004919240400667779, + "loss": 1.8567, + "loss_base2": 2.6787, + "loss_pixel": 0.1937, + "loss_text": 1.663, + "ppl": 6.4026, + "step": 2135 + }, + { + "epoch": 0.01, + "global_step": 2136, + "learning_rate": 0.0004919198664440734, + "loss": 1.8493, + "loss_base2": 2.668, + "loss_pixel": 0.1912, + "loss_text": 1.658, + "ppl": 6.3554, + "step": 2136 + }, + { + "epoch": 0.01, + "global_step": 2137, + "learning_rate": 0.000491915692821369, + "loss": 1.8408, + "loss_base2": 2.6557, + "loss_pixel": 0.1907, + "loss_text": 1.6502, + "ppl": 6.3016, + "step": 2137 + }, + { + "epoch": 0.01, + "global_step": 2138, + "learning_rate": 0.0004919115191986645, + "loss": 1.8627, + "loss_base2": 2.6873, + "loss_pixel": 0.1908, + "loss_text": 1.6718, + "ppl": 6.4411, + "step": 2138 + }, + { + "epoch": 0.01, + "global_step": 2139, + "learning_rate": 0.00049190734557596, + "loss": 1.8454, + "loss_base2": 2.6623, + "loss_pixel": 0.1913, + "loss_text": 1.6541, + "ppl": 6.3306, + "step": 2139 + }, + { + "epoch": 0.01, + "global_step": 2140, + "learning_rate": 0.0004919031719532555, + "loss": 1.866, + "loss_base2": 2.6921, + "loss_pixel": 0.1922, + "loss_text": 1.6738, + "ppl": 6.4624, + "step": 2140 + }, + { + "epoch": 0.01, + "global_step": 2141, + "learning_rate": 0.0004918989983305509, + "loss": 1.8244, + "loss_base2": 2.6321, + "loss_pixel": 0.1902, + "loss_text": 1.6342, + "ppl": 6.1991, + "step": 2141 + }, + { + "epoch": 0.01, + "global_step": 2142, + "learning_rate": 0.0004918948247078464, + "loss": 1.82, + "loss_base2": 2.6257, + "loss_pixel": 0.1911, + "loss_text": 1.6288, + "ppl": 6.1719, + "step": 2142 + }, + { + "epoch": 0.01, + "global_step": 2143, + "learning_rate": 0.0004918906510851419, + "loss": 1.8493, + "loss_base2": 2.668, + "loss_pixel": 0.1896, + "loss_text": 1.6597, + "ppl": 6.3554, + "step": 2143 + }, + { + "epoch": 0.01, + "global_step": 2144, + "learning_rate": 0.0004918864774624374, + "loss": 1.8474, + "loss_base2": 2.6652, + "loss_pixel": 0.191, + "loss_text": 1.6564, + "ppl": 6.3433, + "step": 2144 + }, + { + "epoch": 0.01, + "global_step": 2145, + "learning_rate": 0.0004918823038397329, + "loss": 1.8594, + "loss_base2": 2.6825, + "loss_pixel": 0.1909, + "loss_text": 1.6685, + "ppl": 6.4199, + "step": 2145 + }, + { + "epoch": 0.01, + "global_step": 2146, + "learning_rate": 0.0004918781302170284, + "loss": 1.8376, + "loss_base2": 2.6511, + "loss_pixel": 0.1905, + "loss_text": 1.6472, + "ppl": 6.2814, + "step": 2146 + }, + { + "epoch": 0.01, + "global_step": 2147, + "learning_rate": 0.0004918739565943239, + "loss": 1.8497, + "loss_base2": 2.6686, + "loss_pixel": 0.1926, + "loss_text": 1.6571, + "ppl": 6.3579, + "step": 2147 + }, + { + "epoch": 0.01, + "global_step": 2148, + "learning_rate": 0.0004918697829716194, + "loss": 1.8494, + "loss_base2": 2.6681, + "loss_pixel": 0.191, + "loss_text": 1.6584, + "ppl": 6.356, + "step": 2148 + }, + { + "epoch": 0.01, + "global_step": 2149, + "learning_rate": 0.0004918656093489149, + "loss": 1.6507, + "loss_base2": 2.3815, + "loss_pixel": 0.191, + "loss_text": 1.4598, + "ppl": 5.2106, + "step": 2149 + }, + { + "epoch": 0.01, + "global_step": 2150, + "learning_rate": 0.0004918614357262103, + "loss": 1.6326, + "loss_base2": 2.3553, + "loss_pixel": 0.1907, + "loss_text": 1.4418, + "ppl": 5.1172, + "step": 2150 + }, + { + "epoch": 0.01, + "global_step": 2151, + "learning_rate": 0.0004918572621035058, + "loss": 1.6653, + "loss_base2": 2.4025, + "loss_pixel": 0.1915, + "loss_text": 1.4738, + "ppl": 5.2873, + "step": 2151 + }, + { + "epoch": 0.01, + "global_step": 2152, + "learning_rate": 0.0004918530884808013, + "loss": 1.6536, + "loss_base2": 2.3856, + "loss_pixel": 0.1932, + "loss_text": 1.4604, + "ppl": 5.2258, + "step": 2152 + }, + { + "epoch": 0.01, + "global_step": 2153, + "learning_rate": 0.0004918489148580969, + "loss": 1.6839, + "loss_base2": 2.4294, + "loss_pixel": 0.1909, + "loss_text": 1.493, + "ppl": 5.3865, + "step": 2153 + }, + { + "epoch": 0.01, + "global_step": 2154, + "learning_rate": 0.0004918447412353924, + "loss": 1.6655, + "loss_base2": 2.4028, + "loss_pixel": 0.1925, + "loss_text": 1.473, + "ppl": 5.2883, + "step": 2154 + }, + { + "epoch": 0.01, + "global_step": 2155, + "learning_rate": 0.0004918405676126878, + "loss": 1.6687, + "loss_base2": 2.4074, + "loss_pixel": 0.1922, + "loss_text": 1.4765, + "ppl": 5.3053, + "step": 2155 + }, + { + "epoch": 0.01, + "global_step": 2156, + "learning_rate": 0.0004918363939899833, + "loss": 1.6606, + "loss_base2": 2.3957, + "loss_pixel": 0.1906, + "loss_text": 1.47, + "ppl": 5.2625, + "step": 2156 + }, + { + "epoch": 0.01, + "global_step": 2157, + "learning_rate": 0.0004918322203672788, + "loss": 1.6603, + "loss_base2": 2.3953, + "loss_pixel": 0.1926, + "loss_text": 1.4677, + "ppl": 5.2609, + "step": 2157 + }, + { + "epoch": 0.01, + "global_step": 2158, + "learning_rate": 0.0004918280467445743, + "loss": 1.6738, + "loss_base2": 2.4148, + "loss_pixel": 0.1912, + "loss_text": 1.4826, + "ppl": 5.3324, + "step": 2158 + }, + { + "epoch": 0.01, + "global_step": 2159, + "learning_rate": 0.0004918238731218698, + "loss": 1.6655, + "loss_base2": 2.4028, + "loss_pixel": 0.1929, + "loss_text": 1.4726, + "ppl": 5.2883, + "step": 2159 + }, + { + "epoch": 0.01, + "global_step": 2160, + "learning_rate": 0.0004918196994991653, + "loss": 1.6633, + "loss_base2": 2.3996, + "loss_pixel": 0.1964, + "loss_text": 1.467, + "ppl": 5.2767, + "step": 2160 + }, + { + "epoch": 0.01, + "global_step": 2161, + "learning_rate": 0.0004918155258764608, + "loss": 1.6565, + "loss_base2": 2.3898, + "loss_pixel": 0.1949, + "loss_text": 1.4616, + "ppl": 5.2409, + "step": 2161 + }, + { + "epoch": 0.01, + "global_step": 2162, + "learning_rate": 0.0004918113522537563, + "loss": 1.675, + "loss_base2": 2.4165, + "loss_pixel": 0.1954, + "loss_text": 1.4796, + "ppl": 5.3388, + "step": 2162 + }, + { + "epoch": 0.01, + "global_step": 2163, + "learning_rate": 0.0004918071786310518, + "loss": 1.6344, + "loss_base2": 2.3579, + "loss_pixel": 0.1933, + "loss_text": 1.441, + "ppl": 5.1264, + "step": 2163 + }, + { + "epoch": 0.01, + "global_step": 2164, + "learning_rate": 0.0004918030050083472, + "loss": 1.8056, + "loss_base2": 2.6049, + "loss_pixel": 0.1942, + "loss_text": 1.6114, + "ppl": 6.0836, + "step": 2164 + }, + { + "epoch": 0.01, + "global_step": 2165, + "learning_rate": 0.0004917988313856427, + "loss": 1.8908, + "loss_base2": 2.7278, + "loss_pixel": 0.1938, + "loss_text": 1.697, + "ppl": 6.6247, + "step": 2165 + }, + { + "epoch": 0.01, + "global_step": 2166, + "learning_rate": 0.0004917946577629382, + "loss": 1.8738, + "loss_base2": 2.7033, + "loss_pixel": 0.1923, + "loss_text": 1.6815, + "ppl": 6.513, + "step": 2166 + }, + { + "epoch": 0.01, + "global_step": 2167, + "learning_rate": 0.0004917904841402337, + "loss": 1.8827, + "loss_base2": 2.7162, + "loss_pixel": 0.1944, + "loss_text": 1.6883, + "ppl": 6.5712, + "step": 2167 + }, + { + "epoch": 0.01, + "global_step": 2168, + "learning_rate": 0.0004917863105175292, + "loss": 1.8859, + "loss_base2": 2.7208, + "loss_pixel": 0.193, + "loss_text": 1.6929, + "ppl": 6.5923, + "step": 2168 + }, + { + "epoch": 0.01, + "global_step": 2169, + "learning_rate": 0.0004917821368948248, + "loss": 1.8759, + "loss_base2": 2.7064, + "loss_pixel": 0.1922, + "loss_text": 1.6837, + "ppl": 6.5267, + "step": 2169 + }, + { + "epoch": 0.01, + "global_step": 2170, + "learning_rate": 0.0004917779632721203, + "loss": 1.8864, + "loss_base2": 2.7215, + "loss_pixel": 0.1919, + "loss_text": 1.6945, + "ppl": 6.5956, + "step": 2170 + }, + { + "epoch": 0.01, + "global_step": 2171, + "learning_rate": 0.0004917737896494157, + "loss": 1.8781, + "loss_base2": 2.7095, + "loss_pixel": 0.1927, + "loss_text": 1.6854, + "ppl": 6.5411, + "step": 2171 + }, + { + "epoch": 0.01, + "global_step": 2172, + "learning_rate": 0.0004917696160267112, + "loss": 1.8748, + "loss_base2": 2.7048, + "loss_pixel": 0.1963, + "loss_text": 1.6785, + "ppl": 6.5195, + "step": 2172 + }, + { + "epoch": 0.01, + "global_step": 2173, + "learning_rate": 0.0004917654424040067, + "loss": 1.8902, + "loss_base2": 2.727, + "loss_pixel": 0.2009, + "loss_text": 1.6893, + "ppl": 6.6207, + "step": 2173 + }, + { + "epoch": 0.01, + "global_step": 2174, + "learning_rate": 0.0004917612687813022, + "loss": 1.8719, + "loss_base2": 2.7006, + "loss_pixel": 0.2011, + "loss_text": 1.6708, + "ppl": 6.5006, + "step": 2174 + }, + { + "epoch": 0.01, + "global_step": 2175, + "learning_rate": 0.0004917570951585977, + "loss": 1.8838, + "loss_base2": 2.7177, + "loss_pixel": 0.2003, + "loss_text": 1.6835, + "ppl": 6.5785, + "step": 2175 + }, + { + "epoch": 0.01, + "global_step": 2176, + "learning_rate": 0.0004917529215358932, + "loss": 1.8761, + "loss_base2": 2.7066, + "loss_pixel": 0.1997, + "loss_text": 1.6765, + "ppl": 6.528, + "step": 2176 + }, + { + "epoch": 0.01, + "global_step": 2177, + "learning_rate": 0.0004917487479131886, + "loss": 1.8872, + "loss_base2": 2.7227, + "loss_pixel": 0.1997, + "loss_text": 1.6875, + "ppl": 6.6009, + "step": 2177 + }, + { + "epoch": 0.01, + "global_step": 2178, + "learning_rate": 0.0004917445742904841, + "loss": 1.8871, + "loss_base2": 2.7225, + "loss_pixel": 0.2005, + "loss_text": 1.6866, + "ppl": 6.6002, + "step": 2178 + }, + { + "epoch": 0.01, + "global_step": 2179, + "learning_rate": 0.0004917404006677796, + "loss": 1.8652, + "loss_base2": 2.6909, + "loss_pixel": 0.2019, + "loss_text": 1.6633, + "ppl": 6.4572, + "step": 2179 + }, + { + "epoch": 0.01, + "global_step": 2180, + "learning_rate": 0.0004917362270450751, + "loss": 1.864, + "loss_base2": 2.6892, + "loss_pixel": 0.1979, + "loss_text": 1.6662, + "ppl": 6.4495, + "step": 2180 + }, + { + "epoch": 0.01, + "global_step": 2181, + "learning_rate": 0.0004917320534223706, + "loss": 1.8702, + "loss_base2": 2.6981, + "loss_pixel": 0.196, + "loss_text": 1.6742, + "ppl": 6.4896, + "step": 2181 + }, + { + "epoch": 0.01, + "global_step": 2182, + "learning_rate": 0.0004917278797996661, + "loss": 1.8441, + "loss_base2": 2.6605, + "loss_pixel": 0.1983, + "loss_text": 1.6458, + "ppl": 6.3224, + "step": 2182 + }, + { + "epoch": 0.01, + "global_step": 2183, + "learning_rate": 0.0004917237061769616, + "loss": 1.8528, + "loss_base2": 2.673, + "loss_pixel": 0.1954, + "loss_text": 1.6573, + "ppl": 6.3777, + "step": 2183 + }, + { + "epoch": 0.01, + "global_step": 2184, + "learning_rate": 0.0004917195325542571, + "loss": 1.8599, + "loss_base2": 2.6833, + "loss_pixel": 0.1947, + "loss_text": 1.6651, + "ppl": 6.4231, + "step": 2184 + }, + { + "epoch": 0.01, + "global_step": 2185, + "learning_rate": 0.0004917153589315527, + "loss": 1.8611, + "loss_base2": 2.685, + "loss_pixel": 0.1951, + "loss_text": 1.666, + "ppl": 6.4308, + "step": 2185 + }, + { + "epoch": 0.01, + "global_step": 2186, + "learning_rate": 0.0004917111853088481, + "loss": 1.6943, + "loss_base2": 2.4444, + "loss_pixel": 0.1954, + "loss_text": 1.4989, + "ppl": 5.4428, + "step": 2186 + }, + { + "epoch": 0.01, + "global_step": 2187, + "learning_rate": 0.0004917070116861436, + "loss": 1.6456, + "loss_base2": 2.3741, + "loss_pixel": 0.1954, + "loss_text": 1.4502, + "ppl": 5.1841, + "step": 2187 + }, + { + "epoch": 0.01, + "global_step": 2188, + "learning_rate": 0.0004917028380634391, + "loss": 1.6421, + "loss_base2": 2.369, + "loss_pixel": 0.1944, + "loss_text": 1.4477, + "ppl": 5.166, + "step": 2188 + }, + { + "epoch": 0.01, + "global_step": 2189, + "learning_rate": 0.0004916986644407346, + "loss": 1.6463, + "loss_base2": 2.3751, + "loss_pixel": 0.1931, + "loss_text": 1.4532, + "ppl": 5.1877, + "step": 2189 + }, + { + "epoch": 0.01, + "global_step": 2190, + "learning_rate": 0.0004916944908180301, + "loss": 1.6115, + "loss_base2": 2.3249, + "loss_pixel": 0.1939, + "loss_text": 1.4176, + "ppl": 5.0103, + "step": 2190 + }, + { + "epoch": 0.01, + "global_step": 2191, + "learning_rate": 0.0004916903171953255, + "loss": 1.6329, + "loss_base2": 2.3558, + "loss_pixel": 0.1961, + "loss_text": 1.4368, + "ppl": 5.1187, + "step": 2191 + }, + { + "epoch": 0.01, + "global_step": 2192, + "learning_rate": 0.000491686143572621, + "loss": 1.6316, + "loss_base2": 2.3539, + "loss_pixel": 0.1976, + "loss_text": 1.434, + "ppl": 5.112, + "step": 2192 + }, + { + "epoch": 0.01, + "global_step": 2193, + "learning_rate": 0.0004916819699499165, + "loss": 1.6219, + "loss_base2": 2.3399, + "loss_pixel": 0.2002, + "loss_text": 1.4216, + "ppl": 5.0627, + "step": 2193 + }, + { + "epoch": 0.01, + "global_step": 2194, + "learning_rate": 0.000491677796327212, + "loss": 1.6241, + "loss_base2": 2.3431, + "loss_pixel": 0.2012, + "loss_text": 1.4229, + "ppl": 5.0739, + "step": 2194 + }, + { + "epoch": 0.01, + "global_step": 2195, + "learning_rate": 0.0004916736227045075, + "loss": 1.6542, + "loss_base2": 2.3865, + "loss_pixel": 0.2038, + "loss_text": 1.4503, + "ppl": 5.2289, + "step": 2195 + }, + { + "epoch": 0.01, + "global_step": 2196, + "learning_rate": 0.000491669449081803, + "loss": 1.6246, + "loss_base2": 2.3438, + "loss_pixel": 0.201, + "loss_text": 1.4235, + "ppl": 5.0764, + "step": 2196 + }, + { + "epoch": 0.01, + "global_step": 2197, + "learning_rate": 0.0004916652754590985, + "loss": 1.6271, + "loss_base2": 2.3474, + "loss_pixel": 0.203, + "loss_text": 1.4242, + "ppl": 5.0891, + "step": 2197 + }, + { + "epoch": 0.01, + "global_step": 2198, + "learning_rate": 0.000491661101836394, + "loss": 1.6121, + "loss_base2": 2.3258, + "loss_pixel": 0.1996, + "loss_text": 1.4125, + "ppl": 5.0133, + "step": 2198 + }, + { + "epoch": 0.01, + "global_step": 2199, + "learning_rate": 0.0004916569282136895, + "loss": 1.6352, + "loss_base2": 2.3591, + "loss_pixel": 0.1975, + "loss_text": 1.4377, + "ppl": 5.1305, + "step": 2199 + }, + { + "epoch": 0.01, + "global_step": 2200, + "learning_rate": 0.0004916527545909849, + "loss": 1.6077, + "loss_base2": 2.3194, + "loss_pixel": 0.1965, + "loss_text": 1.4112, + "ppl": 4.9913, + "step": 2200 + }, + { + "epoch": 0.01, + "global_step": 2201, + "learning_rate": 0.0004916485809682804, + "loss": 1.6294, + "loss_base2": 2.3507, + "loss_pixel": 0.1969, + "loss_text": 1.4325, + "ppl": 5.1008, + "step": 2201 + }, + { + "epoch": 0.01, + "global_step": 2202, + "learning_rate": 0.000491644407345576, + "loss": 1.8823, + "loss_base2": 2.7156, + "loss_pixel": 0.1956, + "loss_text": 1.6867, + "ppl": 6.5686, + "step": 2202 + }, + { + "epoch": 0.01, + "global_step": 2203, + "learning_rate": 0.0004916402337228715, + "loss": 1.8828, + "loss_base2": 2.7163, + "loss_pixel": 0.1978, + "loss_text": 1.6849, + "ppl": 6.5719, + "step": 2203 + }, + { + "epoch": 0.01, + "global_step": 2204, + "learning_rate": 0.000491636060100167, + "loss": 1.8885, + "loss_base2": 2.7245, + "loss_pixel": 0.1949, + "loss_text": 1.6936, + "ppl": 6.6094, + "step": 2204 + }, + { + "epoch": 0.01, + "global_step": 2205, + "learning_rate": 0.0004916318864774625, + "loss": 1.8495, + "loss_base2": 2.6683, + "loss_pixel": 0.1936, + "loss_text": 1.6559, + "ppl": 6.3566, + "step": 2205 + }, + { + "epoch": 0.01, + "global_step": 2206, + "learning_rate": 0.000491627712854758, + "loss": 1.8669, + "loss_base2": 2.6934, + "loss_pixel": 0.1942, + "loss_text": 1.6727, + "ppl": 6.4682, + "step": 2206 + }, + { + "epoch": 0.01, + "global_step": 2207, + "learning_rate": 0.0004916235392320535, + "loss": 1.8657, + "loss_base2": 2.6916, + "loss_pixel": 0.1931, + "loss_text": 1.6726, + "ppl": 6.4605, + "step": 2207 + }, + { + "epoch": 0.01, + "global_step": 2208, + "learning_rate": 0.000491619365609349, + "loss": 1.8663, + "loss_base2": 2.6925, + "loss_pixel": 0.1935, + "loss_text": 1.6727, + "ppl": 6.4643, + "step": 2208 + }, + { + "epoch": 0.01, + "global_step": 2209, + "learning_rate": 0.0004916151919866444, + "loss": 1.8712, + "loss_base2": 2.6996, + "loss_pixel": 0.1929, + "loss_text": 1.6783, + "ppl": 6.4961, + "step": 2209 + }, + { + "epoch": 0.01, + "global_step": 2210, + "learning_rate": 0.0004916110183639399, + "loss": 1.8756, + "loss_base2": 2.7059, + "loss_pixel": 0.1938, + "loss_text": 1.6817, + "ppl": 6.5247, + "step": 2210 + }, + { + "epoch": 0.01, + "global_step": 2211, + "learning_rate": 0.0004916068447412354, + "loss": 1.8424, + "loss_base2": 2.658, + "loss_pixel": 0.195, + "loss_text": 1.6475, + "ppl": 6.3117, + "step": 2211 + }, + { + "epoch": 0.01, + "global_step": 2212, + "learning_rate": 0.0004916026711185309, + "loss": 1.864, + "loss_base2": 2.6892, + "loss_pixel": 0.1926, + "loss_text": 1.6714, + "ppl": 6.4495, + "step": 2212 + }, + { + "epoch": 0.01, + "global_step": 2213, + "learning_rate": 0.0004915984974958264, + "loss": 1.8624, + "loss_base2": 2.6869, + "loss_pixel": 0.1921, + "loss_text": 1.6703, + "ppl": 6.4392, + "step": 2213 + }, + { + "epoch": 0.01, + "global_step": 2214, + "learning_rate": 0.0004915943238731218, + "loss": 1.831, + "loss_base2": 2.6416, + "loss_pixel": 0.1925, + "loss_text": 1.6385, + "ppl": 6.2401, + "step": 2214 + }, + { + "epoch": 0.01, + "global_step": 2215, + "learning_rate": 0.0004915901502504173, + "loss": 1.8472, + "loss_base2": 2.6649, + "loss_pixel": 0.1923, + "loss_text": 1.6549, + "ppl": 6.342, + "step": 2215 + }, + { + "epoch": 0.01, + "global_step": 2216, + "learning_rate": 0.0004915859766277128, + "loss": 1.8568, + "loss_base2": 2.6788, + "loss_pixel": 0.193, + "loss_text": 1.6638, + "ppl": 6.4032, + "step": 2216 + }, + { + "epoch": 0.01, + "global_step": 2217, + "learning_rate": 0.0004915818030050083, + "loss": 1.856, + "loss_base2": 2.6776, + "loss_pixel": 0.1923, + "loss_text": 1.6637, + "ppl": 6.3981, + "step": 2217 + }, + { + "epoch": 0.01, + "global_step": 2218, + "learning_rate": 0.0004915776293823039, + "loss": 1.8505, + "loss_base2": 2.6697, + "loss_pixel": 0.1902, + "loss_text": 1.6603, + "ppl": 6.363, + "step": 2218 + }, + { + "epoch": 0.01, + "global_step": 2219, + "learning_rate": 0.0004915734557595994, + "loss": 1.8623, + "loss_base2": 2.6867, + "loss_pixel": 0.1915, + "loss_text": 1.6708, + "ppl": 6.4385, + "step": 2219 + }, + { + "epoch": 0.01, + "global_step": 2220, + "learning_rate": 0.0004915692821368949, + "loss": 1.8576, + "loss_base2": 2.68, + "loss_pixel": 0.1918, + "loss_text": 1.6658, + "ppl": 6.4083, + "step": 2220 + }, + { + "epoch": 0.01, + "global_step": 2221, + "learning_rate": 0.0004915651085141904, + "loss": 1.8512, + "loss_base2": 2.6707, + "loss_pixel": 0.1919, + "loss_text": 1.6594, + "ppl": 6.3675, + "step": 2221 + }, + { + "epoch": 0.01, + "global_step": 2222, + "learning_rate": 0.0004915609348914859, + "loss": 1.8481, + "loss_base2": 2.6662, + "loss_pixel": 0.1913, + "loss_text": 1.6568, + "ppl": 6.3477, + "step": 2222 + }, + { + "epoch": 0.01, + "global_step": 2223, + "learning_rate": 0.0004915567612687813, + "loss": 1.8569, + "loss_base2": 2.6789, + "loss_pixel": 0.1914, + "loss_text": 1.6655, + "ppl": 6.4039, + "step": 2223 + }, + { + "epoch": 0.01, + "global_step": 2224, + "learning_rate": 0.0004915525876460768, + "loss": 1.8683, + "loss_base2": 2.6954, + "loss_pixel": 0.1911, + "loss_text": 1.6772, + "ppl": 6.4773, + "step": 2224 + }, + { + "epoch": 0.01, + "global_step": 2225, + "learning_rate": 0.0004915484140233723, + "loss": 1.8455, + "loss_base2": 2.6625, + "loss_pixel": 0.1898, + "loss_text": 1.6557, + "ppl": 6.3313, + "step": 2225 + }, + { + "epoch": 0.01, + "global_step": 2226, + "learning_rate": 0.0004915442404006678, + "loss": 1.8092, + "loss_base2": 2.6101, + "loss_pixel": 0.1911, + "loss_text": 1.6181, + "ppl": 6.1056, + "step": 2226 + }, + { + "epoch": 0.01, + "global_step": 2227, + "learning_rate": 0.0004915400667779632, + "loss": 1.6475, + "loss_base2": 2.3768, + "loss_pixel": 0.1913, + "loss_text": 1.4563, + "ppl": 5.194, + "step": 2227 + }, + { + "epoch": 0.01, + "global_step": 2228, + "learning_rate": 0.0004915358931552587, + "loss": 1.6187, + "loss_base2": 2.3353, + "loss_pixel": 0.1924, + "loss_text": 1.4263, + "ppl": 5.0465, + "step": 2228 + }, + { + "epoch": 0.01, + "global_step": 2229, + "learning_rate": 0.0004915317195325542, + "loss": 1.6144, + "loss_base2": 2.3291, + "loss_pixel": 0.1914, + "loss_text": 1.423, + "ppl": 5.0249, + "step": 2229 + }, + { + "epoch": 0.01, + "global_step": 2230, + "learning_rate": 0.0004915275459098497, + "loss": 1.6096, + "loss_base2": 2.3222, + "loss_pixel": 0.191, + "loss_text": 1.4186, + "ppl": 5.0008, + "step": 2230 + }, + { + "epoch": 0.01, + "global_step": 2231, + "learning_rate": 0.0004915233722871452, + "loss": 1.6009, + "loss_base2": 2.3096, + "loss_pixel": 0.1934, + "loss_text": 1.4075, + "ppl": 4.9575, + "step": 2231 + }, + { + "epoch": 0.01, + "global_step": 2232, + "learning_rate": 0.0004915191986644407, + "loss": 1.6103, + "loss_base2": 2.3232, + "loss_pixel": 0.192, + "loss_text": 1.4184, + "ppl": 5.0043, + "step": 2232 + }, + { + "epoch": 0.01, + "global_step": 2233, + "learning_rate": 0.0004915150250417362, + "loss": 1.5966, + "loss_base2": 2.3034, + "loss_pixel": 0.1915, + "loss_text": 1.4051, + "ppl": 4.9362, + "step": 2233 + }, + { + "epoch": 0.01, + "global_step": 2234, + "learning_rate": 0.0004915108514190318, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.1945, + "loss_text": 1.4206, + "ppl": 5.0284, + "step": 2234 + }, + { + "epoch": 0.01, + "global_step": 2235, + "learning_rate": 0.0004915066777963273, + "loss": 1.62, + "loss_base2": 2.3372, + "loss_pixel": 0.1928, + "loss_text": 1.4271, + "ppl": 5.0531, + "step": 2235 + }, + { + "epoch": 0.01, + "global_step": 2236, + "learning_rate": 0.0004915025041736227, + "loss": 1.5974, + "loss_base2": 2.3046, + "loss_pixel": 0.1905, + "loss_text": 1.4069, + "ppl": 4.9402, + "step": 2236 + }, + { + "epoch": 0.01, + "global_step": 2237, + "learning_rate": 0.0004914983305509182, + "loss": 1.6146, + "loss_base2": 2.3294, + "loss_pixel": 0.1925, + "loss_text": 1.4222, + "ppl": 5.0259, + "step": 2237 + }, + { + "epoch": 0.01, + "global_step": 2238, + "learning_rate": 0.0004914941569282137, + "loss": 1.6042, + "loss_base2": 2.3144, + "loss_pixel": 0.1926, + "loss_text": 1.4115, + "ppl": 4.9739, + "step": 2238 + }, + { + "epoch": 0.01, + "global_step": 2239, + "learning_rate": 0.0004914899833055092, + "loss": 1.6033, + "loss_base2": 2.3131, + "loss_pixel": 0.1914, + "loss_text": 1.412, + "ppl": 4.9694, + "step": 2239 + }, + { + "epoch": 0.01, + "global_step": 2240, + "learning_rate": 0.0004914858096828047, + "loss": 1.6153, + "loss_base2": 2.3304, + "loss_pixel": 0.1922, + "loss_text": 1.423, + "ppl": 5.0294, + "step": 2240 + }, + { + "epoch": 0.01, + "global_step": 2241, + "learning_rate": 0.0004914816360601002, + "loss": 1.6174, + "loss_base2": 2.3334, + "loss_pixel": 0.1902, + "loss_text": 1.4272, + "ppl": 5.04, + "step": 2241 + }, + { + "epoch": 0.01, + "global_step": 2242, + "learning_rate": 0.0004914774624373957, + "loss": 1.6209, + "loss_base2": 2.3385, + "loss_pixel": 0.1912, + "loss_text": 1.4297, + "ppl": 5.0576, + "step": 2242 + }, + { + "epoch": 0.01, + "global_step": 2243, + "learning_rate": 0.0004914732888146912, + "loss": 1.6041, + "loss_base2": 2.3142, + "loss_pixel": 0.1915, + "loss_text": 1.4126, + "ppl": 4.9734, + "step": 2243 + }, + { + "epoch": 0.01, + "global_step": 2244, + "learning_rate": 0.0004914691151919867, + "loss": 1.6, + "loss_base2": 2.3083, + "loss_pixel": 0.192, + "loss_text": 1.408, + "ppl": 4.953, + "step": 2244 + }, + { + "epoch": 0.01, + "global_step": 2245, + "learning_rate": 0.0004914649415692821, + "loss": 1.5989, + "loss_base2": 2.3067, + "loss_pixel": 0.1905, + "loss_text": 1.4085, + "ppl": 4.9476, + "step": 2245 + }, + { + "epoch": 0.01, + "global_step": 2246, + "learning_rate": 0.0004914607679465776, + "loss": 1.6079, + "loss_base2": 2.3197, + "loss_pixel": 0.192, + "loss_text": 1.416, + "ppl": 4.9923, + "step": 2246 + }, + { + "epoch": 0.01, + "global_step": 2247, + "learning_rate": 0.0004914565943238731, + "loss": 1.5869, + "loss_base2": 2.2894, + "loss_pixel": 0.1905, + "loss_text": 1.3964, + "ppl": 4.8886, + "step": 2247 + }, + { + "epoch": 0.01, + "global_step": 2248, + "learning_rate": 0.0004914524207011686, + "loss": 1.5955, + "loss_base2": 2.3018, + "loss_pixel": 0.1904, + "loss_text": 1.405, + "ppl": 4.9308, + "step": 2248 + }, + { + "epoch": 0.01, + "global_step": 2249, + "learning_rate": 0.0004914482470784641, + "loss": 1.5961, + "loss_base2": 2.3027, + "loss_pixel": 0.1909, + "loss_text": 1.4052, + "ppl": 4.9338, + "step": 2249 + }, + { + "epoch": 0.01, + "global_step": 2250, + "learning_rate": 0.0004914440734557595, + "loss": 1.599, + "loss_base2": 2.3069, + "loss_pixel": 0.191, + "loss_text": 1.408, + "ppl": 4.9481, + "step": 2250 + }, + { + "epoch": 0.01, + "global_step": 2251, + "learning_rate": 0.0004914398998330551, + "loss": 1.8971, + "loss_base2": 2.7369, + "loss_pixel": 0.191, + "loss_text": 1.7061, + "ppl": 6.6665, + "step": 2251 + }, + { + "epoch": 0.01, + "global_step": 2252, + "learning_rate": 0.0004914357262103506, + "loss": 1.8775, + "loss_base2": 2.7087, + "loss_pixel": 0.1907, + "loss_text": 1.6868, + "ppl": 6.5371, + "step": 2252 + }, + { + "epoch": 0.01, + "global_step": 2253, + "learning_rate": 0.0004914315525876461, + "loss": 1.8842, + "loss_base2": 2.7183, + "loss_pixel": 0.1906, + "loss_text": 1.6935, + "ppl": 6.5811, + "step": 2253 + }, + { + "epoch": 0.01, + "global_step": 2254, + "learning_rate": 0.0004914273789649416, + "loss": 1.8615, + "loss_base2": 2.6856, + "loss_pixel": 0.1907, + "loss_text": 1.6708, + "ppl": 6.4334, + "step": 2254 + }, + { + "epoch": 0.01, + "global_step": 2255, + "learning_rate": 0.0004914232053422371, + "loss": 1.8674, + "loss_base2": 2.6941, + "loss_pixel": 0.1891, + "loss_text": 1.6783, + "ppl": 6.4714, + "step": 2255 + }, + { + "epoch": 0.01, + "global_step": 2256, + "learning_rate": 0.0004914190317195326, + "loss": 1.8627, + "loss_base2": 2.6873, + "loss_pixel": 0.1903, + "loss_text": 1.6724, + "ppl": 6.4411, + "step": 2256 + }, + { + "epoch": 0.01, + "global_step": 2257, + "learning_rate": 0.0004914148580968281, + "loss": 1.8647, + "loss_base2": 2.6902, + "loss_pixel": 0.1903, + "loss_text": 1.6744, + "ppl": 6.454, + "step": 2257 + }, + { + "epoch": 0.01, + "global_step": 2258, + "learning_rate": 0.0004914106844741236, + "loss": 1.8618, + "loss_base2": 2.686, + "loss_pixel": 0.1905, + "loss_text": 1.6713, + "ppl": 6.4353, + "step": 2258 + }, + { + "epoch": 0.01, + "global_step": 2259, + "learning_rate": 0.000491406510851419, + "loss": 1.8598, + "loss_base2": 2.6831, + "loss_pixel": 0.19, + "loss_text": 1.6699, + "ppl": 6.4225, + "step": 2259 + }, + { + "epoch": 0.01, + "global_step": 2260, + "learning_rate": 0.0004914023372287145, + "loss": 1.85, + "loss_base2": 2.669, + "loss_pixel": 0.1907, + "loss_text": 1.6593, + "ppl": 6.3598, + "step": 2260 + }, + { + "epoch": 0.01, + "global_step": 2261, + "learning_rate": 0.00049139816360601, + "loss": 1.8429, + "loss_base2": 2.6587, + "loss_pixel": 0.1897, + "loss_text": 1.6532, + "ppl": 6.3148, + "step": 2261 + }, + { + "epoch": 0.01, + "global_step": 2262, + "learning_rate": 0.0004913939899833055, + "loss": 1.8615, + "loss_base2": 2.6856, + "loss_pixel": 0.1919, + "loss_text": 1.6696, + "ppl": 6.4334, + "step": 2262 + }, + { + "epoch": 0.01, + "global_step": 2263, + "learning_rate": 0.000491389816360601, + "loss": 1.8542, + "loss_base2": 2.675, + "loss_pixel": 0.1907, + "loss_text": 1.6635, + "ppl": 6.3866, + "step": 2263 + }, + { + "epoch": 0.01, + "global_step": 2264, + "learning_rate": 0.0004913856427378965, + "loss": 1.8495, + "loss_base2": 2.6683, + "loss_pixel": 0.1922, + "loss_text": 1.6573, + "ppl": 6.3566, + "step": 2264 + }, + { + "epoch": 0.01, + "global_step": 2265, + "learning_rate": 0.0004913814691151919, + "loss": 1.8572, + "loss_base2": 2.6794, + "loss_pixel": 0.1912, + "loss_text": 1.666, + "ppl": 6.4058, + "step": 2265 + }, + { + "epoch": 0.01, + "global_step": 2266, + "learning_rate": 0.0004913772954924874, + "loss": 1.866, + "loss_base2": 2.6921, + "loss_pixel": 0.1896, + "loss_text": 1.6764, + "ppl": 6.4624, + "step": 2266 + }, + { + "epoch": 0.01, + "global_step": 2267, + "learning_rate": 0.000491373121869783, + "loss": 1.8506, + "loss_base2": 2.6699, + "loss_pixel": 0.1908, + "loss_text": 1.6597, + "ppl": 6.3636, + "step": 2267 + }, + { + "epoch": 0.01, + "global_step": 2268, + "learning_rate": 0.0004913689482470785, + "loss": 1.8469, + "loss_base2": 2.6645, + "loss_pixel": 0.1897, + "loss_text": 1.6571, + "ppl": 6.3401, + "step": 2268 + }, + { + "epoch": 0.01, + "global_step": 2269, + "learning_rate": 0.000491364774624374, + "loss": 1.8501, + "loss_base2": 2.6691, + "loss_pixel": 0.189, + "loss_text": 1.6611, + "ppl": 6.3605, + "step": 2269 + }, + { + "epoch": 0.01, + "global_step": 2270, + "learning_rate": 0.0004913606010016695, + "loss": 1.8479, + "loss_base2": 2.666, + "loss_pixel": 0.1893, + "loss_text": 1.6586, + "ppl": 6.3465, + "step": 2270 + }, + { + "epoch": 0.01, + "global_step": 2271, + "learning_rate": 0.000491356427378965, + "loss": 1.8475, + "loss_base2": 2.6654, + "loss_pixel": 0.1886, + "loss_text": 1.659, + "ppl": 6.3439, + "step": 2271 + }, + { + "epoch": 0.01, + "global_step": 2272, + "learning_rate": 0.0004913522537562605, + "loss": 1.8255, + "loss_base2": 2.6336, + "loss_pixel": 0.1893, + "loss_text": 1.6362, + "ppl": 6.2059, + "step": 2272 + }, + { + "epoch": 0.01, + "global_step": 2273, + "learning_rate": 0.0004913480801335559, + "loss": 1.8536, + "loss_base2": 2.6742, + "loss_pixel": 0.1893, + "loss_text": 1.6643, + "ppl": 6.3828, + "step": 2273 + }, + { + "epoch": 0.01, + "global_step": 2274, + "learning_rate": 0.0004913439065108514, + "loss": 1.8421, + "loss_base2": 2.6576, + "loss_pixel": 0.1897, + "loss_text": 1.6524, + "ppl": 6.3098, + "step": 2274 + }, + { + "epoch": 0.01, + "global_step": 2275, + "learning_rate": 0.0004913397328881469, + "loss": 1.8622, + "loss_base2": 2.6866, + "loss_pixel": 0.1904, + "loss_text": 1.6718, + "ppl": 6.4379, + "step": 2275 + }, + { + "epoch": 0.01, + "global_step": 2276, + "learning_rate": 0.0004913355592654424, + "loss": 1.8551, + "loss_base2": 2.6763, + "loss_pixel": 0.1908, + "loss_text": 1.6643, + "ppl": 6.3923, + "step": 2276 + }, + { + "epoch": 0.01, + "global_step": 2277, + "learning_rate": 0.0004913313856427379, + "loss": 1.8514, + "loss_base2": 2.671, + "loss_pixel": 0.1889, + "loss_text": 1.6625, + "ppl": 6.3687, + "step": 2277 + }, + { + "epoch": 0.01, + "global_step": 2278, + "learning_rate": 0.0004913272120200334, + "loss": 1.8633, + "loss_base2": 2.6882, + "loss_pixel": 0.1899, + "loss_text": 1.6734, + "ppl": 6.445, + "step": 2278 + }, + { + "epoch": 0.01, + "global_step": 2279, + "learning_rate": 0.0004913230383973289, + "loss": 1.8591, + "loss_base2": 2.6821, + "loss_pixel": 0.189, + "loss_text": 1.6701, + "ppl": 6.418, + "step": 2279 + }, + { + "epoch": 0.01, + "global_step": 2280, + "learning_rate": 0.0004913188647746244, + "loss": 1.842, + "loss_base2": 2.6574, + "loss_pixel": 0.1897, + "loss_text": 1.6523, + "ppl": 6.3091, + "step": 2280 + }, + { + "epoch": 0.01, + "global_step": 2281, + "learning_rate": 0.00049131469115192, + "loss": 1.8411, + "loss_base2": 2.6561, + "loss_pixel": 0.1896, + "loss_text": 1.6514, + "ppl": 6.3035, + "step": 2281 + }, + { + "epoch": 0.01, + "global_step": 2282, + "learning_rate": 0.0004913105175292153, + "loss": 1.8419, + "loss_base2": 2.6573, + "loss_pixel": 0.1885, + "loss_text": 1.6534, + "ppl": 6.3085, + "step": 2282 + }, + { + "epoch": 0.01, + "global_step": 2283, + "learning_rate": 0.0004913063439065109, + "loss": 1.8491, + "loss_base2": 2.6677, + "loss_pixel": 0.1894, + "loss_text": 1.6597, + "ppl": 6.3541, + "step": 2283 + }, + { + "epoch": 0.01, + "global_step": 2284, + "learning_rate": 0.0004913021702838064, + "loss": 1.836, + "loss_base2": 2.6488, + "loss_pixel": 0.1894, + "loss_text": 1.6466, + "ppl": 6.2714, + "step": 2284 + }, + { + "epoch": 0.01, + "global_step": 2285, + "learning_rate": 0.0004912979966611019, + "loss": 1.8308, + "loss_base2": 2.6413, + "loss_pixel": 0.1896, + "loss_text": 1.6412, + "ppl": 6.2389, + "step": 2285 + }, + { + "epoch": 0.01, + "global_step": 2286, + "learning_rate": 0.0004912938230383973, + "loss": 1.841, + "loss_base2": 2.656, + "loss_pixel": 0.1902, + "loss_text": 1.6509, + "ppl": 6.3028, + "step": 2286 + }, + { + "epoch": 0.01, + "global_step": 2287, + "learning_rate": 0.0004912896494156928, + "loss": 1.8315, + "loss_base2": 2.6423, + "loss_pixel": 0.1889, + "loss_text": 1.6426, + "ppl": 6.2432, + "step": 2287 + }, + { + "epoch": 0.01, + "global_step": 2288, + "learning_rate": 0.0004912854757929883, + "loss": 1.852, + "loss_base2": 2.6719, + "loss_pixel": 0.1898, + "loss_text": 1.6622, + "ppl": 6.3726, + "step": 2288 + }, + { + "epoch": 0.01, + "global_step": 2289, + "learning_rate": 0.0004912813021702838, + "loss": 1.8278, + "loss_base2": 2.637, + "loss_pixel": 0.1886, + "loss_text": 1.6392, + "ppl": 6.2202, + "step": 2289 + }, + { + "epoch": 0.01, + "global_step": 2290, + "learning_rate": 0.0004912771285475793, + "loss": 1.8436, + "loss_base2": 2.6598, + "loss_pixel": 0.1895, + "loss_text": 1.6541, + "ppl": 6.3192, + "step": 2290 + }, + { + "epoch": 0.01, + "global_step": 2291, + "learning_rate": 0.0004912729549248748, + "loss": 1.8314, + "loss_base2": 2.6422, + "loss_pixel": 0.1894, + "loss_text": 1.6419, + "ppl": 6.2426, + "step": 2291 + }, + { + "epoch": 0.01, + "global_step": 2292, + "learning_rate": 0.0004912687813021703, + "loss": 1.8421, + "loss_base2": 2.6576, + "loss_pixel": 0.1878, + "loss_text": 1.6542, + "ppl": 6.3098, + "step": 2292 + }, + { + "epoch": 0.01, + "global_step": 2293, + "learning_rate": 0.0004912646076794658, + "loss": 1.8435, + "loss_base2": 2.6596, + "loss_pixel": 0.1887, + "loss_text": 1.6548, + "ppl": 6.3186, + "step": 2293 + }, + { + "epoch": 0.01, + "global_step": 2294, + "learning_rate": 0.0004912604340567613, + "loss": 1.8376, + "loss_base2": 2.6511, + "loss_pixel": 0.1879, + "loss_text": 1.6498, + "ppl": 6.2814, + "step": 2294 + }, + { + "epoch": 0.01, + "global_step": 2295, + "learning_rate": 0.0004912562604340567, + "loss": 1.8313, + "loss_base2": 2.642, + "loss_pixel": 0.189, + "loss_text": 1.6423, + "ppl": 6.242, + "step": 2295 + }, + { + "epoch": 0.01, + "global_step": 2296, + "learning_rate": 0.0004912520868113522, + "loss": 1.8358, + "loss_base2": 2.6485, + "loss_pixel": 0.1903, + "loss_text": 1.6456, + "ppl": 6.2701, + "step": 2296 + }, + { + "epoch": 0.01, + "global_step": 2297, + "learning_rate": 0.0004912479131886477, + "loss": 1.8424, + "loss_base2": 2.658, + "loss_pixel": 0.1882, + "loss_text": 1.6542, + "ppl": 6.3117, + "step": 2297 + }, + { + "epoch": 0.01, + "global_step": 2298, + "learning_rate": 0.0004912437395659432, + "loss": 1.8371, + "loss_base2": 2.6504, + "loss_pixel": 0.1913, + "loss_text": 1.6458, + "ppl": 6.2783, + "step": 2298 + }, + { + "epoch": 0.01, + "global_step": 2299, + "learning_rate": 0.0004912395659432388, + "loss": 1.8343, + "loss_base2": 2.6463, + "loss_pixel": 0.1888, + "loss_text": 1.6455, + "ppl": 6.2608, + "step": 2299 + }, + { + "epoch": 0.01, + "global_step": 2300, + "learning_rate": 0.0004912353923205343, + "loss": 1.8329, + "loss_base2": 2.6443, + "loss_pixel": 0.1906, + "loss_text": 1.6422, + "ppl": 6.252, + "step": 2300 + }, + { + "epoch": 0.01, + "global_step": 2301, + "learning_rate": 0.0004912312186978298, + "loss": 1.8266, + "loss_base2": 2.6352, + "loss_pixel": 0.1885, + "loss_text": 1.6381, + "ppl": 6.2127, + "step": 2301 + }, + { + "epoch": 0.01, + "global_step": 2302, + "learning_rate": 0.0004912270450751252, + "loss": 1.841, + "loss_base2": 2.656, + "loss_pixel": 0.1897, + "loss_text": 1.6514, + "ppl": 6.3028, + "step": 2302 + }, + { + "epoch": 0.01, + "global_step": 2303, + "learning_rate": 0.0004912228714524207, + "loss": 1.8221, + "loss_base2": 2.6287, + "loss_pixel": 0.1884, + "loss_text": 1.6337, + "ppl": 6.1848, + "step": 2303 + }, + { + "epoch": 0.01, + "global_step": 2304, + "learning_rate": 0.0004912186978297162, + "loss": 1.854, + "loss_base2": 2.6748, + "loss_pixel": 0.1905, + "loss_text": 1.6635, + "ppl": 6.3853, + "step": 2304 + }, + { + "epoch": 0.01, + "global_step": 2305, + "learning_rate": 0.0004912145242070117, + "loss": 1.8326, + "loss_base2": 2.6439, + "loss_pixel": 0.1898, + "loss_text": 1.6428, + "ppl": 6.2501, + "step": 2305 + }, + { + "epoch": 0.01, + "global_step": 2306, + "learning_rate": 0.0004912103505843072, + "loss": 1.8406, + "loss_base2": 2.6554, + "loss_pixel": 0.1887, + "loss_text": 1.6519, + "ppl": 6.3003, + "step": 2306 + }, + { + "epoch": 0.01, + "global_step": 2307, + "learning_rate": 0.0004912061769616027, + "loss": 1.8291, + "loss_base2": 2.6388, + "loss_pixel": 0.1896, + "loss_text": 1.6395, + "ppl": 6.2283, + "step": 2307 + }, + { + "epoch": 0.01, + "global_step": 2308, + "learning_rate": 0.0004912020033388982, + "loss": 1.8316, + "loss_base2": 2.6424, + "loss_pixel": 0.1892, + "loss_text": 1.6424, + "ppl": 6.2439, + "step": 2308 + }, + { + "epoch": 0.01, + "global_step": 2309, + "learning_rate": 0.0004911978297161936, + "loss": 1.8313, + "loss_base2": 2.642, + "loss_pixel": 0.1884, + "loss_text": 1.6429, + "ppl": 6.242, + "step": 2309 + }, + { + "epoch": 0.01, + "global_step": 2310, + "learning_rate": 0.0004911936560934891, + "loss": 1.8307, + "loss_base2": 2.6411, + "loss_pixel": 0.1882, + "loss_text": 1.6425, + "ppl": 6.2383, + "step": 2310 + }, + { + "epoch": 0.01, + "global_step": 2311, + "learning_rate": 0.0004911894824707846, + "loss": 1.8618, + "loss_base2": 2.686, + "loss_pixel": 0.1914, + "loss_text": 1.6704, + "ppl": 6.4353, + "step": 2311 + }, + { + "epoch": 0.01, + "global_step": 2312, + "learning_rate": 0.0004911853088480801, + "loss": 1.8336, + "loss_base2": 2.6453, + "loss_pixel": 0.1896, + "loss_text": 1.6441, + "ppl": 6.2564, + "step": 2312 + }, + { + "epoch": 0.01, + "global_step": 2313, + "learning_rate": 0.0004911811352253756, + "loss": 1.8317, + "loss_base2": 2.6426, + "loss_pixel": 0.1935, + "loss_text": 1.6382, + "ppl": 6.2445, + "step": 2313 + }, + { + "epoch": 0.01, + "global_step": 2314, + "learning_rate": 0.0004911769616026711, + "loss": 1.8259, + "loss_base2": 2.6342, + "loss_pixel": 0.1903, + "loss_text": 1.6356, + "ppl": 6.2084, + "step": 2314 + }, + { + "epoch": 0.01, + "global_step": 2315, + "learning_rate": 0.0004911727879799667, + "loss": 1.8375, + "loss_base2": 2.651, + "loss_pixel": 0.1886, + "loss_text": 1.6489, + "ppl": 6.2808, + "step": 2315 + }, + { + "epoch": 0.01, + "global_step": 2316, + "learning_rate": 0.0004911686143572622, + "loss": 1.8376, + "loss_base2": 2.6511, + "loss_pixel": 0.191, + "loss_text": 1.6467, + "ppl": 6.2814, + "step": 2316 + }, + { + "epoch": 0.01, + "global_step": 2317, + "learning_rate": 0.0004911644407345577, + "loss": 1.8412, + "loss_base2": 2.6563, + "loss_pixel": 0.19, + "loss_text": 1.6513, + "ppl": 6.3041, + "step": 2317 + }, + { + "epoch": 0.01, + "global_step": 2318, + "learning_rate": 0.0004911602671118531, + "loss": 1.8398, + "loss_base2": 2.6543, + "loss_pixel": 0.1882, + "loss_text": 1.6517, + "ppl": 6.2953, + "step": 2318 + }, + { + "epoch": 0.01, + "global_step": 2319, + "learning_rate": 0.0004911560934891486, + "loss": 1.8372, + "loss_base2": 2.6505, + "loss_pixel": 0.1884, + "loss_text": 1.6488, + "ppl": 6.2789, + "step": 2319 + }, + { + "epoch": 0.01, + "global_step": 2320, + "learning_rate": 0.0004911519198664441, + "loss": 1.841, + "loss_base2": 2.656, + "loss_pixel": 0.1859, + "loss_text": 1.6552, + "ppl": 6.3028, + "step": 2320 + }, + { + "epoch": 0.01, + "global_step": 2321, + "learning_rate": 0.0004911477462437396, + "loss": 1.8359, + "loss_base2": 2.6486, + "loss_pixel": 0.1934, + "loss_text": 1.6425, + "ppl": 6.2708, + "step": 2321 + }, + { + "epoch": 0.01, + "global_step": 2322, + "learning_rate": 0.0004911435726210351, + "loss": 1.819, + "loss_base2": 2.6243, + "loss_pixel": 0.1883, + "loss_text": 1.6307, + "ppl": 6.1657, + "step": 2322 + }, + { + "epoch": 0.01, + "global_step": 2323, + "learning_rate": 0.0004911393989983305, + "loss": 1.8289, + "loss_base2": 2.6385, + "loss_pixel": 0.1882, + "loss_text": 1.6407, + "ppl": 6.227, + "step": 2323 + }, + { + "epoch": 0.01, + "global_step": 2324, + "learning_rate": 0.000491135225375626, + "loss": 1.8414, + "loss_base2": 2.6566, + "loss_pixel": 0.1896, + "loss_text": 1.6518, + "ppl": 6.3054, + "step": 2324 + }, + { + "epoch": 0.01, + "global_step": 2325, + "learning_rate": 0.0004911310517529215, + "loss": 1.8348, + "loss_base2": 2.6471, + "loss_pixel": 0.1869, + "loss_text": 1.648, + "ppl": 6.2639, + "step": 2325 + }, + { + "epoch": 0.01, + "global_step": 2326, + "learning_rate": 0.000491126878130217, + "loss": 1.8292, + "loss_base2": 2.639, + "loss_pixel": 0.1873, + "loss_text": 1.6419, + "ppl": 6.2289, + "step": 2326 + }, + { + "epoch": 0.01, + "global_step": 2327, + "learning_rate": 0.0004911227045075125, + "loss": 1.8246, + "loss_base2": 2.6323, + "loss_pixel": 0.1858, + "loss_text": 1.6388, + "ppl": 6.2003, + "step": 2327 + }, + { + "epoch": 0.01, + "global_step": 2328, + "learning_rate": 0.000491118530884808, + "loss": 1.814, + "loss_base2": 2.617, + "loss_pixel": 0.1858, + "loss_text": 1.6282, + "ppl": 6.1349, + "step": 2328 + }, + { + "epoch": 0.01, + "global_step": 2329, + "learning_rate": 0.0004911143572621035, + "loss": 1.8365, + "loss_base2": 2.6495, + "loss_pixel": 0.1858, + "loss_text": 1.6507, + "ppl": 6.2745, + "step": 2329 + }, + { + "epoch": 0.01, + "global_step": 2330, + "learning_rate": 0.000491110183639399, + "loss": 1.8152, + "loss_base2": 2.6188, + "loss_pixel": 0.1867, + "loss_text": 1.6285, + "ppl": 6.1423, + "step": 2330 + }, + { + "epoch": 0.01, + "global_step": 2331, + "learning_rate": 0.0004911060100166946, + "loss": 1.8037, + "loss_base2": 2.6022, + "loss_pixel": 0.185, + "loss_text": 1.6187, + "ppl": 6.0721, + "step": 2331 + }, + { + "epoch": 0.01, + "global_step": 2332, + "learning_rate": 0.00049110183639399, + "loss": 1.8187, + "loss_base2": 2.6238, + "loss_pixel": 0.1872, + "loss_text": 1.6315, + "ppl": 6.1638, + "step": 2332 + }, + { + "epoch": 0.01, + "global_step": 2333, + "learning_rate": 0.0004910976627712855, + "loss": 1.828, + "loss_base2": 2.6372, + "loss_pixel": 0.1841, + "loss_text": 1.6439, + "ppl": 6.2214, + "step": 2333 + }, + { + "epoch": 0.01, + "global_step": 2334, + "learning_rate": 0.000491093489148581, + "loss": 1.8269, + "loss_base2": 2.6357, + "loss_pixel": 0.1856, + "loss_text": 1.6413, + "ppl": 6.2146, + "step": 2334 + }, + { + "epoch": 0.01, + "global_step": 2335, + "learning_rate": 0.0004910893155258765, + "loss": 1.8402, + "loss_base2": 2.6548, + "loss_pixel": 0.1832, + "loss_text": 1.6569, + "ppl": 6.2978, + "step": 2335 + }, + { + "epoch": 0.01, + "global_step": 2336, + "learning_rate": 0.000491085141903172, + "loss": 1.8233, + "loss_base2": 2.6305, + "loss_pixel": 0.1841, + "loss_text": 1.6392, + "ppl": 6.1923, + "step": 2336 + }, + { + "epoch": 0.01, + "global_step": 2337, + "learning_rate": 0.0004910809682804675, + "loss": 1.819, + "loss_base2": 2.6243, + "loss_pixel": 0.1853, + "loss_text": 1.6336, + "ppl": 6.1657, + "step": 2337 + }, + { + "epoch": 0.01, + "global_step": 2338, + "learning_rate": 0.000491076794657763, + "loss": 1.8392, + "loss_base2": 2.6534, + "loss_pixel": 0.1866, + "loss_text": 1.6526, + "ppl": 6.2915, + "step": 2338 + }, + { + "epoch": 0.01, + "global_step": 2339, + "learning_rate": 0.0004910726210350585, + "loss": 1.8212, + "loss_base2": 2.6274, + "loss_pixel": 0.1866, + "loss_text": 1.6345, + "ppl": 6.1793, + "step": 2339 + }, + { + "epoch": 0.01, + "global_step": 2340, + "learning_rate": 0.0004910684474123539, + "loss": 1.6984, + "loss_base2": 2.4503, + "loss_pixel": 0.1852, + "loss_text": 1.5132, + "ppl": 5.4652, + "step": 2340 + }, + { + "epoch": 0.01, + "global_step": 2341, + "learning_rate": 0.0004910642737896494, + "loss": 1.6174, + "loss_base2": 2.3334, + "loss_pixel": 0.184, + "loss_text": 1.4334, + "ppl": 5.04, + "step": 2341 + }, + { + "epoch": 0.01, + "global_step": 2342, + "learning_rate": 0.0004910601001669449, + "loss": 1.6069, + "loss_base2": 2.3183, + "loss_pixel": 0.1833, + "loss_text": 1.4237, + "ppl": 4.9873, + "step": 2342 + }, + { + "epoch": 0.01, + "global_step": 2343, + "learning_rate": 0.0004910559265442404, + "loss": 1.6017, + "loss_base2": 2.3108, + "loss_pixel": 0.184, + "loss_text": 1.4177, + "ppl": 4.9615, + "step": 2343 + }, + { + "epoch": 0.01, + "global_step": 2344, + "learning_rate": 0.0004910517529215359, + "loss": 1.6046, + "loss_base2": 2.3149, + "loss_pixel": 0.1833, + "loss_text": 1.4213, + "ppl": 4.9759, + "step": 2344 + }, + { + "epoch": 0.01, + "global_step": 2345, + "learning_rate": 0.0004910475792988313, + "loss": 1.6165, + "loss_base2": 2.3321, + "loss_pixel": 0.1845, + "loss_text": 1.432, + "ppl": 5.0354, + "step": 2345 + }, + { + "epoch": 0.01, + "global_step": 2346, + "learning_rate": 0.0004910434056761268, + "loss": 1.6049, + "loss_base2": 2.3154, + "loss_pixel": 0.2043, + "loss_text": 1.4007, + "ppl": 4.9774, + "step": 2346 + }, + { + "epoch": 0.01, + "global_step": 2347, + "learning_rate": 0.0004910392320534223, + "loss": 1.6056, + "loss_base2": 2.3164, + "loss_pixel": 0.2026, + "loss_text": 1.403, + "ppl": 4.9808, + "step": 2347 + }, + { + "epoch": 0.01, + "global_step": 2348, + "learning_rate": 0.0004910350584307179, + "loss": 1.6112, + "loss_base2": 2.3245, + "loss_pixel": 0.2014, + "loss_text": 1.4098, + "ppl": 5.0088, + "step": 2348 + }, + { + "epoch": 0.01, + "global_step": 2349, + "learning_rate": 0.0004910308848080134, + "loss": 1.5943, + "loss_base2": 2.3001, + "loss_pixel": 0.2009, + "loss_text": 1.3935, + "ppl": 4.9249, + "step": 2349 + }, + { + "epoch": 0.01, + "global_step": 2350, + "learning_rate": 0.0004910267111853089, + "loss": 1.5941, + "loss_base2": 2.2998, + "loss_pixel": 0.2005, + "loss_text": 1.3936, + "ppl": 4.9239, + "step": 2350 + }, + { + "epoch": 0.01, + "global_step": 2351, + "learning_rate": 0.0004910225375626044, + "loss": 1.5898, + "loss_base2": 2.2936, + "loss_pixel": 0.1947, + "loss_text": 1.3951, + "ppl": 4.9028, + "step": 2351 + }, + { + "epoch": 0.01, + "global_step": 2352, + "learning_rate": 0.0004910183639398999, + "loss": 1.6167, + "loss_base2": 2.3324, + "loss_pixel": 0.195, + "loss_text": 1.4217, + "ppl": 5.0364, + "step": 2352 + }, + { + "epoch": 0.01, + "global_step": 2353, + "learning_rate": 0.0004910141903171954, + "loss": 1.5985, + "loss_base2": 2.3061, + "loss_pixel": 0.1928, + "loss_text": 1.4058, + "ppl": 4.9456, + "step": 2353 + }, + { + "epoch": 0.01, + "global_step": 2354, + "learning_rate": 0.0004910100166944908, + "loss": 1.6074, + "loss_base2": 2.319, + "loss_pixel": 0.1963, + "loss_text": 1.4111, + "ppl": 4.9898, + "step": 2354 + }, + { + "epoch": 0.01, + "global_step": 2355, + "learning_rate": 0.0004910058430717863, + "loss": 1.5931, + "loss_base2": 2.2984, + "loss_pixel": 0.1932, + "loss_text": 1.3999, + "ppl": 4.919, + "step": 2355 + }, + { + "epoch": 0.01, + "global_step": 2356, + "learning_rate": 0.0004910016694490818, + "loss": 1.6237, + "loss_base2": 2.3425, + "loss_pixel": 0.1918, + "loss_text": 1.4319, + "ppl": 5.0718, + "step": 2356 + }, + { + "epoch": 0.01, + "global_step": 2357, + "learning_rate": 0.0004909974958263773, + "loss": 1.5848, + "loss_base2": 2.2864, + "loss_pixel": 0.1925, + "loss_text": 1.3923, + "ppl": 4.8783, + "step": 2357 + }, + { + "epoch": 0.01, + "global_step": 2358, + "learning_rate": 0.0004909933222036728, + "loss": 1.5811, + "loss_base2": 2.281, + "loss_pixel": 0.1909, + "loss_text": 1.3902, + "ppl": 4.8603, + "step": 2358 + }, + { + "epoch": 0.01, + "global_step": 2359, + "learning_rate": 0.0004909891485809682, + "loss": 1.626, + "loss_base2": 2.3458, + "loss_pixel": 0.1921, + "loss_text": 1.4339, + "ppl": 5.0835, + "step": 2359 + }, + { + "epoch": 0.01, + "global_step": 2360, + "learning_rate": 0.0004909849749582637, + "loss": 1.5888, + "loss_base2": 2.2922, + "loss_pixel": 0.1923, + "loss_text": 1.3965, + "ppl": 4.8979, + "step": 2360 + }, + { + "epoch": 0.01, + "global_step": 2361, + "learning_rate": 0.0004909808013355592, + "loss": 1.5861, + "loss_base2": 2.2883, + "loss_pixel": 0.1903, + "loss_text": 1.3958, + "ppl": 4.8847, + "step": 2361 + }, + { + "epoch": 0.01, + "global_step": 2362, + "learning_rate": 0.0004909766277128547, + "loss": 1.5985, + "loss_base2": 2.3061, + "loss_pixel": 0.1919, + "loss_text": 1.4066, + "ppl": 4.9456, + "step": 2362 + }, + { + "epoch": 0.01, + "global_step": 2363, + "learning_rate": 0.0004909724540901502, + "loss": 1.5846, + "loss_base2": 2.2861, + "loss_pixel": 0.1905, + "loss_text": 1.3941, + "ppl": 4.8773, + "step": 2363 + }, + { + "epoch": 0.01, + "global_step": 2364, + "learning_rate": 0.0004909682804674458, + "loss": 1.5954, + "loss_base2": 2.3017, + "loss_pixel": 0.1898, + "loss_text": 1.4055, + "ppl": 4.9303, + "step": 2364 + }, + { + "epoch": 0.01, + "global_step": 2365, + "learning_rate": 0.0004909641068447413, + "loss": 1.782, + "loss_base2": 2.5709, + "loss_pixel": 0.1899, + "loss_text": 1.5921, + "ppl": 5.9417, + "step": 2365 + }, + { + "epoch": 0.01, + "global_step": 2366, + "learning_rate": 0.0004909599332220368, + "loss": 1.5977, + "loss_base2": 2.305, + "loss_pixel": 0.1899, + "loss_text": 1.4078, + "ppl": 4.9417, + "step": 2366 + }, + { + "epoch": 0.01, + "global_step": 2367, + "learning_rate": 0.0004909557595993323, + "loss": 1.596, + "loss_base2": 2.3025, + "loss_pixel": 0.1899, + "loss_text": 1.4061, + "ppl": 4.9333, + "step": 2367 + }, + { + "epoch": 0.01, + "global_step": 2368, + "learning_rate": 0.0004909515859766277, + "loss": 1.5783, + "loss_base2": 2.277, + "loss_pixel": 0.1884, + "loss_text": 1.3899, + "ppl": 4.8467, + "step": 2368 + }, + { + "epoch": 0.01, + "global_step": 2369, + "learning_rate": 0.0004909474123539232, + "loss": 1.5748, + "loss_base2": 2.272, + "loss_pixel": 0.1904, + "loss_text": 1.3844, + "ppl": 4.8298, + "step": 2369 + }, + { + "epoch": 0.01, + "global_step": 2370, + "learning_rate": 0.0004909432387312187, + "loss": 1.6061, + "loss_base2": 2.3171, + "loss_pixel": 0.1897, + "loss_text": 1.4164, + "ppl": 4.9833, + "step": 2370 + }, + { + "epoch": 0.01, + "global_step": 2371, + "learning_rate": 0.0004909390651085142, + "loss": 1.5873, + "loss_base2": 2.29, + "loss_pixel": 0.1888, + "loss_text": 1.3985, + "ppl": 4.8905, + "step": 2371 + }, + { + "epoch": 0.01, + "global_step": 2372, + "learning_rate": 0.0004909348914858097, + "loss": 1.5932, + "loss_base2": 2.2985, + "loss_pixel": 0.1892, + "loss_text": 1.404, + "ppl": 4.9195, + "step": 2372 + }, + { + "epoch": 0.01, + "global_step": 2373, + "learning_rate": 0.0004909307178631052, + "loss": 1.597, + "loss_base2": 2.304, + "loss_pixel": 0.1893, + "loss_text": 1.4077, + "ppl": 4.9382, + "step": 2373 + }, + { + "epoch": 0.01, + "global_step": 2374, + "learning_rate": 0.0004909265442404007, + "loss": 1.7299, + "loss_base2": 2.4957, + "loss_pixel": 0.1889, + "loss_text": 1.541, + "ppl": 5.6401, + "step": 2374 + }, + { + "epoch": 0.01, + "global_step": 2375, + "learning_rate": 0.0004909223706176962, + "loss": 1.7106, + "loss_base2": 2.4679, + "loss_pixel": 0.1893, + "loss_text": 1.5213, + "ppl": 5.5323, + "step": 2375 + }, + { + "epoch": 0.01, + "global_step": 2376, + "learning_rate": 0.0004909181969949917, + "loss": 1.5876, + "loss_base2": 2.2904, + "loss_pixel": 0.1889, + "loss_text": 1.3988, + "ppl": 4.892, + "step": 2376 + }, + { + "epoch": 0.01, + "global_step": 2377, + "learning_rate": 0.0004909140233722871, + "loss": 1.5788, + "loss_base2": 2.2777, + "loss_pixel": 0.1885, + "loss_text": 1.3903, + "ppl": 4.8491, + "step": 2377 + }, + { + "epoch": 0.01, + "global_step": 2378, + "learning_rate": 0.0004909098497495826, + "loss": 1.5991, + "loss_base2": 2.307, + "loss_pixel": 0.1897, + "loss_text": 1.4093, + "ppl": 4.9486, + "step": 2378 + }, + { + "epoch": 0.01, + "global_step": 2379, + "learning_rate": 0.0004909056761268781, + "loss": 1.6066, + "loss_base2": 2.3178, + "loss_pixel": 0.1894, + "loss_text": 1.4173, + "ppl": 4.9858, + "step": 2379 + }, + { + "epoch": 0.01, + "global_step": 2380, + "learning_rate": 0.0004909015025041737, + "loss": 1.597, + "loss_base2": 2.304, + "loss_pixel": 0.1887, + "loss_text": 1.4083, + "ppl": 4.9382, + "step": 2380 + }, + { + "epoch": 0.01, + "global_step": 2381, + "learning_rate": 0.0004908973288814692, + "loss": 1.5986, + "loss_base2": 2.3063, + "loss_pixel": 0.1897, + "loss_text": 1.4089, + "ppl": 4.9461, + "step": 2381 + }, + { + "epoch": 0.01, + "global_step": 2382, + "learning_rate": 0.0004908931552587646, + "loss": 1.6014, + "loss_base2": 2.3103, + "loss_pixel": 0.1888, + "loss_text": 1.4126, + "ppl": 4.96, + "step": 2382 + }, + { + "epoch": 0.01, + "global_step": 2383, + "learning_rate": 0.0004908889816360601, + "loss": 1.6663, + "loss_base2": 2.404, + "loss_pixel": 0.1888, + "loss_text": 1.4775, + "ppl": 5.2925, + "step": 2383 + }, + { + "epoch": 0.01, + "global_step": 2384, + "learning_rate": 0.0004908848080133556, + "loss": 1.9, + "loss_base2": 2.7411, + "loss_pixel": 0.1881, + "loss_text": 1.7119, + "ppl": 6.6859, + "step": 2384 + }, + { + "epoch": 0.01, + "global_step": 2385, + "learning_rate": 0.0004908806343906511, + "loss": 1.8971, + "loss_base2": 2.7369, + "loss_pixel": 0.1892, + "loss_text": 1.7079, + "ppl": 6.6665, + "step": 2385 + }, + { + "epoch": 0.01, + "global_step": 2386, + "learning_rate": 0.0004908764607679466, + "loss": 1.8948, + "loss_base2": 2.7336, + "loss_pixel": 0.1894, + "loss_text": 1.7055, + "ppl": 6.6512, + "step": 2386 + }, + { + "epoch": 0.01, + "global_step": 2387, + "learning_rate": 0.0004908722871452421, + "loss": 1.8713, + "loss_base2": 2.6997, + "loss_pixel": 0.1881, + "loss_text": 1.6831, + "ppl": 6.4967, + "step": 2387 + }, + { + "epoch": 0.01, + "global_step": 2388, + "learning_rate": 0.0004908681135225376, + "loss": 1.8637, + "loss_base2": 2.6888, + "loss_pixel": 0.1879, + "loss_text": 1.6758, + "ppl": 6.4475, + "step": 2388 + }, + { + "epoch": 0.01, + "global_step": 2389, + "learning_rate": 0.0004908639398998331, + "loss": 1.8781, + "loss_base2": 2.7095, + "loss_pixel": 0.1885, + "loss_text": 1.6896, + "ppl": 6.5411, + "step": 2389 + }, + { + "epoch": 0.01, + "global_step": 2390, + "learning_rate": 0.0004908597662771286, + "loss": 1.8867, + "loss_base2": 2.7219, + "loss_pixel": 0.1882, + "loss_text": 1.6985, + "ppl": 6.5976, + "step": 2390 + }, + { + "epoch": 0.01, + "global_step": 2391, + "learning_rate": 0.000490855592654424, + "loss": 1.8704, + "loss_base2": 2.6984, + "loss_pixel": 0.1893, + "loss_text": 1.681, + "ppl": 6.4909, + "step": 2391 + }, + { + "epoch": 0.01, + "global_step": 2392, + "learning_rate": 0.0004908514190317195, + "loss": 1.8653, + "loss_base2": 2.6911, + "loss_pixel": 0.1892, + "loss_text": 1.6761, + "ppl": 6.4579, + "step": 2392 + }, + { + "epoch": 0.01, + "global_step": 2393, + "learning_rate": 0.000490847245409015, + "loss": 1.8855, + "loss_base2": 2.7202, + "loss_pixel": 0.1903, + "loss_text": 1.6952, + "ppl": 6.5896, + "step": 2393 + }, + { + "epoch": 0.01, + "global_step": 2394, + "learning_rate": 0.0004908430717863105, + "loss": 1.8664, + "loss_base2": 2.6926, + "loss_pixel": 0.191, + "loss_text": 1.6754, + "ppl": 6.465, + "step": 2394 + }, + { + "epoch": 0.01, + "global_step": 2395, + "learning_rate": 0.000490838898163606, + "loss": 1.8521, + "loss_base2": 2.672, + "loss_pixel": 0.191, + "loss_text": 1.6611, + "ppl": 6.3732, + "step": 2395 + }, + { + "epoch": 0.01, + "global_step": 2396, + "learning_rate": 0.0004908347245409014, + "loss": 1.8568, + "loss_base2": 2.6788, + "loss_pixel": 0.1927, + "loss_text": 1.6641, + "ppl": 6.4032, + "step": 2396 + }, + { + "epoch": 0.01, + "global_step": 2397, + "learning_rate": 0.000490830550918197, + "loss": 1.8606, + "loss_base2": 2.6843, + "loss_pixel": 0.2004, + "loss_text": 1.6602, + "ppl": 6.4276, + "step": 2397 + }, + { + "epoch": 0.01, + "global_step": 2398, + "learning_rate": 0.0004908263772954925, + "loss": 1.8564, + "loss_base2": 2.6782, + "loss_pixel": 0.1975, + "loss_text": 1.6589, + "ppl": 6.4007, + "step": 2398 + }, + { + "epoch": 0.01, + "global_step": 2399, + "learning_rate": 0.000490822203672788, + "loss": 1.8606, + "loss_base2": 2.6843, + "loss_pixel": 0.1979, + "loss_text": 1.6626, + "ppl": 6.4276, + "step": 2399 + }, + { + "epoch": 0.01, + "global_step": 2400, + "learning_rate": 0.0004908180300500835, + "loss": 1.8454, + "loss_base2": 2.6623, + "loss_pixel": 0.1977, + "loss_text": 1.6477, + "ppl": 6.3306, + "step": 2400 + }, + { + "epoch": 0.01, + "global_step": 2401, + "learning_rate": 0.000490813856427379, + "loss": 1.8634, + "loss_base2": 2.6883, + "loss_pixel": 0.1987, + "loss_text": 1.6647, + "ppl": 6.4456, + "step": 2401 + }, + { + "epoch": 0.01, + "global_step": 2402, + "learning_rate": 0.0004908096828046745, + "loss": 1.8666, + "loss_base2": 2.6929, + "loss_pixel": 0.2049, + "loss_text": 1.6617, + "ppl": 6.4663, + "step": 2402 + }, + { + "epoch": 0.01, + "global_step": 2403, + "learning_rate": 0.00049080550918197, + "loss": 1.8802, + "loss_base2": 2.7126, + "loss_pixel": 0.2112, + "loss_text": 1.669, + "ppl": 6.5548, + "step": 2403 + }, + { + "epoch": 0.01, + "global_step": 2404, + "learning_rate": 0.0004908013355592654, + "loss": 1.8882, + "loss_base2": 2.7241, + "loss_pixel": 0.2156, + "loss_text": 1.6726, + "ppl": 6.6075, + "step": 2404 + }, + { + "epoch": 0.01, + "global_step": 2405, + "learning_rate": 0.0004907971619365609, + "loss": 1.8942, + "loss_base2": 2.7328, + "loss_pixel": 0.2345, + "loss_text": 1.6597, + "ppl": 6.6472, + "step": 2405 + }, + { + "epoch": 0.01, + "global_step": 2406, + "learning_rate": 0.0004907929883138564, + "loss": 1.9115, + "loss_base2": 2.7577, + "loss_pixel": 0.2404, + "loss_text": 1.6712, + "ppl": 6.7632, + "step": 2406 + }, + { + "epoch": 0.01, + "global_step": 2407, + "learning_rate": 0.0004907888146911519, + "loss": 1.8982, + "loss_base2": 2.7385, + "loss_pixel": 0.2493, + "loss_text": 1.6489, + "ppl": 6.6739, + "step": 2407 + }, + { + "epoch": 0.01, + "global_step": 2408, + "learning_rate": 0.0004907846410684474, + "loss": 1.9065, + "loss_base2": 2.7505, + "loss_pixel": 0.2483, + "loss_text": 1.6582, + "ppl": 6.7295, + "step": 2408 + }, + { + "epoch": 0.01, + "global_step": 2409, + "learning_rate": 0.0004907804674457429, + "loss": 1.8913, + "loss_base2": 2.7286, + "loss_pixel": 0.2536, + "loss_text": 1.6377, + "ppl": 6.628, + "step": 2409 + }, + { + "epoch": 0.01, + "global_step": 2410, + "learning_rate": 0.0004907762938230384, + "loss": 1.9066, + "loss_base2": 2.7506, + "loss_pixel": 0.2491, + "loss_text": 1.6575, + "ppl": 6.7302, + "step": 2410 + }, + { + "epoch": 0.01, + "global_step": 2411, + "learning_rate": 0.000490772120200334, + "loss": 1.8963, + "loss_base2": 2.7358, + "loss_pixel": 0.2415, + "loss_text": 1.6548, + "ppl": 6.6612, + "step": 2411 + }, + { + "epoch": 0.01, + "global_step": 2412, + "learning_rate": 0.0004907679465776295, + "loss": 1.887, + "loss_base2": 2.7224, + "loss_pixel": 0.2416, + "loss_text": 1.6454, + "ppl": 6.5995, + "step": 2412 + }, + { + "epoch": 0.01, + "global_step": 2413, + "learning_rate": 0.0004907637729549249, + "loss": 1.8978, + "loss_base2": 2.7379, + "loss_pixel": 0.248, + "loss_text": 1.6498, + "ppl": 6.6712, + "step": 2413 + }, + { + "epoch": 0.01, + "global_step": 2414, + "learning_rate": 0.0004907595993322204, + "loss": 1.8916, + "loss_base2": 2.729, + "loss_pixel": 0.2413, + "loss_text": 1.6503, + "ppl": 6.63, + "step": 2414 + }, + { + "epoch": 0.01, + "global_step": 2415, + "learning_rate": 0.0004907554257095159, + "loss": 1.8802, + "loss_base2": 2.7126, + "loss_pixel": 0.2363, + "loss_text": 1.6439, + "ppl": 6.5548, + "step": 2415 + }, + { + "epoch": 0.01, + "global_step": 2416, + "learning_rate": 0.0004907512520868114, + "loss": 1.8745, + "loss_base2": 2.7043, + "loss_pixel": 0.2313, + "loss_text": 1.6432, + "ppl": 6.5176, + "step": 2416 + }, + { + "epoch": 0.01, + "global_step": 2417, + "learning_rate": 0.0004907470784641069, + "loss": 1.8912, + "loss_base2": 2.7284, + "loss_pixel": 0.228, + "loss_text": 1.6632, + "ppl": 6.6273, + "step": 2417 + }, + { + "epoch": 0.01, + "global_step": 2418, + "learning_rate": 0.0004907429048414023, + "loss": 1.878, + "loss_base2": 2.7094, + "loss_pixel": 0.2226, + "loss_text": 1.6554, + "ppl": 6.5404, + "step": 2418 + }, + { + "epoch": 0.01, + "global_step": 2419, + "learning_rate": 0.0004907387312186978, + "loss": 1.8608, + "loss_base2": 2.6846, + "loss_pixel": 0.2214, + "loss_text": 1.6395, + "ppl": 6.4289, + "step": 2419 + }, + { + "epoch": 0.01, + "global_step": 2420, + "learning_rate": 0.0004907345575959933, + "loss": 1.8634, + "loss_base2": 2.6883, + "loss_pixel": 0.2177, + "loss_text": 1.6457, + "ppl": 6.4456, + "step": 2420 + }, + { + "epoch": 0.01, + "global_step": 2421, + "learning_rate": 0.0004907303839732888, + "loss": 1.8695, + "loss_base2": 2.6971, + "loss_pixel": 0.2184, + "loss_text": 1.6512, + "ppl": 6.4851, + "step": 2421 + }, + { + "epoch": 0.01, + "global_step": 2422, + "learning_rate": 0.0004907262103505843, + "loss": 1.8556, + "loss_base2": 2.6771, + "loss_pixel": 0.217, + "loss_text": 1.6386, + "ppl": 6.3955, + "step": 2422 + }, + { + "epoch": 0.01, + "global_step": 2423, + "learning_rate": 0.0004907220367278798, + "loss": 1.8736, + "loss_base2": 2.703, + "loss_pixel": 0.2164, + "loss_text": 1.6572, + "ppl": 6.5117, + "step": 2423 + }, + { + "epoch": 0.01, + "global_step": 2424, + "learning_rate": 0.0004907178631051753, + "loss": 1.8526, + "loss_base2": 2.6727, + "loss_pixel": 0.2125, + "loss_text": 1.6401, + "ppl": 6.3764, + "step": 2424 + }, + { + "epoch": 0.01, + "global_step": 2425, + "learning_rate": 0.0004907136894824708, + "loss": 1.8929, + "loss_base2": 2.7309, + "loss_pixel": 0.2102, + "loss_text": 1.6827, + "ppl": 6.6386, + "step": 2425 + }, + { + "epoch": 0.01, + "global_step": 2426, + "learning_rate": 0.0004907095158597663, + "loss": 1.8546, + "loss_base2": 2.6756, + "loss_pixel": 0.2045, + "loss_text": 1.6501, + "ppl": 6.3891, + "step": 2426 + }, + { + "epoch": 0.01, + "global_step": 2427, + "learning_rate": 0.0004907053422370617, + "loss": 1.8366, + "loss_base2": 2.6497, + "loss_pixel": 0.2047, + "loss_text": 1.6319, + "ppl": 6.2752, + "step": 2427 + }, + { + "epoch": 0.01, + "global_step": 2428, + "learning_rate": 0.0004907011686143572, + "loss": 1.8397, + "loss_base2": 2.6541, + "loss_pixel": 0.2057, + "loss_text": 1.634, + "ppl": 6.2946, + "step": 2428 + }, + { + "epoch": 0.01, + "global_step": 2429, + "learning_rate": 0.0004906969949916528, + "loss": 1.6561, + "loss_base2": 2.3892, + "loss_pixel": 0.1999, + "loss_text": 1.4561, + "ppl": 5.2388, + "step": 2429 + }, + { + "epoch": 0.01, + "global_step": 2430, + "learning_rate": 0.0004906928213689483, + "loss": 1.6219, + "loss_base2": 2.3399, + "loss_pixel": 0.2022, + "loss_text": 1.4197, + "ppl": 5.0627, + "step": 2430 + }, + { + "epoch": 0.01, + "global_step": 2431, + "learning_rate": 0.0004906886477462438, + "loss": 1.5997, + "loss_base2": 2.3079, + "loss_pixel": 0.1982, + "loss_text": 1.4014, + "ppl": 4.9515, + "step": 2431 + }, + { + "epoch": 0.01, + "global_step": 2432, + "learning_rate": 0.0004906844741235393, + "loss": 1.5794, + "loss_base2": 2.2786, + "loss_pixel": 0.1981, + "loss_text": 1.3813, + "ppl": 4.852, + "step": 2432 + }, + { + "epoch": 0.01, + "global_step": 2433, + "learning_rate": 0.0004906803005008348, + "loss": 1.5856, + "loss_base2": 2.2875, + "loss_pixel": 0.1993, + "loss_text": 1.3863, + "ppl": 4.8822, + "step": 2433 + }, + { + "epoch": 0.01, + "global_step": 2434, + "learning_rate": 0.0004906761268781302, + "loss": 1.5912, + "loss_base2": 2.2956, + "loss_pixel": 0.1987, + "loss_text": 1.3925, + "ppl": 4.9096, + "step": 2434 + }, + { + "epoch": 0.01, + "global_step": 2435, + "learning_rate": 0.0004906719532554257, + "loss": 1.5869, + "loss_base2": 2.2894, + "loss_pixel": 0.199, + "loss_text": 1.3879, + "ppl": 4.8886, + "step": 2435 + }, + { + "epoch": 0.01, + "global_step": 2436, + "learning_rate": 0.0004906677796327212, + "loss": 1.6774, + "loss_base2": 2.42, + "loss_pixel": 0.1952, + "loss_text": 1.4822, + "ppl": 5.3516, + "step": 2436 + }, + { + "epoch": 0.01, + "global_step": 2437, + "learning_rate": 0.0004906636060100167, + "loss": 1.8646, + "loss_base2": 2.69, + "loss_pixel": 0.1945, + "loss_text": 1.6701, + "ppl": 6.4534, + "step": 2437 + }, + { + "epoch": 0.01, + "global_step": 2438, + "learning_rate": 0.0004906594323873122, + "loss": 1.8581, + "loss_base2": 2.6807, + "loss_pixel": 0.1925, + "loss_text": 1.6656, + "ppl": 6.4115, + "step": 2438 + }, + { + "epoch": 0.01, + "global_step": 2439, + "learning_rate": 0.0004906552587646077, + "loss": 1.86, + "loss_base2": 2.6834, + "loss_pixel": 0.1926, + "loss_text": 1.6674, + "ppl": 6.4237, + "step": 2439 + }, + { + "epoch": 0.01, + "global_step": 2440, + "learning_rate": 0.0004906510851419032, + "loss": 1.8135, + "loss_base2": 2.6163, + "loss_pixel": 0.1931, + "loss_text": 1.6203, + "ppl": 6.1319, + "step": 2440 + }, + { + "epoch": 0.01, + "global_step": 2441, + "learning_rate": 0.0004906469115191986, + "loss": 1.8328, + "loss_base2": 2.6442, + "loss_pixel": 0.1923, + "loss_text": 1.6405, + "ppl": 6.2514, + "step": 2441 + }, + { + "epoch": 0.01, + "global_step": 2442, + "learning_rate": 0.0004906427378964941, + "loss": 1.8207, + "loss_base2": 2.6267, + "loss_pixel": 0.191, + "loss_text": 1.6297, + "ppl": 6.1762, + "step": 2442 + }, + { + "epoch": 0.01, + "global_step": 2443, + "learning_rate": 0.0004906385642737896, + "loss": 1.8521, + "loss_base2": 2.672, + "loss_pixel": 0.1891, + "loss_text": 1.663, + "ppl": 6.3732, + "step": 2443 + }, + { + "epoch": 0.01, + "global_step": 2444, + "learning_rate": 0.0004906343906510851, + "loss": 1.8526, + "loss_base2": 2.6727, + "loss_pixel": 0.1918, + "loss_text": 1.6609, + "ppl": 6.3764, + "step": 2444 + }, + { + "epoch": 0.01, + "global_step": 2445, + "learning_rate": 0.0004906302170283807, + "loss": 1.8268, + "loss_base2": 2.6355, + "loss_pixel": 0.1895, + "loss_text": 1.6373, + "ppl": 6.214, + "step": 2445 + }, + { + "epoch": 0.01, + "global_step": 2446, + "learning_rate": 0.0004906260434056762, + "loss": 1.8332, + "loss_base2": 2.6447, + "loss_pixel": 0.19, + "loss_text": 1.6431, + "ppl": 6.2539, + "step": 2446 + }, + { + "epoch": 0.01, + "global_step": 2447, + "learning_rate": 0.0004906218697829717, + "loss": 1.8494, + "loss_base2": 2.6681, + "loss_pixel": 0.1904, + "loss_text": 1.6589, + "ppl": 6.356, + "step": 2447 + }, + { + "epoch": 0.01, + "global_step": 2448, + "learning_rate": 0.0004906176961602672, + "loss": 1.8261, + "loss_base2": 2.6345, + "loss_pixel": 0.1885, + "loss_text": 1.6376, + "ppl": 6.2096, + "step": 2448 + }, + { + "epoch": 0.01, + "global_step": 2449, + "learning_rate": 0.0004906135225375627, + "loss": 1.8254, + "loss_base2": 2.6335, + "loss_pixel": 0.1888, + "loss_text": 1.6366, + "ppl": 6.2053, + "step": 2449 + }, + { + "epoch": 0.01, + "global_step": 2450, + "learning_rate": 0.0004906093489148581, + "loss": 1.8339, + "loss_base2": 2.6458, + "loss_pixel": 0.188, + "loss_text": 1.6459, + "ppl": 6.2582, + "step": 2450 + }, + { + "epoch": 0.01, + "global_step": 2451, + "learning_rate": 0.0004906051752921536, + "loss": 1.8034, + "loss_base2": 2.6018, + "loss_pixel": 0.188, + "loss_text": 1.6153, + "ppl": 6.0703, + "step": 2451 + }, + { + "epoch": 0.01, + "global_step": 2452, + "learning_rate": 0.0004906010016694491, + "loss": 1.8288, + "loss_base2": 2.6384, + "loss_pixel": 0.1868, + "loss_text": 1.642, + "ppl": 6.2264, + "step": 2452 + }, + { + "epoch": 0.01, + "global_step": 2453, + "learning_rate": 0.0004905968280467446, + "loss": 1.8454, + "loss_base2": 2.6623, + "loss_pixel": 0.2074, + "loss_text": 1.6381, + "ppl": 6.3306, + "step": 2453 + }, + { + "epoch": 0.01, + "global_step": 2454, + "learning_rate": 0.00049059265442404, + "loss": 1.82, + "loss_base2": 2.6257, + "loss_pixel": 0.2072, + "loss_text": 1.6128, + "ppl": 6.1719, + "step": 2454 + }, + { + "epoch": 0.01, + "global_step": 2455, + "learning_rate": 0.0004905884808013355, + "loss": 1.8581, + "loss_base2": 2.6807, + "loss_pixel": 0.209, + "loss_text": 1.6491, + "ppl": 6.4115, + "step": 2455 + }, + { + "epoch": 0.01, + "global_step": 2456, + "learning_rate": 0.000490584307178631, + "loss": 1.8366, + "loss_base2": 2.6497, + "loss_pixel": 0.2065, + "loss_text": 1.6301, + "ppl": 6.2752, + "step": 2456 + }, + { + "epoch": 0.01, + "global_step": 2457, + "learning_rate": 0.0004905801335559265, + "loss": 1.8675, + "loss_base2": 2.6942, + "loss_pixel": 0.2023, + "loss_text": 1.6653, + "ppl": 6.4721, + "step": 2457 + }, + { + "epoch": 0.01, + "global_step": 2458, + "learning_rate": 0.000490575959933222, + "loss": 1.8179, + "loss_base2": 2.6227, + "loss_pixel": 0.1902, + "loss_text": 1.6277, + "ppl": 6.1589, + "step": 2458 + }, + { + "epoch": 0.01, + "global_step": 2459, + "learning_rate": 0.0004905717863105175, + "loss": 1.8192, + "loss_base2": 2.6246, + "loss_pixel": 0.1904, + "loss_text": 1.6288, + "ppl": 6.1669, + "step": 2459 + }, + { + "epoch": 0.01, + "global_step": 2460, + "learning_rate": 0.000490567612687813, + "loss": 1.843, + "loss_base2": 2.6589, + "loss_pixel": 0.19, + "loss_text": 1.653, + "ppl": 6.3155, + "step": 2460 + }, + { + "epoch": 0.01, + "global_step": 2461, + "learning_rate": 0.0004905634390651086, + "loss": 1.6771, + "loss_base2": 2.4195, + "loss_pixel": 0.1893, + "loss_text": 1.4878, + "ppl": 5.35, + "step": 2461 + }, + { + "epoch": 0.01, + "global_step": 2462, + "learning_rate": 0.0004905592654424041, + "loss": 1.5795, + "loss_base2": 2.2787, + "loss_pixel": 0.1861, + "loss_text": 1.3935, + "ppl": 4.8525, + "step": 2462 + }, + { + "epoch": 0.01, + "global_step": 2463, + "learning_rate": 0.0004905550918196995, + "loss": 1.5688, + "loss_base2": 2.2633, + "loss_pixel": 0.1869, + "loss_text": 1.3819, + "ppl": 4.8009, + "step": 2463 + }, + { + "epoch": 0.01, + "global_step": 2464, + "learning_rate": 0.000490550918196995, + "loss": 1.5947, + "loss_base2": 2.3007, + "loss_pixel": 0.1881, + "loss_text": 1.4067, + "ppl": 4.9269, + "step": 2464 + }, + { + "epoch": 0.01, + "global_step": 2465, + "learning_rate": 0.0004905467445742905, + "loss": 1.5783, + "loss_base2": 2.277, + "loss_pixel": 0.1871, + "loss_text": 1.3912, + "ppl": 4.8467, + "step": 2465 + }, + { + "epoch": 0.01, + "global_step": 2466, + "learning_rate": 0.000490542570951586, + "loss": 1.5957, + "loss_base2": 2.3021, + "loss_pixel": 0.188, + "loss_text": 1.4077, + "ppl": 4.9318, + "step": 2466 + }, + { + "epoch": 0.01, + "global_step": 2467, + "learning_rate": 0.0004905383973288815, + "loss": 1.5971, + "loss_base2": 2.3041, + "loss_pixel": 0.1849, + "loss_text": 1.4121, + "ppl": 4.9387, + "step": 2467 + }, + { + "epoch": 0.01, + "global_step": 2468, + "learning_rate": 0.000490534223706177, + "loss": 1.7137, + "loss_base2": 2.4723, + "loss_pixel": 0.1865, + "loss_text": 1.5272, + "ppl": 5.5495, + "step": 2468 + }, + { + "epoch": 0.01, + "global_step": 2469, + "learning_rate": 0.0004905300500834725, + "loss": 1.8362, + "loss_base2": 2.6491, + "loss_pixel": 0.1851, + "loss_text": 1.6511, + "ppl": 6.2727, + "step": 2469 + }, + { + "epoch": 0.01, + "global_step": 2470, + "learning_rate": 0.000490525876460768, + "loss": 1.8484, + "loss_base2": 2.6667, + "loss_pixel": 0.1855, + "loss_text": 1.663, + "ppl": 6.3497, + "step": 2470 + }, + { + "epoch": 0.01, + "global_step": 2471, + "learning_rate": 0.0004905217028380634, + "loss": 1.827, + "loss_base2": 2.6358, + "loss_pixel": 0.1853, + "loss_text": 1.6417, + "ppl": 6.2152, + "step": 2471 + }, + { + "epoch": 0.01, + "global_step": 2472, + "learning_rate": 0.0004905175292153589, + "loss": 1.8504, + "loss_base2": 2.6696, + "loss_pixel": 0.1902, + "loss_text": 1.6602, + "ppl": 6.3624, + "step": 2472 + }, + { + "epoch": 0.01, + "global_step": 2473, + "learning_rate": 0.0004905133555926544, + "loss": 1.8508, + "loss_base2": 2.6701, + "loss_pixel": 0.2033, + "loss_text": 1.6475, + "ppl": 6.3649, + "step": 2473 + }, + { + "epoch": 0.01, + "global_step": 2474, + "learning_rate": 0.0004905091819699499, + "loss": 1.8556, + "loss_base2": 2.6771, + "loss_pixel": 0.2032, + "loss_text": 1.6524, + "ppl": 6.3955, + "step": 2474 + }, + { + "epoch": 0.01, + "global_step": 2475, + "learning_rate": 0.0004905050083472454, + "loss": 1.8449, + "loss_base2": 2.6616, + "loss_pixel": 0.1925, + "loss_text": 1.6523, + "ppl": 6.3275, + "step": 2475 + }, + { + "epoch": 0.01, + "global_step": 2476, + "learning_rate": 0.000490500834724541, + "loss": 1.8466, + "loss_base2": 2.6641, + "loss_pixel": 0.188, + "loss_text": 1.6586, + "ppl": 6.3382, + "step": 2476 + }, + { + "epoch": 0.01, + "global_step": 2477, + "learning_rate": 0.0004904966611018363, + "loss": 1.8354, + "loss_base2": 2.6479, + "loss_pixel": 0.1846, + "loss_text": 1.6509, + "ppl": 6.2676, + "step": 2477 + }, + { + "epoch": 0.01, + "global_step": 2478, + "learning_rate": 0.0004904924874791319, + "loss": 1.8286, + "loss_base2": 2.6381, + "loss_pixel": 0.1868, + "loss_text": 1.6418, + "ppl": 6.2252, + "step": 2478 + }, + { + "epoch": 0.01, + "global_step": 2479, + "learning_rate": 0.0004904883138564274, + "loss": 1.8102, + "loss_base2": 2.6116, + "loss_pixel": 0.1858, + "loss_text": 1.6244, + "ppl": 6.1117, + "step": 2479 + }, + { + "epoch": 0.01, + "global_step": 2480, + "learning_rate": 0.0004904841402337229, + "loss": 1.8298, + "loss_base2": 2.6398, + "loss_pixel": 0.1849, + "loss_text": 1.6449, + "ppl": 6.2326, + "step": 2480 + }, + { + "epoch": 0.01, + "global_step": 2481, + "learning_rate": 0.0004904799666110184, + "loss": 1.8336, + "loss_base2": 2.6453, + "loss_pixel": 0.1836, + "loss_text": 1.6501, + "ppl": 6.2564, + "step": 2481 + }, + { + "epoch": 0.01, + "global_step": 2482, + "learning_rate": 0.0004904757929883139, + "loss": 1.8446, + "loss_base2": 2.6612, + "loss_pixel": 0.1887, + "loss_text": 1.6559, + "ppl": 6.3256, + "step": 2482 + }, + { + "epoch": 0.01, + "global_step": 2483, + "learning_rate": 0.0004904716193656094, + "loss": 1.8137, + "loss_base2": 2.6166, + "loss_pixel": 0.185, + "loss_text": 1.6287, + "ppl": 6.1331, + "step": 2483 + }, + { + "epoch": 0.01, + "global_step": 2484, + "learning_rate": 0.0004904674457429049, + "loss": 1.8287, + "loss_base2": 2.6383, + "loss_pixel": 0.1855, + "loss_text": 1.6432, + "ppl": 6.2258, + "step": 2484 + }, + { + "epoch": 0.01, + "global_step": 2485, + "learning_rate": 0.0004904632721202004, + "loss": 1.8106, + "loss_base2": 2.6121, + "loss_pixel": 0.1871, + "loss_text": 1.6235, + "ppl": 6.1141, + "step": 2485 + }, + { + "epoch": 0.01, + "global_step": 2486, + "learning_rate": 0.0004904590984974958, + "loss": 1.8145, + "loss_base2": 2.6178, + "loss_pixel": 0.1848, + "loss_text": 1.6297, + "ppl": 6.138, + "step": 2486 + }, + { + "epoch": 0.01, + "global_step": 2487, + "learning_rate": 0.0004904549248747913, + "loss": 1.8331, + "loss_base2": 2.6446, + "loss_pixel": 0.1839, + "loss_text": 1.6492, + "ppl": 6.2532, + "step": 2487 + }, + { + "epoch": 0.01, + "global_step": 2488, + "learning_rate": 0.0004904507512520868, + "loss": 1.8192, + "loss_base2": 2.6246, + "loss_pixel": 0.1843, + "loss_text": 1.6348, + "ppl": 6.1669, + "step": 2488 + }, + { + "epoch": 0.01, + "global_step": 2489, + "learning_rate": 0.0004904465776293823, + "loss": 1.8279, + "loss_base2": 2.6371, + "loss_pixel": 0.1845, + "loss_text": 1.6434, + "ppl": 6.2208, + "step": 2489 + }, + { + "epoch": 0.01, + "global_step": 2490, + "learning_rate": 0.0004904424040066778, + "loss": 1.631, + "loss_base2": 2.353, + "loss_pixel": 0.1834, + "loss_text": 1.4477, + "ppl": 5.109, + "step": 2490 + }, + { + "epoch": 0.01, + "global_step": 2491, + "learning_rate": 0.0004904382303839732, + "loss": 1.5897, + "loss_base2": 2.2935, + "loss_pixel": 0.1973, + "loss_text": 1.3924, + "ppl": 4.9023, + "step": 2491 + }, + { + "epoch": 0.01, + "global_step": 2492, + "learning_rate": 0.0004904340567612687, + "loss": 1.5908, + "loss_base2": 2.295, + "loss_pixel": 0.2042, + "loss_text": 1.3866, + "ppl": 4.9077, + "step": 2492 + }, + { + "epoch": 0.01, + "global_step": 2493, + "learning_rate": 0.0004904298831385642, + "loss": 1.5921, + "loss_base2": 2.2969, + "loss_pixel": 0.1984, + "loss_text": 1.3938, + "ppl": 4.9141, + "step": 2493 + }, + { + "epoch": 0.01, + "global_step": 2494, + "learning_rate": 0.0004904257095158598, + "loss": 1.5611, + "loss_base2": 2.2522, + "loss_pixel": 0.1847, + "loss_text": 1.3764, + "ppl": 4.7641, + "step": 2494 + }, + { + "epoch": 0.01, + "global_step": 2495, + "learning_rate": 0.0004904215358931553, + "loss": 1.5934, + "loss_base2": 2.2988, + "loss_pixel": 0.1844, + "loss_text": 1.4089, + "ppl": 4.9205, + "step": 2495 + }, + { + "epoch": 0.01, + "global_step": 2496, + "learning_rate": 0.0004904173622704508, + "loss": 1.5766, + "loss_base2": 2.2746, + "loss_pixel": 0.1832, + "loss_text": 1.3934, + "ppl": 4.8385, + "step": 2496 + }, + { + "epoch": 0.01, + "global_step": 2497, + "learning_rate": 0.0004904131886477463, + "loss": 1.5832, + "loss_base2": 2.2841, + "loss_pixel": 0.1831, + "loss_text": 1.4002, + "ppl": 4.8705, + "step": 2497 + }, + { + "epoch": 0.01, + "global_step": 2498, + "learning_rate": 0.0004904090150250418, + "loss": 1.8409, + "loss_base2": 2.6559, + "loss_pixel": 0.1842, + "loss_text": 1.6566, + "ppl": 6.3022, + "step": 2498 + }, + { + "epoch": 0.01, + "global_step": 2499, + "learning_rate": 0.0004904048414023373, + "loss": 1.8468, + "loss_base2": 2.6644, + "loss_pixel": 0.183, + "loss_text": 1.6638, + "ppl": 6.3395, + "step": 2499 + }, + { + "epoch": 0.01, + "global_step": 2500, + "learning_rate": 0.0004904006677796327, + "loss": 1.8557, + "loss_base2": 2.6772, + "loss_pixel": 0.1818, + "loss_text": 1.6738, + "ppl": 6.3962, + "step": 2500 + }, + { + "epoch": 0.01, + "global_step": 2501, + "learning_rate": 0.0004903964941569282, + "loss": 1.82, + "loss_base2": 2.6257, + "loss_pixel": 0.1836, + "loss_text": 1.6364, + "ppl": 6.1719, + "step": 2501 + }, + { + "epoch": 0.01, + "global_step": 2502, + "learning_rate": 0.0004903923205342237, + "loss": 1.831, + "loss_base2": 2.6416, + "loss_pixel": 0.1803, + "loss_text": 1.6508, + "ppl": 6.2401, + "step": 2502 + }, + { + "epoch": 0.01, + "global_step": 2503, + "learning_rate": 0.0004903881469115192, + "loss": 1.8316, + "loss_base2": 2.6424, + "loss_pixel": 0.1838, + "loss_text": 1.6478, + "ppl": 6.2439, + "step": 2503 + }, + { + "epoch": 0.01, + "global_step": 2504, + "learning_rate": 0.0004903839732888147, + "loss": 1.8284, + "loss_base2": 2.6378, + "loss_pixel": 0.1825, + "loss_text": 1.6459, + "ppl": 6.2239, + "step": 2504 + }, + { + "epoch": 0.01, + "global_step": 2505, + "learning_rate": 0.0004903797996661102, + "loss": 1.8386, + "loss_base2": 2.6525, + "loss_pixel": 0.1821, + "loss_text": 1.6566, + "ppl": 6.2877, + "step": 2505 + }, + { + "epoch": 0.01, + "global_step": 2506, + "learning_rate": 0.0004903756260434057, + "loss": 1.849, + "loss_base2": 2.6675, + "loss_pixel": 0.185, + "loss_text": 1.664, + "ppl": 6.3535, + "step": 2506 + }, + { + "epoch": 0.01, + "global_step": 2507, + "learning_rate": 0.0004903714524207012, + "loss": 1.8361, + "loss_base2": 2.6489, + "loss_pixel": 0.1816, + "loss_text": 1.6545, + "ppl": 6.272, + "step": 2507 + }, + { + "epoch": 0.01, + "global_step": 2508, + "learning_rate": 0.0004903672787979967, + "loss": 1.834, + "loss_base2": 2.6459, + "loss_pixel": 0.1836, + "loss_text": 1.6504, + "ppl": 6.2589, + "step": 2508 + }, + { + "epoch": 0.01, + "global_step": 2509, + "learning_rate": 0.0004903631051752921, + "loss": 1.832, + "loss_base2": 2.643, + "loss_pixel": 0.1832, + "loss_text": 1.6488, + "ppl": 6.2464, + "step": 2509 + }, + { + "epoch": 0.01, + "global_step": 2510, + "learning_rate": 0.0004903589315525877, + "loss": 1.8149, + "loss_base2": 2.6183, + "loss_pixel": 0.1816, + "loss_text": 1.6333, + "ppl": 6.1405, + "step": 2510 + }, + { + "epoch": 0.01, + "global_step": 2511, + "learning_rate": 0.0004903547579298832, + "loss": 1.8227, + "loss_base2": 2.6296, + "loss_pixel": 0.1836, + "loss_text": 1.6391, + "ppl": 6.1885, + "step": 2511 + }, + { + "epoch": 0.01, + "global_step": 2512, + "learning_rate": 0.0004903505843071787, + "loss": 1.8281, + "loss_base2": 2.6374, + "loss_pixel": 0.1833, + "loss_text": 1.6448, + "ppl": 6.2221, + "step": 2512 + }, + { + "epoch": 0.01, + "global_step": 2513, + "learning_rate": 0.0004903464106844741, + "loss": 1.8203, + "loss_base2": 2.6261, + "loss_pixel": 0.1812, + "loss_text": 1.6391, + "ppl": 6.1737, + "step": 2513 + }, + { + "epoch": 0.01, + "global_step": 2514, + "learning_rate": 0.0004903422370617696, + "loss": 1.8301, + "loss_base2": 2.6403, + "loss_pixel": 0.1833, + "loss_text": 1.6468, + "ppl": 6.2345, + "step": 2514 + }, + { + "epoch": 0.01, + "global_step": 2515, + "learning_rate": 0.0004903380634390651, + "loss": 1.8232, + "loss_base2": 2.6303, + "loss_pixel": 0.1819, + "loss_text": 1.6413, + "ppl": 6.1916, + "step": 2515 + }, + { + "epoch": 0.01, + "global_step": 2516, + "learning_rate": 0.0004903338898163606, + "loss": 1.8173, + "loss_base2": 2.6218, + "loss_pixel": 0.182, + "loss_text": 1.6353, + "ppl": 6.1552, + "step": 2516 + }, + { + "epoch": 0.01, + "global_step": 2517, + "learning_rate": 0.0004903297161936561, + "loss": 1.8164, + "loss_base2": 2.6205, + "loss_pixel": 0.1809, + "loss_text": 1.6354, + "ppl": 6.1497, + "step": 2517 + }, + { + "epoch": 0.01, + "global_step": 2518, + "learning_rate": 0.0004903255425709516, + "loss": 1.8206, + "loss_base2": 2.6266, + "loss_pixel": 0.1811, + "loss_text": 1.6395, + "ppl": 6.1756, + "step": 2518 + }, + { + "epoch": 0.01, + "global_step": 2519, + "learning_rate": 0.0004903213689482471, + "loss": 1.8025, + "loss_base2": 2.6005, + "loss_pixel": 0.1834, + "loss_text": 1.6191, + "ppl": 6.0648, + "step": 2519 + }, + { + "epoch": 0.01, + "global_step": 2520, + "learning_rate": 0.0004903171953255426, + "loss": 1.799, + "loss_base2": 2.5954, + "loss_pixel": 0.1804, + "loss_text": 1.6187, + "ppl": 6.0436, + "step": 2520 + }, + { + "epoch": 0.01, + "global_step": 2521, + "learning_rate": 0.0004903130217028381, + "loss": 1.7145, + "loss_base2": 2.4735, + "loss_pixel": 0.1839, + "loss_text": 1.5306, + "ppl": 5.5539, + "step": 2521 + }, + { + "epoch": 0.01, + "global_step": 2522, + "learning_rate": 0.0004903088480801335, + "loss": 1.5975, + "loss_base2": 2.3047, + "loss_pixel": 0.1801, + "loss_text": 1.4173, + "ppl": 4.9407, + "step": 2522 + }, + { + "epoch": 0.01, + "global_step": 2523, + "learning_rate": 0.000490304674457429, + "loss": 1.593, + "loss_base2": 2.2982, + "loss_pixel": 0.1802, + "loss_text": 1.4128, + "ppl": 4.9185, + "step": 2523 + }, + { + "epoch": 0.01, + "global_step": 2524, + "learning_rate": 0.0004903005008347245, + "loss": 1.5808, + "loss_base2": 2.2806, + "loss_pixel": 0.1822, + "loss_text": 1.3986, + "ppl": 4.8588, + "step": 2524 + }, + { + "epoch": 0.01, + "global_step": 2525, + "learning_rate": 0.00049029632721202, + "loss": 1.5871, + "loss_base2": 2.2897, + "loss_pixel": 0.1791, + "loss_text": 1.4079, + "ppl": 4.8895, + "step": 2525 + }, + { + "epoch": 0.01, + "global_step": 2526, + "learning_rate": 0.0004902921535893156, + "loss": 1.5638, + "loss_base2": 2.2561, + "loss_pixel": 0.1826, + "loss_text": 1.3812, + "ppl": 4.7769, + "step": 2526 + }, + { + "epoch": 0.01, + "global_step": 2527, + "learning_rate": 0.000490287979966611, + "loss": 1.5936, + "loss_base2": 2.2991, + "loss_pixel": 0.1805, + "loss_text": 1.4132, + "ppl": 4.9214, + "step": 2527 + }, + { + "epoch": 0.01, + "global_step": 2528, + "learning_rate": 0.0004902838063439065, + "loss": 1.5753, + "loss_base2": 2.2727, + "loss_pixel": 0.1821, + "loss_text": 1.3933, + "ppl": 4.8322, + "step": 2528 + }, + { + "epoch": 0.01, + "global_step": 2529, + "learning_rate": 0.000490279632721202, + "loss": 1.6619, + "loss_base2": 2.3976, + "loss_pixel": 0.181, + "loss_text": 1.481, + "ppl": 5.2693, + "step": 2529 + }, + { + "epoch": 0.01, + "global_step": 2530, + "learning_rate": 0.0004902754590984975, + "loss": 1.8068, + "loss_base2": 2.6067, + "loss_pixel": 0.1803, + "loss_text": 1.6265, + "ppl": 6.0909, + "step": 2530 + }, + { + "epoch": 0.01, + "global_step": 2531, + "learning_rate": 0.000490271285475793, + "loss": 1.8106, + "loss_base2": 2.6121, + "loss_pixel": 0.1796, + "loss_text": 1.6311, + "ppl": 6.1141, + "step": 2531 + }, + { + "epoch": 0.01, + "global_step": 2532, + "learning_rate": 0.0004902671118530885, + "loss": 1.8296, + "loss_base2": 2.6396, + "loss_pixel": 0.1804, + "loss_text": 1.6492, + "ppl": 6.2314, + "step": 2532 + }, + { + "epoch": 0.01, + "global_step": 2533, + "learning_rate": 0.000490262938230384, + "loss": 1.8357, + "loss_base2": 2.6484, + "loss_pixel": 0.1819, + "loss_text": 1.6538, + "ppl": 6.2695, + "step": 2533 + }, + { + "epoch": 0.01, + "global_step": 2534, + "learning_rate": 0.0004902587646076795, + "loss": 1.8234, + "loss_base2": 2.6306, + "loss_pixel": 0.1814, + "loss_text": 1.642, + "ppl": 6.1929, + "step": 2534 + }, + { + "epoch": 0.01, + "global_step": 2535, + "learning_rate": 0.000490254590984975, + "loss": 1.8281, + "loss_base2": 2.6374, + "loss_pixel": 0.1802, + "loss_text": 1.6479, + "ppl": 6.2221, + "step": 2535 + }, + { + "epoch": 0.01, + "global_step": 2536, + "learning_rate": 0.0004902504173622704, + "loss": 1.8092, + "loss_base2": 2.6101, + "loss_pixel": 0.1789, + "loss_text": 1.6303, + "ppl": 6.1056, + "step": 2536 + }, + { + "epoch": 0.01, + "global_step": 2537, + "learning_rate": 0.0004902462437395659, + "loss": 1.8036, + "loss_base2": 2.602, + "loss_pixel": 0.1815, + "loss_text": 1.6221, + "ppl": 6.0715, + "step": 2537 + }, + { + "epoch": 0.01, + "global_step": 2538, + "learning_rate": 0.0004902420701168614, + "loss": 1.8268, + "loss_base2": 2.6355, + "loss_pixel": 0.1806, + "loss_text": 1.6462, + "ppl": 6.214, + "step": 2538 + }, + { + "epoch": 0.01, + "global_step": 2539, + "learning_rate": 0.0004902378964941569, + "loss": 1.8116, + "loss_base2": 2.6136, + "loss_pixel": 0.1796, + "loss_text": 1.632, + "ppl": 6.1202, + "step": 2539 + }, + { + "epoch": 0.01, + "global_step": 2540, + "learning_rate": 0.0004902337228714524, + "loss": 1.8231, + "loss_base2": 2.6302, + "loss_pixel": 0.1797, + "loss_text": 1.6434, + "ppl": 6.191, + "step": 2540 + }, + { + "epoch": 0.01, + "global_step": 2541, + "learning_rate": 0.000490229549248748, + "loss": 1.8125, + "loss_base2": 2.6149, + "loss_pixel": 0.1804, + "loss_text": 1.632, + "ppl": 6.1257, + "step": 2541 + }, + { + "epoch": 0.01, + "global_step": 2542, + "learning_rate": 0.0004902253756260435, + "loss": 1.8178, + "loss_base2": 2.6225, + "loss_pixel": 0.1785, + "loss_text": 1.6394, + "ppl": 6.1583, + "step": 2542 + }, + { + "epoch": 0.01, + "global_step": 2543, + "learning_rate": 0.000490221202003339, + "loss": 1.8396, + "loss_base2": 2.654, + "loss_pixel": 0.1887, + "loss_text": 1.6509, + "ppl": 6.294, + "step": 2543 + }, + { + "epoch": 0.01, + "global_step": 2544, + "learning_rate": 0.0004902170283806345, + "loss": 1.8379, + "loss_base2": 2.6515, + "loss_pixel": 0.1945, + "loss_text": 1.6434, + "ppl": 6.2833, + "step": 2544 + }, + { + "epoch": 0.01, + "global_step": 2545, + "learning_rate": 0.0004902128547579299, + "loss": 1.8234, + "loss_base2": 2.6306, + "loss_pixel": 0.1948, + "loss_text": 1.6286, + "ppl": 6.1929, + "step": 2545 + }, + { + "epoch": 0.01, + "global_step": 2546, + "learning_rate": 0.0004902086811352254, + "loss": 1.8281, + "loss_base2": 2.6374, + "loss_pixel": 0.1939, + "loss_text": 1.6342, + "ppl": 6.2221, + "step": 2546 + }, + { + "epoch": 0.01, + "global_step": 2547, + "learning_rate": 0.0004902045075125209, + "loss": 1.8122, + "loss_base2": 2.6145, + "loss_pixel": 0.1932, + "loss_text": 1.619, + "ppl": 6.1239, + "step": 2547 + }, + { + "epoch": 0.01, + "global_step": 2548, + "learning_rate": 0.0004902003338898164, + "loss": 1.8333, + "loss_base2": 2.6449, + "loss_pixel": 0.1932, + "loss_text": 1.6401, + "ppl": 6.2545, + "step": 2548 + }, + { + "epoch": 0.01, + "global_step": 2549, + "learning_rate": 0.0004901961602671119, + "loss": 1.8281, + "loss_base2": 2.6374, + "loss_pixel": 0.1941, + "loss_text": 1.634, + "ppl": 6.2221, + "step": 2549 + }, + { + "epoch": 0.01, + "global_step": 2550, + "learning_rate": 0.0004901919866444073, + "loss": 1.8426, + "loss_base2": 2.6583, + "loss_pixel": 0.1939, + "loss_text": 1.6487, + "ppl": 6.3129, + "step": 2550 + }, + { + "epoch": 0.01, + "global_step": 2551, + "learning_rate": 0.0004901878130217028, + "loss": 1.8372, + "loss_base2": 2.6505, + "loss_pixel": 0.1914, + "loss_text": 1.6458, + "ppl": 6.2789, + "step": 2551 + }, + { + "epoch": 0.01, + "global_step": 2552, + "learning_rate": 0.0004901836393989983, + "loss": 1.8256, + "loss_base2": 2.6338, + "loss_pixel": 0.1919, + "loss_text": 1.6336, + "ppl": 6.2065, + "step": 2552 + }, + { + "epoch": 0.01, + "global_step": 2553, + "learning_rate": 0.0004901794657762938, + "loss": 1.833, + "loss_base2": 2.6445, + "loss_pixel": 0.1929, + "loss_text": 1.6401, + "ppl": 6.2526, + "step": 2553 + }, + { + "epoch": 0.01, + "global_step": 2554, + "learning_rate": 0.0004901752921535893, + "loss": 1.8091, + "loss_base2": 2.61, + "loss_pixel": 0.1919, + "loss_text": 1.6171, + "ppl": 6.105, + "step": 2554 + }, + { + "epoch": 0.01, + "global_step": 2555, + "learning_rate": 0.0004901711185308848, + "loss": 1.8089, + "loss_base2": 2.6097, + "loss_pixel": 0.1932, + "loss_text": 1.6158, + "ppl": 6.1037, + "step": 2555 + }, + { + "epoch": 0.01, + "global_step": 2556, + "learning_rate": 0.0004901669449081803, + "loss": 1.8335, + "loss_base2": 2.6452, + "loss_pixel": 0.1926, + "loss_text": 1.6409, + "ppl": 6.2557, + "step": 2556 + }, + { + "epoch": 0.01, + "global_step": 2557, + "learning_rate": 0.0004901627712854758, + "loss": 1.7971, + "loss_base2": 2.5927, + "loss_pixel": 0.1924, + "loss_text": 1.6048, + "ppl": 6.0321, + "step": 2557 + }, + { + "epoch": 0.01, + "global_step": 2558, + "learning_rate": 0.0004901585976627714, + "loss": 1.8163, + "loss_base2": 2.6204, + "loss_pixel": 0.1926, + "loss_text": 1.6236, + "ppl": 6.1491, + "step": 2558 + }, + { + "epoch": 0.01, + "global_step": 2559, + "learning_rate": 0.0004901544240400668, + "loss": 1.8391, + "loss_base2": 2.6533, + "loss_pixel": 0.1917, + "loss_text": 1.6474, + "ppl": 6.2909, + "step": 2559 + }, + { + "epoch": 0.01, + "global_step": 2560, + "learning_rate": 0.0004901502504173623, + "loss": 1.8346, + "loss_base2": 2.6468, + "loss_pixel": 0.1907, + "loss_text": 1.6439, + "ppl": 6.2626, + "step": 2560 + }, + { + "epoch": 0.01, + "global_step": 2561, + "learning_rate": 0.0004901460767946578, + "loss": 1.8258, + "loss_base2": 2.6341, + "loss_pixel": 0.1913, + "loss_text": 1.6345, + "ppl": 6.2078, + "step": 2561 + }, + { + "epoch": 0.01, + "global_step": 2562, + "learning_rate": 0.0004901419031719533, + "loss": 1.8293, + "loss_base2": 2.6391, + "loss_pixel": 0.1917, + "loss_text": 1.6376, + "ppl": 6.2295, + "step": 2562 + }, + { + "epoch": 0.01, + "global_step": 2563, + "learning_rate": 0.0004901377295492488, + "loss": 1.8329, + "loss_base2": 2.6443, + "loss_pixel": 0.1921, + "loss_text": 1.6408, + "ppl": 6.252, + "step": 2563 + }, + { + "epoch": 0.01, + "global_step": 2564, + "learning_rate": 0.0004901335559265443, + "loss": 1.8078, + "loss_base2": 2.6081, + "loss_pixel": 0.19, + "loss_text": 1.6178, + "ppl": 6.097, + "step": 2564 + }, + { + "epoch": 0.01, + "global_step": 2565, + "learning_rate": 0.0004901293823038397, + "loss": 1.8117, + "loss_base2": 2.6137, + "loss_pixel": 0.1901, + "loss_text": 1.6217, + "ppl": 6.1208, + "step": 2565 + }, + { + "epoch": 0.01, + "global_step": 2566, + "learning_rate": 0.0004901252086811352, + "loss": 1.8306, + "loss_base2": 2.641, + "loss_pixel": 0.1904, + "loss_text": 1.6402, + "ppl": 6.2376, + "step": 2566 + }, + { + "epoch": 0.01, + "global_step": 2567, + "learning_rate": 0.0004901210350584307, + "loss": 1.8157, + "loss_base2": 2.6195, + "loss_pixel": 0.1901, + "loss_text": 1.6256, + "ppl": 6.1454, + "step": 2567 + }, + { + "epoch": 0.01, + "global_step": 2568, + "learning_rate": 0.0004901168614357262, + "loss": 1.81, + "loss_base2": 2.6113, + "loss_pixel": 0.1901, + "loss_text": 1.6199, + "ppl": 6.1104, + "step": 2568 + }, + { + "epoch": 0.01, + "global_step": 2569, + "learning_rate": 0.0004901126878130217, + "loss": 1.7986, + "loss_base2": 2.5948, + "loss_pixel": 0.1898, + "loss_text": 1.6089, + "ppl": 6.0412, + "step": 2569 + }, + { + "epoch": 0.01, + "global_step": 2570, + "learning_rate": 0.0004901085141903172, + "loss": 1.8268, + "loss_base2": 2.6355, + "loss_pixel": 0.1892, + "loss_text": 1.6376, + "ppl": 6.214, + "step": 2570 + }, + { + "epoch": 0.01, + "global_step": 2571, + "learning_rate": 0.0004901043405676127, + "loss": 1.807, + "loss_base2": 2.6069, + "loss_pixel": 0.1901, + "loss_text": 1.617, + "ppl": 6.0921, + "step": 2571 + }, + { + "epoch": 0.01, + "global_step": 2572, + "learning_rate": 0.0004901001669449081, + "loss": 1.8173, + "loss_base2": 2.6218, + "loss_pixel": 0.1902, + "loss_text": 1.6271, + "ppl": 6.1552, + "step": 2572 + }, + { + "epoch": 0.01, + "global_step": 2573, + "learning_rate": 0.0004900959933222036, + "loss": 1.8076, + "loss_base2": 2.6078, + "loss_pixel": 0.191, + "loss_text": 1.6166, + "ppl": 6.0958, + "step": 2573 + }, + { + "epoch": 0.01, + "global_step": 2574, + "learning_rate": 0.0004900918196994991, + "loss": 1.8267, + "loss_base2": 2.6354, + "loss_pixel": 0.19, + "loss_text": 1.6367, + "ppl": 6.2133, + "step": 2574 + }, + { + "epoch": 0.01, + "global_step": 2575, + "learning_rate": 0.0004900876460767947, + "loss": 1.8237, + "loss_base2": 2.631, + "loss_pixel": 0.1902, + "loss_text": 1.6335, + "ppl": 6.1947, + "step": 2575 + }, + { + "epoch": 0.01, + "global_step": 2576, + "learning_rate": 0.0004900834724540902, + "loss": 1.8093, + "loss_base2": 2.6103, + "loss_pixel": 0.1903, + "loss_text": 1.6189, + "ppl": 6.1062, + "step": 2576 + }, + { + "epoch": 0.01, + "global_step": 2577, + "learning_rate": 0.0004900792988313857, + "loss": 1.8016, + "loss_base2": 2.5992, + "loss_pixel": 0.1898, + "loss_text": 1.6117, + "ppl": 6.0593, + "step": 2577 + }, + { + "epoch": 0.01, + "global_step": 2578, + "learning_rate": 0.0004900751252086812, + "loss": 1.6429, + "loss_base2": 2.3702, + "loss_pixel": 0.1895, + "loss_text": 1.4534, + "ppl": 5.1701, + "step": 2578 + }, + { + "epoch": 0.01, + "global_step": 2579, + "learning_rate": 0.0004900709515859767, + "loss": 1.594, + "loss_base2": 2.2997, + "loss_pixel": 0.1889, + "loss_text": 1.4051, + "ppl": 4.9234, + "step": 2579 + }, + { + "epoch": 0.01, + "global_step": 2580, + "learning_rate": 0.0004900667779632722, + "loss": 1.585, + "loss_base2": 2.2867, + "loss_pixel": 0.1893, + "loss_text": 1.3958, + "ppl": 4.8793, + "step": 2580 + }, + { + "epoch": 0.01, + "global_step": 2581, + "learning_rate": 0.0004900626043405676, + "loss": 1.5711, + "loss_base2": 2.2666, + "loss_pixel": 0.1896, + "loss_text": 1.3815, + "ppl": 4.8119, + "step": 2581 + }, + { + "epoch": 0.01, + "global_step": 2582, + "learning_rate": 0.0004900584307178631, + "loss": 1.5861, + "loss_base2": 2.2883, + "loss_pixel": 0.1883, + "loss_text": 1.3979, + "ppl": 4.8847, + "step": 2582 + }, + { + "epoch": 0.01, + "global_step": 2583, + "learning_rate": 0.0004900542570951586, + "loss": 1.5763, + "loss_base2": 2.2741, + "loss_pixel": 0.1893, + "loss_text": 1.387, + "ppl": 4.837, + "step": 2583 + }, + { + "epoch": 0.01, + "global_step": 2584, + "learning_rate": 0.0004900500834724541, + "loss": 1.5717, + "loss_base2": 2.2675, + "loss_pixel": 0.1887, + "loss_text": 1.383, + "ppl": 4.8148, + "step": 2584 + }, + { + "epoch": 0.01, + "global_step": 2585, + "learning_rate": 0.0004900459098497496, + "loss": 1.6754, + "loss_base2": 2.4171, + "loss_pixel": 0.1894, + "loss_text": 1.486, + "ppl": 5.3409, + "step": 2585 + }, + { + "epoch": 0.01, + "global_step": 2586, + "learning_rate": 0.000490041736227045, + "loss": 1.6523, + "loss_base2": 2.3838, + "loss_pixel": 0.188, + "loss_text": 1.4644, + "ppl": 5.219, + "step": 2586 + }, + { + "epoch": 0.01, + "global_step": 2587, + "learning_rate": 0.0004900375626043405, + "loss": 1.5732, + "loss_base2": 2.2696, + "loss_pixel": 0.1882, + "loss_text": 1.385, + "ppl": 4.8221, + "step": 2587 + }, + { + "epoch": 0.01, + "global_step": 2588, + "learning_rate": 0.000490033388981636, + "loss": 1.6024, + "loss_base2": 2.3118, + "loss_pixel": 0.1886, + "loss_text": 1.4138, + "ppl": 4.9649, + "step": 2588 + }, + { + "epoch": 0.01, + "global_step": 2589, + "learning_rate": 0.0004900292153589315, + "loss": 1.5883, + "loss_base2": 2.2914, + "loss_pixel": 0.1872, + "loss_text": 1.4011, + "ppl": 4.8954, + "step": 2589 + }, + { + "epoch": 0.01, + "global_step": 2590, + "learning_rate": 0.000490025041736227, + "loss": 1.6023, + "loss_base2": 2.3116, + "loss_pixel": 0.1879, + "loss_text": 1.4144, + "ppl": 4.9644, + "step": 2590 + }, + { + "epoch": 0.01, + "global_step": 2591, + "learning_rate": 0.0004900208681135226, + "loss": 1.5711, + "loss_base2": 2.2666, + "loss_pixel": 0.1889, + "loss_text": 1.3822, + "ppl": 4.8119, + "step": 2591 + }, + { + "epoch": 0.01, + "global_step": 2592, + "learning_rate": 0.0004900166944908181, + "loss": 1.6016, + "loss_base2": 2.3106, + "loss_pixel": 0.1882, + "loss_text": 1.4135, + "ppl": 4.961, + "step": 2592 + }, + { + "epoch": 0.01, + "global_step": 2593, + "learning_rate": 0.0004900125208681136, + "loss": 1.5786, + "loss_base2": 2.2774, + "loss_pixel": 0.1891, + "loss_text": 1.3895, + "ppl": 4.8482, + "step": 2593 + }, + { + "epoch": 0.01, + "global_step": 2594, + "learning_rate": 0.0004900083472454091, + "loss": 1.7216, + "loss_base2": 2.4837, + "loss_pixel": 0.188, + "loss_text": 1.5336, + "ppl": 5.5935, + "step": 2594 + }, + { + "epoch": 0.01, + "global_step": 2595, + "learning_rate": 0.0004900041736227045, + "loss": 1.8367, + "loss_base2": 2.6498, + "loss_pixel": 0.1879, + "loss_text": 1.6488, + "ppl": 6.2758, + "step": 2595 + }, + { + "epoch": 0.01, + "global_step": 2596, + "learning_rate": 0.00049, + "loss": 1.8296, + "loss_base2": 2.6396, + "loss_pixel": 0.1889, + "loss_text": 1.6407, + "ppl": 6.2314, + "step": 2596 + }, + { + "epoch": 0.01, + "global_step": 2597, + "learning_rate": 0.0004899958263772955, + "loss": 1.8257, + "loss_base2": 2.6339, + "loss_pixel": 0.1887, + "loss_text": 1.637, + "ppl": 6.2071, + "step": 2597 + }, + { + "epoch": 0.01, + "global_step": 2598, + "learning_rate": 0.000489991652754591, + "loss": 1.8228, + "loss_base2": 2.6297, + "loss_pixel": 0.1884, + "loss_text": 1.6344, + "ppl": 6.1892, + "step": 2598 + }, + { + "epoch": 0.01, + "global_step": 2599, + "learning_rate": 0.0004899874791318865, + "loss": 1.8328, + "loss_base2": 2.6442, + "loss_pixel": 0.1891, + "loss_text": 1.6436, + "ppl": 6.2514, + "step": 2599 + }, + { + "epoch": 0.01, + "global_step": 2600, + "learning_rate": 0.000489983305509182, + "loss": 1.8274, + "loss_base2": 2.6364, + "loss_pixel": 0.1887, + "loss_text": 1.6387, + "ppl": 6.2177, + "step": 2600 + }, + { + "epoch": 0.01, + "global_step": 2601, + "learning_rate": 0.0004899791318864775, + "loss": 1.8244, + "loss_base2": 2.6321, + "loss_pixel": 0.1873, + "loss_text": 1.6371, + "ppl": 6.1991, + "step": 2601 + }, + { + "epoch": 0.01, + "global_step": 2602, + "learning_rate": 0.000489974958263773, + "loss": 1.8115, + "loss_base2": 2.6134, + "loss_pixel": 0.1876, + "loss_text": 1.6239, + "ppl": 6.1196, + "step": 2602 + }, + { + "epoch": 0.01, + "global_step": 2603, + "learning_rate": 0.0004899707846410684, + "loss": 1.8202, + "loss_base2": 2.626, + "loss_pixel": 0.1872, + "loss_text": 1.6331, + "ppl": 6.1731, + "step": 2603 + }, + { + "epoch": 0.01, + "global_step": 2604, + "learning_rate": 0.0004899666110183639, + "loss": 1.8316, + "loss_base2": 2.6424, + "loss_pixel": 0.1876, + "loss_text": 1.6441, + "ppl": 6.2439, + "step": 2604 + }, + { + "epoch": 0.01, + "global_step": 2605, + "learning_rate": 0.0004899624373956594, + "loss": 1.8151, + "loss_base2": 2.6186, + "loss_pixel": 0.1881, + "loss_text": 1.6269, + "ppl": 6.1417, + "step": 2605 + }, + { + "epoch": 0.01, + "global_step": 2606, + "learning_rate": 0.000489958263772955, + "loss": 1.8144, + "loss_base2": 2.6176, + "loss_pixel": 0.1881, + "loss_text": 1.6263, + "ppl": 6.1374, + "step": 2606 + }, + { + "epoch": 0.01, + "global_step": 2607, + "learning_rate": 0.0004899540901502505, + "loss": 1.8095, + "loss_base2": 2.6106, + "loss_pixel": 0.1882, + "loss_text": 1.6213, + "ppl": 6.1074, + "step": 2607 + }, + { + "epoch": 0.01, + "global_step": 2608, + "learning_rate": 0.000489949916527546, + "loss": 1.7961, + "loss_base2": 2.5912, + "loss_pixel": 0.1884, + "loss_text": 1.6077, + "ppl": 6.0261, + "step": 2608 + }, + { + "epoch": 0.01, + "global_step": 2609, + "learning_rate": 0.0004899457429048414, + "loss": 1.8234, + "loss_base2": 2.6306, + "loss_pixel": 0.1868, + "loss_text": 1.6366, + "ppl": 6.1929, + "step": 2609 + }, + { + "epoch": 0.01, + "global_step": 2610, + "learning_rate": 0.0004899415692821369, + "loss": 1.8165, + "loss_base2": 2.6207, + "loss_pixel": 0.1875, + "loss_text": 1.629, + "ppl": 6.1503, + "step": 2610 + }, + { + "epoch": 0.01, + "global_step": 2611, + "learning_rate": 0.0004899373956594324, + "loss": 1.8007, + "loss_base2": 2.5979, + "loss_pixel": 0.1881, + "loss_text": 1.6126, + "ppl": 6.0539, + "step": 2611 + }, + { + "epoch": 0.01, + "global_step": 2612, + "learning_rate": 0.0004899332220367279, + "loss": 1.8179, + "loss_base2": 2.6227, + "loss_pixel": 0.1872, + "loss_text": 1.6307, + "ppl": 6.1589, + "step": 2612 + }, + { + "epoch": 0.01, + "global_step": 2613, + "learning_rate": 0.0004899290484140234, + "loss": 1.8231, + "loss_base2": 2.6302, + "loss_pixel": 0.1885, + "loss_text": 1.6345, + "ppl": 6.191, + "step": 2613 + }, + { + "epoch": 0.01, + "global_step": 2614, + "learning_rate": 0.0004899248747913189, + "loss": 1.8213, + "loss_base2": 2.6276, + "loss_pixel": 0.1837, + "loss_text": 1.6376, + "ppl": 6.1799, + "step": 2614 + }, + { + "epoch": 0.01, + "global_step": 2615, + "learning_rate": 0.0004899207011686144, + "loss": 1.7876, + "loss_base2": 2.579, + "loss_pixel": 0.1849, + "loss_text": 1.6027, + "ppl": 5.9751, + "step": 2615 + }, + { + "epoch": 0.01, + "global_step": 2616, + "learning_rate": 0.0004899165275459099, + "loss": 1.7939, + "loss_base2": 2.5881, + "loss_pixel": 0.1812, + "loss_text": 1.6127, + "ppl": 6.0129, + "step": 2616 + }, + { + "epoch": 0.01, + "global_step": 2617, + "learning_rate": 0.0004899123539232054, + "loss": 1.8054, + "loss_base2": 2.6046, + "loss_pixel": 0.1809, + "loss_text": 1.6244, + "ppl": 6.0824, + "step": 2617 + }, + { + "epoch": 0.01, + "global_step": 2618, + "learning_rate": 0.0004899081803005008, + "loss": 1.813, + "loss_base2": 2.6156, + "loss_pixel": 0.1831, + "loss_text": 1.6299, + "ppl": 6.1288, + "step": 2618 + }, + { + "epoch": 0.01, + "global_step": 2619, + "learning_rate": 0.0004899040066777963, + "loss": 1.796, + "loss_base2": 2.5911, + "loss_pixel": 0.1798, + "loss_text": 1.6162, + "ppl": 6.0255, + "step": 2619 + }, + { + "epoch": 0.01, + "global_step": 2620, + "learning_rate": 0.0004898998330550918, + "loss": 1.8078, + "loss_base2": 2.6081, + "loss_pixel": 0.1818, + "loss_text": 1.6261, + "ppl": 6.097, + "step": 2620 + }, + { + "epoch": 0.01, + "global_step": 2621, + "learning_rate": 0.0004898956594323873, + "loss": 1.7952, + "loss_base2": 2.5899, + "loss_pixel": 0.1805, + "loss_text": 1.6146, + "ppl": 6.0207, + "step": 2621 + }, + { + "epoch": 0.01, + "global_step": 2622, + "learning_rate": 0.0004898914858096827, + "loss": 1.815, + "loss_base2": 2.6185, + "loss_pixel": 0.1798, + "loss_text": 1.6352, + "ppl": 6.1411, + "step": 2622 + }, + { + "epoch": 0.01, + "global_step": 2623, + "learning_rate": 0.0004898873121869782, + "loss": 1.8128, + "loss_base2": 2.6153, + "loss_pixel": 0.1807, + "loss_text": 1.6321, + "ppl": 6.1276, + "step": 2623 + }, + { + "epoch": 0.01, + "global_step": 2624, + "learning_rate": 0.0004898831385642738, + "loss": 1.8005, + "loss_base2": 2.5976, + "loss_pixel": 0.1821, + "loss_text": 1.6183, + "ppl": 6.0527, + "step": 2624 + }, + { + "epoch": 0.01, + "global_step": 2625, + "learning_rate": 0.0004898789649415693, + "loss": 1.8041, + "loss_base2": 2.6028, + "loss_pixel": 0.1809, + "loss_text": 1.6232, + "ppl": 6.0745, + "step": 2625 + }, + { + "epoch": 0.01, + "global_step": 2626, + "learning_rate": 0.0004898747913188648, + "loss": 1.803, + "loss_base2": 2.6012, + "loss_pixel": 0.1801, + "loss_text": 1.6229, + "ppl": 6.0678, + "step": 2626 + }, + { + "epoch": 0.01, + "global_step": 2627, + "learning_rate": 0.0004898706176961603, + "loss": 1.7965, + "loss_base2": 2.5918, + "loss_pixel": 0.1808, + "loss_text": 1.6157, + "ppl": 6.0285, + "step": 2627 + }, + { + "epoch": 0.01, + "global_step": 2628, + "learning_rate": 0.0004898664440734558, + "loss": 1.7972, + "loss_base2": 2.5928, + "loss_pixel": 0.1821, + "loss_text": 1.6151, + "ppl": 6.0327, + "step": 2628 + }, + { + "epoch": 0.01, + "global_step": 2629, + "learning_rate": 0.0004898622704507513, + "loss": 1.8172, + "loss_base2": 2.6217, + "loss_pixel": 0.1788, + "loss_text": 1.6385, + "ppl": 6.1546, + "step": 2629 + }, + { + "epoch": 0.01, + "global_step": 2630, + "learning_rate": 0.0004898580968280468, + "loss": 1.7971, + "loss_base2": 2.5927, + "loss_pixel": 0.1799, + "loss_text": 1.6173, + "ppl": 6.0321, + "step": 2630 + }, + { + "epoch": 0.01, + "global_step": 2631, + "learning_rate": 0.0004898539232053422, + "loss": 1.8019, + "loss_base2": 2.5996, + "loss_pixel": 0.1804, + "loss_text": 1.6215, + "ppl": 6.0612, + "step": 2631 + }, + { + "epoch": 0.01, + "global_step": 2632, + "learning_rate": 0.0004898497495826377, + "loss": 1.8024, + "loss_base2": 2.6003, + "loss_pixel": 0.1788, + "loss_text": 1.6236, + "ppl": 6.0642, + "step": 2632 + }, + { + "epoch": 0.01, + "global_step": 2633, + "learning_rate": 0.0004898455759599332, + "loss": 1.7896, + "loss_base2": 2.5818, + "loss_pixel": 0.1787, + "loss_text": 1.6109, + "ppl": 5.9871, + "step": 2633 + }, + { + "epoch": 0.01, + "global_step": 2634, + "learning_rate": 0.0004898414023372287, + "loss": 1.8157, + "loss_base2": 2.6195, + "loss_pixel": 0.1788, + "loss_text": 1.6369, + "ppl": 6.1454, + "step": 2634 + }, + { + "epoch": 0.01, + "global_step": 2635, + "learning_rate": 0.0004898372287145242, + "loss": 1.7881, + "loss_base2": 2.5797, + "loss_pixel": 0.1794, + "loss_text": 1.6087, + "ppl": 5.9781, + "step": 2635 + }, + { + "epoch": 0.01, + "global_step": 2636, + "learning_rate": 0.0004898330550918197, + "loss": 1.8061, + "loss_base2": 2.6057, + "loss_pixel": 0.1787, + "loss_text": 1.6274, + "ppl": 6.0867, + "step": 2636 + }, + { + "epoch": 0.01, + "global_step": 2637, + "learning_rate": 0.0004898288814691152, + "loss": 1.788, + "loss_base2": 2.5795, + "loss_pixel": 0.1797, + "loss_text": 1.6083, + "ppl": 5.9775, + "step": 2637 + }, + { + "epoch": 0.01, + "global_step": 2638, + "learning_rate": 0.0004898247078464107, + "loss": 1.6087, + "loss_base2": 2.3209, + "loss_pixel": 0.1779, + "loss_text": 1.4309, + "ppl": 4.9963, + "step": 2638 + }, + { + "epoch": 0.01, + "global_step": 2639, + "learning_rate": 0.0004898205342237063, + "loss": 1.564, + "loss_base2": 2.2564, + "loss_pixel": 0.1803, + "loss_text": 1.3838, + "ppl": 4.7779, + "step": 2639 + }, + { + "epoch": 0.01, + "global_step": 2640, + "learning_rate": 0.0004898163606010017, + "loss": 1.5644, + "loss_base2": 2.257, + "loss_pixel": 0.1796, + "loss_text": 1.3849, + "ppl": 4.7798, + "step": 2640 + }, + { + "epoch": 0.01, + "global_step": 2641, + "learning_rate": 0.0004898121869782972, + "loss": 1.5868, + "loss_base2": 2.2893, + "loss_pixel": 0.1787, + "loss_text": 1.4081, + "ppl": 4.8881, + "step": 2641 + }, + { + "epoch": 0.01, + "global_step": 2642, + "learning_rate": 0.0004898080133555927, + "loss": 1.548, + "loss_base2": 2.2333, + "loss_pixel": 0.1789, + "loss_text": 1.3691, + "ppl": 4.7021, + "step": 2642 + }, + { + "epoch": 0.01, + "global_step": 2643, + "learning_rate": 0.0004898038397328882, + "loss": 1.5564, + "loss_base2": 2.2454, + "loss_pixel": 0.1766, + "loss_text": 1.3798, + "ppl": 4.7417, + "step": 2643 + }, + { + "epoch": 0.01, + "global_step": 2644, + "learning_rate": 0.0004897996661101837, + "loss": 1.5512, + "loss_base2": 2.2379, + "loss_pixel": 0.1789, + "loss_text": 1.3723, + "ppl": 4.7171, + "step": 2644 + }, + { + "epoch": 0.01, + "global_step": 2645, + "learning_rate": 0.0004897954924874791, + "loss": 1.5551, + "loss_base2": 2.2435, + "loss_pixel": 0.1793, + "loss_text": 1.3758, + "ppl": 4.7356, + "step": 2645 + }, + { + "epoch": 0.01, + "global_step": 2646, + "learning_rate": 0.0004897913188647746, + "loss": 1.7094, + "loss_base2": 2.4661, + "loss_pixel": 0.1778, + "loss_text": 1.5315, + "ppl": 5.5256, + "step": 2646 + }, + { + "epoch": 0.01, + "global_step": 2647, + "learning_rate": 0.0004897871452420701, + "loss": 1.6076, + "loss_base2": 2.3193, + "loss_pixel": 0.1899, + "loss_text": 1.4177, + "ppl": 4.9908, + "step": 2647 + }, + { + "epoch": 0.01, + "global_step": 2648, + "learning_rate": 0.0004897829716193656, + "loss": 1.5928, + "loss_base2": 2.2979, + "loss_pixel": 0.1994, + "loss_text": 1.3934, + "ppl": 4.9175, + "step": 2648 + }, + { + "epoch": 0.01, + "global_step": 2649, + "learning_rate": 0.0004897787979966611, + "loss": 1.5811, + "loss_base2": 2.281, + "loss_pixel": 0.2001, + "loss_text": 1.381, + "ppl": 4.8603, + "step": 2649 + }, + { + "epoch": 0.01, + "global_step": 2650, + "learning_rate": 0.0004897746243739566, + "loss": 1.5933, + "loss_base2": 2.2986, + "loss_pixel": 0.1987, + "loss_text": 1.3946, + "ppl": 4.92, + "step": 2650 + }, + { + "epoch": 0.01, + "global_step": 2651, + "learning_rate": 0.0004897704507512521, + "loss": 1.5611, + "loss_base2": 2.2522, + "loss_pixel": 0.1975, + "loss_text": 1.3636, + "ppl": 4.7641, + "step": 2651 + }, + { + "epoch": 0.01, + "global_step": 2652, + "learning_rate": 0.0004897662771285476, + "loss": 1.5939, + "loss_base2": 2.2995, + "loss_pixel": 0.1917, + "loss_text": 1.4022, + "ppl": 4.9229, + "step": 2652 + }, + { + "epoch": 0.01, + "global_step": 2653, + "learning_rate": 0.0004897621035058431, + "loss": 1.5743, + "loss_base2": 2.2712, + "loss_pixel": 0.1841, + "loss_text": 1.3901, + "ppl": 4.8274, + "step": 2653 + }, + { + "epoch": 0.01, + "global_step": 2654, + "learning_rate": 0.0004897579298831385, + "loss": 1.5706, + "loss_base2": 2.2659, + "loss_pixel": 0.1831, + "loss_text": 1.3875, + "ppl": 4.8095, + "step": 2654 + }, + { + "epoch": 0.01, + "global_step": 2655, + "learning_rate": 0.000489753756260434, + "loss": 1.7459, + "loss_base2": 2.5188, + "loss_pixel": 0.1841, + "loss_text": 1.5618, + "ppl": 5.7311, + "step": 2655 + }, + { + "epoch": 0.01, + "global_step": 2656, + "learning_rate": 0.0004897495826377296, + "loss": 1.8385, + "loss_base2": 2.6524, + "loss_pixel": 0.1818, + "loss_text": 1.6568, + "ppl": 6.2871, + "step": 2656 + }, + { + "epoch": 0.01, + "global_step": 2657, + "learning_rate": 0.0004897454090150251, + "loss": 1.8349, + "loss_base2": 2.6472, + "loss_pixel": 0.1836, + "loss_text": 1.6513, + "ppl": 6.2645, + "step": 2657 + }, + { + "epoch": 0.01, + "global_step": 2658, + "learning_rate": 0.0004897412353923206, + "loss": 1.8299, + "loss_base2": 2.64, + "loss_pixel": 0.1815, + "loss_text": 1.6484, + "ppl": 6.2333, + "step": 2658 + }, + { + "epoch": 0.01, + "global_step": 2659, + "learning_rate": 0.000489737061769616, + "loss": 1.8271, + "loss_base2": 2.6359, + "loss_pixel": 0.186, + "loss_text": 1.6411, + "ppl": 6.2158, + "step": 2659 + }, + { + "epoch": 0.01, + "global_step": 2660, + "learning_rate": 0.0004897328881469115, + "loss": 1.8218, + "loss_base2": 2.6283, + "loss_pixel": 0.185, + "loss_text": 1.6368, + "ppl": 6.183, + "step": 2660 + }, + { + "epoch": 0.01, + "global_step": 2661, + "learning_rate": 0.000489728714524207, + "loss": 1.8416, + "loss_base2": 2.6569, + "loss_pixel": 0.1954, + "loss_text": 1.6462, + "ppl": 6.3066, + "step": 2661 + }, + { + "epoch": 0.01, + "global_step": 2662, + "learning_rate": 0.0004897245409015025, + "loss": 1.9177, + "loss_base2": 2.7667, + "loss_pixel": 0.2977, + "loss_text": 1.62, + "ppl": 6.8053, + "step": 2662 + }, + { + "epoch": 0.01, + "global_step": 2663, + "learning_rate": 0.000489720367278798, + "loss": 1.9201, + "loss_base2": 2.7701, + "loss_pixel": 0.2891, + "loss_text": 1.6309, + "ppl": 6.8216, + "step": 2663 + }, + { + "epoch": 0.01, + "global_step": 2664, + "learning_rate": 0.0004897161936560935, + "loss": 1.9357, + "loss_base2": 2.7926, + "loss_pixel": 0.3036, + "loss_text": 1.6321, + "ppl": 6.9289, + "step": 2664 + }, + { + "epoch": 0.01, + "global_step": 2665, + "learning_rate": 0.000489712020033389, + "loss": 1.9559, + "loss_base2": 2.8218, + "loss_pixel": 0.3118, + "loss_text": 1.6441, + "ppl": 7.0703, + "step": 2665 + }, + { + "epoch": 0.01, + "global_step": 2666, + "learning_rate": 0.0004897078464106845, + "loss": 1.9584, + "loss_base2": 2.8254, + "loss_pixel": 0.3226, + "loss_text": 1.6357, + "ppl": 7.088, + "step": 2666 + }, + { + "epoch": 0.01, + "global_step": 2667, + "learning_rate": 0.00048970367278798, + "loss": 1.9361, + "loss_base2": 2.7932, + "loss_pixel": 0.3169, + "loss_text": 1.6192, + "ppl": 6.9317, + "step": 2667 + }, + { + "epoch": 0.01, + "global_step": 2668, + "learning_rate": 0.0004896994991652754, + "loss": 1.9608, + "loss_base2": 2.8288, + "loss_pixel": 0.3245, + "loss_text": 1.6363, + "ppl": 7.105, + "step": 2668 + }, + { + "epoch": 0.01, + "global_step": 2669, + "learning_rate": 0.0004896953255425709, + "loss": 1.9954, + "loss_base2": 2.8788, + "loss_pixel": 0.3675, + "loss_text": 1.6279, + "ppl": 7.3551, + "step": 2669 + }, + { + "epoch": 0.01, + "global_step": 2670, + "learning_rate": 0.0004896911519198664, + "loss": 2.0224, + "loss_base2": 2.9177, + "loss_pixel": 0.3955, + "loss_text": 1.6269, + "ppl": 7.5564, + "step": 2670 + }, + { + "epoch": 0.01, + "global_step": 2671, + "learning_rate": 0.000489686978297162, + "loss": 2.0599, + "loss_base2": 2.9718, + "loss_pixel": 0.3881, + "loss_text": 1.6717, + "ppl": 7.8452, + "step": 2671 + }, + { + "epoch": 0.01, + "global_step": 2672, + "learning_rate": 0.0004896828046744575, + "loss": 6.1862, + "loss_base2": 8.9248, + "loss_pixel": 0.3971, + "loss_text": 5.7891, + "ppl": 485.9958, + "step": 2672 + }, + { + "epoch": 0.01, + "global_step": 2673, + "learning_rate": 0.000489678631051753, + "loss": 4.4942, + "loss_base2": 6.4838, + "loss_pixel": 0.6728, + "loss_text": 3.8214, + "ppl": 89.4965, + "step": 2673 + }, + { + "epoch": 0.01, + "global_step": 2674, + "learning_rate": 0.0004896744574290485, + "loss": 2.6966, + "loss_base2": 3.8904, + "loss_pixel": 0.6359, + "loss_text": 2.0607, + "ppl": 14.8292, + "step": 2674 + }, + { + "epoch": 0.01, + "global_step": 2675, + "learning_rate": 0.000489670283806344, + "loss": 4.5821, + "loss_base2": 6.6106, + "loss_pixel": 0.5076, + "loss_text": 4.0745, + "ppl": 97.7194, + "step": 2675 + }, + { + "epoch": 0.01, + "global_step": 2676, + "learning_rate": 0.0004896661101836395, + "loss": 4.2881, + "loss_base2": 6.1864, + "loss_pixel": 0.5092, + "loss_text": 3.7789, + "ppl": 72.828, + "step": 2676 + }, + { + "epoch": 0.01, + "global_step": 2677, + "learning_rate": 0.0004896619365609349, + "loss": 4.1852, + "loss_base2": 6.038, + "loss_pixel": 0.4724, + "loss_text": 3.7128, + "ppl": 65.7066, + "step": 2677 + }, + { + "epoch": 0.01, + "global_step": 2678, + "learning_rate": 0.0004896577629382304, + "loss": 4.55, + "loss_base2": 6.5643, + "loss_pixel": 0.5207, + "loss_text": 4.0293, + "ppl": 94.6324, + "step": 2678 + }, + { + "epoch": 0.01, + "global_step": 2679, + "learning_rate": 0.0004896535893155259, + "loss": 4.2985, + "loss_base2": 6.2014, + "loss_pixel": 0.7696, + "loss_text": 3.5289, + "ppl": 73.5893, + "step": 2679 + }, + { + "epoch": 0.01, + "global_step": 2680, + "learning_rate": 0.0004896494156928214, + "loss": 4.2002, + "loss_base2": 6.0596, + "loss_pixel": 0.584, + "loss_text": 3.6162, + "ppl": 66.6997, + "step": 2680 + }, + { + "epoch": 0.01, + "global_step": 2681, + "learning_rate": 0.0004896452420701168, + "loss": 4.4981, + "loss_base2": 6.4894, + "loss_pixel": 0.4899, + "loss_text": 4.0082, + "ppl": 89.8463, + "step": 2681 + }, + { + "epoch": 0.01, + "global_step": 2682, + "learning_rate": 0.0004896410684474123, + "loss": 4.186, + "loss_base2": 6.0391, + "loss_pixel": 0.4277, + "loss_text": 3.7583, + "ppl": 65.7592, + "step": 2682 + }, + { + "epoch": 0.01, + "global_step": 2683, + "learning_rate": 0.0004896368948247078, + "loss": 4.6744, + "loss_base2": 6.7437, + "loss_pixel": 0.4286, + "loss_text": 4.2458, + "ppl": 107.1682, + "step": 2683 + }, + { + "epoch": 0.01, + "global_step": 2684, + "learning_rate": 0.0004896327212020033, + "loss": 4.4995, + "loss_base2": 6.4914, + "loss_pixel": 0.4629, + "loss_text": 4.0367, + "ppl": 89.9721, + "step": 2684 + }, + { + "epoch": 0.01, + "global_step": 2685, + "learning_rate": 0.0004896285475792988, + "loss": 4.5292, + "loss_base2": 6.5343, + "loss_pixel": 0.4188, + "loss_text": 4.1104, + "ppl": 92.6844, + "step": 2685 + }, + { + "epoch": 0.01, + "global_step": 2686, + "learning_rate": 0.0004896243739565943, + "loss": 4.2726, + "loss_base2": 6.1641, + "loss_pixel": 0.4378, + "loss_text": 3.8348, + "ppl": 71.7078, + "step": 2686 + }, + { + "epoch": 0.01, + "global_step": 2687, + "learning_rate": 0.0004896202003338898, + "loss": 4.1406, + "loss_base2": 5.9736, + "loss_pixel": 0.4083, + "loss_text": 3.7323, + "ppl": 62.8405, + "step": 2687 + }, + { + "epoch": 0.01, + "global_step": 2688, + "learning_rate": 0.0004896160267111854, + "loss": 4.1882, + "loss_base2": 6.0423, + "loss_pixel": 0.4336, + "loss_text": 3.7545, + "ppl": 65.9041, + "step": 2688 + }, + { + "epoch": 0.01, + "global_step": 2689, + "learning_rate": 0.0004896118530884809, + "loss": 3.9484, + "loss_base2": 5.6963, + "loss_pixel": 0.4044, + "loss_text": 3.5441, + "ppl": 51.8523, + "step": 2689 + }, + { + "epoch": 0.01, + "global_step": 2690, + "learning_rate": 0.0004896076794657763, + "loss": 3.8541, + "loss_base2": 5.5603, + "loss_pixel": 0.4163, + "loss_text": 3.4378, + "ppl": 47.1861, + "step": 2690 + }, + { + "epoch": 0.01, + "global_step": 2691, + "learning_rate": 0.0004896035058430718, + "loss": 3.7927, + "loss_base2": 5.4717, + "loss_pixel": 0.4007, + "loss_text": 3.392, + "ppl": 44.3761, + "step": 2691 + }, + { + "epoch": 0.01, + "global_step": 2692, + "learning_rate": 0.0004895993322203673, + "loss": 3.7523, + "loss_base2": 5.4134, + "loss_pixel": 0.4164, + "loss_text": 3.3358, + "ppl": 42.619, + "step": 2692 + }, + { + "epoch": 0.01, + "global_step": 2693, + "learning_rate": 0.0004895951585976628, + "loss": 3.7095, + "loss_base2": 5.3517, + "loss_pixel": 0.4037, + "loss_text": 3.3058, + "ppl": 40.8334, + "step": 2693 + }, + { + "epoch": 0.01, + "global_step": 2694, + "learning_rate": 0.0004895909849749583, + "loss": 3.6677, + "loss_base2": 5.2914, + "loss_pixel": 0.4057, + "loss_text": 3.262, + "ppl": 39.1617, + "step": 2694 + }, + { + "epoch": 0.01, + "global_step": 2695, + "learning_rate": 0.0004895868113522538, + "loss": 3.6302, + "loss_base2": 5.2373, + "loss_pixel": 0.4058, + "loss_text": 3.2244, + "ppl": 37.7204, + "step": 2695 + }, + { + "epoch": 0.01, + "global_step": 2696, + "learning_rate": 0.0004895826377295492, + "loss": 3.5935, + "loss_base2": 5.1843, + "loss_pixel": 0.4005, + "loss_text": 3.193, + "ppl": 36.3611, + "step": 2696 + }, + { + "epoch": 0.01, + "global_step": 2697, + "learning_rate": 0.0004895784641068447, + "loss": 3.5779, + "loss_base2": 5.1618, + "loss_pixel": 0.3999, + "loss_text": 3.1781, + "ppl": 35.7983, + "step": 2697 + }, + { + "epoch": 0.01, + "global_step": 2698, + "learning_rate": 0.0004895742904841402, + "loss": 3.5486, + "loss_base2": 5.1195, + "loss_pixel": 0.4001, + "loss_text": 3.1485, + "ppl": 34.7646, + "step": 2698 + }, + { + "epoch": 0.01, + "global_step": 2699, + "learning_rate": 0.0004895701168614357, + "loss": 3.5286, + "loss_base2": 5.0907, + "loss_pixel": 0.3969, + "loss_text": 3.1317, + "ppl": 34.0762, + "step": 2699 + }, + { + "epoch": 0.01, + "global_step": 2700, + "learning_rate": 0.0004895659432387312, + "loss": 3.5089, + "loss_base2": 5.0623, + "loss_pixel": 0.3936, + "loss_text": 3.1153, + "ppl": 33.4115, + "step": 2700 + }, + { + "epoch": 0.01, + "global_step": 2701, + "learning_rate": 0.0004895617696160267, + "loss": 3.4851, + "loss_base2": 5.0279, + "loss_pixel": 0.3927, + "loss_text": 3.0925, + "ppl": 32.6257, + "step": 2701 + }, + { + "epoch": 0.01, + "global_step": 2702, + "learning_rate": 0.0004895575959933222, + "loss": 3.4697, + "loss_base2": 5.0057, + "loss_pixel": 0.3912, + "loss_text": 3.0785, + "ppl": 32.1271, + "step": 2702 + }, + { + "epoch": 0.01, + "global_step": 2703, + "learning_rate": 0.0004895534223706177, + "loss": 3.4711, + "loss_base2": 5.0077, + "loss_pixel": 0.3901, + "loss_text": 3.081, + "ppl": 32.1721, + "step": 2703 + }, + { + "epoch": 0.01, + "global_step": 2704, + "learning_rate": 0.0004895492487479131, + "loss": 3.4215, + "loss_base2": 4.9362, + "loss_pixel": 0.3886, + "loss_text": 3.0329, + "ppl": 30.6153, + "step": 2704 + }, + { + "epoch": 0.01, + "global_step": 2705, + "learning_rate": 0.0004895450751252087, + "loss": 3.3898, + "loss_base2": 4.8904, + "loss_pixel": 0.388, + "loss_text": 3.0018, + "ppl": 29.66, + "step": 2705 + }, + { + "epoch": 0.01, + "global_step": 2706, + "learning_rate": 0.0004895409015025042, + "loss": 3.4319, + "loss_base2": 4.9512, + "loss_pixel": 0.3868, + "loss_text": 3.0451, + "ppl": 30.9354, + "step": 2706 + }, + { + "epoch": 0.01, + "global_step": 2707, + "learning_rate": 0.0004895367278797997, + "loss": 3.4206, + "loss_base2": 4.9349, + "loss_pixel": 0.3866, + "loss_text": 3.034, + "ppl": 30.5878, + "step": 2707 + }, + { + "epoch": 0.01, + "global_step": 2708, + "learning_rate": 0.0004895325542570952, + "loss": 3.3242, + "loss_base2": 4.7958, + "loss_pixel": 0.3871, + "loss_text": 2.9371, + "ppl": 27.7768, + "step": 2708 + }, + { + "epoch": 0.01, + "global_step": 2709, + "learning_rate": 0.0004895283806343907, + "loss": 3.2666, + "loss_base2": 4.7127, + "loss_pixel": 0.3864, + "loss_text": 2.8802, + "ppl": 26.222, + "step": 2709 + }, + { + "epoch": 0.01, + "global_step": 2710, + "learning_rate": 0.0004895242070116862, + "loss": 3.2576, + "loss_base2": 4.6997, + "loss_pixel": 0.3854, + "loss_text": 2.8722, + "ppl": 25.9871, + "step": 2710 + }, + { + "epoch": 0.01, + "global_step": 2711, + "learning_rate": 0.0004895200333889817, + "loss": 3.2785, + "loss_base2": 4.7299, + "loss_pixel": 0.3869, + "loss_text": 2.8916, + "ppl": 26.5359, + "step": 2711 + }, + { + "epoch": 0.01, + "global_step": 2712, + "learning_rate": 0.0004895158597662772, + "loss": 3.2189, + "loss_base2": 4.6439, + "loss_pixel": 0.3858, + "loss_text": 2.8331, + "ppl": 25.0006, + "step": 2712 + }, + { + "epoch": 0.01, + "global_step": 2713, + "learning_rate": 0.0004895116861435726, + "loss": 3.2078, + "loss_base2": 4.6279, + "loss_pixel": 0.3881, + "loss_text": 2.8197, + "ppl": 24.7246, + "step": 2713 + }, + { + "epoch": 0.01, + "global_step": 2714, + "learning_rate": 0.0004895075125208681, + "loss": 3.1777, + "loss_base2": 4.5845, + "loss_pixel": 0.3851, + "loss_text": 2.7926, + "ppl": 23.9915, + "step": 2714 + }, + { + "epoch": 0.01, + "global_step": 2715, + "learning_rate": 0.0004895033388981636, + "loss": 3.148, + "loss_base2": 4.5416, + "loss_pixel": 0.3863, + "loss_text": 2.7616, + "ppl": 23.2894, + "step": 2715 + }, + { + "epoch": 0.01, + "global_step": 2716, + "learning_rate": 0.0004894991652754591, + "loss": 3.1311, + "loss_base2": 4.5172, + "loss_pixel": 0.3843, + "loss_text": 2.7468, + "ppl": 22.8992, + "step": 2716 + }, + { + "epoch": 0.01, + "global_step": 2717, + "learning_rate": 0.0004894949916527546, + "loss": 3.1089, + "loss_base2": 4.4852, + "loss_pixel": 0.3855, + "loss_text": 2.7234, + "ppl": 22.3964, + "step": 2717 + }, + { + "epoch": 0.01, + "global_step": 2718, + "learning_rate": 0.00048949081803005, + "loss": 3.0846, + "loss_base2": 4.4501, + "loss_pixel": 0.3838, + "loss_text": 2.7008, + "ppl": 21.8587, + "step": 2718 + }, + { + "epoch": 0.01, + "global_step": 2719, + "learning_rate": 0.0004894866444073455, + "loss": 3.0771, + "loss_base2": 4.4393, + "loss_pixel": 0.3833, + "loss_text": 2.6938, + "ppl": 21.6954, + "step": 2719 + }, + { + "epoch": 0.01, + "global_step": 2720, + "learning_rate": 0.000489482470784641, + "loss": 3.0558, + "loss_base2": 4.4086, + "loss_pixel": 0.3845, + "loss_text": 2.6713, + "ppl": 21.2382, + "step": 2720 + }, + { + "epoch": 0.01, + "global_step": 2721, + "learning_rate": 0.0004894782971619366, + "loss": 3.0261, + "loss_base2": 4.3657, + "loss_pixel": 0.3832, + "loss_text": 2.6429, + "ppl": 20.6167, + "step": 2721 + }, + { + "epoch": 0.01, + "global_step": 2722, + "learning_rate": 0.0004894741235392321, + "loss": 2.9943, + "loss_base2": 4.3199, + "loss_pixel": 0.3839, + "loss_text": 2.6104, + "ppl": 19.9714, + "step": 2722 + }, + { + "epoch": 0.01, + "global_step": 2723, + "learning_rate": 0.0004894699499165276, + "loss": 3.0677, + "loss_base2": 4.4258, + "loss_pixel": 0.3827, + "loss_text": 2.685, + "ppl": 21.4924, + "step": 2723 + }, + { + "epoch": 0.01, + "global_step": 2724, + "learning_rate": 0.0004894657762938231, + "loss": 3.3846, + "loss_base2": 4.8829, + "loss_pixel": 0.3826, + "loss_text": 3.0019, + "ppl": 29.5062, + "step": 2724 + }, + { + "epoch": 0.01, + "global_step": 2725, + "learning_rate": 0.0004894616026711186, + "loss": 3.3068, + "loss_base2": 4.7707, + "loss_pixel": 0.3825, + "loss_text": 2.9243, + "ppl": 27.2976, + "step": 2725 + }, + { + "epoch": 0.01, + "global_step": 2726, + "learning_rate": 0.0004894574290484141, + "loss": 3.2447, + "loss_base2": 4.6811, + "loss_pixel": 0.3822, + "loss_text": 2.8625, + "ppl": 25.654, + "step": 2726 + }, + { + "epoch": 0.01, + "global_step": 2727, + "learning_rate": 0.0004894532554257095, + "loss": 3.2063, + "loss_base2": 4.6257, + "loss_pixel": 0.384, + "loss_text": 2.8223, + "ppl": 24.6876, + "step": 2727 + }, + { + "epoch": 0.01, + "global_step": 2728, + "learning_rate": 0.000489449081803005, + "loss": 3.1871, + "loss_base2": 4.598, + "loss_pixel": 0.3828, + "loss_text": 2.8043, + "ppl": 24.2181, + "step": 2728 + }, + { + "epoch": 0.01, + "global_step": 2729, + "learning_rate": 0.0004894449081803005, + "loss": 3.1834, + "loss_base2": 4.5927, + "loss_pixel": 0.3826, + "loss_text": 2.8008, + "ppl": 24.1287, + "step": 2729 + }, + { + "epoch": 0.01, + "global_step": 2730, + "learning_rate": 0.000489440734557596, + "loss": 3.1381, + "loss_base2": 4.5273, + "loss_pixel": 0.3823, + "loss_text": 2.7557, + "ppl": 23.06, + "step": 2730 + }, + { + "epoch": 0.01, + "global_step": 2731, + "learning_rate": 0.0004894365609348915, + "loss": 3.1196, + "loss_base2": 4.5006, + "loss_pixel": 0.3814, + "loss_text": 2.7382, + "ppl": 22.6373, + "step": 2731 + }, + { + "epoch": 0.01, + "global_step": 2732, + "learning_rate": 0.000489432387312187, + "loss": 3.0812, + "loss_base2": 4.4452, + "loss_pixel": 0.3819, + "loss_text": 2.6993, + "ppl": 21.7845, + "step": 2732 + }, + { + "epoch": 0.01, + "global_step": 2733, + "learning_rate": 0.0004894282136894825, + "loss": 3.059, + "loss_base2": 4.4132, + "loss_pixel": 0.3812, + "loss_text": 2.6778, + "ppl": 21.3062, + "step": 2733 + }, + { + "epoch": 0.01, + "global_step": 2734, + "learning_rate": 0.0004894240400667779, + "loss": 3.025, + "loss_base2": 4.3642, + "loss_pixel": 0.3812, + "loss_text": 2.6438, + "ppl": 20.594, + "step": 2734 + }, + { + "epoch": 0.01, + "global_step": 2735, + "learning_rate": 0.0004894198664440734, + "loss": 2.994, + "loss_base2": 4.3194, + "loss_pixel": 0.3812, + "loss_text": 2.6128, + "ppl": 19.9654, + "step": 2735 + }, + { + "epoch": 0.01, + "global_step": 2736, + "learning_rate": 0.000489415692821369, + "loss": 2.9636, + "loss_base2": 4.2756, + "loss_pixel": 0.3814, + "loss_text": 2.5822, + "ppl": 19.3676, + "step": 2736 + }, + { + "epoch": 0.01, + "global_step": 2737, + "learning_rate": 0.0004894115191986645, + "loss": 2.9216, + "loss_base2": 4.215, + "loss_pixel": 0.3811, + "loss_text": 2.5405, + "ppl": 18.571, + "step": 2737 + }, + { + "epoch": 0.01, + "global_step": 2738, + "learning_rate": 0.00048940734557596, + "loss": 2.9175, + "loss_base2": 4.2091, + "loss_pixel": 0.3809, + "loss_text": 2.5366, + "ppl": 18.495, + "step": 2738 + }, + { + "epoch": 0.01, + "global_step": 2739, + "learning_rate": 0.0004894031719532555, + "loss": 3.056, + "loss_base2": 4.4089, + "loss_pixel": 0.3816, + "loss_text": 2.6744, + "ppl": 21.2424, + "step": 2739 + }, + { + "epoch": 0.01, + "global_step": 2740, + "learning_rate": 0.0004893989983305509, + "loss": 3.204, + "loss_base2": 4.6224, + "loss_pixel": 0.3812, + "loss_text": 2.8228, + "ppl": 24.6309, + "step": 2740 + }, + { + "epoch": 0.01, + "global_step": 2741, + "learning_rate": 0.0004893948247078464, + "loss": 3.1711, + "loss_base2": 4.5749, + "loss_pixel": 0.3822, + "loss_text": 2.7889, + "ppl": 23.8337, + "step": 2741 + }, + { + "epoch": 0.01, + "global_step": 2742, + "learning_rate": 0.0004893906510851419, + "loss": 3.0967, + "loss_base2": 4.4676, + "loss_pixel": 0.3819, + "loss_text": 2.7148, + "ppl": 22.1248, + "step": 2742 + }, + { + "epoch": 0.01, + "global_step": 2743, + "learning_rate": 0.0004893864774624374, + "loss": 3.113, + "loss_base2": 4.4911, + "loss_pixel": 0.3819, + "loss_text": 2.7311, + "ppl": 22.4884, + "step": 2743 + }, + { + "epoch": 0.01, + "global_step": 2744, + "learning_rate": 0.0004893823038397329, + "loss": 3.0893, + "loss_base2": 4.4569, + "loss_pixel": 0.3818, + "loss_text": 2.7075, + "ppl": 21.9617, + "step": 2744 + }, + { + "epoch": 0.01, + "global_step": 2745, + "learning_rate": 0.0004893781302170284, + "loss": 3.0631, + "loss_base2": 4.4191, + "loss_pixel": 0.3814, + "loss_text": 2.6816, + "ppl": 21.3938, + "step": 2745 + }, + { + "epoch": 0.01, + "global_step": 2746, + "learning_rate": 0.0004893739565943239, + "loss": 3.0425, + "loss_base2": 4.3894, + "loss_pixel": 0.3813, + "loss_text": 2.6612, + "ppl": 20.9576, + "step": 2746 + }, + { + "epoch": 0.01, + "global_step": 2747, + "learning_rate": 0.0004893697829716194, + "loss": 3.0518, + "loss_base2": 4.4028, + "loss_pixel": 0.3812, + "loss_text": 2.6706, + "ppl": 21.1534, + "step": 2747 + }, + { + "epoch": 0.01, + "global_step": 2748, + "learning_rate": 0.0004893656093489149, + "loss": 3.0085, + "loss_base2": 4.3403, + "loss_pixel": 0.3817, + "loss_text": 2.6268, + "ppl": 20.257, + "step": 2748 + }, + { + "epoch": 0.01, + "global_step": 2749, + "learning_rate": 0.0004893614357262103, + "loss": 2.9946, + "loss_base2": 4.3203, + "loss_pixel": 0.3817, + "loss_text": 2.6128, + "ppl": 19.9774, + "step": 2749 + }, + { + "epoch": 0.01, + "global_step": 2750, + "learning_rate": 0.0004893572621035058, + "loss": 2.9772, + "loss_base2": 4.2952, + "loss_pixel": 0.381, + "loss_text": 2.5963, + "ppl": 19.6328, + "step": 2750 + }, + { + "epoch": 0.02, + "global_step": 2751, + "learning_rate": 0.0004893530884808013, + "loss": 2.9541, + "loss_base2": 4.2619, + "loss_pixel": 0.381, + "loss_text": 2.5732, + "ppl": 19.1844, + "step": 2751 + }, + { + "epoch": 0.02, + "global_step": 2752, + "learning_rate": 0.0004893489148580968, + "loss": 2.9401, + "loss_base2": 4.2417, + "loss_pixel": 0.3806, + "loss_text": 2.5595, + "ppl": 18.9177, + "step": 2752 + }, + { + "epoch": 0.02, + "global_step": 2753, + "learning_rate": 0.0004893447412353924, + "loss": 2.9026, + "loss_base2": 4.1876, + "loss_pixel": 0.3805, + "loss_text": 2.5221, + "ppl": 18.2215, + "step": 2753 + }, + { + "epoch": 0.02, + "global_step": 2754, + "learning_rate": 0.0004893405676126878, + "loss": 2.8934, + "loss_base2": 4.1743, + "loss_pixel": 0.3806, + "loss_text": 2.5129, + "ppl": 18.0546, + "step": 2754 + }, + { + "epoch": 0.02, + "global_step": 2755, + "learning_rate": 0.0004893363939899833, + "loss": 2.8688, + "loss_base2": 4.1388, + "loss_pixel": 0.3801, + "loss_text": 2.4887, + "ppl": 17.6159, + "step": 2755 + }, + { + "epoch": 0.02, + "global_step": 2756, + "learning_rate": 0.0004893322203672788, + "loss": 2.8617, + "loss_base2": 4.1286, + "loss_pixel": 0.3798, + "loss_text": 2.4818, + "ppl": 17.4912, + "step": 2756 + }, + { + "epoch": 0.02, + "global_step": 2757, + "learning_rate": 0.0004893280467445743, + "loss": 2.8296, + "loss_base2": 4.0822, + "loss_pixel": 0.3802, + "loss_text": 2.4494, + "ppl": 16.9387, + "step": 2757 + }, + { + "epoch": 0.02, + "global_step": 2758, + "learning_rate": 0.0004893238731218698, + "loss": 2.8018, + "loss_base2": 4.0421, + "loss_pixel": 0.3798, + "loss_text": 2.422, + "ppl": 16.4743, + "step": 2758 + }, + { + "epoch": 0.02, + "global_step": 2759, + "learning_rate": 0.0004893196994991653, + "loss": 2.7731, + "loss_base2": 4.0007, + "loss_pixel": 0.3785, + "loss_text": 2.3946, + "ppl": 16.0082, + "step": 2759 + }, + { + "epoch": 0.02, + "global_step": 2760, + "learning_rate": 0.0004893155258764608, + "loss": 2.7609, + "loss_base2": 3.9831, + "loss_pixel": 0.3788, + "loss_text": 2.3821, + "ppl": 15.8141, + "step": 2760 + }, + { + "epoch": 0.02, + "global_step": 2761, + "learning_rate": 0.0004893113522537563, + "loss": 2.752, + "loss_base2": 3.9703, + "loss_pixel": 0.3783, + "loss_text": 2.3737, + "ppl": 15.6739, + "step": 2761 + }, + { + "epoch": 0.02, + "global_step": 2762, + "learning_rate": 0.0004893071786310518, + "loss": 2.7314, + "loss_base2": 3.9406, + "loss_pixel": 0.3789, + "loss_text": 2.3525, + "ppl": 15.3544, + "step": 2762 + }, + { + "epoch": 0.02, + "global_step": 2763, + "learning_rate": 0.0004893030050083472, + "loss": 2.776, + "loss_base2": 4.0049, + "loss_pixel": 0.3816, + "loss_text": 2.3944, + "ppl": 16.0547, + "step": 2763 + }, + { + "epoch": 0.02, + "global_step": 2764, + "learning_rate": 0.0004892988313856427, + "loss": 2.7599, + "loss_base2": 3.9817, + "loss_pixel": 0.3993, + "loss_text": 2.3606, + "ppl": 15.7983, + "step": 2764 + }, + { + "epoch": 0.02, + "global_step": 2765, + "learning_rate": 0.0004892946577629382, + "loss": 2.8579, + "loss_base2": 4.1231, + "loss_pixel": 0.4283, + "loss_text": 2.4296, + "ppl": 17.4249, + "step": 2765 + }, + { + "epoch": 0.02, + "global_step": 2766, + "learning_rate": 0.0004892904841402337, + "loss": 2.8386, + "loss_base2": 4.0952, + "loss_pixel": 0.3885, + "loss_text": 2.4501, + "ppl": 17.0918, + "step": 2766 + }, + { + "epoch": 0.02, + "global_step": 2767, + "learning_rate": 0.0004892863105175292, + "loss": 2.7974, + "loss_base2": 4.0358, + "loss_pixel": 0.3851, + "loss_text": 2.4123, + "ppl": 16.4019, + "step": 2767 + }, + { + "epoch": 0.02, + "global_step": 2768, + "learning_rate": 0.0004892821368948247, + "loss": 2.7825, + "loss_base2": 4.0143, + "loss_pixel": 0.3909, + "loss_text": 2.3917, + "ppl": 16.1594, + "step": 2768 + }, + { + "epoch": 0.02, + "global_step": 2769, + "learning_rate": 0.0004892779632721203, + "loss": 2.7517, + "loss_base2": 3.9699, + "loss_pixel": 0.3898, + "loss_text": 2.3619, + "ppl": 15.6692, + "step": 2769 + }, + { + "epoch": 0.02, + "global_step": 2770, + "learning_rate": 0.0004892737896494158, + "loss": 2.7258, + "loss_base2": 3.9325, + "loss_pixel": 0.3861, + "loss_text": 2.3397, + "ppl": 15.2686, + "step": 2770 + }, + { + "epoch": 0.02, + "global_step": 2771, + "learning_rate": 0.0004892696160267113, + "loss": 2.7125, + "loss_base2": 3.9133, + "loss_pixel": 0.3846, + "loss_text": 2.3279, + "ppl": 15.0669, + "step": 2771 + }, + { + "epoch": 0.02, + "global_step": 2772, + "learning_rate": 0.0004892654424040067, + "loss": 2.6918, + "loss_base2": 3.8834, + "loss_pixel": 0.3839, + "loss_text": 2.3079, + "ppl": 14.7582, + "step": 2772 + }, + { + "epoch": 0.02, + "global_step": 2773, + "learning_rate": 0.0004892612687813022, + "loss": 2.6702, + "loss_base2": 3.8523, + "loss_pixel": 0.3846, + "loss_text": 2.2856, + "ppl": 14.4429, + "step": 2773 + }, + { + "epoch": 0.02, + "global_step": 2774, + "learning_rate": 0.0004892570951585977, + "loss": 2.6513, + "loss_base2": 3.825, + "loss_pixel": 0.3856, + "loss_text": 2.2658, + "ppl": 14.1725, + "step": 2774 + }, + { + "epoch": 0.02, + "global_step": 2775, + "learning_rate": 0.0004892529215358932, + "loss": 2.6529, + "loss_base2": 3.8273, + "loss_pixel": 0.3849, + "loss_text": 2.268, + "ppl": 14.1951, + "step": 2775 + }, + { + "epoch": 0.02, + "global_step": 2776, + "learning_rate": 0.0004892487479131887, + "loss": 2.6302, + "loss_base2": 3.7946, + "loss_pixel": 0.3844, + "loss_text": 2.2458, + "ppl": 13.8765, + "step": 2776 + }, + { + "epoch": 0.02, + "global_step": 2777, + "learning_rate": 0.0004892445742904841, + "loss": 2.6287, + "loss_base2": 3.7924, + "loss_pixel": 0.3829, + "loss_text": 2.2458, + "ppl": 13.8557, + "step": 2777 + }, + { + "epoch": 0.02, + "global_step": 2778, + "learning_rate": 0.0004892404006677796, + "loss": 2.612, + "loss_base2": 3.7683, + "loss_pixel": 0.383, + "loss_text": 2.2291, + "ppl": 13.6263, + "step": 2778 + }, + { + "epoch": 0.02, + "global_step": 2779, + "learning_rate": 0.0004892362270450751, + "loss": 2.5943, + "loss_base2": 3.7428, + "loss_pixel": 0.3822, + "loss_text": 2.2121, + "ppl": 13.3872, + "step": 2779 + }, + { + "epoch": 0.02, + "global_step": 2780, + "learning_rate": 0.0004892320534223706, + "loss": 2.5748, + "loss_base2": 3.7147, + "loss_pixel": 0.383, + "loss_text": 2.1918, + "ppl": 13.1287, + "step": 2780 + }, + { + "epoch": 0.02, + "global_step": 2781, + "learning_rate": 0.0004892278797996661, + "loss": 2.5449, + "loss_base2": 3.6715, + "loss_pixel": 0.3821, + "loss_text": 2.1628, + "ppl": 12.742, + "step": 2781 + }, + { + "epoch": 0.02, + "global_step": 2782, + "learning_rate": 0.0004892237061769616, + "loss": 2.5418, + "loss_base2": 3.667, + "loss_pixel": 0.3819, + "loss_text": 2.1598, + "ppl": 12.7025, + "step": 2782 + }, + { + "epoch": 0.02, + "global_step": 2783, + "learning_rate": 0.0004892195325542571, + "loss": 2.5682, + "loss_base2": 3.7051, + "loss_pixel": 0.3816, + "loss_text": 2.1866, + "ppl": 13.0423, + "step": 2783 + }, + { + "epoch": 0.02, + "global_step": 2784, + "learning_rate": 0.0004892153589315526, + "loss": 2.5407, + "loss_base2": 3.6655, + "loss_pixel": 0.3809, + "loss_text": 2.1597, + "ppl": 12.6885, + "step": 2784 + }, + { + "epoch": 0.02, + "global_step": 2785, + "learning_rate": 0.0004892111853088482, + "loss": 2.5428, + "loss_base2": 3.6685, + "loss_pixel": 0.3808, + "loss_text": 2.162, + "ppl": 12.7152, + "step": 2785 + }, + { + "epoch": 0.02, + "global_step": 2786, + "learning_rate": 0.0004892070116861436, + "loss": 2.5377, + "loss_base2": 3.6611, + "loss_pixel": 0.381, + "loss_text": 2.1567, + "ppl": 12.6505, + "step": 2786 + }, + { + "epoch": 0.02, + "global_step": 2787, + "learning_rate": 0.0004892028380634391, + "loss": 2.5244, + "loss_base2": 3.6419, + "loss_pixel": 0.3817, + "loss_text": 2.1427, + "ppl": 12.4834, + "step": 2787 + }, + { + "epoch": 0.02, + "global_step": 2788, + "learning_rate": 0.0004891986644407346, + "loss": 2.4979, + "loss_base2": 3.6037, + "loss_pixel": 0.381, + "loss_text": 2.1169, + "ppl": 12.1569, + "step": 2788 + }, + { + "epoch": 0.02, + "global_step": 2789, + "learning_rate": 0.0004891944908180301, + "loss": 2.4909, + "loss_base2": 3.5936, + "loss_pixel": 0.3812, + "loss_text": 2.1097, + "ppl": 12.0721, + "step": 2789 + }, + { + "epoch": 0.02, + "global_step": 2790, + "learning_rate": 0.0004891903171953255, + "loss": 2.4738, + "loss_base2": 3.5689, + "loss_pixel": 0.3807, + "loss_text": 2.0931, + "ppl": 11.8675, + "step": 2790 + }, + { + "epoch": 0.02, + "global_step": 2791, + "learning_rate": 0.000489186143572621, + "loss": 2.4763, + "loss_base2": 3.5725, + "loss_pixel": 0.381, + "loss_text": 2.0953, + "ppl": 11.8972, + "step": 2791 + }, + { + "epoch": 0.02, + "global_step": 2792, + "learning_rate": 0.0004891819699499165, + "loss": 2.4256, + "loss_base2": 3.4994, + "loss_pixel": 0.3803, + "loss_text": 2.0453, + "ppl": 11.309, + "step": 2792 + }, + { + "epoch": 0.02, + "global_step": 2793, + "learning_rate": 0.000489177796327212, + "loss": 2.4334, + "loss_base2": 3.5107, + "loss_pixel": 0.3808, + "loss_text": 2.0526, + "ppl": 11.3976, + "step": 2793 + }, + { + "epoch": 0.02, + "global_step": 2794, + "learning_rate": 0.0004891736227045075, + "loss": 2.437, + "loss_base2": 3.5158, + "loss_pixel": 0.3804, + "loss_text": 2.0565, + "ppl": 11.4387, + "step": 2794 + }, + { + "epoch": 0.02, + "global_step": 2795, + "learning_rate": 0.000489169449081803, + "loss": 2.5052, + "loss_base2": 3.6142, + "loss_pixel": 0.3807, + "loss_text": 2.1244, + "ppl": 12.246, + "step": 2795 + }, + { + "epoch": 0.02, + "global_step": 2796, + "learning_rate": 0.0004891652754590985, + "loss": 2.4848, + "loss_base2": 3.5848, + "loss_pixel": 0.3819, + "loss_text": 2.1029, + "ppl": 11.9987, + "step": 2796 + }, + { + "epoch": 0.02, + "global_step": 2797, + "learning_rate": 0.000489161101836394, + "loss": 2.6167, + "loss_base2": 3.7751, + "loss_pixel": 0.3809, + "loss_text": 2.2358, + "ppl": 13.6905, + "step": 2797 + }, + { + "epoch": 0.02, + "global_step": 2798, + "learning_rate": 0.0004891569282136895, + "loss": 2.7079, + "loss_base2": 3.9067, + "loss_pixel": 0.3806, + "loss_text": 2.3273, + "ppl": 14.9977, + "step": 2798 + }, + { + "epoch": 0.02, + "global_step": 2799, + "learning_rate": 0.0004891527545909849, + "loss": 2.578, + "loss_base2": 3.7193, + "loss_pixel": 0.3805, + "loss_text": 2.1976, + "ppl": 13.1708, + "step": 2799 + }, + { + "epoch": 0.02, + "global_step": 2800, + "learning_rate": 0.0004891485809682804, + "loss": 2.5569, + "loss_base2": 3.6888, + "loss_pixel": 0.3803, + "loss_text": 2.1766, + "ppl": 12.8958, + "step": 2800 + }, + { + "epoch": 0.02, + "global_step": 2801, + "learning_rate": 0.000489144407345576, + "loss": 2.51, + "loss_base2": 3.6212, + "loss_pixel": 0.38, + "loss_text": 2.13, + "ppl": 12.3049, + "step": 2801 + }, + { + "epoch": 0.02, + "global_step": 2802, + "learning_rate": 0.0004891402337228715, + "loss": 2.4749, + "loss_base2": 3.5705, + "loss_pixel": 0.3804, + "loss_text": 2.0945, + "ppl": 11.8805, + "step": 2802 + }, + { + "epoch": 0.02, + "global_step": 2803, + "learning_rate": 0.000489136060100167, + "loss": 2.5167, + "loss_base2": 3.6308, + "loss_pixel": 0.3799, + "loss_text": 2.1368, + "ppl": 12.3876, + "step": 2803 + }, + { + "epoch": 0.02, + "global_step": 2804, + "learning_rate": 0.0004891318864774625, + "loss": 2.6577, + "loss_base2": 3.8343, + "loss_pixel": 0.3801, + "loss_text": 2.2776, + "ppl": 14.2634, + "step": 2804 + }, + { + "epoch": 0.02, + "global_step": 2805, + "learning_rate": 0.000489127712854758, + "loss": 2.6257, + "loss_base2": 3.7881, + "loss_pixel": 0.381, + "loss_text": 2.2447, + "ppl": 13.8142, + "step": 2805 + }, + { + "epoch": 0.02, + "global_step": 2806, + "learning_rate": 0.0004891235392320535, + "loss": 2.5947, + "loss_base2": 3.7434, + "loss_pixel": 0.38, + "loss_text": 2.2147, + "ppl": 13.3926, + "step": 2806 + }, + { + "epoch": 0.02, + "global_step": 2807, + "learning_rate": 0.000489119365609349, + "loss": 2.566, + "loss_base2": 3.702, + "loss_pixel": 0.3802, + "loss_text": 2.1859, + "ppl": 13.0137, + "step": 2807 + }, + { + "epoch": 0.02, + "global_step": 2808, + "learning_rate": 0.0004891151919866444, + "loss": 2.5614, + "loss_base2": 3.6953, + "loss_pixel": 0.3796, + "loss_text": 2.1819, + "ppl": 12.9539, + "step": 2808 + }, + { + "epoch": 0.02, + "global_step": 2809, + "learning_rate": 0.0004891110183639399, + "loss": 2.5544, + "loss_base2": 3.6852, + "loss_pixel": 0.38, + "loss_text": 2.1744, + "ppl": 12.8636, + "step": 2809 + }, + { + "epoch": 0.02, + "global_step": 2810, + "learning_rate": 0.0004891068447412354, + "loss": 2.5271, + "loss_base2": 3.6458, + "loss_pixel": 0.3809, + "loss_text": 2.1462, + "ppl": 12.5172, + "step": 2810 + }, + { + "epoch": 0.02, + "global_step": 2811, + "learning_rate": 0.0004891026711185309, + "loss": 2.4976, + "loss_base2": 3.6033, + "loss_pixel": 0.38, + "loss_text": 2.1176, + "ppl": 12.1533, + "step": 2811 + }, + { + "epoch": 0.02, + "global_step": 2812, + "learning_rate": 0.0004890984974958264, + "loss": 2.4875, + "loss_base2": 3.5887, + "loss_pixel": 0.3797, + "loss_text": 2.1078, + "ppl": 12.0312, + "step": 2812 + }, + { + "epoch": 0.02, + "global_step": 2813, + "learning_rate": 0.0004890943238731218, + "loss": 2.4803, + "loss_base2": 3.5783, + "loss_pixel": 0.3797, + "loss_text": 2.1006, + "ppl": 11.9448, + "step": 2813 + }, + { + "epoch": 0.02, + "global_step": 2814, + "learning_rate": 0.0004890901502504173, + "loss": 2.4604, + "loss_base2": 3.5496, + "loss_pixel": 0.3811, + "loss_text": 2.0793, + "ppl": 11.7095, + "step": 2814 + }, + { + "epoch": 0.02, + "global_step": 2815, + "learning_rate": 0.0004890859766277128, + "loss": 2.4427, + "loss_base2": 3.5241, + "loss_pixel": 0.3835, + "loss_text": 2.0591, + "ppl": 11.5041, + "step": 2815 + }, + { + "epoch": 0.02, + "global_step": 2816, + "learning_rate": 0.0004890818030050083, + "loss": 2.4512, + "loss_base2": 3.5363, + "loss_pixel": 0.384, + "loss_text": 2.0673, + "ppl": 11.6023, + "step": 2816 + }, + { + "epoch": 0.02, + "global_step": 2817, + "learning_rate": 0.0004890776293823038, + "loss": 2.4332, + "loss_base2": 3.5104, + "loss_pixel": 0.3805, + "loss_text": 2.0527, + "ppl": 11.3953, + "step": 2817 + }, + { + "epoch": 0.02, + "global_step": 2818, + "learning_rate": 0.0004890734557595994, + "loss": 2.4354, + "loss_base2": 3.5135, + "loss_pixel": 0.3788, + "loss_text": 2.0566, + "ppl": 11.4204, + "step": 2818 + }, + { + "epoch": 0.02, + "global_step": 2819, + "learning_rate": 0.0004890692821368949, + "loss": 2.4492, + "loss_base2": 3.5334, + "loss_pixel": 0.3786, + "loss_text": 2.0706, + "ppl": 11.5791, + "step": 2819 + }, + { + "epoch": 0.02, + "global_step": 2820, + "learning_rate": 0.0004890651085141904, + "loss": 2.4529, + "loss_base2": 3.5388, + "loss_pixel": 0.3788, + "loss_text": 2.0741, + "ppl": 11.622, + "step": 2820 + }, + { + "epoch": 0.02, + "global_step": 2821, + "learning_rate": 0.0004890609348914859, + "loss": 2.4371, + "loss_base2": 3.516, + "loss_pixel": 0.3789, + "loss_text": 2.0582, + "ppl": 11.4398, + "step": 2821 + }, + { + "epoch": 0.02, + "global_step": 2822, + "learning_rate": 0.0004890567612687813, + "loss": 2.4505, + "loss_base2": 3.5353, + "loss_pixel": 0.3791, + "loss_text": 2.0714, + "ppl": 11.5941, + "step": 2822 + }, + { + "epoch": 0.02, + "global_step": 2823, + "learning_rate": 0.0004890525876460768, + "loss": 2.4114, + "loss_base2": 3.4789, + "loss_pixel": 0.3791, + "loss_text": 2.0323, + "ppl": 11.1496, + "step": 2823 + }, + { + "epoch": 0.02, + "global_step": 2824, + "learning_rate": 0.0004890484140233723, + "loss": 2.4006, + "loss_base2": 3.4633, + "loss_pixel": 0.3788, + "loss_text": 2.0218, + "ppl": 11.0298, + "step": 2824 + }, + { + "epoch": 0.02, + "global_step": 2825, + "learning_rate": 0.0004890442404006678, + "loss": 2.3953, + "loss_base2": 3.4557, + "loss_pixel": 0.3785, + "loss_text": 2.0168, + "ppl": 10.9715, + "step": 2825 + }, + { + "epoch": 0.02, + "global_step": 2826, + "learning_rate": 0.0004890400667779633, + "loss": 2.3852, + "loss_base2": 3.4411, + "loss_pixel": 0.378, + "loss_text": 2.0072, + "ppl": 10.8612, + "step": 2826 + }, + { + "epoch": 0.02, + "global_step": 2827, + "learning_rate": 0.0004890358931552588, + "loss": 2.3739, + "loss_base2": 3.4248, + "loss_pixel": 0.3775, + "loss_text": 1.9965, + "ppl": 10.7392, + "step": 2827 + }, + { + "epoch": 0.02, + "global_step": 2828, + "learning_rate": 0.0004890317195325542, + "loss": 2.3694, + "loss_base2": 3.4183, + "loss_pixel": 0.3778, + "loss_text": 1.9916, + "ppl": 10.691, + "step": 2828 + }, + { + "epoch": 0.02, + "global_step": 2829, + "learning_rate": 0.0004890275459098497, + "loss": 2.3766, + "loss_base2": 3.4287, + "loss_pixel": 0.3771, + "loss_text": 1.9995, + "ppl": 10.7682, + "step": 2829 + }, + { + "epoch": 0.02, + "global_step": 2830, + "learning_rate": 0.0004890233722871452, + "loss": 2.3619, + "loss_base2": 3.4075, + "loss_pixel": 0.377, + "loss_text": 1.985, + "ppl": 10.6111, + "step": 2830 + }, + { + "epoch": 0.02, + "global_step": 2831, + "learning_rate": 0.0004890191986644407, + "loss": 2.3443, + "loss_base2": 3.3821, + "loss_pixel": 0.3768, + "loss_text": 1.9675, + "ppl": 10.426, + "step": 2831 + }, + { + "epoch": 0.02, + "global_step": 2832, + "learning_rate": 0.0004890150250417362, + "loss": 2.3267, + "loss_base2": 3.3567, + "loss_pixel": 0.3756, + "loss_text": 1.9512, + "ppl": 10.2441, + "step": 2832 + }, + { + "epoch": 0.02, + "global_step": 2833, + "learning_rate": 0.0004890108514190317, + "loss": 2.3192, + "loss_base2": 3.3459, + "loss_pixel": 0.3756, + "loss_text": 1.9436, + "ppl": 10.1675, + "step": 2833 + }, + { + "epoch": 0.02, + "global_step": 2834, + "learning_rate": 0.0004890066777963273, + "loss": 2.3423, + "loss_base2": 3.3792, + "loss_pixel": 0.3746, + "loss_text": 1.9677, + "ppl": 10.4051, + "step": 2834 + }, + { + "epoch": 0.02, + "global_step": 2835, + "learning_rate": 0.0004890025041736228, + "loss": 2.3216, + "loss_base2": 3.3494, + "loss_pixel": 0.3745, + "loss_text": 1.9471, + "ppl": 10.192, + "step": 2835 + }, + { + "epoch": 0.02, + "global_step": 2836, + "learning_rate": 0.0004889983305509182, + "loss": 2.3071, + "loss_base2": 3.3284, + "loss_pixel": 0.3728, + "loss_text": 1.9343, + "ppl": 10.0453, + "step": 2836 + }, + { + "epoch": 0.02, + "global_step": 2837, + "learning_rate": 0.0004889941569282137, + "loss": 2.3065, + "loss_base2": 3.3276, + "loss_pixel": 0.3715, + "loss_text": 1.935, + "ppl": 10.0392, + "step": 2837 + }, + { + "epoch": 0.02, + "global_step": 2838, + "learning_rate": 0.0004889899833055092, + "loss": 2.3839, + "loss_base2": 3.4392, + "loss_pixel": 0.4483, + "loss_text": 1.9356, + "ppl": 10.8471, + "step": 2838 + }, + { + "epoch": 0.02, + "global_step": 2839, + "learning_rate": 0.0004889858096828047, + "loss": 2.5407, + "loss_base2": 3.6655, + "loss_pixel": 0.6142, + "loss_text": 1.9266, + "ppl": 12.6885, + "step": 2839 + }, + { + "epoch": 0.02, + "global_step": 2840, + "learning_rate": 0.0004889816360601002, + "loss": 2.3262, + "loss_base2": 3.356, + "loss_pixel": 0.4103, + "loss_text": 1.9159, + "ppl": 10.239, + "step": 2840 + }, + { + "epoch": 0.02, + "global_step": 2841, + "learning_rate": 0.0004889774624373957, + "loss": 2.3175, + "loss_base2": 3.3434, + "loss_pixel": 0.3995, + "loss_text": 1.9181, + "ppl": 10.1503, + "step": 2841 + }, + { + "epoch": 0.02, + "global_step": 2842, + "learning_rate": 0.0004889732888146912, + "loss": 2.2991, + "loss_base2": 3.3169, + "loss_pixel": 0.4011, + "loss_text": 1.898, + "ppl": 9.9652, + "step": 2842 + }, + { + "epoch": 0.02, + "global_step": 2843, + "learning_rate": 0.0004889691151919867, + "loss": 2.3061, + "loss_base2": 3.327, + "loss_pixel": 0.4007, + "loss_text": 1.9053, + "ppl": 10.0352, + "step": 2843 + }, + { + "epoch": 0.02, + "global_step": 2844, + "learning_rate": 0.0004889649415692822, + "loss": 2.2937, + "loss_base2": 3.3091, + "loss_pixel": 0.3976, + "loss_text": 1.8961, + "ppl": 9.9115, + "step": 2844 + }, + { + "epoch": 0.02, + "global_step": 2845, + "learning_rate": 0.0004889607679465776, + "loss": 2.2938, + "loss_base2": 3.3093, + "loss_pixel": 0.3929, + "loss_text": 1.9009, + "ppl": 9.9125, + "step": 2845 + }, + { + "epoch": 0.02, + "global_step": 2846, + "learning_rate": 0.0004889565943238731, + "loss": 2.2633, + "loss_base2": 3.2653, + "loss_pixel": 0.39, + "loss_text": 1.8733, + "ppl": 9.6148, + "step": 2846 + }, + { + "epoch": 0.02, + "global_step": 2847, + "learning_rate": 0.0004889524207011686, + "loss": 2.1412, + "loss_base2": 3.0891, + "loss_pixel": 0.3895, + "loss_text": 1.7516, + "ppl": 8.5096, + "step": 2847 + }, + { + "epoch": 0.02, + "global_step": 2848, + "learning_rate": 0.0004889482470784641, + "loss": 2.134, + "loss_base2": 3.0787, + "loss_pixel": 0.3915, + "loss_text": 1.7425, + "ppl": 8.4486, + "step": 2848 + }, + { + "epoch": 0.02, + "global_step": 2849, + "learning_rate": 0.0004889440734557595, + "loss": 2.1517, + "loss_base2": 3.1042, + "loss_pixel": 0.3923, + "loss_text": 1.7594, + "ppl": 8.5995, + "step": 2849 + }, + { + "epoch": 0.02, + "global_step": 2850, + "learning_rate": 0.000488939899833055, + "loss": 2.1512, + "loss_base2": 3.1035, + "loss_pixel": 0.3904, + "loss_text": 1.7607, + "ppl": 8.5952, + "step": 2850 + }, + { + "epoch": 0.02, + "global_step": 2851, + "learning_rate": 0.0004889357262103506, + "loss": 2.1476, + "loss_base2": 3.0983, + "loss_pixel": 0.3881, + "loss_text": 1.7595, + "ppl": 8.5643, + "step": 2851 + }, + { + "epoch": 0.02, + "global_step": 2852, + "learning_rate": 0.0004889315525876461, + "loss": 2.1113, + "loss_base2": 3.046, + "loss_pixel": 0.3863, + "loss_text": 1.7251, + "ppl": 8.259, + "step": 2852 + }, + { + "epoch": 0.02, + "global_step": 2853, + "learning_rate": 0.0004889273789649416, + "loss": 2.1038, + "loss_base2": 3.0351, + "loss_pixel": 0.3845, + "loss_text": 1.7193, + "ppl": 8.1973, + "step": 2853 + }, + { + "epoch": 0.02, + "global_step": 2854, + "learning_rate": 0.0004889232053422371, + "loss": 2.1006, + "loss_base2": 3.0305, + "loss_pixel": 0.3842, + "loss_text": 1.7164, + "ppl": 8.1711, + "step": 2854 + }, + { + "epoch": 0.02, + "global_step": 2855, + "learning_rate": 0.0004889190317195326, + "loss": 2.0773, + "loss_base2": 2.9969, + "loss_pixel": 0.3854, + "loss_text": 1.6919, + "ppl": 7.9829, + "step": 2855 + }, + { + "epoch": 0.02, + "global_step": 2856, + "learning_rate": 0.0004889148580968281, + "loss": 2.069, + "loss_base2": 2.9849, + "loss_pixel": 0.3846, + "loss_text": 1.6843, + "ppl": 7.9169, + "step": 2856 + }, + { + "epoch": 0.02, + "global_step": 2857, + "learning_rate": 0.0004889106844741236, + "loss": 2.0541, + "loss_base2": 2.9634, + "loss_pixel": 0.3847, + "loss_text": 1.6694, + "ppl": 7.7998, + "step": 2857 + }, + { + "epoch": 0.02, + "global_step": 2858, + "learning_rate": 0.000488906510851419, + "loss": 2.0391, + "loss_base2": 2.9418, + "loss_pixel": 0.3845, + "loss_text": 1.6546, + "ppl": 7.6837, + "step": 2858 + }, + { + "epoch": 0.02, + "global_step": 2859, + "learning_rate": 0.0004889023372287145, + "loss": 2.03, + "loss_base2": 2.9287, + "loss_pixel": 0.3842, + "loss_text": 1.6458, + "ppl": 7.6141, + "step": 2859 + }, + { + "epoch": 0.02, + "global_step": 2860, + "learning_rate": 0.00048889816360601, + "loss": 2.0206, + "loss_base2": 2.9151, + "loss_pixel": 0.383, + "loss_text": 1.6376, + "ppl": 7.5428, + "step": 2860 + }, + { + "epoch": 0.02, + "global_step": 2861, + "learning_rate": 0.0004888939899833055, + "loss": 2.0146, + "loss_base2": 2.9065, + "loss_pixel": 0.382, + "loss_text": 1.6325, + "ppl": 7.4977, + "step": 2861 + }, + { + "epoch": 0.02, + "global_step": 2862, + "learning_rate": 0.000488889816360601, + "loss": 2.0044, + "loss_base2": 2.8917, + "loss_pixel": 0.3822, + "loss_text": 1.6221, + "ppl": 7.4216, + "step": 2862 + }, + { + "epoch": 0.02, + "global_step": 2863, + "learning_rate": 0.0004888856427378965, + "loss": 2.3256, + "loss_base2": 3.3551, + "loss_pixel": 0.383, + "loss_text": 1.9426, + "ppl": 10.2328, + "step": 2863 + }, + { + "epoch": 0.02, + "global_step": 2864, + "learning_rate": 0.000488881469115192, + "loss": 2.2903, + "loss_base2": 3.3042, + "loss_pixel": 0.3822, + "loss_text": 1.9081, + "ppl": 9.8779, + "step": 2864 + }, + { + "epoch": 0.02, + "global_step": 2865, + "learning_rate": 0.0004888772954924874, + "loss": 2.3048, + "loss_base2": 3.3251, + "loss_pixel": 0.3835, + "loss_text": 1.9212, + "ppl": 10.0222, + "step": 2865 + }, + { + "epoch": 0.02, + "global_step": 2866, + "learning_rate": 0.000488873121869783, + "loss": 2.28, + "loss_base2": 3.2893, + "loss_pixel": 0.3823, + "loss_text": 1.8977, + "ppl": 9.7767, + "step": 2866 + }, + { + "epoch": 0.02, + "global_step": 2867, + "learning_rate": 0.0004888689482470785, + "loss": 2.2718, + "loss_base2": 3.2775, + "loss_pixel": 0.3817, + "loss_text": 1.8902, + "ppl": 9.6968, + "step": 2867 + }, + { + "epoch": 0.02, + "global_step": 2868, + "learning_rate": 0.000488864774624374, + "loss": 2.2585, + "loss_base2": 3.2583, + "loss_pixel": 0.3824, + "loss_text": 1.8761, + "ppl": 9.5687, + "step": 2868 + }, + { + "epoch": 0.02, + "global_step": 2869, + "learning_rate": 0.0004888606010016695, + "loss": 2.2497, + "loss_base2": 3.2456, + "loss_pixel": 0.3822, + "loss_text": 1.8675, + "ppl": 9.4849, + "step": 2869 + }, + { + "epoch": 0.02, + "global_step": 2870, + "learning_rate": 0.000488856427378965, + "loss": 2.2369, + "loss_base2": 3.2272, + "loss_pixel": 0.3809, + "loss_text": 1.856, + "ppl": 9.3643, + "step": 2870 + }, + { + "epoch": 0.02, + "global_step": 2871, + "learning_rate": 0.0004888522537562605, + "loss": 2.242, + "loss_base2": 3.2345, + "loss_pixel": 0.3813, + "loss_text": 1.8607, + "ppl": 9.4121, + "step": 2871 + }, + { + "epoch": 0.02, + "global_step": 2872, + "learning_rate": 0.0004888480801335559, + "loss": 2.2284, + "loss_base2": 3.2149, + "loss_pixel": 0.3807, + "loss_text": 1.8477, + "ppl": 9.285, + "step": 2872 + }, + { + "epoch": 0.02, + "global_step": 2873, + "learning_rate": 0.0004888439065108514, + "loss": 2.2274, + "loss_base2": 3.2135, + "loss_pixel": 0.3808, + "loss_text": 1.8466, + "ppl": 9.2757, + "step": 2873 + }, + { + "epoch": 0.02, + "global_step": 2874, + "learning_rate": 0.0004888397328881469, + "loss": 2.2187, + "loss_base2": 3.2009, + "loss_pixel": 0.3812, + "loss_text": 1.8375, + "ppl": 9.1954, + "step": 2874 + }, + { + "epoch": 0.02, + "global_step": 2875, + "learning_rate": 0.0004888355592654424, + "loss": 2.2184, + "loss_base2": 3.2005, + "loss_pixel": 0.3809, + "loss_text": 1.8375, + "ppl": 9.1926, + "step": 2875 + }, + { + "epoch": 0.02, + "global_step": 2876, + "learning_rate": 0.0004888313856427379, + "loss": 2.187, + "loss_base2": 3.1552, + "loss_pixel": 0.3809, + "loss_text": 1.8061, + "ppl": 8.9084, + "step": 2876 + }, + { + "epoch": 0.02, + "global_step": 2877, + "learning_rate": 0.0004888272120200334, + "loss": 2.2185, + "loss_base2": 3.2006, + "loss_pixel": 0.3849, + "loss_text": 1.8336, + "ppl": 9.1935, + "step": 2877 + }, + { + "epoch": 0.02, + "global_step": 2878, + "learning_rate": 0.0004888230383973289, + "loss": 2.2009, + "loss_base2": 3.1752, + "loss_pixel": 0.3831, + "loss_text": 1.8178, + "ppl": 9.0331, + "step": 2878 + }, + { + "epoch": 0.02, + "global_step": 2879, + "learning_rate": 0.0004888188647746244, + "loss": 2.2143, + "loss_base2": 3.1946, + "loss_pixel": 0.3823, + "loss_text": 1.832, + "ppl": 9.155, + "step": 2879 + }, + { + "epoch": 0.02, + "global_step": 2880, + "learning_rate": 0.0004888146911519199, + "loss": 2.2168, + "loss_base2": 3.1982, + "loss_pixel": 0.3816, + "loss_text": 1.8352, + "ppl": 9.1779, + "step": 2880 + }, + { + "epoch": 0.02, + "global_step": 2881, + "learning_rate": 0.0004888105175292153, + "loss": 2.1994, + "loss_base2": 3.1731, + "loss_pixel": 0.384, + "loss_text": 1.8154, + "ppl": 9.0196, + "step": 2881 + }, + { + "epoch": 0.02, + "global_step": 2882, + "learning_rate": 0.0004888063439065108, + "loss": 2.1857, + "loss_base2": 3.1533, + "loss_pixel": 0.3823, + "loss_text": 1.8033, + "ppl": 8.8969, + "step": 2882 + }, + { + "epoch": 0.02, + "global_step": 2883, + "learning_rate": 0.0004888021702838064, + "loss": 2.1871, + "loss_base2": 3.1553, + "loss_pixel": 0.3825, + "loss_text": 1.8046, + "ppl": 8.9093, + "step": 2883 + }, + { + "epoch": 0.02, + "global_step": 2884, + "learning_rate": 0.0004887979966611019, + "loss": 2.1957, + "loss_base2": 3.1677, + "loss_pixel": 0.3822, + "loss_text": 1.8135, + "ppl": 8.9863, + "step": 2884 + }, + { + "epoch": 0.02, + "global_step": 2885, + "learning_rate": 0.0004887938230383973, + "loss": 2.2002, + "loss_base2": 3.1742, + "loss_pixel": 0.386, + "loss_text": 1.8142, + "ppl": 9.0268, + "step": 2885 + }, + { + "epoch": 0.02, + "global_step": 2886, + "learning_rate": 0.0004887896494156928, + "loss": 2.2129, + "loss_base2": 3.1925, + "loss_pixel": 0.3829, + "loss_text": 1.83, + "ppl": 9.1422, + "step": 2886 + }, + { + "epoch": 0.02, + "global_step": 2887, + "learning_rate": 0.0004887854757929883, + "loss": 2.1765, + "loss_base2": 3.14, + "loss_pixel": 0.384, + "loss_text": 1.7926, + "ppl": 8.8154, + "step": 2887 + }, + { + "epoch": 0.02, + "global_step": 2888, + "learning_rate": 0.0004887813021702838, + "loss": 2.1699, + "loss_base2": 3.1305, + "loss_pixel": 0.3819, + "loss_text": 1.788, + "ppl": 8.7574, + "step": 2888 + }, + { + "epoch": 0.02, + "global_step": 2889, + "learning_rate": 0.0004887771285475793, + "loss": 2.1737, + "loss_base2": 3.136, + "loss_pixel": 0.3828, + "loss_text": 1.7909, + "ppl": 8.7907, + "step": 2889 + }, + { + "epoch": 0.02, + "global_step": 2890, + "learning_rate": 0.0004887729549248748, + "loss": 2.1915, + "loss_base2": 3.1617, + "loss_pixel": 0.3826, + "loss_text": 1.8089, + "ppl": 8.9486, + "step": 2890 + }, + { + "epoch": 0.02, + "global_step": 2891, + "learning_rate": 0.0004887687813021703, + "loss": 2.1687, + "loss_base2": 3.1288, + "loss_pixel": 0.3834, + "loss_text": 1.7853, + "ppl": 8.7469, + "step": 2891 + }, + { + "epoch": 0.02, + "global_step": 2892, + "learning_rate": 0.0004887646076794658, + "loss": 2.1713, + "loss_base2": 3.1325, + "loss_pixel": 0.383, + "loss_text": 1.7882, + "ppl": 8.7697, + "step": 2892 + }, + { + "epoch": 0.02, + "global_step": 2893, + "learning_rate": 0.0004887604340567613, + "loss": 2.1739, + "loss_base2": 3.1363, + "loss_pixel": 0.3804, + "loss_text": 1.7935, + "ppl": 8.7925, + "step": 2893 + }, + { + "epoch": 0.02, + "global_step": 2894, + "learning_rate": 0.0004887562604340568, + "loss": 2.1641, + "loss_base2": 3.1221, + "loss_pixel": 0.3818, + "loss_text": 1.7823, + "ppl": 8.7068, + "step": 2894 + }, + { + "epoch": 0.02, + "global_step": 2895, + "learning_rate": 0.0004887520868113522, + "loss": 2.155, + "loss_base2": 3.109, + "loss_pixel": 0.3812, + "loss_text": 1.7738, + "ppl": 8.6279, + "step": 2895 + }, + { + "epoch": 0.02, + "global_step": 2896, + "learning_rate": 0.0004887479131886477, + "loss": 2.1449, + "loss_base2": 3.0944, + "loss_pixel": 0.3809, + "loss_text": 1.764, + "ppl": 8.5412, + "step": 2896 + }, + { + "epoch": 0.02, + "global_step": 2897, + "learning_rate": 0.0004887437395659432, + "loss": 2.1455, + "loss_base2": 3.0953, + "loss_pixel": 0.3807, + "loss_text": 1.7648, + "ppl": 8.5463, + "step": 2897 + }, + { + "epoch": 0.02, + "global_step": 2898, + "learning_rate": 0.0004887395659432387, + "loss": 2.1544, + "loss_base2": 3.1081, + "loss_pixel": 0.3801, + "loss_text": 1.7743, + "ppl": 8.6227, + "step": 2898 + }, + { + "epoch": 0.02, + "global_step": 2899, + "learning_rate": 0.0004887353923205343, + "loss": 2.1424, + "loss_base2": 3.0908, + "loss_pixel": 0.3811, + "loss_text": 1.7613, + "ppl": 8.5199, + "step": 2899 + }, + { + "epoch": 0.02, + "global_step": 2900, + "learning_rate": 0.0004887312186978298, + "loss": 2.1422, + "loss_base2": 3.0905, + "loss_pixel": 0.3805, + "loss_text": 1.7617, + "ppl": 8.5182, + "step": 2900 + }, + { + "epoch": 0.02, + "global_step": 2901, + "learning_rate": 0.0004887270450751253, + "loss": 2.1429, + "loss_base2": 3.0916, + "loss_pixel": 0.3805, + "loss_text": 1.7623, + "ppl": 8.5241, + "step": 2901 + }, + { + "epoch": 0.02, + "global_step": 2902, + "learning_rate": 0.0004887228714524208, + "loss": 2.1587, + "loss_base2": 3.1143, + "loss_pixel": 0.3806, + "loss_text": 1.778, + "ppl": 8.6599, + "step": 2902 + }, + { + "epoch": 0.02, + "global_step": 2903, + "learning_rate": 0.0004887186978297162, + "loss": 2.1459, + "loss_base2": 3.0959, + "loss_pixel": 0.3807, + "loss_text": 1.7652, + "ppl": 8.5497, + "step": 2903 + }, + { + "epoch": 0.02, + "global_step": 2904, + "learning_rate": 0.0004887145242070117, + "loss": 2.1375, + "loss_base2": 3.0838, + "loss_pixel": 0.3803, + "loss_text": 1.7571, + "ppl": 8.4782, + "step": 2904 + }, + { + "epoch": 0.02, + "global_step": 2905, + "learning_rate": 0.0004887103505843072, + "loss": 2.1393, + "loss_base2": 3.0864, + "loss_pixel": 0.3805, + "loss_text": 1.7588, + "ppl": 8.4935, + "step": 2905 + }, + { + "epoch": 0.02, + "global_step": 2906, + "learning_rate": 0.0004887061769616027, + "loss": 2.1206, + "loss_base2": 3.0594, + "loss_pixel": 0.3807, + "loss_text": 1.7399, + "ppl": 8.3361, + "step": 2906 + }, + { + "epoch": 0.02, + "global_step": 2907, + "learning_rate": 0.0004887020033388982, + "loss": 2.1431, + "loss_base2": 3.0918, + "loss_pixel": 0.3807, + "loss_text": 1.7624, + "ppl": 8.5258, + "step": 2907 + }, + { + "epoch": 0.02, + "global_step": 2908, + "learning_rate": 0.0004886978297161936, + "loss": 2.143, + "loss_base2": 3.0917, + "loss_pixel": 0.3805, + "loss_text": 1.7625, + "ppl": 8.525, + "step": 2908 + }, + { + "epoch": 0.02, + "global_step": 2909, + "learning_rate": 0.0004886936560934891, + "loss": 2.1364, + "loss_base2": 3.0822, + "loss_pixel": 0.3805, + "loss_text": 1.7559, + "ppl": 8.4689, + "step": 2909 + }, + { + "epoch": 0.02, + "global_step": 2910, + "learning_rate": 0.0004886894824707846, + "loss": 2.1136, + "loss_base2": 3.0493, + "loss_pixel": 0.3808, + "loss_text": 1.7328, + "ppl": 8.278, + "step": 2910 + }, + { + "epoch": 0.02, + "global_step": 2911, + "learning_rate": 0.0004886853088480801, + "loss": 2.0162, + "loss_base2": 2.9088, + "loss_pixel": 0.3809, + "loss_text": 1.6353, + "ppl": 7.5097, + "step": 2911 + }, + { + "epoch": 0.02, + "global_step": 2912, + "learning_rate": 0.0004886811352253756, + "loss": 1.9198, + "loss_base2": 2.7697, + "loss_pixel": 0.3802, + "loss_text": 1.5397, + "ppl": 6.8196, + "step": 2912 + }, + { + "epoch": 0.02, + "global_step": 2913, + "learning_rate": 0.0004886769616026711, + "loss": 1.9316, + "loss_base2": 2.7867, + "loss_pixel": 0.3805, + "loss_text": 1.5511, + "ppl": 6.9005, + "step": 2913 + }, + { + "epoch": 0.02, + "global_step": 2914, + "learning_rate": 0.0004886727879799666, + "loss": 1.9122, + "loss_base2": 2.7587, + "loss_pixel": 0.3807, + "loss_text": 1.5315, + "ppl": 6.768, + "step": 2914 + }, + { + "epoch": 0.02, + "global_step": 2915, + "learning_rate": 0.0004886686143572622, + "loss": 1.9079, + "loss_base2": 2.7525, + "loss_pixel": 0.3812, + "loss_text": 1.5267, + "ppl": 6.7389, + "step": 2915 + }, + { + "epoch": 0.02, + "global_step": 2916, + "learning_rate": 0.0004886644407345577, + "loss": 1.9206, + "loss_base2": 2.7708, + "loss_pixel": 0.3803, + "loss_text": 1.5403, + "ppl": 6.8251, + "step": 2916 + }, + { + "epoch": 0.02, + "global_step": 2917, + "learning_rate": 0.0004886602671118531, + "loss": 1.8739, + "loss_base2": 2.7035, + "loss_pixel": 0.3799, + "loss_text": 1.494, + "ppl": 6.5137, + "step": 2917 + }, + { + "epoch": 0.02, + "global_step": 2918, + "learning_rate": 0.0004886560934891486, + "loss": 1.9044, + "loss_base2": 2.7475, + "loss_pixel": 0.3804, + "loss_text": 1.524, + "ppl": 6.7154, + "step": 2918 + }, + { + "epoch": 0.02, + "global_step": 2919, + "learning_rate": 0.0004886519198664441, + "loss": 2.0675, + "loss_base2": 2.9828, + "loss_pixel": 0.3813, + "loss_text": 1.6862, + "ppl": 7.905, + "step": 2919 + }, + { + "epoch": 0.02, + "global_step": 2920, + "learning_rate": 0.0004886477462437396, + "loss": 1.9401, + "loss_base2": 2.799, + "loss_pixel": 0.3801, + "loss_text": 1.56, + "ppl": 6.9594, + "step": 2920 + }, + { + "epoch": 0.02, + "global_step": 2921, + "learning_rate": 0.0004886435726210351, + "loss": 1.9066, + "loss_base2": 2.7506, + "loss_pixel": 0.3808, + "loss_text": 1.5258, + "ppl": 6.7302, + "step": 2921 + }, + { + "epoch": 0.02, + "global_step": 2922, + "learning_rate": 0.0004886393989983305, + "loss": 1.9147, + "loss_base2": 2.7623, + "loss_pixel": 0.3806, + "loss_text": 1.5342, + "ppl": 6.7849, + "step": 2922 + }, + { + "epoch": 0.02, + "global_step": 2923, + "learning_rate": 0.000488635225375626, + "loss": 1.8888, + "loss_base2": 2.725, + "loss_pixel": 0.3805, + "loss_text": 1.5083, + "ppl": 6.6114, + "step": 2923 + }, + { + "epoch": 0.02, + "global_step": 2924, + "learning_rate": 0.0004886310517529215, + "loss": 1.8992, + "loss_base2": 2.74, + "loss_pixel": 0.3814, + "loss_text": 1.5179, + "ppl": 6.6805, + "step": 2924 + }, + { + "epoch": 0.02, + "global_step": 2925, + "learning_rate": 0.000488626878130217, + "loss": 1.8927, + "loss_base2": 2.7306, + "loss_pixel": 0.3803, + "loss_text": 1.5125, + "ppl": 6.6373, + "step": 2925 + }, + { + "epoch": 0.02, + "global_step": 2926, + "learning_rate": 0.0004886227045075125, + "loss": 1.8869, + "loss_base2": 2.7222, + "loss_pixel": 0.3812, + "loss_text": 1.5057, + "ppl": 6.5989, + "step": 2926 + }, + { + "epoch": 0.02, + "global_step": 2927, + "learning_rate": 0.000488618530884808, + "loss": 2.0166, + "loss_base2": 2.9093, + "loss_pixel": 0.38, + "loss_text": 1.6366, + "ppl": 7.5127, + "step": 2927 + }, + { + "epoch": 0.02, + "global_step": 2928, + "learning_rate": 0.0004886143572621035, + "loss": 2.1602, + "loss_base2": 3.1165, + "loss_pixel": 0.3808, + "loss_text": 1.7794, + "ppl": 8.6729, + "step": 2928 + }, + { + "epoch": 0.02, + "global_step": 2929, + "learning_rate": 0.000488610183639399, + "loss": 2.1557, + "loss_base2": 3.11, + "loss_pixel": 0.3809, + "loss_text": 1.7748, + "ppl": 8.6339, + "step": 2929 + }, + { + "epoch": 0.02, + "global_step": 2930, + "learning_rate": 0.0004886060100166945, + "loss": 2.1302, + "loss_base2": 3.0732, + "loss_pixel": 0.3799, + "loss_text": 1.7503, + "ppl": 8.4165, + "step": 2930 + }, + { + "epoch": 0.02, + "global_step": 2931, + "learning_rate": 0.00048860183639399, + "loss": 2.1373, + "loss_base2": 3.0835, + "loss_pixel": 0.3802, + "loss_text": 1.7571, + "ppl": 8.4765, + "step": 2931 + }, + { + "epoch": 0.02, + "global_step": 2932, + "learning_rate": 0.0004885976627712855, + "loss": 2.1449, + "loss_base2": 3.0944, + "loss_pixel": 0.3803, + "loss_text": 1.7647, + "ppl": 8.5412, + "step": 2932 + }, + { + "epoch": 0.02, + "global_step": 2933, + "learning_rate": 0.000488593489148581, + "loss": 2.1378, + "loss_base2": 3.0842, + "loss_pixel": 0.3799, + "loss_text": 1.7579, + "ppl": 8.4808, + "step": 2933 + }, + { + "epoch": 0.02, + "global_step": 2934, + "learning_rate": 0.0004885893155258765, + "loss": 2.1319, + "loss_base2": 3.0757, + "loss_pixel": 0.3797, + "loss_text": 1.7522, + "ppl": 8.4309, + "step": 2934 + }, + { + "epoch": 0.02, + "global_step": 2935, + "learning_rate": 0.000488585141903172, + "loss": 2.1241, + "loss_base2": 3.0644, + "loss_pixel": 0.38, + "loss_text": 1.7441, + "ppl": 8.3654, + "step": 2935 + }, + { + "epoch": 0.02, + "global_step": 2936, + "learning_rate": 0.0004885809682804675, + "loss": 2.1285, + "loss_base2": 3.0708, + "loss_pixel": 0.3802, + "loss_text": 1.7483, + "ppl": 8.4023, + "step": 2936 + }, + { + "epoch": 0.02, + "global_step": 2937, + "learning_rate": 0.000488576794657763, + "loss": 2.1084, + "loss_base2": 3.0418, + "loss_pixel": 0.3799, + "loss_text": 1.7285, + "ppl": 8.2351, + "step": 2937 + }, + { + "epoch": 0.02, + "global_step": 2938, + "learning_rate": 0.0004885726210350585, + "loss": 2.0685, + "loss_base2": 2.9842, + "loss_pixel": 0.3807, + "loss_text": 1.6879, + "ppl": 7.9129, + "step": 2938 + }, + { + "epoch": 0.02, + "global_step": 2939, + "learning_rate": 0.000488568447412354, + "loss": 2.1201, + "loss_base2": 3.0587, + "loss_pixel": 0.3811, + "loss_text": 1.739, + "ppl": 8.332, + "step": 2939 + }, + { + "epoch": 0.02, + "global_step": 2940, + "learning_rate": 0.0004885642737896494, + "loss": 2.1084, + "loss_base2": 3.0418, + "loss_pixel": 0.3809, + "loss_text": 1.7276, + "ppl": 8.2351, + "step": 2940 + }, + { + "epoch": 0.02, + "global_step": 2941, + "learning_rate": 0.0004885601001669449, + "loss": 2.0979, + "loss_base2": 3.0266, + "loss_pixel": 0.3812, + "loss_text": 1.7167, + "ppl": 8.149, + "step": 2941 + }, + { + "epoch": 0.02, + "global_step": 2942, + "learning_rate": 0.0004885559265442404, + "loss": 2.1021, + "loss_base2": 3.0327, + "loss_pixel": 0.3804, + "loss_text": 1.7217, + "ppl": 8.1833, + "step": 2942 + }, + { + "epoch": 0.02, + "global_step": 2943, + "learning_rate": 0.0004885517529215359, + "loss": 2.0924, + "loss_base2": 3.0187, + "loss_pixel": 0.3798, + "loss_text": 1.7126, + "ppl": 8.1043, + "step": 2943 + }, + { + "epoch": 0.02, + "global_step": 2944, + "learning_rate": 0.0004885475792988313, + "loss": 2.0911, + "loss_base2": 3.0168, + "loss_pixel": 0.38, + "loss_text": 1.7111, + "ppl": 8.0938, + "step": 2944 + }, + { + "epoch": 0.02, + "global_step": 2945, + "learning_rate": 0.0004885434056761268, + "loss": 2.1038, + "loss_base2": 3.0351, + "loss_pixel": 0.3798, + "loss_text": 1.7241, + "ppl": 8.1973, + "step": 2945 + }, + { + "epoch": 0.02, + "global_step": 2946, + "learning_rate": 0.0004885392320534223, + "loss": 2.1002, + "loss_base2": 3.0299, + "loss_pixel": 0.3797, + "loss_text": 1.7205, + "ppl": 8.1678, + "step": 2946 + }, + { + "epoch": 0.02, + "global_step": 2947, + "learning_rate": 0.0004885350584307178, + "loss": 2.1061, + "loss_base2": 3.0385, + "loss_pixel": 0.38, + "loss_text": 1.7261, + "ppl": 8.2161, + "step": 2947 + }, + { + "epoch": 0.02, + "global_step": 2948, + "learning_rate": 0.0004885308848080134, + "loss": 2.102, + "loss_base2": 3.0325, + "loss_pixel": 0.3809, + "loss_text": 1.7211, + "ppl": 8.1825, + "step": 2948 + }, + { + "epoch": 0.02, + "global_step": 2949, + "learning_rate": 0.0004885267111853089, + "loss": 2.0956, + "loss_base2": 3.0233, + "loss_pixel": 0.3796, + "loss_text": 1.7159, + "ppl": 8.1303, + "step": 2949 + }, + { + "epoch": 0.02, + "global_step": 2950, + "learning_rate": 0.0004885225375626044, + "loss": 2.095, + "loss_base2": 3.0224, + "loss_pixel": 0.3795, + "loss_text": 1.7154, + "ppl": 8.1254, + "step": 2950 + }, + { + "epoch": 0.02, + "global_step": 2951, + "learning_rate": 0.0004885183639398999, + "loss": 2.1093, + "loss_base2": 3.0431, + "loss_pixel": 0.3833, + "loss_text": 1.7259, + "ppl": 8.2425, + "step": 2951 + }, + { + "epoch": 0.02, + "global_step": 2952, + "learning_rate": 0.0004885141903171954, + "loss": 2.108, + "loss_base2": 3.0412, + "loss_pixel": 0.3875, + "loss_text": 1.7205, + "ppl": 8.2318, + "step": 2952 + }, + { + "epoch": 0.02, + "global_step": 2953, + "learning_rate": 0.0004885100166944909, + "loss": 2.3572, + "loss_base2": 3.4007, + "loss_pixel": 0.4251, + "loss_text": 1.9321, + "ppl": 10.5613, + "step": 2953 + }, + { + "epoch": 0.02, + "global_step": 2954, + "learning_rate": 0.0004885058430717863, + "loss": 2.1689, + "loss_base2": 3.1291, + "loss_pixel": 0.4318, + "loss_text": 1.737, + "ppl": 8.7487, + "step": 2954 + }, + { + "epoch": 0.02, + "global_step": 2955, + "learning_rate": 0.0004885016694490818, + "loss": 2.1582, + "loss_base2": 3.1136, + "loss_pixel": 0.4058, + "loss_text": 1.7525, + "ppl": 8.6555, + "step": 2955 + }, + { + "epoch": 0.02, + "global_step": 2956, + "learning_rate": 0.0004884974958263773, + "loss": 2.1517, + "loss_base2": 3.1042, + "loss_pixel": 0.3865, + "loss_text": 1.7652, + "ppl": 8.5995, + "step": 2956 + }, + { + "epoch": 0.02, + "global_step": 2957, + "learning_rate": 0.0004884933222036728, + "loss": 2.1425, + "loss_base2": 3.091, + "loss_pixel": 0.3899, + "loss_text": 1.7526, + "ppl": 8.5207, + "step": 2957 + }, + { + "epoch": 0.02, + "global_step": 2958, + "learning_rate": 0.0004884891485809683, + "loss": 2.1523, + "loss_base2": 3.1051, + "loss_pixel": 0.3972, + "loss_text": 1.7552, + "ppl": 8.6046, + "step": 2958 + }, + { + "epoch": 0.02, + "global_step": 2959, + "learning_rate": 0.0004884849749582637, + "loss": 2.1549, + "loss_base2": 3.1089, + "loss_pixel": 0.3964, + "loss_text": 1.7585, + "ppl": 8.627, + "step": 2959 + }, + { + "epoch": 0.02, + "global_step": 2960, + "learning_rate": 0.0004884808013355592, + "loss": 2.1507, + "loss_base2": 3.1028, + "loss_pixel": 0.3919, + "loss_text": 1.7588, + "ppl": 8.5909, + "step": 2960 + }, + { + "epoch": 0.02, + "global_step": 2961, + "learning_rate": 0.0004884766277128547, + "loss": 2.1168, + "loss_base2": 3.0539, + "loss_pixel": 0.3903, + "loss_text": 1.7266, + "ppl": 8.3045, + "step": 2961 + }, + { + "epoch": 0.02, + "global_step": 2962, + "learning_rate": 0.0004884724540901502, + "loss": 2.1128, + "loss_base2": 3.0481, + "loss_pixel": 0.3901, + "loss_text": 1.7228, + "ppl": 8.2714, + "step": 2962 + }, + { + "epoch": 0.02, + "global_step": 2963, + "learning_rate": 0.0004884682804674457, + "loss": 2.1212, + "loss_base2": 3.0602, + "loss_pixel": 0.3889, + "loss_text": 1.7323, + "ppl": 8.3411, + "step": 2963 + }, + { + "epoch": 0.02, + "global_step": 2964, + "learning_rate": 0.0004884641068447413, + "loss": 2.108, + "loss_base2": 3.0412, + "loss_pixel": 0.386, + "loss_text": 1.722, + "ppl": 8.2318, + "step": 2964 + }, + { + "epoch": 0.02, + "global_step": 2965, + "learning_rate": 0.0004884599332220368, + "loss": 2.1102, + "loss_base2": 3.0444, + "loss_pixel": 0.3843, + "loss_text": 1.7259, + "ppl": 8.2499, + "step": 2965 + }, + { + "epoch": 0.02, + "global_step": 2966, + "learning_rate": 0.0004884557595993323, + "loss": 2.1046, + "loss_base2": 3.0363, + "loss_pixel": 0.3847, + "loss_text": 1.7199, + "ppl": 8.2038, + "step": 2966 + }, + { + "epoch": 0.02, + "global_step": 2967, + "learning_rate": 0.0004884515859766277, + "loss": 2.1059, + "loss_base2": 3.0382, + "loss_pixel": 0.3861, + "loss_text": 1.7198, + "ppl": 8.2145, + "step": 2967 + }, + { + "epoch": 0.02, + "global_step": 2968, + "learning_rate": 0.0004884474123539232, + "loss": 2.0884, + "loss_base2": 3.0129, + "loss_pixel": 0.3851, + "loss_text": 1.7033, + "ppl": 8.072, + "step": 2968 + }, + { + "epoch": 0.02, + "global_step": 2969, + "learning_rate": 0.0004884432387312187, + "loss": 2.0842, + "loss_base2": 3.0069, + "loss_pixel": 0.3845, + "loss_text": 1.6997, + "ppl": 8.0382, + "step": 2969 + }, + { + "epoch": 0.02, + "global_step": 2970, + "learning_rate": 0.0004884390651085142, + "loss": 2.0869, + "loss_base2": 3.0108, + "loss_pixel": 0.3836, + "loss_text": 1.7033, + "ppl": 8.0599, + "step": 2970 + }, + { + "epoch": 0.02, + "global_step": 2971, + "learning_rate": 0.0004884348914858097, + "loss": 2.1006, + "loss_base2": 3.0305, + "loss_pixel": 0.3835, + "loss_text": 1.7171, + "ppl": 8.1711, + "step": 2971 + }, + { + "epoch": 0.02, + "global_step": 2972, + "learning_rate": 0.0004884307178631052, + "loss": 2.088, + "loss_base2": 3.0123, + "loss_pixel": 0.3832, + "loss_text": 1.7048, + "ppl": 8.0688, + "step": 2972 + }, + { + "epoch": 0.02, + "global_step": 2973, + "learning_rate": 0.0004884265442404007, + "loss": 2.0966, + "loss_base2": 3.0248, + "loss_pixel": 0.3833, + "loss_text": 1.7133, + "ppl": 8.1385, + "step": 2973 + }, + { + "epoch": 0.02, + "global_step": 2974, + "learning_rate": 0.0004884223706176962, + "loss": 2.1016, + "loss_base2": 3.032, + "loss_pixel": 0.3828, + "loss_text": 1.7188, + "ppl": 8.1792, + "step": 2974 + }, + { + "epoch": 0.02, + "global_step": 2975, + "learning_rate": 0.0004884181969949917, + "loss": 2.0868, + "loss_base2": 3.0106, + "loss_pixel": 0.3824, + "loss_text": 1.7044, + "ppl": 8.0591, + "step": 2975 + }, + { + "epoch": 0.02, + "global_step": 2976, + "learning_rate": 0.0004884140233722871, + "loss": 2.0805, + "loss_base2": 3.0015, + "loss_pixel": 0.3826, + "loss_text": 1.6979, + "ppl": 8.0085, + "step": 2976 + }, + { + "epoch": 0.02, + "global_step": 2977, + "learning_rate": 0.0004884098497495826, + "loss": 2.0769, + "loss_base2": 2.9963, + "loss_pixel": 0.382, + "loss_text": 1.695, + "ppl": 7.9797, + "step": 2977 + }, + { + "epoch": 0.02, + "global_step": 2978, + "learning_rate": 0.0004884056761268781, + "loss": 2.0894, + "loss_base2": 3.0144, + "loss_pixel": 0.382, + "loss_text": 1.7074, + "ppl": 8.0801, + "step": 2978 + }, + { + "epoch": 0.02, + "global_step": 2979, + "learning_rate": 0.0004884015025041736, + "loss": 2.0682, + "loss_base2": 2.9838, + "loss_pixel": 0.3821, + "loss_text": 1.686, + "ppl": 7.9106, + "step": 2979 + }, + { + "epoch": 0.02, + "global_step": 2980, + "learning_rate": 0.0004883973288814692, + "loss": 2.0797, + "loss_base2": 3.0004, + "loss_pixel": 0.3817, + "loss_text": 1.6981, + "ppl": 8.0021, + "step": 2980 + }, + { + "epoch": 0.02, + "global_step": 2981, + "learning_rate": 0.0004883931552587646, + "loss": 2.0805, + "loss_base2": 3.0015, + "loss_pixel": 0.3813, + "loss_text": 1.6992, + "ppl": 8.0085, + "step": 2981 + }, + { + "epoch": 0.02, + "global_step": 2982, + "learning_rate": 0.0004883889816360601, + "loss": 2.0532, + "loss_base2": 2.9621, + "loss_pixel": 0.3809, + "loss_text": 1.6723, + "ppl": 7.7928, + "step": 2982 + }, + { + "epoch": 0.02, + "global_step": 2983, + "learning_rate": 0.0004883848080133556, + "loss": 2.0705, + "loss_base2": 2.9871, + "loss_pixel": 0.3811, + "loss_text": 1.6894, + "ppl": 7.9288, + "step": 2983 + }, + { + "epoch": 0.02, + "global_step": 2984, + "learning_rate": 0.0004883806343906511, + "loss": 2.0502, + "loss_base2": 2.9578, + "loss_pixel": 0.3817, + "loss_text": 1.6685, + "ppl": 7.7695, + "step": 2984 + }, + { + "epoch": 0.02, + "global_step": 2985, + "learning_rate": 0.0004883764607679466, + "loss": 2.0685, + "loss_base2": 2.9842, + "loss_pixel": 0.3809, + "loss_text": 1.6876, + "ppl": 7.9129, + "step": 2985 + }, + { + "epoch": 0.02, + "global_step": 2986, + "learning_rate": 0.0004883722871452421, + "loss": 2.0725, + "loss_base2": 2.99, + "loss_pixel": 0.3808, + "loss_text": 1.6917, + "ppl": 7.9447, + "step": 2986 + }, + { + "epoch": 0.02, + "global_step": 2987, + "learning_rate": 0.0004883681135225376, + "loss": 2.0842, + "loss_base2": 3.0069, + "loss_pixel": 0.3811, + "loss_text": 1.7031, + "ppl": 8.0382, + "step": 2987 + }, + { + "epoch": 0.02, + "global_step": 2988, + "learning_rate": 0.0004883639398998331, + "loss": 2.0746, + "loss_base2": 2.993, + "loss_pixel": 0.3807, + "loss_text": 1.6939, + "ppl": 7.9614, + "step": 2988 + }, + { + "epoch": 0.02, + "global_step": 2989, + "learning_rate": 0.0004883597662771286, + "loss": 2.0836, + "loss_base2": 3.006, + "loss_pixel": 0.3809, + "loss_text": 1.7027, + "ppl": 8.0333, + "step": 2989 + }, + { + "epoch": 0.02, + "global_step": 2990, + "learning_rate": 0.000488355592654424, + "loss": 2.0847, + "loss_base2": 3.0076, + "loss_pixel": 0.3819, + "loss_text": 1.7028, + "ppl": 8.0422, + "step": 2990 + }, + { + "epoch": 0.02, + "global_step": 2991, + "learning_rate": 0.0004883514190317195, + "loss": 2.0563, + "loss_base2": 2.9666, + "loss_pixel": 0.3813, + "loss_text": 1.675, + "ppl": 7.817, + "step": 2991 + }, + { + "epoch": 0.02, + "global_step": 2992, + "learning_rate": 0.000488347245409015, + "loss": 2.0604, + "loss_base2": 2.9725, + "loss_pixel": 0.3805, + "loss_text": 1.6799, + "ppl": 7.8491, + "step": 2992 + }, + { + "epoch": 0.02, + "global_step": 2993, + "learning_rate": 0.0004883430717863105, + "loss": 2.0694, + "loss_base2": 2.9855, + "loss_pixel": 0.3814, + "loss_text": 1.6881, + "ppl": 7.9201, + "step": 2993 + }, + { + "epoch": 0.02, + "global_step": 2994, + "learning_rate": 0.000488338898163606, + "loss": 2.0543, + "loss_base2": 2.9637, + "loss_pixel": 0.3809, + "loss_text": 1.6734, + "ppl": 7.8014, + "step": 2994 + }, + { + "epoch": 0.02, + "global_step": 2995, + "learning_rate": 0.0004883347245409015, + "loss": 2.0665, + "loss_base2": 2.9813, + "loss_pixel": 0.3803, + "loss_text": 1.6861, + "ppl": 7.8971, + "step": 2995 + }, + { + "epoch": 0.02, + "global_step": 2996, + "learning_rate": 0.0004883305509181971, + "loss": 2.063, + "loss_base2": 2.9763, + "loss_pixel": 0.3805, + "loss_text": 1.6825, + "ppl": 7.8695, + "step": 2996 + }, + { + "epoch": 0.02, + "global_step": 2997, + "learning_rate": 0.0004883263772954925, + "loss": 2.0586, + "loss_base2": 2.9699, + "loss_pixel": 0.381, + "loss_text": 1.6776, + "ppl": 7.835, + "step": 2997 + }, + { + "epoch": 0.02, + "global_step": 2998, + "learning_rate": 0.000488322203672788, + "loss": 2.0797, + "loss_base2": 3.0004, + "loss_pixel": 0.3802, + "loss_text": 1.6995, + "ppl": 8.0021, + "step": 2998 + }, + { + "epoch": 0.02, + "global_step": 2999, + "learning_rate": 0.0004883180300500835, + "loss": 1.882, + "loss_base2": 2.7152, + "loss_pixel": 0.3803, + "loss_text": 1.5017, + "ppl": 6.5666, + "step": 2999 + }, + { + "epoch": 0.02, + "global_step": 3000, + "learning_rate": 0.000488313856427379, + "loss": 1.8523, + "loss_base2": 2.6723, + "loss_pixel": 0.3803, + "loss_text": 1.472, + "ppl": 6.3745, + "step": 3000 + }, + { + "epoch": 0.02, + "global_step": 3001, + "learning_rate": 0.0004883096828046745, + "loss": 1.8466, + "loss_base2": 2.6641, + "loss_pixel": 0.3804, + "loss_text": 1.4663, + "ppl": 6.3382, + "step": 3001 + }, + { + "epoch": 0.02, + "global_step": 3002, + "learning_rate": 0.00048830550918197, + "loss": 1.8699, + "loss_base2": 2.6977, + "loss_pixel": 0.3807, + "loss_text": 1.4892, + "ppl": 6.4876, + "step": 3002 + }, + { + "epoch": 0.02, + "global_step": 3003, + "learning_rate": 0.0004883013355592654, + "loss": 1.8405, + "loss_base2": 2.6553, + "loss_pixel": 0.3808, + "loss_text": 1.4597, + "ppl": 6.2997, + "step": 3003 + }, + { + "epoch": 0.02, + "global_step": 3004, + "learning_rate": 0.0004882971619365609, + "loss": 1.8471, + "loss_base2": 2.6648, + "loss_pixel": 0.3808, + "loss_text": 1.4663, + "ppl": 6.3414, + "step": 3004 + }, + { + "epoch": 0.02, + "global_step": 3005, + "learning_rate": 0.0004882929883138564, + "loss": 1.8242, + "loss_base2": 2.6318, + "loss_pixel": 0.3807, + "loss_text": 1.4435, + "ppl": 6.1978, + "step": 3005 + }, + { + "epoch": 0.02, + "global_step": 3006, + "learning_rate": 0.0004882888146911519, + "loss": 1.9556, + "loss_base2": 2.8213, + "loss_pixel": 0.3802, + "loss_text": 1.5754, + "ppl": 7.0682, + "step": 3006 + }, + { + "epoch": 0.02, + "global_step": 3007, + "learning_rate": 0.0004882846410684474, + "loss": 2.077, + "loss_base2": 2.9965, + "loss_pixel": 0.3807, + "loss_text": 1.6963, + "ppl": 7.9805, + "step": 3007 + }, + { + "epoch": 0.02, + "global_step": 3008, + "learning_rate": 0.0004882804674457429, + "loss": 2.0898, + "loss_base2": 3.0149, + "loss_pixel": 0.3803, + "loss_text": 1.7095, + "ppl": 8.0833, + "step": 3008 + }, + { + "epoch": 0.02, + "global_step": 3009, + "learning_rate": 0.0004882762938230384, + "loss": 2.0982, + "loss_base2": 3.0271, + "loss_pixel": 0.3803, + "loss_text": 1.7179, + "ppl": 8.1515, + "step": 3009 + }, + { + "epoch": 0.02, + "global_step": 3010, + "learning_rate": 0.0004882721202003339, + "loss": 2.0756, + "loss_base2": 2.9945, + "loss_pixel": 0.3805, + "loss_text": 1.6951, + "ppl": 7.9693, + "step": 3010 + }, + { + "epoch": 0.02, + "global_step": 3011, + "learning_rate": 0.0004882679465776294, + "loss": 2.075, + "loss_base2": 2.9936, + "loss_pixel": 0.3805, + "loss_text": 1.6945, + "ppl": 7.9645, + "step": 3011 + }, + { + "epoch": 0.02, + "global_step": 3012, + "learning_rate": 0.0004882637729549249, + "loss": 2.0652, + "loss_base2": 2.9795, + "loss_pixel": 0.3806, + "loss_text": 1.6846, + "ppl": 7.8869, + "step": 3012 + }, + { + "epoch": 0.02, + "global_step": 3013, + "learning_rate": 0.00048825959933222036, + "loss": 2.0609, + "loss_base2": 2.9733, + "loss_pixel": 0.3825, + "loss_text": 1.6784, + "ppl": 7.853, + "step": 3013 + }, + { + "epoch": 0.02, + "global_step": 3014, + "learning_rate": 0.00048825542570951586, + "loss": 2.0741, + "loss_base2": 2.9923, + "loss_pixel": 0.3817, + "loss_text": 1.6924, + "ppl": 7.9574, + "step": 3014 + }, + { + "epoch": 0.02, + "global_step": 3015, + "learning_rate": 0.00048825125208681137, + "loss": 2.0587, + "loss_base2": 2.9701, + "loss_pixel": 0.3823, + "loss_text": 1.6764, + "ppl": 7.8358, + "step": 3015 + }, + { + "epoch": 0.02, + "global_step": 3016, + "learning_rate": 0.0004882470784641069, + "loss": 2.0673, + "loss_base2": 2.9825, + "loss_pixel": 0.3816, + "loss_text": 1.6856, + "ppl": 7.9035, + "step": 3016 + }, + { + "epoch": 0.02, + "global_step": 3017, + "learning_rate": 0.00048824290484140233, + "loss": 2.0542, + "loss_base2": 2.9636, + "loss_pixel": 0.3823, + "loss_text": 1.672, + "ppl": 7.8006, + "step": 3017 + }, + { + "epoch": 0.02, + "global_step": 3018, + "learning_rate": 0.00048823873121869784, + "loss": 2.068, + "loss_base2": 2.9835, + "loss_pixel": 0.3833, + "loss_text": 1.6847, + "ppl": 7.909, + "step": 3018 + }, + { + "epoch": 0.02, + "global_step": 3019, + "learning_rate": 0.00048823455759599335, + "loss": 2.0634, + "loss_base2": 2.9769, + "loss_pixel": 0.3819, + "loss_text": 1.6815, + "ppl": 7.8727, + "step": 3019 + }, + { + "epoch": 0.02, + "global_step": 3020, + "learning_rate": 0.00048823038397328885, + "loss": 2.0569, + "loss_base2": 2.9675, + "loss_pixel": 0.3844, + "loss_text": 1.6726, + "ppl": 7.8217, + "step": 3020 + }, + { + "epoch": 0.02, + "global_step": 3021, + "learning_rate": 0.00048822621035058436, + "loss": 2.0544, + "loss_base2": 2.9639, + "loss_pixel": 0.3819, + "loss_text": 1.6725, + "ppl": 7.8022, + "step": 3021 + }, + { + "epoch": 0.02, + "global_step": 3022, + "learning_rate": 0.0004882220367278798, + "loss": 2.0695, + "loss_base2": 2.9857, + "loss_pixel": 0.3816, + "loss_text": 1.6879, + "ppl": 7.9209, + "step": 3022 + }, + { + "epoch": 0.02, + "global_step": 3023, + "learning_rate": 0.0004882178631051753, + "loss": 2.0528, + "loss_base2": 2.9616, + "loss_pixel": 0.3833, + "loss_text": 1.6695, + "ppl": 7.7897, + "step": 3023 + }, + { + "epoch": 0.02, + "global_step": 3024, + "learning_rate": 0.00048821368948247083, + "loss": 2.0637, + "loss_base2": 2.9773, + "loss_pixel": 0.3809, + "loss_text": 1.6828, + "ppl": 7.8751, + "step": 3024 + }, + { + "epoch": 0.02, + "global_step": 3025, + "learning_rate": 0.0004882095158597663, + "loss": 2.0609, + "loss_base2": 2.9733, + "loss_pixel": 0.3826, + "loss_text": 1.6783, + "ppl": 7.853, + "step": 3025 + }, + { + "epoch": 0.02, + "global_step": 3026, + "learning_rate": 0.00048820534223706173, + "loss": 2.0471, + "loss_base2": 2.9533, + "loss_pixel": 0.3826, + "loss_text": 1.6645, + "ppl": 7.7454, + "step": 3026 + }, + { + "epoch": 0.02, + "global_step": 3027, + "learning_rate": 0.00048820116861435724, + "loss": 2.0392, + "loss_base2": 2.9419, + "loss_pixel": 0.382, + "loss_text": 1.6572, + "ppl": 7.6845, + "step": 3027 + }, + { + "epoch": 0.02, + "global_step": 3028, + "learning_rate": 0.00048819699499165275, + "loss": 2.0814, + "loss_base2": 3.0028, + "loss_pixel": 0.383, + "loss_text": 1.6984, + "ppl": 8.0157, + "step": 3028 + }, + { + "epoch": 0.02, + "global_step": 3029, + "learning_rate": 0.00048819282136894826, + "loss": 2.0246, + "loss_base2": 2.9209, + "loss_pixel": 0.3833, + "loss_text": 1.6414, + "ppl": 7.5731, + "step": 3029 + }, + { + "epoch": 0.02, + "global_step": 3030, + "learning_rate": 0.00048818864774624376, + "loss": 1.8401, + "loss_base2": 2.6547, + "loss_pixel": 0.384, + "loss_text": 1.4562, + "ppl": 6.2972, + "step": 3030 + }, + { + "epoch": 0.02, + "global_step": 3031, + "learning_rate": 0.0004881844741235392, + "loss": 1.8394, + "loss_base2": 2.6537, + "loss_pixel": 0.383, + "loss_text": 1.4564, + "ppl": 6.2928, + "step": 3031 + }, + { + "epoch": 0.02, + "global_step": 3032, + "learning_rate": 0.0004881803005008347, + "loss": 1.8403, + "loss_base2": 2.655, + "loss_pixel": 0.3822, + "loss_text": 1.4582, + "ppl": 6.2984, + "step": 3032 + }, + { + "epoch": 0.02, + "global_step": 3033, + "learning_rate": 0.00048817612687813023, + "loss": 1.8144, + "loss_base2": 2.6176, + "loss_pixel": 0.3818, + "loss_text": 1.4326, + "ppl": 6.1374, + "step": 3033 + }, + { + "epoch": 0.02, + "global_step": 3034, + "learning_rate": 0.00048817195325542574, + "loss": 1.8194, + "loss_base2": 2.6248, + "loss_pixel": 0.3835, + "loss_text": 1.4359, + "ppl": 6.1682, + "step": 3034 + }, + { + "epoch": 0.02, + "global_step": 3035, + "learning_rate": 0.0004881677796327212, + "loss": 1.8257, + "loss_base2": 2.6339, + "loss_pixel": 0.3822, + "loss_text": 1.4435, + "ppl": 6.2071, + "step": 3035 + }, + { + "epoch": 0.02, + "global_step": 3036, + "learning_rate": 0.0004881636060100167, + "loss": 1.815, + "loss_base2": 2.6185, + "loss_pixel": 0.382, + "loss_text": 1.433, + "ppl": 6.1411, + "step": 3036 + }, + { + "epoch": 0.02, + "global_step": 3037, + "learning_rate": 0.0004881594323873122, + "loss": 1.8023, + "loss_base2": 2.6002, + "loss_pixel": 0.3817, + "loss_text": 1.4206, + "ppl": 6.0636, + "step": 3037 + }, + { + "epoch": 0.02, + "global_step": 3038, + "learning_rate": 0.0004881552587646077, + "loss": 1.8053, + "loss_base2": 2.6045, + "loss_pixel": 0.3821, + "loss_text": 1.4231, + "ppl": 6.0818, + "step": 3038 + }, + { + "epoch": 0.02, + "global_step": 3039, + "learning_rate": 0.0004881510851419032, + "loss": 1.8103, + "loss_base2": 2.6117, + "loss_pixel": 0.3823, + "loss_text": 1.428, + "ppl": 6.1123, + "step": 3039 + }, + { + "epoch": 0.02, + "global_step": 3040, + "learning_rate": 0.0004881469115191987, + "loss": 1.81, + "loss_base2": 2.6113, + "loss_pixel": 0.3824, + "loss_text": 1.4276, + "ppl": 6.1104, + "step": 3040 + }, + { + "epoch": 0.02, + "global_step": 3041, + "learning_rate": 0.0004881427378964942, + "loss": 1.8188, + "loss_base2": 2.624, + "loss_pixel": 0.3813, + "loss_text": 1.4374, + "ppl": 6.1645, + "step": 3041 + }, + { + "epoch": 0.02, + "global_step": 3042, + "learning_rate": 0.0004881385642737897, + "loss": 1.809, + "loss_base2": 2.6098, + "loss_pixel": 0.3808, + "loss_text": 1.4283, + "ppl": 6.1043, + "step": 3042 + }, + { + "epoch": 0.02, + "global_step": 3043, + "learning_rate": 0.0004881343906510852, + "loss": 1.8035, + "loss_base2": 2.6019, + "loss_pixel": 0.383, + "loss_text": 1.4205, + "ppl": 6.0709, + "step": 3043 + }, + { + "epoch": 0.02, + "global_step": 3044, + "learning_rate": 0.0004881302170283806, + "loss": 1.8234, + "loss_base2": 2.6306, + "loss_pixel": 0.3817, + "loss_text": 1.4417, + "ppl": 6.1929, + "step": 3044 + }, + { + "epoch": 0.02, + "global_step": 3045, + "learning_rate": 0.0004881260434056761, + "loss": 1.823, + "loss_base2": 2.63, + "loss_pixel": 0.381, + "loss_text": 1.442, + "ppl": 6.1904, + "step": 3045 + }, + { + "epoch": 0.02, + "global_step": 3046, + "learning_rate": 0.0004881218697829716, + "loss": 1.9279, + "loss_base2": 2.7814, + "loss_pixel": 0.3816, + "loss_text": 1.5463, + "ppl": 6.8751, + "step": 3046 + }, + { + "epoch": 0.02, + "global_step": 3047, + "learning_rate": 0.0004881176961602671, + "loss": 1.881, + "loss_base2": 2.7137, + "loss_pixel": 0.3794, + "loss_text": 1.5016, + "ppl": 6.5601, + "step": 3047 + }, + { + "epoch": 0.02, + "global_step": 3048, + "learning_rate": 0.0004881135225375626, + "loss": 1.8014, + "loss_base2": 2.5989, + "loss_pixel": 0.38, + "loss_text": 1.4214, + "ppl": 6.0581, + "step": 3048 + }, + { + "epoch": 0.02, + "global_step": 3049, + "learning_rate": 0.0004881093489148581, + "loss": 1.8065, + "loss_base2": 2.6062, + "loss_pixel": 0.3799, + "loss_text": 1.4265, + "ppl": 6.0891, + "step": 3049 + }, + { + "epoch": 0.02, + "global_step": 3050, + "learning_rate": 0.0004881051752921536, + "loss": 1.8077, + "loss_base2": 2.608, + "loss_pixel": 0.3795, + "loss_text": 1.4283, + "ppl": 6.0964, + "step": 3050 + }, + { + "epoch": 0.02, + "global_step": 3051, + "learning_rate": 0.0004881010016694491, + "loss": 1.7856, + "loss_base2": 2.5761, + "loss_pixel": 0.3798, + "loss_text": 1.4058, + "ppl": 5.9632, + "step": 3051 + }, + { + "epoch": 0.02, + "global_step": 3052, + "learning_rate": 0.0004880968280467446, + "loss": 1.8039, + "loss_base2": 2.6025, + "loss_pixel": 0.3801, + "loss_text": 1.4238, + "ppl": 6.0733, + "step": 3052 + }, + { + "epoch": 0.02, + "global_step": 3053, + "learning_rate": 0.00048809265442404005, + "loss": 1.7968, + "loss_base2": 2.5922, + "loss_pixel": 0.3788, + "loss_text": 1.418, + "ppl": 6.0303, + "step": 3053 + }, + { + "epoch": 0.02, + "global_step": 3054, + "learning_rate": 0.00048808848080133556, + "loss": 1.8113, + "loss_base2": 2.6132, + "loss_pixel": 0.3795, + "loss_text": 1.4318, + "ppl": 6.1184, + "step": 3054 + }, + { + "epoch": 0.02, + "global_step": 3055, + "learning_rate": 0.00048808430717863107, + "loss": 1.8031, + "loss_base2": 2.6013, + "loss_pixel": 0.3793, + "loss_text": 1.4238, + "ppl": 6.0684, + "step": 3055 + }, + { + "epoch": 0.02, + "global_step": 3056, + "learning_rate": 0.0004880801335559266, + "loss": 1.8001, + "loss_base2": 2.597, + "loss_pixel": 0.3794, + "loss_text": 1.4207, + "ppl": 6.0503, + "step": 3056 + }, + { + "epoch": 0.02, + "global_step": 3057, + "learning_rate": 0.0004880759599332221, + "loss": 1.7835, + "loss_base2": 2.573, + "loss_pixel": 0.3788, + "loss_text": 1.4047, + "ppl": 5.9506, + "step": 3057 + }, + { + "epoch": 0.02, + "global_step": 3058, + "learning_rate": 0.00048807178631051753, + "loss": 1.828, + "loss_base2": 2.6372, + "loss_pixel": 0.3791, + "loss_text": 1.4489, + "ppl": 6.2214, + "step": 3058 + }, + { + "epoch": 0.02, + "global_step": 3059, + "learning_rate": 0.00048806761268781304, + "loss": 1.8083, + "loss_base2": 2.6088, + "loss_pixel": 0.3789, + "loss_text": 1.4293, + "ppl": 6.1001, + "step": 3059 + }, + { + "epoch": 0.02, + "global_step": 3060, + "learning_rate": 0.00048806343906510855, + "loss": 1.787, + "loss_base2": 2.5781, + "loss_pixel": 0.3795, + "loss_text": 1.4075, + "ppl": 5.9715, + "step": 3060 + }, + { + "epoch": 0.02, + "global_step": 3061, + "learning_rate": 0.00048805926544240406, + "loss": 1.7936, + "loss_base2": 2.5876, + "loss_pixel": 0.3784, + "loss_text": 1.4151, + "ppl": 6.0111, + "step": 3061 + }, + { + "epoch": 0.02, + "global_step": 3062, + "learning_rate": 0.00048805509181969946, + "loss": 1.771, + "loss_base2": 2.555, + "loss_pixel": 0.3788, + "loss_text": 1.3922, + "ppl": 5.8767, + "step": 3062 + }, + { + "epoch": 0.02, + "global_step": 3063, + "learning_rate": 0.00048805091819699496, + "loss": 1.7865, + "loss_base2": 2.5774, + "loss_pixel": 0.3788, + "loss_text": 1.4077, + "ppl": 5.9685, + "step": 3063 + }, + { + "epoch": 0.02, + "global_step": 3064, + "learning_rate": 0.00048804674457429047, + "loss": 1.7941, + "loss_base2": 2.5883, + "loss_pixel": 0.3786, + "loss_text": 1.4155, + "ppl": 6.0141, + "step": 3064 + }, + { + "epoch": 0.02, + "global_step": 3065, + "learning_rate": 0.000488042570951586, + "loss": 1.7869, + "loss_base2": 2.578, + "loss_pixel": 0.3777, + "loss_text": 1.4091, + "ppl": 5.9709, + "step": 3065 + }, + { + "epoch": 0.02, + "global_step": 3066, + "learning_rate": 0.0004880383973288815, + "loss": 1.7767, + "loss_base2": 2.5632, + "loss_pixel": 0.3784, + "loss_text": 1.3982, + "ppl": 5.9103, + "step": 3066 + }, + { + "epoch": 0.02, + "global_step": 3067, + "learning_rate": 0.00048803422370617694, + "loss": 1.7778, + "loss_base2": 2.5648, + "loss_pixel": 0.3772, + "loss_text": 1.4006, + "ppl": 5.9168, + "step": 3067 + }, + { + "epoch": 0.02, + "global_step": 3068, + "learning_rate": 0.00048803005008347245, + "loss": 1.7807, + "loss_base2": 2.569, + "loss_pixel": 0.3786, + "loss_text": 1.4021, + "ppl": 5.934, + "step": 3068 + }, + { + "epoch": 0.02, + "global_step": 3069, + "learning_rate": 0.00048802587646076795, + "loss": 1.8069, + "loss_base2": 2.6068, + "loss_pixel": 0.3898, + "loss_text": 1.4171, + "ppl": 6.0915, + "step": 3069 + }, + { + "epoch": 0.02, + "global_step": 3070, + "learning_rate": 0.00048802170283806346, + "loss": 1.8168, + "loss_base2": 2.6211, + "loss_pixel": 0.4188, + "loss_text": 1.398, + "ppl": 6.1521, + "step": 3070 + }, + { + "epoch": 0.02, + "global_step": 3071, + "learning_rate": 0.00048801752921535897, + "loss": 1.9876, + "loss_base2": 2.8675, + "loss_pixel": 0.3999, + "loss_text": 1.5876, + "ppl": 7.298, + "step": 3071 + }, + { + "epoch": 0.02, + "global_step": 3072, + "learning_rate": 0.0004880133555926544, + "loss": 1.8581, + "loss_base2": 2.6807, + "loss_pixel": 0.3883, + "loss_text": 1.4698, + "ppl": 6.4115, + "step": 3072 + }, + { + "epoch": 0.02, + "global_step": 3073, + "learning_rate": 0.00048800918196994993, + "loss": 1.7928, + "loss_base2": 2.5865, + "loss_pixel": 0.3922, + "loss_text": 1.4006, + "ppl": 6.0062, + "step": 3073 + }, + { + "epoch": 0.02, + "global_step": 3074, + "learning_rate": 0.00048800500834724544, + "loss": 1.7977, + "loss_base2": 2.5935, + "loss_pixel": 0.3919, + "loss_text": 1.4058, + "ppl": 6.0357, + "step": 3074 + }, + { + "epoch": 0.02, + "global_step": 3075, + "learning_rate": 0.00048800083472454094, + "loss": 1.79, + "loss_base2": 2.5824, + "loss_pixel": 0.3899, + "loss_text": 1.4001, + "ppl": 5.9895, + "step": 3075 + }, + { + "epoch": 0.02, + "global_step": 3076, + "learning_rate": 0.0004879966611018364, + "loss": 1.8002, + "loss_base2": 2.5971, + "loss_pixel": 0.3896, + "loss_text": 1.4106, + "ppl": 6.0509, + "step": 3076 + }, + { + "epoch": 0.02, + "global_step": 3077, + "learning_rate": 0.0004879924874791319, + "loss": 1.7989, + "loss_base2": 2.5953, + "loss_pixel": 0.3906, + "loss_text": 1.4084, + "ppl": 6.043, + "step": 3077 + }, + { + "epoch": 0.02, + "global_step": 3078, + "learning_rate": 0.0004879883138564274, + "loss": 1.7926, + "loss_base2": 2.5862, + "loss_pixel": 0.3887, + "loss_text": 1.4039, + "ppl": 6.005, + "step": 3078 + }, + { + "epoch": 0.02, + "global_step": 3079, + "learning_rate": 0.0004879841402337229, + "loss": 1.7997, + "loss_base2": 2.5964, + "loss_pixel": 0.3861, + "loss_text": 1.4137, + "ppl": 6.0478, + "step": 3079 + }, + { + "epoch": 0.02, + "global_step": 3080, + "learning_rate": 0.0004879799666110184, + "loss": 1.8132, + "loss_base2": 2.6159, + "loss_pixel": 0.3857, + "loss_text": 1.4274, + "ppl": 6.13, + "step": 3080 + }, + { + "epoch": 0.02, + "global_step": 3081, + "learning_rate": 0.0004879757929883138, + "loss": 1.9895, + "loss_base2": 2.8702, + "loss_pixel": 0.3844, + "loss_text": 1.6051, + "ppl": 7.3119, + "step": 3081 + }, + { + "epoch": 0.02, + "global_step": 3082, + "learning_rate": 0.00048797161936560933, + "loss": 1.8432, + "loss_base2": 2.6592, + "loss_pixel": 0.3848, + "loss_text": 1.4584, + "ppl": 6.3167, + "step": 3082 + }, + { + "epoch": 0.02, + "global_step": 3083, + "learning_rate": 0.00048796744574290484, + "loss": 1.7802, + "loss_base2": 2.5683, + "loss_pixel": 0.3838, + "loss_text": 1.3964, + "ppl": 5.931, + "step": 3083 + }, + { + "epoch": 0.02, + "global_step": 3084, + "learning_rate": 0.00048796327212020035, + "loss": 1.7855, + "loss_base2": 2.5759, + "loss_pixel": 0.3834, + "loss_text": 1.4021, + "ppl": 5.9626, + "step": 3084 + }, + { + "epoch": 0.02, + "global_step": 3085, + "learning_rate": 0.0004879590984974958, + "loss": 1.7876, + "loss_base2": 2.579, + "loss_pixel": 0.3834, + "loss_text": 1.4043, + "ppl": 5.9751, + "step": 3085 + }, + { + "epoch": 0.02, + "global_step": 3086, + "learning_rate": 0.0004879549248747913, + "loss": 1.7747, + "loss_base2": 2.5604, + "loss_pixel": 0.3832, + "loss_text": 1.3915, + "ppl": 5.8985, + "step": 3086 + }, + { + "epoch": 0.02, + "global_step": 3087, + "learning_rate": 0.0004879507512520868, + "loss": 1.781, + "loss_base2": 2.5694, + "loss_pixel": 0.3839, + "loss_text": 1.3972, + "ppl": 5.9358, + "step": 3087 + }, + { + "epoch": 0.02, + "global_step": 3088, + "learning_rate": 0.0004879465776293823, + "loss": 1.801, + "loss_base2": 2.5983, + "loss_pixel": 0.3826, + "loss_text": 1.4184, + "ppl": 6.0557, + "step": 3088 + }, + { + "epoch": 0.02, + "global_step": 3089, + "learning_rate": 0.00048794240400667783, + "loss": 1.7649, + "loss_base2": 2.5462, + "loss_pixel": 0.3824, + "loss_text": 1.3825, + "ppl": 5.841, + "step": 3089 + }, + { + "epoch": 0.02, + "global_step": 3090, + "learning_rate": 0.0004879382303839733, + "loss": 2.0298, + "loss_base2": 2.9284, + "loss_pixel": 0.3837, + "loss_text": 1.6461, + "ppl": 7.6126, + "step": 3090 + }, + { + "epoch": 0.02, + "global_step": 3091, + "learning_rate": 0.0004879340567612688, + "loss": 2.094, + "loss_base2": 3.021, + "loss_pixel": 0.3821, + "loss_text": 1.712, + "ppl": 8.1173, + "step": 3091 + }, + { + "epoch": 0.02, + "global_step": 3092, + "learning_rate": 0.0004879298831385643, + "loss": 2.0968, + "loss_base2": 3.025, + "loss_pixel": 0.3826, + "loss_text": 1.7142, + "ppl": 8.1401, + "step": 3092 + }, + { + "epoch": 0.02, + "global_step": 3093, + "learning_rate": 0.0004879257095158598, + "loss": 2.0743, + "loss_base2": 2.9926, + "loss_pixel": 0.3813, + "loss_text": 1.693, + "ppl": 7.959, + "step": 3093 + }, + { + "epoch": 0.02, + "global_step": 3094, + "learning_rate": 0.00048792153589315526, + "loss": 2.0972, + "loss_base2": 3.0256, + "loss_pixel": 0.3816, + "loss_text": 1.7156, + "ppl": 8.1433, + "step": 3094 + }, + { + "epoch": 0.02, + "global_step": 3095, + "learning_rate": 0.00048791736227045076, + "loss": 2.0767, + "loss_base2": 2.996, + "loss_pixel": 0.3817, + "loss_text": 1.695, + "ppl": 7.9781, + "step": 3095 + }, + { + "epoch": 0.02, + "global_step": 3096, + "learning_rate": 0.00048791318864774627, + "loss": 2.067, + "loss_base2": 2.9821, + "loss_pixel": 0.3819, + "loss_text": 1.6852, + "ppl": 7.9011, + "step": 3096 + }, + { + "epoch": 0.02, + "global_step": 3097, + "learning_rate": 0.0004879090150250418, + "loss": 2.0762, + "loss_base2": 2.9953, + "loss_pixel": 0.3818, + "loss_text": 1.6943, + "ppl": 7.9741, + "step": 3097 + }, + { + "epoch": 0.02, + "global_step": 3098, + "learning_rate": 0.0004879048414023373, + "loss": 2.0731, + "loss_base2": 2.9909, + "loss_pixel": 0.3824, + "loss_text": 1.6907, + "ppl": 7.9494, + "step": 3098 + }, + { + "epoch": 0.02, + "global_step": 3099, + "learning_rate": 0.00048790066777963274, + "loss": 2.0664, + "loss_base2": 2.9812, + "loss_pixel": 0.3811, + "loss_text": 1.6853, + "ppl": 7.8963, + "step": 3099 + }, + { + "epoch": 0.02, + "global_step": 3100, + "learning_rate": 0.0004878964941569282, + "loss": 2.0767, + "loss_base2": 2.996, + "loss_pixel": 0.3811, + "loss_text": 1.6956, + "ppl": 7.9781, + "step": 3100 + }, + { + "epoch": 0.02, + "global_step": 3101, + "learning_rate": 0.0004878923205342237, + "loss": 2.063, + "loss_base2": 2.9763, + "loss_pixel": 0.3807, + "loss_text": 1.6824, + "ppl": 7.8695, + "step": 3101 + }, + { + "epoch": 0.02, + "global_step": 3102, + "learning_rate": 0.0004878881469115192, + "loss": 2.062, + "loss_base2": 2.9748, + "loss_pixel": 0.3823, + "loss_text": 1.6797, + "ppl": 7.8617, + "step": 3102 + }, + { + "epoch": 0.02, + "global_step": 3103, + "learning_rate": 0.00048788397328881466, + "loss": 2.0698, + "loss_base2": 2.9861, + "loss_pixel": 0.3813, + "loss_text": 1.6885, + "ppl": 7.9232, + "step": 3103 + }, + { + "epoch": 0.02, + "global_step": 3104, + "learning_rate": 0.00048787979966611017, + "loss": 2.0552, + "loss_base2": 2.965, + "loss_pixel": 0.3812, + "loss_text": 1.674, + "ppl": 7.8084, + "step": 3104 + }, + { + "epoch": 0.02, + "global_step": 3105, + "learning_rate": 0.0004878756260434057, + "loss": 2.0691, + "loss_base2": 2.9851, + "loss_pixel": 0.3809, + "loss_text": 1.6882, + "ppl": 7.9177, + "step": 3105 + }, + { + "epoch": 0.02, + "global_step": 3106, + "learning_rate": 0.0004878714524207012, + "loss": 2.0469, + "loss_base2": 2.9531, + "loss_pixel": 0.3814, + "loss_text": 1.6655, + "ppl": 7.7439, + "step": 3106 + }, + { + "epoch": 0.02, + "global_step": 3107, + "learning_rate": 0.0004878672787979967, + "loss": 2.0534, + "loss_base2": 2.9624, + "loss_pixel": 0.3813, + "loss_text": 1.6721, + "ppl": 7.7944, + "step": 3107 + }, + { + "epoch": 0.02, + "global_step": 3108, + "learning_rate": 0.00048786310517529214, + "loss": 2.0554, + "loss_base2": 2.9653, + "loss_pixel": 0.3804, + "loss_text": 1.675, + "ppl": 7.81, + "step": 3108 + }, + { + "epoch": 0.02, + "global_step": 3109, + "learning_rate": 0.00048785893155258765, + "loss": 2.0481, + "loss_base2": 2.9548, + "loss_pixel": 0.3805, + "loss_text": 1.6676, + "ppl": 7.7532, + "step": 3109 + }, + { + "epoch": 0.02, + "global_step": 3110, + "learning_rate": 0.00048785475792988316, + "loss": 2.0504, + "loss_base2": 2.9581, + "loss_pixel": 0.3807, + "loss_text": 1.6697, + "ppl": 7.771, + "step": 3110 + }, + { + "epoch": 0.02, + "global_step": 3111, + "learning_rate": 0.00048785058430717866, + "loss": 2.0551, + "loss_base2": 2.9649, + "loss_pixel": 0.381, + "loss_text": 1.6741, + "ppl": 7.8076, + "step": 3111 + }, + { + "epoch": 0.02, + "global_step": 3112, + "learning_rate": 0.0004878464106844741, + "loss": 2.0454, + "loss_base2": 2.9509, + "loss_pixel": 0.3803, + "loss_text": 1.6651, + "ppl": 7.7323, + "step": 3112 + }, + { + "epoch": 0.02, + "global_step": 3113, + "learning_rate": 0.0004878422370617696, + "loss": 2.06, + "loss_base2": 2.972, + "loss_pixel": 0.3807, + "loss_text": 1.6793, + "ppl": 7.846, + "step": 3113 + }, + { + "epoch": 0.02, + "global_step": 3114, + "learning_rate": 0.00048783806343906513, + "loss": 1.9884, + "loss_base2": 2.8687, + "loss_pixel": 0.3802, + "loss_text": 1.6082, + "ppl": 7.3038, + "step": 3114 + }, + { + "epoch": 0.02, + "global_step": 3115, + "learning_rate": 0.00048783388981636064, + "loss": 1.8107, + "loss_base2": 2.6123, + "loss_pixel": 0.3818, + "loss_text": 1.4289, + "ppl": 6.1147, + "step": 3115 + }, + { + "epoch": 0.02, + "global_step": 3116, + "learning_rate": 0.00048782971619365615, + "loss": 1.7868, + "loss_base2": 2.5778, + "loss_pixel": 0.3806, + "loss_text": 1.4063, + "ppl": 5.9703, + "step": 3116 + }, + { + "epoch": 0.02, + "global_step": 3117, + "learning_rate": 0.0004878255425709516, + "loss": 1.7879, + "loss_base2": 2.5794, + "loss_pixel": 0.3808, + "loss_text": 1.4071, + "ppl": 5.9769, + "step": 3117 + }, + { + "epoch": 0.02, + "global_step": 3118, + "learning_rate": 0.00048782136894824705, + "loss": 1.7971, + "loss_base2": 2.5927, + "loss_pixel": 0.3808, + "loss_text": 1.4163, + "ppl": 6.0321, + "step": 3118 + }, + { + "epoch": 0.02, + "global_step": 3119, + "learning_rate": 0.00048781719532554256, + "loss": 1.768, + "loss_base2": 2.5507, + "loss_pixel": 0.3811, + "loss_text": 1.3869, + "ppl": 5.8591, + "step": 3119 + }, + { + "epoch": 0.02, + "global_step": 3120, + "learning_rate": 0.00048781302170283807, + "loss": 1.761, + "loss_base2": 2.5406, + "loss_pixel": 0.3808, + "loss_text": 1.3802, + "ppl": 5.8183, + "step": 3120 + }, + { + "epoch": 0.02, + "global_step": 3121, + "learning_rate": 0.0004878088480801336, + "loss": 1.7718, + "loss_base2": 2.5562, + "loss_pixel": 0.3804, + "loss_text": 1.3914, + "ppl": 5.8814, + "step": 3121 + }, + { + "epoch": 0.02, + "global_step": 3122, + "learning_rate": 0.00048780467445742903, + "loss": 1.9271, + "loss_base2": 2.7802, + "loss_pixel": 0.3808, + "loss_text": 1.5462, + "ppl": 6.8696, + "step": 3122 + }, + { + "epoch": 0.02, + "global_step": 3123, + "learning_rate": 0.00048780050083472453, + "loss": 2.0619, + "loss_base2": 2.9747, + "loss_pixel": 0.3807, + "loss_text": 1.6813, + "ppl": 7.8609, + "step": 3123 + }, + { + "epoch": 0.02, + "global_step": 3124, + "learning_rate": 0.00048779632721202004, + "loss": 2.0714, + "loss_base2": 2.9884, + "loss_pixel": 0.3803, + "loss_text": 1.6912, + "ppl": 7.9359, + "step": 3124 + }, + { + "epoch": 0.02, + "global_step": 3125, + "learning_rate": 0.00048779215358931555, + "loss": 2.0587, + "loss_base2": 2.9701, + "loss_pixel": 0.38, + "loss_text": 1.6787, + "ppl": 7.8358, + "step": 3125 + }, + { + "epoch": 0.02, + "global_step": 3126, + "learning_rate": 0.000487787979966611, + "loss": 2.0368, + "loss_base2": 2.9385, + "loss_pixel": 0.3808, + "loss_text": 1.6559, + "ppl": 7.666, + "step": 3126 + }, + { + "epoch": 0.02, + "global_step": 3127, + "learning_rate": 0.0004877838063439065, + "loss": 2.0461, + "loss_base2": 2.9519, + "loss_pixel": 0.3805, + "loss_text": 1.6655, + "ppl": 7.7377, + "step": 3127 + }, + { + "epoch": 0.02, + "global_step": 3128, + "learning_rate": 0.000487779632721202, + "loss": 2.0485, + "loss_base2": 2.9554, + "loss_pixel": 0.3806, + "loss_text": 1.6679, + "ppl": 7.7563, + "step": 3128 + }, + { + "epoch": 0.02, + "global_step": 3129, + "learning_rate": 0.0004877754590984975, + "loss": 2.0473, + "loss_base2": 2.9536, + "loss_pixel": 0.3806, + "loss_text": 1.6667, + "ppl": 7.747, + "step": 3129 + }, + { + "epoch": 0.02, + "global_step": 3130, + "learning_rate": 0.00048777128547579303, + "loss": 2.0481, + "loss_base2": 2.9548, + "loss_pixel": 0.3804, + "loss_text": 1.6677, + "ppl": 7.7532, + "step": 3130 + }, + { + "epoch": 0.02, + "global_step": 3131, + "learning_rate": 0.0004877671118530885, + "loss": 2.0465, + "loss_base2": 2.9525, + "loss_pixel": 0.3806, + "loss_text": 1.6658, + "ppl": 7.7408, + "step": 3131 + }, + { + "epoch": 0.02, + "global_step": 3132, + "learning_rate": 0.000487762938230384, + "loss": 2.0347, + "loss_base2": 2.9355, + "loss_pixel": 0.3806, + "loss_text": 1.6541, + "ppl": 7.65, + "step": 3132 + }, + { + "epoch": 0.02, + "global_step": 3133, + "learning_rate": 0.0004877587646076795, + "loss": 2.0423, + "loss_base2": 2.9464, + "loss_pixel": 0.3802, + "loss_text": 1.6621, + "ppl": 7.7083, + "step": 3133 + }, + { + "epoch": 0.02, + "global_step": 3134, + "learning_rate": 0.000487754590984975, + "loss": 2.0427, + "loss_base2": 2.947, + "loss_pixel": 0.3806, + "loss_text": 1.6621, + "ppl": 7.7114, + "step": 3134 + }, + { + "epoch": 0.02, + "global_step": 3135, + "learning_rate": 0.00048775041736227046, + "loss": 2.0488, + "loss_base2": 2.9558, + "loss_pixel": 0.3804, + "loss_text": 1.6684, + "ppl": 7.7586, + "step": 3135 + }, + { + "epoch": 0.02, + "global_step": 3136, + "learning_rate": 0.00048774624373956597, + "loss": 2.0277, + "loss_base2": 2.9254, + "loss_pixel": 0.3809, + "loss_text": 1.6469, + "ppl": 7.5966, + "step": 3136 + }, + { + "epoch": 0.02, + "global_step": 3137, + "learning_rate": 0.0004877420701168614, + "loss": 2.0278, + "loss_base2": 2.9255, + "loss_pixel": 0.3804, + "loss_text": 1.6474, + "ppl": 7.5974, + "step": 3137 + }, + { + "epoch": 0.02, + "global_step": 3138, + "learning_rate": 0.00048773789649415693, + "loss": 2.0425, + "loss_base2": 2.9467, + "loss_pixel": 0.3803, + "loss_text": 1.6622, + "ppl": 7.7099, + "step": 3138 + }, + { + "epoch": 0.02, + "global_step": 3139, + "learning_rate": 0.00048773372287145244, + "loss": 2.0299, + "loss_base2": 2.9285, + "loss_pixel": 0.3799, + "loss_text": 1.65, + "ppl": 7.6133, + "step": 3139 + }, + { + "epoch": 0.02, + "global_step": 3140, + "learning_rate": 0.0004877295492487479, + "loss": 2.0378, + "loss_base2": 2.9399, + "loss_pixel": 0.3806, + "loss_text": 1.6572, + "ppl": 7.6737, + "step": 3140 + }, + { + "epoch": 0.02, + "global_step": 3141, + "learning_rate": 0.0004877253756260434, + "loss": 2.0614, + "loss_base2": 2.974, + "loss_pixel": 0.3804, + "loss_text": 1.681, + "ppl": 7.857, + "step": 3141 + }, + { + "epoch": 0.02, + "global_step": 3142, + "learning_rate": 0.0004877212020033389, + "loss": 2.033, + "loss_base2": 2.933, + "loss_pixel": 0.3802, + "loss_text": 1.6528, + "ppl": 7.637, + "step": 3142 + }, + { + "epoch": 0.02, + "global_step": 3143, + "learning_rate": 0.0004877170283806344, + "loss": 2.0426, + "loss_base2": 2.9468, + "loss_pixel": 0.3808, + "loss_text": 1.6618, + "ppl": 7.7106, + "step": 3143 + }, + { + "epoch": 0.02, + "global_step": 3144, + "learning_rate": 0.00048771285475792986, + "loss": 2.0461, + "loss_base2": 2.9519, + "loss_pixel": 0.3806, + "loss_text": 1.6656, + "ppl": 7.7377, + "step": 3144 + }, + { + "epoch": 0.02, + "global_step": 3145, + "learning_rate": 0.00048770868113522537, + "loss": 2.0334, + "loss_base2": 2.9336, + "loss_pixel": 0.3807, + "loss_text": 1.6527, + "ppl": 7.64, + "step": 3145 + }, + { + "epoch": 0.02, + "global_step": 3146, + "learning_rate": 0.0004877045075125209, + "loss": 2.0342, + "loss_base2": 2.9347, + "loss_pixel": 0.3808, + "loss_text": 1.6535, + "ppl": 7.6461, + "step": 3146 + }, + { + "epoch": 0.02, + "global_step": 3147, + "learning_rate": 0.0004877003338898164, + "loss": 2.0369, + "loss_base2": 2.9386, + "loss_pixel": 0.3808, + "loss_text": 1.6561, + "ppl": 7.6668, + "step": 3147 + }, + { + "epoch": 0.02, + "global_step": 3148, + "learning_rate": 0.0004876961602671119, + "loss": 2.0368, + "loss_base2": 2.9385, + "loss_pixel": 0.3801, + "loss_text": 1.6568, + "ppl": 7.666, + "step": 3148 + }, + { + "epoch": 0.02, + "global_step": 3149, + "learning_rate": 0.00048769198664440735, + "loss": 2.05, + "loss_base2": 2.9575, + "loss_pixel": 0.3805, + "loss_text": 1.6695, + "ppl": 7.7679, + "step": 3149 + }, + { + "epoch": 0.02, + "global_step": 3150, + "learning_rate": 0.00048768781302170285, + "loss": 2.0198, + "loss_base2": 2.914, + "loss_pixel": 0.3803, + "loss_text": 1.6394, + "ppl": 7.5368, + "step": 3150 + }, + { + "epoch": 0.02, + "global_step": 3151, + "learning_rate": 0.00048768363939899836, + "loss": 2.0267, + "loss_base2": 2.9239, + "loss_pixel": 0.3806, + "loss_text": 1.6461, + "ppl": 7.589, + "step": 3151 + }, + { + "epoch": 0.02, + "global_step": 3152, + "learning_rate": 0.00048767946577629387, + "loss": 2.0398, + "loss_base2": 2.9428, + "loss_pixel": 0.3807, + "loss_text": 1.6592, + "ppl": 7.6891, + "step": 3152 + }, + { + "epoch": 0.02, + "global_step": 3153, + "learning_rate": 0.0004876752921535893, + "loss": 2.009, + "loss_base2": 2.8984, + "loss_pixel": 0.3804, + "loss_text": 1.6286, + "ppl": 7.4559, + "step": 3153 + }, + { + "epoch": 0.02, + "global_step": 3154, + "learning_rate": 0.00048767111853088483, + "loss": 2.0265, + "loss_base2": 2.9236, + "loss_pixel": 0.3811, + "loss_text": 1.6454, + "ppl": 7.5875, + "step": 3154 + }, + { + "epoch": 0.02, + "global_step": 3155, + "learning_rate": 0.00048766694490818034, + "loss": 2.0436, + "loss_base2": 2.9483, + "loss_pixel": 0.3808, + "loss_text": 1.6628, + "ppl": 7.7183, + "step": 3155 + }, + { + "epoch": 0.02, + "global_step": 3156, + "learning_rate": 0.0004876627712854758, + "loss": 2.0057, + "loss_base2": 2.8936, + "loss_pixel": 0.3803, + "loss_text": 1.6253, + "ppl": 7.4313, + "step": 3156 + }, + { + "epoch": 0.02, + "global_step": 3157, + "learning_rate": 0.0004876585976627713, + "loss": 2.0128, + "loss_base2": 2.9039, + "loss_pixel": 0.3799, + "loss_text": 1.6328, + "ppl": 7.4842, + "step": 3157 + }, + { + "epoch": 0.02, + "global_step": 3158, + "learning_rate": 0.00048765442404006675, + "loss": 2.0317, + "loss_base2": 2.9311, + "loss_pixel": 0.3808, + "loss_text": 1.6509, + "ppl": 7.627, + "step": 3158 + }, + { + "epoch": 0.02, + "global_step": 3159, + "learning_rate": 0.00048765025041736226, + "loss": 2.0315, + "loss_base2": 2.9308, + "loss_pixel": 0.3805, + "loss_text": 1.651, + "ppl": 7.6255, + "step": 3159 + }, + { + "epoch": 0.02, + "global_step": 3160, + "learning_rate": 0.00048764607679465776, + "loss": 2.022, + "loss_base2": 2.9171, + "loss_pixel": 0.3805, + "loss_text": 1.6415, + "ppl": 7.5534, + "step": 3160 + }, + { + "epoch": 0.02, + "global_step": 3161, + "learning_rate": 0.00048764190317195327, + "loss": 2.0398, + "loss_base2": 2.9428, + "loss_pixel": 0.3807, + "loss_text": 1.6592, + "ppl": 7.6891, + "step": 3161 + }, + { + "epoch": 0.02, + "global_step": 3162, + "learning_rate": 0.0004876377295492487, + "loss": 2.0289, + "loss_base2": 2.9271, + "loss_pixel": 0.3804, + "loss_text": 1.6485, + "ppl": 7.6057, + "step": 3162 + }, + { + "epoch": 0.02, + "global_step": 3163, + "learning_rate": 0.00048763355592654423, + "loss": 2.0317, + "loss_base2": 2.9311, + "loss_pixel": 0.3798, + "loss_text": 1.6519, + "ppl": 7.627, + "step": 3163 + }, + { + "epoch": 0.02, + "global_step": 3164, + "learning_rate": 0.00048762938230383974, + "loss": 2.0366, + "loss_base2": 2.9382, + "loss_pixel": 0.3807, + "loss_text": 1.6559, + "ppl": 7.6645, + "step": 3164 + }, + { + "epoch": 0.02, + "global_step": 3165, + "learning_rate": 0.00048762520868113525, + "loss": 2.0302, + "loss_base2": 2.929, + "loss_pixel": 0.3808, + "loss_text": 1.6494, + "ppl": 7.6156, + "step": 3165 + }, + { + "epoch": 0.02, + "global_step": 3166, + "learning_rate": 0.00048762103505843075, + "loss": 2.0143, + "loss_base2": 2.906, + "loss_pixel": 0.3805, + "loss_text": 1.6338, + "ppl": 7.4955, + "step": 3166 + }, + { + "epoch": 0.02, + "global_step": 3167, + "learning_rate": 0.0004876168614357262, + "loss": 2.0076, + "loss_base2": 2.8964, + "loss_pixel": 0.3804, + "loss_text": 1.6271, + "ppl": 7.4454, + "step": 3167 + }, + { + "epoch": 0.02, + "global_step": 3168, + "learning_rate": 0.0004876126878130217, + "loss": 2.02, + "loss_base2": 2.9142, + "loss_pixel": 0.3801, + "loss_text": 1.6398, + "ppl": 7.5383, + "step": 3168 + }, + { + "epoch": 0.02, + "global_step": 3169, + "learning_rate": 0.0004876085141903172, + "loss": 2.0153, + "loss_base2": 2.9075, + "loss_pixel": 0.3803, + "loss_text": 1.6349, + "ppl": 7.503, + "step": 3169 + }, + { + "epoch": 0.02, + "global_step": 3170, + "learning_rate": 0.00048760434056761273, + "loss": 2.0334, + "loss_base2": 2.9336, + "loss_pixel": 0.3802, + "loss_text": 1.6532, + "ppl": 7.64, + "step": 3170 + }, + { + "epoch": 0.02, + "global_step": 3171, + "learning_rate": 0.0004876001669449082, + "loss": 2.0305, + "loss_base2": 2.9294, + "loss_pixel": 0.3801, + "loss_text": 1.6504, + "ppl": 7.6179, + "step": 3171 + }, + { + "epoch": 0.02, + "global_step": 3172, + "learning_rate": 0.0004875959933222037, + "loss": 2.0178, + "loss_base2": 2.9111, + "loss_pixel": 0.3806, + "loss_text": 1.6372, + "ppl": 7.5218, + "step": 3172 + }, + { + "epoch": 0.02, + "global_step": 3173, + "learning_rate": 0.0004875918196994992, + "loss": 2.0294, + "loss_base2": 2.9278, + "loss_pixel": 0.3801, + "loss_text": 1.6493, + "ppl": 7.6095, + "step": 3173 + }, + { + "epoch": 0.02, + "global_step": 3174, + "learning_rate": 0.0004875876460767947, + "loss": 2.0149, + "loss_base2": 2.9069, + "loss_pixel": 0.3807, + "loss_text": 1.6342, + "ppl": 7.5, + "step": 3174 + }, + { + "epoch": 0.02, + "global_step": 3175, + "learning_rate": 0.00048758347245409016, + "loss": 2.0088, + "loss_base2": 2.8981, + "loss_pixel": 0.38, + "loss_text": 1.6288, + "ppl": 7.4544, + "step": 3175 + }, + { + "epoch": 0.02, + "global_step": 3176, + "learning_rate": 0.0004875792988313856, + "loss": 2.0152, + "loss_base2": 2.9073, + "loss_pixel": 0.3798, + "loss_text": 1.6354, + "ppl": 7.5022, + "step": 3176 + }, + { + "epoch": 0.02, + "global_step": 3177, + "learning_rate": 0.0004875751252086811, + "loss": 2.0098, + "loss_base2": 2.8995, + "loss_pixel": 0.38, + "loss_text": 1.6299, + "ppl": 7.4618, + "step": 3177 + }, + { + "epoch": 0.02, + "global_step": 3178, + "learning_rate": 0.0004875709515859766, + "loss": 2.027, + "loss_base2": 2.9243, + "loss_pixel": 0.3819, + "loss_text": 1.645, + "ppl": 7.5913, + "step": 3178 + }, + { + "epoch": 0.02, + "global_step": 3179, + "learning_rate": 0.00048756677796327213, + "loss": 2.0387, + "loss_base2": 2.9412, + "loss_pixel": 0.385, + "loss_text": 1.6537, + "ppl": 7.6806, + "step": 3179 + }, + { + "epoch": 0.02, + "global_step": 3180, + "learning_rate": 0.00048756260434056764, + "loss": 2.037, + "loss_base2": 2.9388, + "loss_pixel": 0.385, + "loss_text": 1.652, + "ppl": 7.6676, + "step": 3180 + }, + { + "epoch": 0.02, + "global_step": 3181, + "learning_rate": 0.0004875584307178631, + "loss": 2.0189, + "loss_base2": 2.9127, + "loss_pixel": 0.3829, + "loss_text": 1.636, + "ppl": 7.53, + "step": 3181 + }, + { + "epoch": 0.02, + "global_step": 3182, + "learning_rate": 0.0004875542570951586, + "loss": 2.0349, + "loss_base2": 2.9357, + "loss_pixel": 0.3817, + "loss_text": 1.6532, + "ppl": 7.6515, + "step": 3182 + }, + { + "epoch": 0.02, + "global_step": 3183, + "learning_rate": 0.0004875500834724541, + "loss": 2.024, + "loss_base2": 2.92, + "loss_pixel": 0.3826, + "loss_text": 1.6414, + "ppl": 7.5685, + "step": 3183 + }, + { + "epoch": 0.02, + "global_step": 3184, + "learning_rate": 0.0004875459098497496, + "loss": 1.9951, + "loss_base2": 2.8783, + "loss_pixel": 0.3822, + "loss_text": 1.6129, + "ppl": 7.3529, + "step": 3184 + }, + { + "epoch": 0.02, + "global_step": 3185, + "learning_rate": 0.00048754173622704507, + "loss": 2.0095, + "loss_base2": 2.8991, + "loss_pixel": 0.3822, + "loss_text": 1.6273, + "ppl": 7.4596, + "step": 3185 + }, + { + "epoch": 0.02, + "global_step": 3186, + "learning_rate": 0.0004875375626043406, + "loss": 2.002, + "loss_base2": 2.8883, + "loss_pixel": 0.3825, + "loss_text": 1.6195, + "ppl": 7.4038, + "step": 3186 + }, + { + "epoch": 0.02, + "global_step": 3187, + "learning_rate": 0.0004875333889816361, + "loss": 2.0278, + "loss_base2": 2.9255, + "loss_pixel": 0.3804, + "loss_text": 1.6474, + "ppl": 7.5974, + "step": 3187 + }, + { + "epoch": 0.02, + "global_step": 3188, + "learning_rate": 0.0004875292153589316, + "loss": 2.0076, + "loss_base2": 2.8964, + "loss_pixel": 0.3823, + "loss_text": 1.6253, + "ppl": 7.4454, + "step": 3188 + }, + { + "epoch": 0.02, + "global_step": 3189, + "learning_rate": 0.0004875250417362271, + "loss": 2.0342, + "loss_base2": 2.9347, + "loss_pixel": 0.3803, + "loss_text": 1.6539, + "ppl": 7.6461, + "step": 3189 + }, + { + "epoch": 0.02, + "global_step": 3190, + "learning_rate": 0.00048752086811352255, + "loss": 2.034, + "loss_base2": 2.9344, + "loss_pixel": 0.3837, + "loss_text": 1.6503, + "ppl": 7.6446, + "step": 3190 + }, + { + "epoch": 0.02, + "global_step": 3191, + "learning_rate": 0.00048751669449081806, + "loss": 2.0032, + "loss_base2": 2.89, + "loss_pixel": 0.3828, + "loss_text": 1.6204, + "ppl": 7.4127, + "step": 3191 + }, + { + "epoch": 0.02, + "global_step": 3192, + "learning_rate": 0.00048751252086811356, + "loss": 2.0216, + "loss_base2": 2.9166, + "loss_pixel": 0.3816, + "loss_text": 1.6401, + "ppl": 7.5504, + "step": 3192 + }, + { + "epoch": 0.02, + "global_step": 3193, + "learning_rate": 0.00048750834724540907, + "loss": 2.0303, + "loss_base2": 2.9291, + "loss_pixel": 0.3829, + "loss_text": 1.6474, + "ppl": 7.6164, + "step": 3193 + }, + { + "epoch": 0.02, + "global_step": 3194, + "learning_rate": 0.00048750417362270447, + "loss": 2.0135, + "loss_base2": 2.9049, + "loss_pixel": 0.3812, + "loss_text": 1.6323, + "ppl": 7.4895, + "step": 3194 + }, + { + "epoch": 0.02, + "global_step": 3195, + "learning_rate": 0.0004875, + "loss": 2.028, + "loss_base2": 2.9258, + "loss_pixel": 0.38, + "loss_text": 1.648, + "ppl": 7.5989, + "step": 3195 + }, + { + "epoch": 0.02, + "global_step": 3196, + "learning_rate": 0.0004874958263772955, + "loss": 2.0289, + "loss_base2": 2.9271, + "loss_pixel": 0.3809, + "loss_text": 1.648, + "ppl": 7.6057, + "step": 3196 + }, + { + "epoch": 0.02, + "global_step": 3197, + "learning_rate": 0.000487491652754591, + "loss": 2.0345, + "loss_base2": 2.9352, + "loss_pixel": 0.3838, + "loss_text": 1.6508, + "ppl": 7.6484, + "step": 3197 + }, + { + "epoch": 0.02, + "global_step": 3198, + "learning_rate": 0.0004874874791318865, + "loss": 2.0253, + "loss_base2": 2.9219, + "loss_pixel": 0.3833, + "loss_text": 1.6421, + "ppl": 7.5784, + "step": 3198 + }, + { + "epoch": 0.02, + "global_step": 3199, + "learning_rate": 0.00048748330550918195, + "loss": 2.0184, + "loss_base2": 2.9119, + "loss_pixel": 0.3808, + "loss_text": 1.6376, + "ppl": 7.5263, + "step": 3199 + }, + { + "epoch": 0.02, + "global_step": 3200, + "learning_rate": 0.00048747913188647746, + "loss": 2.0192, + "loss_base2": 2.9131, + "loss_pixel": 0.3836, + "loss_text": 1.6356, + "ppl": 7.5323, + "step": 3200 + }, + { + "epoch": 0.02, + "global_step": 3201, + "learning_rate": 0.00048747495826377297, + "loss": 2.0131, + "loss_base2": 2.9043, + "loss_pixel": 0.38, + "loss_text": 1.6331, + "ppl": 7.4865, + "step": 3201 + }, + { + "epoch": 0.02, + "global_step": 3202, + "learning_rate": 0.0004874707846410685, + "loss": 2.0192, + "loss_base2": 2.9131, + "loss_pixel": 0.3796, + "loss_text": 1.6396, + "ppl": 7.5323, + "step": 3202 + }, + { + "epoch": 0.02, + "global_step": 3203, + "learning_rate": 0.00048746661101836393, + "loss": 2.0105, + "loss_base2": 2.9005, + "loss_pixel": 0.3803, + "loss_text": 1.6302, + "ppl": 7.467, + "step": 3203 + }, + { + "epoch": 0.02, + "global_step": 3204, + "learning_rate": 0.00048746243739565944, + "loss": 2.0152, + "loss_base2": 2.9073, + "loss_pixel": 0.3777, + "loss_text": 1.6376, + "ppl": 7.5022, + "step": 3204 + }, + { + "epoch": 0.02, + "global_step": 3205, + "learning_rate": 0.00048745826377295494, + "loss": 2.0164, + "loss_base2": 2.9091, + "loss_pixel": 0.3807, + "loss_text": 1.6357, + "ppl": 7.5112, + "step": 3205 + }, + { + "epoch": 0.02, + "global_step": 3206, + "learning_rate": 0.00048745409015025045, + "loss": 2.0269, + "loss_base2": 2.9242, + "loss_pixel": 0.3933, + "loss_text": 1.6336, + "ppl": 7.5905, + "step": 3206 + }, + { + "epoch": 0.02, + "global_step": 3207, + "learning_rate": 0.00048744991652754596, + "loss": 2.0066, + "loss_base2": 2.8949, + "loss_pixel": 0.3835, + "loss_text": 1.6231, + "ppl": 7.438, + "step": 3207 + }, + { + "epoch": 0.02, + "global_step": 3208, + "learning_rate": 0.0004874457429048414, + "loss": 2.029, + "loss_base2": 2.9272, + "loss_pixel": 0.3846, + "loss_text": 1.6444, + "ppl": 7.6065, + "step": 3208 + }, + { + "epoch": 0.02, + "global_step": 3209, + "learning_rate": 0.0004874415692821369, + "loss": 2.0173, + "loss_base2": 2.9103, + "loss_pixel": 0.3806, + "loss_text": 1.6368, + "ppl": 7.518, + "step": 3209 + }, + { + "epoch": 0.02, + "global_step": 3210, + "learning_rate": 0.0004874373956594324, + "loss": 2.0079, + "loss_base2": 2.8968, + "loss_pixel": 0.3858, + "loss_text": 1.6221, + "ppl": 7.4477, + "step": 3210 + }, + { + "epoch": 0.02, + "global_step": 3211, + "learning_rate": 0.00048743322203672793, + "loss": 2.0045, + "loss_base2": 2.8919, + "loss_pixel": 0.3826, + "loss_text": 1.6219, + "ppl": 7.4224, + "step": 3211 + }, + { + "epoch": 0.02, + "global_step": 3212, + "learning_rate": 0.00048742904841402333, + "loss": 2.0163, + "loss_base2": 2.9089, + "loss_pixel": 0.3833, + "loss_text": 1.633, + "ppl": 7.5105, + "step": 3212 + }, + { + "epoch": 0.02, + "global_step": 3213, + "learning_rate": 0.00048742487479131884, + "loss": 2.0221, + "loss_base2": 2.9173, + "loss_pixel": 0.3826, + "loss_text": 1.6395, + "ppl": 7.5542, + "step": 3213 + }, + { + "epoch": 0.02, + "global_step": 3214, + "learning_rate": 0.00048742070116861435, + "loss": 2.0005, + "loss_base2": 2.8861, + "loss_pixel": 0.3817, + "loss_text": 1.6188, + "ppl": 7.3928, + "step": 3214 + }, + { + "epoch": 0.02, + "global_step": 3215, + "learning_rate": 0.00048741652754590985, + "loss": 2.0155, + "loss_base2": 2.9078, + "loss_pixel": 0.3813, + "loss_text": 1.6342, + "ppl": 7.5045, + "step": 3215 + }, + { + "epoch": 0.02, + "global_step": 3216, + "learning_rate": 0.00048741235392320536, + "loss": 2.0209, + "loss_base2": 2.9155, + "loss_pixel": 0.381, + "loss_text": 1.64, + "ppl": 7.5451, + "step": 3216 + }, + { + "epoch": 0.02, + "global_step": 3217, + "learning_rate": 0.0004874081803005008, + "loss": 2.0191, + "loss_base2": 2.9129, + "loss_pixel": 0.3801, + "loss_text": 1.6389, + "ppl": 7.5315, + "step": 3217 + }, + { + "epoch": 0.02, + "global_step": 3218, + "learning_rate": 0.0004874040066777963, + "loss": 1.9881, + "loss_base2": 2.8682, + "loss_pixel": 0.3804, + "loss_text": 1.6076, + "ppl": 7.3016, + "step": 3218 + }, + { + "epoch": 0.02, + "global_step": 3219, + "learning_rate": 0.00048739983305509183, + "loss": 1.9968, + "loss_base2": 2.8808, + "loss_pixel": 0.3802, + "loss_text": 1.6166, + "ppl": 7.3654, + "step": 3219 + }, + { + "epoch": 0.02, + "global_step": 3220, + "learning_rate": 0.00048739565943238734, + "loss": 2.0049, + "loss_base2": 2.8925, + "loss_pixel": 0.38, + "loss_text": 1.6249, + "ppl": 7.4254, + "step": 3220 + }, + { + "epoch": 0.02, + "global_step": 3221, + "learning_rate": 0.0004873914858096828, + "loss": 1.9868, + "loss_base2": 2.8663, + "loss_pixel": 0.3801, + "loss_text": 1.6067, + "ppl": 7.2922, + "step": 3221 + }, + { + "epoch": 0.02, + "global_step": 3222, + "learning_rate": 0.0004873873121869783, + "loss": 1.9853, + "loss_base2": 2.8642, + "loss_pixel": 0.3799, + "loss_text": 1.6054, + "ppl": 7.2812, + "step": 3222 + }, + { + "epoch": 0.02, + "global_step": 3223, + "learning_rate": 0.0004873831385642738, + "loss": 2.0198, + "loss_base2": 2.914, + "loss_pixel": 0.3798, + "loss_text": 1.64, + "ppl": 7.5368, + "step": 3223 + }, + { + "epoch": 0.02, + "global_step": 3224, + "learning_rate": 0.0004873789649415693, + "loss": 2.0105, + "loss_base2": 2.9005, + "loss_pixel": 0.3793, + "loss_text": 1.6312, + "ppl": 7.467, + "step": 3224 + }, + { + "epoch": 0.02, + "global_step": 3225, + "learning_rate": 0.0004873747913188648, + "loss": 2.0205, + "loss_base2": 2.915, + "loss_pixel": 0.3792, + "loss_text": 1.6413, + "ppl": 7.5421, + "step": 3225 + }, + { + "epoch": 0.02, + "global_step": 3226, + "learning_rate": 0.00048737061769616027, + "loss": 2.0223, + "loss_base2": 2.9176, + "loss_pixel": 0.3793, + "loss_text": 1.643, + "ppl": 7.5557, + "step": 3226 + }, + { + "epoch": 0.02, + "global_step": 3227, + "learning_rate": 0.0004873664440734558, + "loss": 2.018, + "loss_base2": 2.9114, + "loss_pixel": 0.3795, + "loss_text": 1.6385, + "ppl": 7.5233, + "step": 3227 + }, + { + "epoch": 0.02, + "global_step": 3228, + "learning_rate": 0.0004873622704507513, + "loss": 2.009, + "loss_base2": 2.8984, + "loss_pixel": 0.3793, + "loss_text": 1.6296, + "ppl": 7.4559, + "step": 3228 + }, + { + "epoch": 0.02, + "global_step": 3229, + "learning_rate": 0.0004873580968280468, + "loss": 1.9915, + "loss_base2": 2.8731, + "loss_pixel": 0.379, + "loss_text": 1.6125, + "ppl": 7.3265, + "step": 3229 + }, + { + "epoch": 0.02, + "global_step": 3230, + "learning_rate": 0.00048735392320534225, + "loss": 2.0076, + "loss_base2": 2.8964, + "loss_pixel": 0.3785, + "loss_text": 1.6292, + "ppl": 7.4454, + "step": 3230 + }, + { + "epoch": 0.02, + "global_step": 3231, + "learning_rate": 0.0004873497495826377, + "loss": 2.0111, + "loss_base2": 2.9014, + "loss_pixel": 0.3784, + "loss_text": 1.6328, + "ppl": 7.4715, + "step": 3231 + }, + { + "epoch": 0.02, + "global_step": 3232, + "learning_rate": 0.0004873455759599332, + "loss": 2.019, + "loss_base2": 2.9128, + "loss_pixel": 0.3783, + "loss_text": 1.6407, + "ppl": 7.5308, + "step": 3232 + }, + { + "epoch": 0.02, + "global_step": 3233, + "learning_rate": 0.0004873414023372287, + "loss": 1.8123, + "loss_base2": 2.6146, + "loss_pixel": 0.3776, + "loss_text": 1.4346, + "ppl": 6.1245, + "step": 3233 + }, + { + "epoch": 0.02, + "global_step": 3234, + "learning_rate": 0.0004873372287145242, + "loss": 1.7821, + "loss_base2": 2.571, + "loss_pixel": 0.377, + "loss_text": 1.4052, + "ppl": 5.9423, + "step": 3234 + }, + { + "epoch": 0.02, + "global_step": 3235, + "learning_rate": 0.0004873330550918197, + "loss": 1.7883, + "loss_base2": 2.58, + "loss_pixel": 0.3758, + "loss_text": 1.4125, + "ppl": 5.9793, + "step": 3235 + }, + { + "epoch": 0.02, + "global_step": 3236, + "learning_rate": 0.0004873288814691152, + "loss": 1.7779, + "loss_base2": 2.565, + "loss_pixel": 0.3752, + "loss_text": 1.4027, + "ppl": 5.9174, + "step": 3236 + }, + { + "epoch": 0.02, + "global_step": 3237, + "learning_rate": 0.0004873247078464107, + "loss": 1.7602, + "loss_base2": 2.5394, + "loss_pixel": 0.3751, + "loss_text": 1.3851, + "ppl": 5.8136, + "step": 3237 + }, + { + "epoch": 0.02, + "global_step": 3238, + "learning_rate": 0.0004873205342237062, + "loss": 1.7755, + "loss_base2": 2.5615, + "loss_pixel": 0.3751, + "loss_text": 1.4004, + "ppl": 5.9032, + "step": 3238 + }, + { + "epoch": 0.02, + "global_step": 3239, + "learning_rate": 0.0004873163606010017, + "loss": 1.7765, + "loss_base2": 2.5629, + "loss_pixel": 0.3758, + "loss_text": 1.4007, + "ppl": 5.9091, + "step": 3239 + }, + { + "epoch": 0.02, + "global_step": 3240, + "learning_rate": 0.00048731218697829716, + "loss": 1.7697, + "loss_base2": 2.5531, + "loss_pixel": 0.3748, + "loss_text": 1.3949, + "ppl": 5.8691, + "step": 3240 + }, + { + "epoch": 0.02, + "global_step": 3241, + "learning_rate": 0.00048730801335559266, + "loss": 1.8833, + "loss_base2": 2.717, + "loss_pixel": 0.3744, + "loss_text": 1.5089, + "ppl": 6.5752, + "step": 3241 + }, + { + "epoch": 0.02, + "global_step": 3242, + "learning_rate": 0.00048730383973288817, + "loss": 2.0131, + "loss_base2": 2.9043, + "loss_pixel": 0.3741, + "loss_text": 1.639, + "ppl": 7.4865, + "step": 3242 + }, + { + "epoch": 0.02, + "global_step": 3243, + "learning_rate": 0.0004872996661101837, + "loss": 2.021, + "loss_base2": 2.9157, + "loss_pixel": 0.374, + "loss_text": 1.6469, + "ppl": 7.5459, + "step": 3243 + }, + { + "epoch": 0.02, + "global_step": 3244, + "learning_rate": 0.00048729549248747913, + "loss": 2.0007, + "loss_base2": 2.8864, + "loss_pixel": 0.3761, + "loss_text": 1.6246, + "ppl": 7.3942, + "step": 3244 + }, + { + "epoch": 0.02, + "global_step": 3245, + "learning_rate": 0.00048729131886477464, + "loss": 2.0174, + "loss_base2": 2.9105, + "loss_pixel": 0.3726, + "loss_text": 1.6448, + "ppl": 7.5188, + "step": 3245 + }, + { + "epoch": 0.02, + "global_step": 3246, + "learning_rate": 0.00048728714524207015, + "loss": 2.0001, + "loss_base2": 2.8855, + "loss_pixel": 0.372, + "loss_text": 1.628, + "ppl": 7.3898, + "step": 3246 + }, + { + "epoch": 0.02, + "global_step": 3247, + "learning_rate": 0.00048728297161936565, + "loss": 2.0101, + "loss_base2": 2.9, + "loss_pixel": 0.3726, + "loss_text": 1.6374, + "ppl": 7.4641, + "step": 3247 + }, + { + "epoch": 0.02, + "global_step": 3248, + "learning_rate": 0.00048727879799666116, + "loss": 2.016, + "loss_base2": 2.9085, + "loss_pixel": 0.3772, + "loss_text": 1.6389, + "ppl": 7.5082, + "step": 3248 + }, + { + "epoch": 0.02, + "global_step": 3249, + "learning_rate": 0.0004872746243739566, + "loss": 2.0373, + "loss_base2": 2.9392, + "loss_pixel": 0.3747, + "loss_text": 1.6625, + "ppl": 7.6699, + "step": 3249 + }, + { + "epoch": 0.03, + "global_step": 3250, + "learning_rate": 0.00048727045075125207, + "loss": 1.9947, + "loss_base2": 2.8777, + "loss_pixel": 0.3751, + "loss_text": 1.6196, + "ppl": 7.35, + "step": 3250 + }, + { + "epoch": 0.03, + "global_step": 3251, + "learning_rate": 0.0004872662771285476, + "loss": 2.0226, + "loss_base2": 2.918, + "loss_pixel": 0.3753, + "loss_text": 1.6474, + "ppl": 7.558, + "step": 3251 + }, + { + "epoch": 0.03, + "global_step": 3252, + "learning_rate": 0.0004872621035058431, + "loss": 1.998, + "loss_base2": 2.8825, + "loss_pixel": 0.3731, + "loss_text": 1.6249, + "ppl": 7.3743, + "step": 3252 + }, + { + "epoch": 0.03, + "global_step": 3253, + "learning_rate": 0.00048725792988313853, + "loss": 2.0041, + "loss_base2": 2.8913, + "loss_pixel": 0.3726, + "loss_text": 1.6315, + "ppl": 7.4194, + "step": 3253 + }, + { + "epoch": 0.03, + "global_step": 3254, + "learning_rate": 0.00048725375626043404, + "loss": 2.0128, + "loss_base2": 2.9039, + "loss_pixel": 0.3729, + "loss_text": 1.6399, + "ppl": 7.4842, + "step": 3254 + }, + { + "epoch": 0.03, + "global_step": 3255, + "learning_rate": 0.00048724958263772955, + "loss": 2.0015, + "loss_base2": 2.8876, + "loss_pixel": 0.372, + "loss_text": 1.6295, + "ppl": 7.4001, + "step": 3255 + }, + { + "epoch": 0.03, + "global_step": 3256, + "learning_rate": 0.00048724540901502506, + "loss": 2.0134, + "loss_base2": 2.9047, + "loss_pixel": 0.3729, + "loss_text": 1.6405, + "ppl": 7.4887, + "step": 3256 + }, + { + "epoch": 0.03, + "global_step": 3257, + "learning_rate": 0.00048724123539232056, + "loss": 1.9848, + "loss_base2": 2.8635, + "loss_pixel": 0.3721, + "loss_text": 1.6127, + "ppl": 7.2776, + "step": 3257 + }, + { + "epoch": 0.03, + "global_step": 3258, + "learning_rate": 0.000487237061769616, + "loss": 1.9942, + "loss_base2": 2.877, + "loss_pixel": 0.3716, + "loss_text": 1.6226, + "ppl": 7.3463, + "step": 3258 + }, + { + "epoch": 0.03, + "global_step": 3259, + "learning_rate": 0.0004872328881469115, + "loss": 1.9984, + "loss_base2": 2.8831, + "loss_pixel": 0.3717, + "loss_text": 1.6266, + "ppl": 7.3772, + "step": 3259 + }, + { + "epoch": 0.03, + "global_step": 3260, + "learning_rate": 0.00048722871452420703, + "loss": 2.0162, + "loss_base2": 2.9088, + "loss_pixel": 0.3706, + "loss_text": 1.6456, + "ppl": 7.5097, + "step": 3260 + }, + { + "epoch": 0.03, + "global_step": 3261, + "learning_rate": 0.00048722454090150254, + "loss": 1.9968, + "loss_base2": 2.8808, + "loss_pixel": 0.3704, + "loss_text": 1.6264, + "ppl": 7.3654, + "step": 3261 + }, + { + "epoch": 0.03, + "global_step": 3262, + "learning_rate": 0.000487220367278798, + "loss": 2.0059, + "loss_base2": 2.8939, + "loss_pixel": 0.3702, + "loss_text": 1.6357, + "ppl": 7.4328, + "step": 3262 + }, + { + "epoch": 0.03, + "global_step": 3263, + "learning_rate": 0.0004872161936560935, + "loss": 1.9993, + "loss_base2": 2.8844, + "loss_pixel": 0.3699, + "loss_text": 1.6295, + "ppl": 7.3839, + "step": 3263 + }, + { + "epoch": 0.03, + "global_step": 3264, + "learning_rate": 0.000487212020033389, + "loss": 1.99, + "loss_base2": 2.871, + "loss_pixel": 0.3697, + "loss_text": 1.6203, + "ppl": 7.3155, + "step": 3264 + }, + { + "epoch": 0.03, + "global_step": 3265, + "learning_rate": 0.0004872078464106845, + "loss": 1.9718, + "loss_base2": 2.8447, + "loss_pixel": 0.3696, + "loss_text": 1.6022, + "ppl": 7.1836, + "step": 3265 + }, + { + "epoch": 0.03, + "global_step": 3266, + "learning_rate": 0.00048720367278798, + "loss": 1.9881, + "loss_base2": 2.8682, + "loss_pixel": 0.3697, + "loss_text": 1.6184, + "ppl": 7.3016, + "step": 3266 + }, + { + "epoch": 0.03, + "global_step": 3267, + "learning_rate": 0.0004871994991652755, + "loss": 2.0015, + "loss_base2": 2.8876, + "loss_pixel": 0.3696, + "loss_text": 1.6319, + "ppl": 7.4001, + "step": 3267 + }, + { + "epoch": 0.03, + "global_step": 3268, + "learning_rate": 0.000487195325542571, + "loss": 1.9944, + "loss_base2": 2.8773, + "loss_pixel": 0.3687, + "loss_text": 1.6257, + "ppl": 7.3478, + "step": 3268 + }, + { + "epoch": 0.03, + "global_step": 3269, + "learning_rate": 0.00048719115191986644, + "loss": 1.9975, + "loss_base2": 2.8818, + "loss_pixel": 0.3689, + "loss_text": 1.6285, + "ppl": 7.3706, + "step": 3269 + }, + { + "epoch": 0.03, + "global_step": 3270, + "learning_rate": 0.00048718697829716194, + "loss": 2.0082, + "loss_base2": 2.8972, + "loss_pixel": 0.3689, + "loss_text": 1.6393, + "ppl": 7.4499, + "step": 3270 + }, + { + "epoch": 0.03, + "global_step": 3271, + "learning_rate": 0.0004871828046744574, + "loss": 1.9885, + "loss_base2": 2.8688, + "loss_pixel": 0.3685, + "loss_text": 1.62, + "ppl": 7.3046, + "step": 3271 + }, + { + "epoch": 0.03, + "global_step": 3272, + "learning_rate": 0.0004871786310517529, + "loss": 2.0089, + "loss_base2": 2.8982, + "loss_pixel": 0.3685, + "loss_text": 1.6404, + "ppl": 7.4551, + "step": 3272 + }, + { + "epoch": 0.03, + "global_step": 3273, + "learning_rate": 0.0004871744574290484, + "loss": 1.9824, + "loss_base2": 2.86, + "loss_pixel": 0.368, + "loss_text": 1.6144, + "ppl": 7.2601, + "step": 3273 + }, + { + "epoch": 0.03, + "global_step": 3274, + "learning_rate": 0.0004871702838063439, + "loss": 1.9927, + "loss_base2": 2.8749, + "loss_pixel": 0.3676, + "loss_text": 1.6251, + "ppl": 7.3353, + "step": 3274 + }, + { + "epoch": 0.03, + "global_step": 3275, + "learning_rate": 0.0004871661101836394, + "loss": 1.9976, + "loss_base2": 2.8819, + "loss_pixel": 0.367, + "loss_text": 1.6306, + "ppl": 7.3713, + "step": 3275 + }, + { + "epoch": 0.03, + "global_step": 3276, + "learning_rate": 0.0004871619365609349, + "loss": 1.9816, + "loss_base2": 2.8588, + "loss_pixel": 0.3666, + "loss_text": 1.615, + "ppl": 7.2543, + "step": 3276 + }, + { + "epoch": 0.03, + "global_step": 3277, + "learning_rate": 0.0004871577629382304, + "loss": 2.0016, + "loss_base2": 2.8877, + "loss_pixel": 0.3662, + "loss_text": 1.6354, + "ppl": 7.4009, + "step": 3277 + }, + { + "epoch": 0.03, + "global_step": 3278, + "learning_rate": 0.0004871535893155259, + "loss": 1.9784, + "loss_base2": 2.8542, + "loss_pixel": 0.3658, + "loss_text": 1.6126, + "ppl": 7.2312, + "step": 3278 + }, + { + "epoch": 0.03, + "global_step": 3279, + "learning_rate": 0.0004871494156928214, + "loss": 1.9742, + "loss_base2": 2.8482, + "loss_pixel": 0.3659, + "loss_text": 1.6082, + "ppl": 7.2009, + "step": 3279 + }, + { + "epoch": 0.03, + "global_step": 3280, + "learning_rate": 0.00048714524207011685, + "loss": 1.9719, + "loss_base2": 2.8449, + "loss_pixel": 0.3652, + "loss_text": 1.6067, + "ppl": 7.1843, + "step": 3280 + }, + { + "epoch": 0.03, + "global_step": 3281, + "learning_rate": 0.00048714106844741236, + "loss": 1.9907, + "loss_base2": 2.872, + "loss_pixel": 0.3644, + "loss_text": 1.6263, + "ppl": 7.3207, + "step": 3281 + }, + { + "epoch": 0.03, + "global_step": 3282, + "learning_rate": 0.00048713689482470787, + "loss": 1.9821, + "loss_base2": 2.8596, + "loss_pixel": 0.3642, + "loss_text": 1.6179, + "ppl": 7.258, + "step": 3282 + }, + { + "epoch": 0.03, + "global_step": 3283, + "learning_rate": 0.0004871327212020034, + "loss": 1.9861, + "loss_base2": 2.8653, + "loss_pixel": 0.368, + "loss_text": 1.6181, + "ppl": 7.2871, + "step": 3283 + }, + { + "epoch": 0.03, + "global_step": 3284, + "learning_rate": 0.0004871285475792989, + "loss": 1.9823, + "loss_base2": 2.8599, + "loss_pixel": 0.3653, + "loss_text": 1.617, + "ppl": 7.2594, + "step": 3284 + }, + { + "epoch": 0.03, + "global_step": 3285, + "learning_rate": 0.00048712437395659434, + "loss": 1.9726, + "loss_base2": 2.8459, + "loss_pixel": 0.3644, + "loss_text": 1.6082, + "ppl": 7.1893, + "step": 3285 + }, + { + "epoch": 0.03, + "global_step": 3286, + "learning_rate": 0.00048712020033388984, + "loss": 1.9864, + "loss_base2": 2.8658, + "loss_pixel": 0.3642, + "loss_text": 1.6222, + "ppl": 7.2892, + "step": 3286 + }, + { + "epoch": 0.03, + "global_step": 3287, + "learning_rate": 0.0004871160267111853, + "loss": 1.9771, + "loss_base2": 2.8524, + "loss_pixel": 0.3647, + "loss_text": 1.6124, + "ppl": 7.2218, + "step": 3287 + }, + { + "epoch": 0.03, + "global_step": 3288, + "learning_rate": 0.0004871118530884808, + "loss": 1.9682, + "loss_base2": 2.8395, + "loss_pixel": 0.3634, + "loss_text": 1.6047, + "ppl": 7.1578, + "step": 3288 + }, + { + "epoch": 0.03, + "global_step": 3289, + "learning_rate": 0.00048710767946577626, + "loss": 1.9849, + "loss_base2": 2.8636, + "loss_pixel": 0.362, + "loss_text": 1.6229, + "ppl": 7.2783, + "step": 3289 + }, + { + "epoch": 0.03, + "global_step": 3290, + "learning_rate": 0.00048710350584307176, + "loss": 1.9873, + "loss_base2": 2.8671, + "loss_pixel": 0.3637, + "loss_text": 1.6235, + "ppl": 7.2958, + "step": 3290 + }, + { + "epoch": 0.03, + "global_step": 3291, + "learning_rate": 0.00048709933222036727, + "loss": 1.9882, + "loss_base2": 2.8684, + "loss_pixel": 0.3667, + "loss_text": 1.6216, + "ppl": 7.3024, + "step": 3291 + }, + { + "epoch": 0.03, + "global_step": 3292, + "learning_rate": 0.0004870951585976628, + "loss": 1.9678, + "loss_base2": 2.8389, + "loss_pixel": 0.3626, + "loss_text": 1.6053, + "ppl": 7.1549, + "step": 3292 + }, + { + "epoch": 0.03, + "global_step": 3293, + "learning_rate": 0.0004870909849749583, + "loss": 1.9671, + "loss_base2": 2.8379, + "loss_pixel": 0.3636, + "loss_text": 1.6035, + "ppl": 7.1499, + "step": 3293 + }, + { + "epoch": 0.03, + "global_step": 3294, + "learning_rate": 0.00048708681135225374, + "loss": 1.9912, + "loss_base2": 2.8727, + "loss_pixel": 0.365, + "loss_text": 1.6262, + "ppl": 7.3243, + "step": 3294 + }, + { + "epoch": 0.03, + "global_step": 3295, + "learning_rate": 0.00048708263772954925, + "loss": 1.9883, + "loss_base2": 2.8685, + "loss_pixel": 0.3645, + "loss_text": 1.6238, + "ppl": 7.3031, + "step": 3295 + }, + { + "epoch": 0.03, + "global_step": 3296, + "learning_rate": 0.00048707846410684475, + "loss": 2.0026, + "loss_base2": 2.8891, + "loss_pixel": 0.3637, + "loss_text": 1.6389, + "ppl": 7.4083, + "step": 3296 + }, + { + "epoch": 0.03, + "global_step": 3297, + "learning_rate": 0.00048707429048414026, + "loss": 1.9882, + "loss_base2": 2.8684, + "loss_pixel": 0.3635, + "loss_text": 1.6248, + "ppl": 7.3024, + "step": 3297 + }, + { + "epoch": 0.03, + "global_step": 3298, + "learning_rate": 0.00048707011686143577, + "loss": 1.9673, + "loss_base2": 2.8382, + "loss_pixel": 0.3628, + "loss_text": 1.6044, + "ppl": 7.1513, + "step": 3298 + }, + { + "epoch": 0.03, + "global_step": 3299, + "learning_rate": 0.0004870659432387312, + "loss": 1.9682, + "loss_base2": 2.8395, + "loss_pixel": 0.3619, + "loss_text": 1.6064, + "ppl": 7.1578, + "step": 3299 + }, + { + "epoch": 0.03, + "global_step": 3300, + "learning_rate": 0.00048706176961602673, + "loss": 1.9889, + "loss_base2": 2.8694, + "loss_pixel": 0.3612, + "loss_text": 1.6277, + "ppl": 7.3075, + "step": 3300 + }, + { + "epoch": 0.03, + "global_step": 3301, + "learning_rate": 0.00048705759599332224, + "loss": 1.966, + "loss_base2": 2.8363, + "loss_pixel": 0.3601, + "loss_text": 1.6059, + "ppl": 7.1421, + "step": 3301 + }, + { + "epoch": 0.03, + "global_step": 3302, + "learning_rate": 0.00048705342237061774, + "loss": 1.9755, + "loss_base2": 2.85, + "loss_pixel": 0.3592, + "loss_text": 1.6164, + "ppl": 7.2102, + "step": 3302 + }, + { + "epoch": 0.03, + "global_step": 3303, + "learning_rate": 0.0004870492487479132, + "loss": 1.9764, + "loss_base2": 2.8513, + "loss_pixel": 0.3584, + "loss_text": 1.618, + "ppl": 7.2167, + "step": 3303 + }, + { + "epoch": 0.03, + "global_step": 3304, + "learning_rate": 0.0004870450751252087, + "loss": 1.9565, + "loss_base2": 2.8226, + "loss_pixel": 0.3582, + "loss_text": 1.5983, + "ppl": 7.0745, + "step": 3304 + }, + { + "epoch": 0.03, + "global_step": 3305, + "learning_rate": 0.0004870409015025042, + "loss": 1.9643, + "loss_base2": 2.8339, + "loss_pixel": 0.3586, + "loss_text": 1.6057, + "ppl": 7.1299, + "step": 3305 + }, + { + "epoch": 0.03, + "global_step": 3306, + "learning_rate": 0.00048703672787979966, + "loss": 1.9646, + "loss_base2": 2.8343, + "loss_pixel": 0.3577, + "loss_text": 1.6068, + "ppl": 7.1321, + "step": 3306 + }, + { + "epoch": 0.03, + "global_step": 3307, + "learning_rate": 0.00048703255425709517, + "loss": 1.994, + "loss_base2": 2.8767, + "loss_pixel": 0.3595, + "loss_text": 1.6345, + "ppl": 7.3449, + "step": 3307 + }, + { + "epoch": 0.03, + "global_step": 3308, + "learning_rate": 0.0004870283806343906, + "loss": 1.9853, + "loss_base2": 2.8642, + "loss_pixel": 0.3572, + "loss_text": 1.6281, + "ppl": 7.2812, + "step": 3308 + }, + { + "epoch": 0.03, + "global_step": 3309, + "learning_rate": 0.00048702420701168613, + "loss": 1.9833, + "loss_base2": 2.8613, + "loss_pixel": 0.3562, + "loss_text": 1.6271, + "ppl": 7.2667, + "step": 3309 + }, + { + "epoch": 0.03, + "global_step": 3310, + "learning_rate": 0.00048702003338898164, + "loss": 1.9849, + "loss_base2": 2.8636, + "loss_pixel": 0.3566, + "loss_text": 1.6283, + "ppl": 7.2783, + "step": 3310 + }, + { + "epoch": 0.03, + "global_step": 3311, + "learning_rate": 0.00048701585976627715, + "loss": 1.9739, + "loss_base2": 2.8477, + "loss_pixel": 0.354, + "loss_text": 1.6199, + "ppl": 7.1987, + "step": 3311 + }, + { + "epoch": 0.03, + "global_step": 3312, + "learning_rate": 0.0004870116861435726, + "loss": 1.9649, + "loss_base2": 2.8348, + "loss_pixel": 0.3544, + "loss_text": 1.6105, + "ppl": 7.1342, + "step": 3312 + }, + { + "epoch": 0.03, + "global_step": 3313, + "learning_rate": 0.0004870075125208681, + "loss": 1.7458, + "loss_base2": 2.5187, + "loss_pixel": 0.3531, + "loss_text": 1.3928, + "ppl": 5.7305, + "step": 3313 + }, + { + "epoch": 0.03, + "global_step": 3314, + "learning_rate": 0.0004870033388981636, + "loss": 1.7234, + "loss_base2": 2.4863, + "loss_pixel": 0.3523, + "loss_text": 1.3711, + "ppl": 5.6035, + "step": 3314 + }, + { + "epoch": 0.03, + "global_step": 3315, + "learning_rate": 0.0004869991652754591, + "loss": 1.7264, + "loss_base2": 2.4907, + "loss_pixel": 0.3516, + "loss_text": 1.3747, + "ppl": 5.6204, + "step": 3315 + }, + { + "epoch": 0.03, + "global_step": 3316, + "learning_rate": 0.00048699499165275463, + "loss": 1.7492, + "loss_base2": 2.5236, + "loss_pixel": 0.3519, + "loss_text": 1.3973, + "ppl": 5.75, + "step": 3316 + }, + { + "epoch": 0.03, + "global_step": 3317, + "learning_rate": 0.0004869908180300501, + "loss": 1.7512, + "loss_base2": 2.5264, + "loss_pixel": 0.3578, + "loss_text": 1.3934, + "ppl": 5.7615, + "step": 3317 + }, + { + "epoch": 0.03, + "global_step": 3318, + "learning_rate": 0.0004869866444073456, + "loss": 1.7394, + "loss_base2": 2.5094, + "loss_pixel": 0.355, + "loss_text": 1.3844, + "ppl": 5.6939, + "step": 3318 + }, + { + "epoch": 0.03, + "global_step": 3319, + "learning_rate": 0.0004869824707846411, + "loss": 1.7409, + "loss_base2": 2.5116, + "loss_pixel": 0.3602, + "loss_text": 1.3807, + "ppl": 5.7025, + "step": 3319 + }, + { + "epoch": 0.03, + "global_step": 3320, + "learning_rate": 0.0004869782971619366, + "loss": 1.7499, + "loss_base2": 2.5246, + "loss_pixel": 0.3562, + "loss_text": 1.3937, + "ppl": 5.754, + "step": 3320 + }, + { + "epoch": 0.03, + "global_step": 3321, + "learning_rate": 0.00048697412353923206, + "loss": 1.8008, + "loss_base2": 2.598, + "loss_pixel": 0.3593, + "loss_text": 1.4415, + "ppl": 6.0545, + "step": 3321 + }, + { + "epoch": 0.03, + "global_step": 3322, + "learning_rate": 0.00048696994991652756, + "loss": 2.0056, + "loss_base2": 2.8935, + "loss_pixel": 0.353, + "loss_text": 1.6527, + "ppl": 7.4306, + "step": 3322 + }, + { + "epoch": 0.03, + "global_step": 3323, + "learning_rate": 0.00048696577629382307, + "loss": 2.0036, + "loss_base2": 2.8906, + "loss_pixel": 0.362, + "loss_text": 1.6416, + "ppl": 7.4157, + "step": 3323 + }, + { + "epoch": 0.03, + "global_step": 3324, + "learning_rate": 0.0004869616026711186, + "loss": 1.9993, + "loss_base2": 2.8844, + "loss_pixel": 0.3619, + "loss_text": 1.6374, + "ppl": 7.3839, + "step": 3324 + }, + { + "epoch": 0.03, + "global_step": 3325, + "learning_rate": 0.00048695742904841403, + "loss": 1.9975, + "loss_base2": 2.8818, + "loss_pixel": 0.3561, + "loss_text": 1.6414, + "ppl": 7.3706, + "step": 3325 + }, + { + "epoch": 0.03, + "global_step": 3326, + "learning_rate": 0.0004869532554257095, + "loss": 1.9802, + "loss_base2": 2.8568, + "loss_pixel": 0.3559, + "loss_text": 1.6244, + "ppl": 7.2442, + "step": 3326 + }, + { + "epoch": 0.03, + "global_step": 3327, + "learning_rate": 0.000486949081803005, + "loss": 1.9633, + "loss_base2": 2.8324, + "loss_pixel": 0.3501, + "loss_text": 1.6131, + "ppl": 7.1228, + "step": 3327 + }, + { + "epoch": 0.03, + "global_step": 3328, + "learning_rate": 0.0004869449081803005, + "loss": 1.9953, + "loss_base2": 2.8786, + "loss_pixel": 0.3499, + "loss_text": 1.6454, + "ppl": 7.3544, + "step": 3328 + }, + { + "epoch": 0.03, + "global_step": 3329, + "learning_rate": 0.000486940734557596, + "loss": 1.986, + "loss_base2": 2.8652, + "loss_pixel": 0.3496, + "loss_text": 1.6364, + "ppl": 7.2863, + "step": 3329 + }, + { + "epoch": 0.03, + "global_step": 3330, + "learning_rate": 0.00048693656093489146, + "loss": 1.9801, + "loss_base2": 2.8567, + "loss_pixel": 0.3491, + "loss_text": 1.6311, + "ppl": 7.2435, + "step": 3330 + }, + { + "epoch": 0.03, + "global_step": 3331, + "learning_rate": 0.00048693238731218697, + "loss": 1.9787, + "loss_base2": 2.8547, + "loss_pixel": 0.3478, + "loss_text": 1.6309, + "ppl": 7.2333, + "step": 3331 + }, + { + "epoch": 0.03, + "global_step": 3332, + "learning_rate": 0.0004869282136894825, + "loss": 1.9622, + "loss_base2": 2.8309, + "loss_pixel": 0.348, + "loss_text": 1.6141, + "ppl": 7.115, + "step": 3332 + }, + { + "epoch": 0.03, + "global_step": 3333, + "learning_rate": 0.000486924040066778, + "loss": 1.9746, + "loss_base2": 2.8487, + "loss_pixel": 0.3463, + "loss_text": 1.6284, + "ppl": 7.2037, + "step": 3333 + }, + { + "epoch": 0.03, + "global_step": 3334, + "learning_rate": 0.0004869198664440735, + "loss": 1.9767, + "loss_base2": 2.8518, + "loss_pixel": 0.3464, + "loss_text": 1.6303, + "ppl": 7.2189, + "step": 3334 + }, + { + "epoch": 0.03, + "global_step": 3335, + "learning_rate": 0.00048691569282136894, + "loss": 1.9792, + "loss_base2": 2.8554, + "loss_pixel": 0.3459, + "loss_text": 1.6333, + "ppl": 7.237, + "step": 3335 + }, + { + "epoch": 0.03, + "global_step": 3336, + "learning_rate": 0.00048691151919866445, + "loss": 1.962, + "loss_base2": 2.8306, + "loss_pixel": 0.3451, + "loss_text": 1.6169, + "ppl": 7.1135, + "step": 3336 + }, + { + "epoch": 0.03, + "global_step": 3337, + "learning_rate": 0.00048690734557595996, + "loss": 1.9736, + "loss_base2": 2.8473, + "loss_pixel": 0.3451, + "loss_text": 1.6285, + "ppl": 7.1965, + "step": 3337 + }, + { + "epoch": 0.03, + "global_step": 3338, + "learning_rate": 0.00048690317195325546, + "loss": 1.9604, + "loss_base2": 2.8283, + "loss_pixel": 0.3449, + "loss_text": 1.6155, + "ppl": 7.1022, + "step": 3338 + }, + { + "epoch": 0.03, + "global_step": 3339, + "learning_rate": 0.0004868989983305509, + "loss": 1.9516, + "loss_base2": 2.8156, + "loss_pixel": 0.343, + "loss_text": 1.6087, + "ppl": 7.0399, + "step": 3339 + }, + { + "epoch": 0.03, + "global_step": 3340, + "learning_rate": 0.0004868948247078464, + "loss": 1.9395, + "loss_base2": 2.7981, + "loss_pixel": 0.3433, + "loss_text": 1.5961, + "ppl": 6.9553, + "step": 3340 + }, + { + "epoch": 0.03, + "global_step": 3341, + "learning_rate": 0.00048689065108514193, + "loss": 1.9598, + "loss_base2": 2.8274, + "loss_pixel": 0.3423, + "loss_text": 1.6175, + "ppl": 7.0979, + "step": 3341 + }, + { + "epoch": 0.03, + "global_step": 3342, + "learning_rate": 0.00048688647746243744, + "loss": 1.939, + "loss_base2": 2.7974, + "loss_pixel": 0.3424, + "loss_text": 1.5966, + "ppl": 6.9518, + "step": 3342 + }, + { + "epoch": 0.03, + "global_step": 3343, + "learning_rate": 0.00048688230383973295, + "loss": 1.9695, + "loss_base2": 2.8414, + "loss_pixel": 0.341, + "loss_text": 1.6285, + "ppl": 7.1671, + "step": 3343 + }, + { + "epoch": 0.03, + "global_step": 3344, + "learning_rate": 0.00048687813021702835, + "loss": 1.9546, + "loss_base2": 2.8199, + "loss_pixel": 0.3407, + "loss_text": 1.614, + "ppl": 7.0611, + "step": 3344 + }, + { + "epoch": 0.03, + "global_step": 3345, + "learning_rate": 0.00048687395659432385, + "loss": 1.9589, + "loss_base2": 2.8261, + "loss_pixel": 0.3395, + "loss_text": 1.6194, + "ppl": 7.0915, + "step": 3345 + }, + { + "epoch": 0.03, + "global_step": 3346, + "learning_rate": 0.00048686978297161936, + "loss": 1.7215, + "loss_base2": 2.4836, + "loss_pixel": 0.3408, + "loss_text": 1.3807, + "ppl": 5.5929, + "step": 3346 + }, + { + "epoch": 0.03, + "global_step": 3347, + "learning_rate": 0.00048686560934891487, + "loss": 1.7266, + "loss_base2": 2.491, + "loss_pixel": 0.3394, + "loss_text": 1.3872, + "ppl": 5.6215, + "step": 3347 + }, + { + "epoch": 0.03, + "global_step": 3348, + "learning_rate": 0.0004868614357262103, + "loss": 1.7189, + "loss_base2": 2.4798, + "loss_pixel": 0.3384, + "loss_text": 1.3805, + "ppl": 5.5784, + "step": 3348 + }, + { + "epoch": 0.03, + "global_step": 3349, + "learning_rate": 0.00048685726210350583, + "loss": 1.7208, + "loss_base2": 2.4826, + "loss_pixel": 0.338, + "loss_text": 1.3828, + "ppl": 5.589, + "step": 3349 + }, + { + "epoch": 0.03, + "global_step": 3350, + "learning_rate": 0.00048685308848080134, + "loss": 1.7332, + "loss_base2": 2.5005, + "loss_pixel": 0.3374, + "loss_text": 1.3957, + "ppl": 5.6587, + "step": 3350 + }, + { + "epoch": 0.03, + "global_step": 3351, + "learning_rate": 0.00048684891485809684, + "loss": 1.7048, + "loss_base2": 2.4595, + "loss_pixel": 0.336, + "loss_text": 1.3688, + "ppl": 5.5003, + "step": 3351 + }, + { + "epoch": 0.03, + "global_step": 3352, + "learning_rate": 0.00048684474123539235, + "loss": 1.7163, + "loss_base2": 2.4761, + "loss_pixel": 0.3379, + "loss_text": 1.3784, + "ppl": 5.5639, + "step": 3352 + }, + { + "epoch": 0.03, + "global_step": 3353, + "learning_rate": 0.0004868405676126878, + "loss": 1.7571, + "loss_base2": 2.535, + "loss_pixel": 0.3602, + "loss_text": 1.3969, + "ppl": 5.7956, + "step": 3353 + }, + { + "epoch": 0.03, + "global_step": 3354, + "learning_rate": 0.0004868363939899833, + "loss": 1.729, + "loss_base2": 2.4944, + "loss_pixel": 0.3569, + "loss_text": 1.3721, + "ppl": 5.635, + "step": 3354 + }, + { + "epoch": 0.03, + "global_step": 3355, + "learning_rate": 0.0004868322203672788, + "loss": 1.718, + "loss_base2": 2.4786, + "loss_pixel": 0.3507, + "loss_text": 1.3673, + "ppl": 5.5734, + "step": 3355 + }, + { + "epoch": 0.03, + "global_step": 3356, + "learning_rate": 0.0004868280467445743, + "loss": 1.7337, + "loss_base2": 2.5012, + "loss_pixel": 0.3465, + "loss_text": 1.3872, + "ppl": 5.6616, + "step": 3356 + }, + { + "epoch": 0.03, + "global_step": 3357, + "learning_rate": 0.00048682387312186983, + "loss": 1.7324, + "loss_base2": 2.4993, + "loss_pixel": 0.3448, + "loss_text": 1.3875, + "ppl": 5.6542, + "step": 3357 + }, + { + "epoch": 0.03, + "global_step": 3358, + "learning_rate": 0.0004868196994991653, + "loss": 1.7131, + "loss_base2": 2.4715, + "loss_pixel": 0.3417, + "loss_text": 1.3713, + "ppl": 5.5461, + "step": 3358 + }, + { + "epoch": 0.03, + "global_step": 3359, + "learning_rate": 0.0004868155258764608, + "loss": 1.7143, + "loss_base2": 2.4732, + "loss_pixel": 0.3411, + "loss_text": 1.3732, + "ppl": 5.5528, + "step": 3359 + }, + { + "epoch": 0.03, + "global_step": 3360, + "learning_rate": 0.0004868113522537563, + "loss": 1.7037, + "loss_base2": 2.4579, + "loss_pixel": 0.3412, + "loss_text": 1.3625, + "ppl": 5.4942, + "step": 3360 + }, + { + "epoch": 0.03, + "global_step": 3361, + "learning_rate": 0.0004868071786310518, + "loss": 1.7174, + "loss_base2": 2.4777, + "loss_pixel": 0.3389, + "loss_text": 1.3785, + "ppl": 5.57, + "step": 3361 + }, + { + "epoch": 0.03, + "global_step": 3362, + "learning_rate": 0.0004868030050083472, + "loss": 1.9038, + "loss_base2": 2.7466, + "loss_pixel": 0.3388, + "loss_text": 1.565, + "ppl": 6.7113, + "step": 3362 + }, + { + "epoch": 0.03, + "global_step": 3363, + "learning_rate": 0.0004867988313856427, + "loss": 1.9703, + "loss_base2": 2.8425, + "loss_pixel": 0.3373, + "loss_text": 1.633, + "ppl": 7.1728, + "step": 3363 + }, + { + "epoch": 0.03, + "global_step": 3364, + "learning_rate": 0.0004867946577629382, + "loss": 1.9657, + "loss_base2": 2.8359, + "loss_pixel": 0.3369, + "loss_text": 1.6288, + "ppl": 7.1399, + "step": 3364 + }, + { + "epoch": 0.03, + "global_step": 3365, + "learning_rate": 0.00048679048414023373, + "loss": 1.9627, + "loss_base2": 2.8316, + "loss_pixel": 0.3353, + "loss_text": 1.6274, + "ppl": 7.1185, + "step": 3365 + }, + { + "epoch": 0.03, + "global_step": 3366, + "learning_rate": 0.00048678631051752924, + "loss": 1.9643, + "loss_base2": 2.8339, + "loss_pixel": 0.335, + "loss_text": 1.6294, + "ppl": 7.1299, + "step": 3366 + }, + { + "epoch": 0.03, + "global_step": 3367, + "learning_rate": 0.0004867821368948247, + "loss": 1.975, + "loss_base2": 2.8493, + "loss_pixel": 0.337, + "loss_text": 1.638, + "ppl": 7.2066, + "step": 3367 + }, + { + "epoch": 0.03, + "global_step": 3368, + "learning_rate": 0.0004867779632721202, + "loss": 1.9719, + "loss_base2": 2.8449, + "loss_pixel": 0.3525, + "loss_text": 1.6195, + "ppl": 7.1843, + "step": 3368 + }, + { + "epoch": 0.03, + "global_step": 3369, + "learning_rate": 0.0004867737896494157, + "loss": 1.9798, + "loss_base2": 2.8562, + "loss_pixel": 0.3587, + "loss_text": 1.621, + "ppl": 7.2413, + "step": 3369 + }, + { + "epoch": 0.03, + "global_step": 3370, + "learning_rate": 0.0004867696160267112, + "loss": 1.9907, + "loss_base2": 2.872, + "loss_pixel": 0.3566, + "loss_text": 1.6341, + "ppl": 7.3207, + "step": 3370 + }, + { + "epoch": 0.03, + "global_step": 3371, + "learning_rate": 0.00048676544240400666, + "loss": 1.9824, + "loss_base2": 2.86, + "loss_pixel": 0.3563, + "loss_text": 1.6262, + "ppl": 7.2601, + "step": 3371 + }, + { + "epoch": 0.03, + "global_step": 3372, + "learning_rate": 0.00048676126878130217, + "loss": 1.984, + "loss_base2": 2.8623, + "loss_pixel": 0.3574, + "loss_text": 1.6265, + "ppl": 7.2718, + "step": 3372 + }, + { + "epoch": 0.03, + "global_step": 3373, + "learning_rate": 0.0004867570951585977, + "loss": 1.9703, + "loss_base2": 2.8425, + "loss_pixel": 0.3495, + "loss_text": 1.6208, + "ppl": 7.1728, + "step": 3373 + }, + { + "epoch": 0.03, + "global_step": 3374, + "learning_rate": 0.0004867529215358932, + "loss": 1.977, + "loss_base2": 2.8522, + "loss_pixel": 0.3516, + "loss_text": 1.6254, + "ppl": 7.221, + "step": 3374 + }, + { + "epoch": 0.03, + "global_step": 3375, + "learning_rate": 0.0004867487479131887, + "loss": 1.9719, + "loss_base2": 2.8449, + "loss_pixel": 0.3464, + "loss_text": 1.6254, + "ppl": 7.1843, + "step": 3375 + }, + { + "epoch": 0.03, + "global_step": 3376, + "learning_rate": 0.00048674457429048415, + "loss": 1.9665, + "loss_base2": 2.8371, + "loss_pixel": 0.3444, + "loss_text": 1.6221, + "ppl": 7.1456, + "step": 3376 + }, + { + "epoch": 0.03, + "global_step": 3377, + "learning_rate": 0.00048674040066777965, + "loss": 1.9664, + "loss_base2": 2.8369, + "loss_pixel": 0.3435, + "loss_text": 1.623, + "ppl": 7.1449, + "step": 3377 + }, + { + "epoch": 0.03, + "global_step": 3378, + "learning_rate": 0.00048673622704507516, + "loss": 1.9616, + "loss_base2": 2.83, + "loss_pixel": 0.3414, + "loss_text": 1.6201, + "ppl": 7.1107, + "step": 3378 + }, + { + "epoch": 0.03, + "global_step": 3379, + "learning_rate": 0.00048673205342237067, + "loss": 1.9716, + "loss_base2": 2.8444, + "loss_pixel": 0.3398, + "loss_text": 1.6318, + "ppl": 7.1822, + "step": 3379 + }, + { + "epoch": 0.03, + "global_step": 3380, + "learning_rate": 0.0004867278797996661, + "loss": 1.9719, + "loss_base2": 2.8449, + "loss_pixel": 0.3398, + "loss_text": 1.6321, + "ppl": 7.1843, + "step": 3380 + }, + { + "epoch": 0.03, + "global_step": 3381, + "learning_rate": 0.0004867237061769616, + "loss": 1.9513, + "loss_base2": 2.8151, + "loss_pixel": 0.3379, + "loss_text": 1.6134, + "ppl": 7.0378, + "step": 3381 + }, + { + "epoch": 0.03, + "global_step": 3382, + "learning_rate": 0.0004867195325542571, + "loss": 1.9532, + "loss_base2": 2.8179, + "loss_pixel": 0.3363, + "loss_text": 1.6168, + "ppl": 7.0512, + "step": 3382 + }, + { + "epoch": 0.03, + "global_step": 3383, + "learning_rate": 0.0004867153589315526, + "loss": 1.9407, + "loss_base2": 2.7998, + "loss_pixel": 0.3359, + "loss_text": 1.6049, + "ppl": 6.9636, + "step": 3383 + }, + { + "epoch": 0.03, + "global_step": 3384, + "learning_rate": 0.0004867111853088481, + "loss": 1.9548, + "loss_base2": 2.8202, + "loss_pixel": 0.3341, + "loss_text": 1.6207, + "ppl": 7.0625, + "step": 3384 + }, + { + "epoch": 0.03, + "global_step": 3385, + "learning_rate": 0.00048670701168614355, + "loss": 1.9594, + "loss_base2": 2.8268, + "loss_pixel": 0.3331, + "loss_text": 1.6263, + "ppl": 7.0951, + "step": 3385 + }, + { + "epoch": 0.03, + "global_step": 3386, + "learning_rate": 0.00048670283806343906, + "loss": 1.9512, + "loss_base2": 2.815, + "loss_pixel": 0.3321, + "loss_text": 1.6191, + "ppl": 7.0371, + "step": 3386 + }, + { + "epoch": 0.03, + "global_step": 3387, + "learning_rate": 0.00048669866444073456, + "loss": 1.9571, + "loss_base2": 2.8235, + "loss_pixel": 0.3325, + "loss_text": 1.6246, + "ppl": 7.0788, + "step": 3387 + }, + { + "epoch": 0.03, + "global_step": 3388, + "learning_rate": 0.00048669449081803007, + "loss": 1.9589, + "loss_base2": 2.8261, + "loss_pixel": 0.3303, + "loss_text": 1.6286, + "ppl": 7.0915, + "step": 3388 + }, + { + "epoch": 0.03, + "global_step": 3389, + "learning_rate": 0.0004866903171953255, + "loss": 1.9448, + "loss_base2": 2.8058, + "loss_pixel": 0.3297, + "loss_text": 1.6151, + "ppl": 6.9922, + "step": 3389 + }, + { + "epoch": 0.03, + "global_step": 3390, + "learning_rate": 0.00048668614357262103, + "loss": 1.9342, + "loss_base2": 2.7905, + "loss_pixel": 0.3299, + "loss_text": 1.6044, + "ppl": 6.9185, + "step": 3390 + }, + { + "epoch": 0.03, + "global_step": 3391, + "learning_rate": 0.00048668196994991654, + "loss": 1.9481, + "loss_base2": 2.8105, + "loss_pixel": 0.3295, + "loss_text": 1.6185, + "ppl": 7.0153, + "step": 3391 + }, + { + "epoch": 0.03, + "global_step": 3392, + "learning_rate": 0.00048667779632721205, + "loss": 1.9446, + "loss_base2": 2.8055, + "loss_pixel": 0.3308, + "loss_text": 1.6138, + "ppl": 6.9908, + "step": 3392 + }, + { + "epoch": 0.03, + "global_step": 3393, + "learning_rate": 0.00048667362270450755, + "loss": 1.9211, + "loss_base2": 2.7716, + "loss_pixel": 0.332, + "loss_text": 1.5891, + "ppl": 6.8285, + "step": 3393 + }, + { + "epoch": 0.03, + "global_step": 3394, + "learning_rate": 0.000486669449081803, + "loss": 1.9312, + "loss_base2": 2.7861, + "loss_pixel": 0.3302, + "loss_text": 1.601, + "ppl": 6.8978, + "step": 3394 + }, + { + "epoch": 0.03, + "global_step": 3395, + "learning_rate": 0.0004866652754590985, + "loss": 1.9234, + "loss_base2": 2.7749, + "loss_pixel": 0.3286, + "loss_text": 1.5948, + "ppl": 6.8442, + "step": 3395 + }, + { + "epoch": 0.03, + "global_step": 3396, + "learning_rate": 0.000486661101836394, + "loss": 1.9395, + "loss_base2": 2.7981, + "loss_pixel": 0.329, + "loss_text": 1.6105, + "ppl": 6.9553, + "step": 3396 + }, + { + "epoch": 0.03, + "global_step": 3397, + "learning_rate": 0.00048665692821368953, + "loss": 1.9364, + "loss_base2": 2.7936, + "loss_pixel": 0.3282, + "loss_text": 1.6082, + "ppl": 6.9337, + "step": 3397 + }, + { + "epoch": 0.03, + "global_step": 3398, + "learning_rate": 0.000486652754590985, + "loss": 1.9298, + "loss_base2": 2.7841, + "loss_pixel": 0.3258, + "loss_text": 1.604, + "ppl": 6.8881, + "step": 3398 + }, + { + "epoch": 0.03, + "global_step": 3399, + "learning_rate": 0.0004866485809682805, + "loss": 1.9577, + "loss_base2": 2.8244, + "loss_pixel": 0.3254, + "loss_text": 1.6323, + "ppl": 7.083, + "step": 3399 + }, + { + "epoch": 0.03, + "global_step": 3400, + "learning_rate": 0.00048664440734557594, + "loss": 1.9496, + "loss_base2": 2.8127, + "loss_pixel": 0.3251, + "loss_text": 1.6246, + "ppl": 7.0259, + "step": 3400 + }, + { + "epoch": 0.03, + "global_step": 3401, + "learning_rate": 0.00048664023372287145, + "loss": 1.9326, + "loss_base2": 2.7882, + "loss_pixel": 0.3252, + "loss_text": 1.6074, + "ppl": 6.9074, + "step": 3401 + }, + { + "epoch": 0.03, + "global_step": 3402, + "learning_rate": 0.00048663606010016696, + "loss": 1.9229, + "loss_base2": 2.7742, + "loss_pixel": 0.3243, + "loss_text": 1.5987, + "ppl": 6.8408, + "step": 3402 + }, + { + "epoch": 0.03, + "global_step": 3403, + "learning_rate": 0.0004866318864774624, + "loss": 1.9272, + "loss_base2": 2.7804, + "loss_pixel": 0.3221, + "loss_text": 1.6051, + "ppl": 6.8702, + "step": 3403 + }, + { + "epoch": 0.03, + "global_step": 3404, + "learning_rate": 0.0004866277128547579, + "loss": 1.9241, + "loss_base2": 2.7759, + "loss_pixel": 0.3233, + "loss_text": 1.6008, + "ppl": 6.849, + "step": 3404 + }, + { + "epoch": 0.03, + "global_step": 3405, + "learning_rate": 0.0004866235392320534, + "loss": 1.9262, + "loss_base2": 2.7789, + "loss_pixel": 0.3214, + "loss_text": 1.6047, + "ppl": 6.8634, + "step": 3405 + }, + { + "epoch": 0.03, + "global_step": 3406, + "learning_rate": 0.00048661936560934893, + "loss": 1.9088, + "loss_base2": 2.7538, + "loss_pixel": 0.3218, + "loss_text": 1.587, + "ppl": 6.745, + "step": 3406 + }, + { + "epoch": 0.03, + "global_step": 3407, + "learning_rate": 0.0004866151919866444, + "loss": 1.8375, + "loss_base2": 2.651, + "loss_pixel": 0.3203, + "loss_text": 1.5172, + "ppl": 6.2808, + "step": 3407 + }, + { + "epoch": 0.03, + "global_step": 3408, + "learning_rate": 0.0004866110183639399, + "loss": 1.7073, + "loss_base2": 2.4631, + "loss_pixel": 0.3202, + "loss_text": 1.3871, + "ppl": 5.5141, + "step": 3408 + }, + { + "epoch": 0.03, + "global_step": 3409, + "learning_rate": 0.0004866068447412354, + "loss": 1.6853, + "loss_base2": 2.4314, + "loss_pixel": 0.3187, + "loss_text": 1.3666, + "ppl": 5.3941, + "step": 3409 + }, + { + "epoch": 0.03, + "global_step": 3410, + "learning_rate": 0.0004866026711185309, + "loss": 1.7147, + "loss_base2": 2.4738, + "loss_pixel": 0.3183, + "loss_text": 1.3964, + "ppl": 5.555, + "step": 3410 + }, + { + "epoch": 0.03, + "global_step": 3411, + "learning_rate": 0.0004865984974958264, + "loss": 1.7098, + "loss_base2": 2.4667, + "loss_pixel": 0.3179, + "loss_text": 1.392, + "ppl": 5.5279, + "step": 3411 + }, + { + "epoch": 0.03, + "global_step": 3412, + "learning_rate": 0.00048659432387312187, + "loss": 1.7054, + "loss_base2": 2.4604, + "loss_pixel": 0.318, + "loss_text": 1.3874, + "ppl": 5.5036, + "step": 3412 + }, + { + "epoch": 0.03, + "global_step": 3413, + "learning_rate": 0.0004865901502504174, + "loss": 1.6893, + "loss_base2": 2.4371, + "loss_pixel": 0.3181, + "loss_text": 1.3713, + "ppl": 5.4157, + "step": 3413 + }, + { + "epoch": 0.03, + "global_step": 3414, + "learning_rate": 0.0004865859766277129, + "loss": 1.6999, + "loss_base2": 2.4524, + "loss_pixel": 0.3198, + "loss_text": 1.3801, + "ppl": 5.4734, + "step": 3414 + }, + { + "epoch": 0.03, + "global_step": 3415, + "learning_rate": 0.0004865818030050084, + "loss": 1.6947, + "loss_base2": 2.4449, + "loss_pixel": 0.3174, + "loss_text": 1.3773, + "ppl": 5.445, + "step": 3415 + }, + { + "epoch": 0.03, + "global_step": 3416, + "learning_rate": 0.0004865776293823039, + "loss": 1.8769, + "loss_base2": 2.7078, + "loss_pixel": 0.3185, + "loss_text": 1.5584, + "ppl": 6.5332, + "step": 3416 + }, + { + "epoch": 0.03, + "global_step": 3417, + "learning_rate": 0.00048657345575959935, + "loss": 1.9519, + "loss_base2": 2.816, + "loss_pixel": 0.3176, + "loss_text": 1.6343, + "ppl": 7.0421, + "step": 3417 + }, + { + "epoch": 0.03, + "global_step": 3418, + "learning_rate": 0.00048656928213689486, + "loss": 1.9674, + "loss_base2": 2.8384, + "loss_pixel": 0.3176, + "loss_text": 1.6497, + "ppl": 7.1521, + "step": 3418 + }, + { + "epoch": 0.03, + "global_step": 3419, + "learning_rate": 0.0004865651085141903, + "loss": 1.9771, + "loss_base2": 2.8524, + "loss_pixel": 0.3287, + "loss_text": 1.6484, + "ppl": 7.2218, + "step": 3419 + }, + { + "epoch": 0.03, + "global_step": 3420, + "learning_rate": 0.0004865609348914858, + "loss": 1.957, + "loss_base2": 2.8234, + "loss_pixel": 0.3277, + "loss_text": 1.6293, + "ppl": 7.0781, + "step": 3420 + }, + { + "epoch": 0.03, + "global_step": 3421, + "learning_rate": 0.00048655676126878127, + "loss": 1.9521, + "loss_base2": 2.8163, + "loss_pixel": 0.3224, + "loss_text": 1.6297, + "ppl": 7.0435, + "step": 3421 + }, + { + "epoch": 0.03, + "global_step": 3422, + "learning_rate": 0.0004865525876460768, + "loss": 1.9593, + "loss_base2": 2.8267, + "loss_pixel": 0.3185, + "loss_text": 1.6407, + "ppl": 7.0944, + "step": 3422 + }, + { + "epoch": 0.03, + "global_step": 3423, + "learning_rate": 0.0004865484140233723, + "loss": 1.9429, + "loss_base2": 2.803, + "loss_pixel": 0.328, + "loss_text": 1.6149, + "ppl": 6.979, + "step": 3423 + }, + { + "epoch": 0.03, + "global_step": 3424, + "learning_rate": 0.0004865442404006678, + "loss": 1.9484, + "loss_base2": 2.8109, + "loss_pixel": 0.336, + "loss_text": 1.6124, + "ppl": 7.0175, + "step": 3424 + }, + { + "epoch": 0.03, + "global_step": 3425, + "learning_rate": 0.0004865400667779633, + "loss": 1.9491, + "loss_base2": 2.812, + "loss_pixel": 0.3314, + "loss_text": 1.6177, + "ppl": 7.0224, + "step": 3425 + }, + { + "epoch": 0.03, + "global_step": 3426, + "learning_rate": 0.00048653589315525875, + "loss": 1.9329, + "loss_base2": 2.7886, + "loss_pixel": 0.3275, + "loss_text": 1.6053, + "ppl": 6.9095, + "step": 3426 + }, + { + "epoch": 0.03, + "global_step": 3427, + "learning_rate": 0.00048653171953255426, + "loss": 1.9504, + "loss_base2": 2.8138, + "loss_pixel": 0.3278, + "loss_text": 1.6226, + "ppl": 7.0315, + "step": 3427 + }, + { + "epoch": 0.03, + "global_step": 3428, + "learning_rate": 0.00048652754590984977, + "loss": 1.945, + "loss_base2": 2.806, + "loss_pixel": 0.3224, + "loss_text": 1.6225, + "ppl": 6.9936, + "step": 3428 + }, + { + "epoch": 0.03, + "global_step": 3429, + "learning_rate": 0.0004865233722871453, + "loss": 1.9236, + "loss_base2": 2.7752, + "loss_pixel": 0.3192, + "loss_text": 1.6044, + "ppl": 6.8456, + "step": 3429 + }, + { + "epoch": 0.03, + "global_step": 3430, + "learning_rate": 0.00048651919866444073, + "loss": 1.9491, + "loss_base2": 2.812, + "loss_pixel": 0.3193, + "loss_text": 1.6298, + "ppl": 7.0224, + "step": 3430 + }, + { + "epoch": 0.03, + "global_step": 3431, + "learning_rate": 0.00048651502504173624, + "loss": 1.9427, + "loss_base2": 2.8027, + "loss_pixel": 0.3172, + "loss_text": 1.6255, + "ppl": 6.9776, + "step": 3431 + }, + { + "epoch": 0.03, + "global_step": 3432, + "learning_rate": 0.00048651085141903174, + "loss": 1.9162, + "loss_base2": 2.7645, + "loss_pixel": 0.3153, + "loss_text": 1.6009, + "ppl": 6.7951, + "step": 3432 + }, + { + "epoch": 0.03, + "global_step": 3433, + "learning_rate": 0.00048650667779632725, + "loss": 1.9245, + "loss_base2": 2.7765, + "loss_pixel": 0.3143, + "loss_text": 1.6102, + "ppl": 6.8517, + "step": 3433 + }, + { + "epoch": 0.03, + "global_step": 3434, + "learning_rate": 0.00048650250417362276, + "loss": 1.9258, + "loss_base2": 2.7783, + "loss_pixel": 0.3128, + "loss_text": 1.613, + "ppl": 6.8606, + "step": 3434 + }, + { + "epoch": 0.03, + "global_step": 3435, + "learning_rate": 0.0004864983305509182, + "loss": 1.9333, + "loss_base2": 2.7892, + "loss_pixel": 0.3125, + "loss_text": 1.6209, + "ppl": 6.9123, + "step": 3435 + }, + { + "epoch": 0.03, + "global_step": 3436, + "learning_rate": 0.0004864941569282137, + "loss": 1.9349, + "loss_base2": 2.7915, + "loss_pixel": 0.312, + "loss_text": 1.6229, + "ppl": 6.9234, + "step": 3436 + }, + { + "epoch": 0.03, + "global_step": 3437, + "learning_rate": 0.0004864899833055092, + "loss": 1.9059, + "loss_base2": 2.7496, + "loss_pixel": 0.3171, + "loss_text": 1.5887, + "ppl": 6.7255, + "step": 3437 + }, + { + "epoch": 0.03, + "global_step": 3438, + "learning_rate": 0.0004864858096828047, + "loss": 1.9209, + "loss_base2": 2.7713, + "loss_pixel": 0.3141, + "loss_text": 1.6067, + "ppl": 6.8271, + "step": 3438 + }, + { + "epoch": 0.03, + "global_step": 3439, + "learning_rate": 0.00048648163606010013, + "loss": 1.9298, + "loss_base2": 2.7841, + "loss_pixel": 0.313, + "loss_text": 1.6168, + "ppl": 6.8881, + "step": 3439 + }, + { + "epoch": 0.03, + "global_step": 3440, + "learning_rate": 0.00048647746243739564, + "loss": 1.9366, + "loss_base2": 2.7939, + "loss_pixel": 0.3102, + "loss_text": 1.6264, + "ppl": 6.9351, + "step": 3440 + }, + { + "epoch": 0.03, + "global_step": 3441, + "learning_rate": 0.00048647328881469115, + "loss": 1.9041, + "loss_base2": 2.747, + "loss_pixel": 0.3085, + "loss_text": 1.5956, + "ppl": 6.7134, + "step": 3441 + }, + { + "epoch": 0.03, + "global_step": 3442, + "learning_rate": 0.00048646911519198665, + "loss": 1.9197, + "loss_base2": 2.7695, + "loss_pixel": 0.3076, + "loss_text": 1.6121, + "ppl": 6.8189, + "step": 3442 + }, + { + "epoch": 0.03, + "global_step": 3443, + "learning_rate": 0.00048646494156928216, + "loss": 1.8961, + "loss_base2": 2.7355, + "loss_pixel": 0.3057, + "loss_text": 1.5904, + "ppl": 6.6599, + "step": 3443 + }, + { + "epoch": 0.03, + "global_step": 3444, + "learning_rate": 0.0004864607679465776, + "loss": 1.9035, + "loss_base2": 2.7462, + "loss_pixel": 0.3053, + "loss_text": 1.5982, + "ppl": 6.7093, + "step": 3444 + }, + { + "epoch": 0.03, + "global_step": 3445, + "learning_rate": 0.0004864565943238731, + "loss": 1.9066, + "loss_base2": 2.7506, + "loss_pixel": 0.304, + "loss_text": 1.6026, + "ppl": 6.7302, + "step": 3445 + }, + { + "epoch": 0.03, + "global_step": 3446, + "learning_rate": 0.00048645242070116863, + "loss": 1.9117, + "loss_base2": 2.758, + "loss_pixel": 0.3036, + "loss_text": 1.6081, + "ppl": 6.7646, + "step": 3446 + }, + { + "epoch": 0.03, + "global_step": 3447, + "learning_rate": 0.00048644824707846414, + "loss": 1.9161, + "loss_base2": 2.7643, + "loss_pixel": 0.3039, + "loss_text": 1.6121, + "ppl": 6.7944, + "step": 3447 + }, + { + "epoch": 0.03, + "global_step": 3448, + "learning_rate": 0.0004864440734557596, + "loss": 1.9222, + "loss_base2": 2.7731, + "loss_pixel": 0.3018, + "loss_text": 1.6204, + "ppl": 6.836, + "step": 3448 + }, + { + "epoch": 0.03, + "global_step": 3449, + "learning_rate": 0.0004864398998330551, + "loss": 1.8917, + "loss_base2": 2.7291, + "loss_pixel": 0.3002, + "loss_text": 1.5915, + "ppl": 6.6306, + "step": 3449 + }, + { + "epoch": 0.03, + "global_step": 3450, + "learning_rate": 0.0004864357262103506, + "loss": 1.9047, + "loss_base2": 2.7479, + "loss_pixel": 0.3001, + "loss_text": 1.6046, + "ppl": 6.7174, + "step": 3450 + }, + { + "epoch": 0.03, + "global_step": 3451, + "learning_rate": 0.0004864315525876461, + "loss": 1.9089, + "loss_base2": 2.754, + "loss_pixel": 0.2986, + "loss_text": 1.6103, + "ppl": 6.7457, + "step": 3451 + }, + { + "epoch": 0.03, + "global_step": 3452, + "learning_rate": 0.0004864273789649416, + "loss": 1.917, + "loss_base2": 2.7656, + "loss_pixel": 0.2982, + "loss_text": 1.6188, + "ppl": 6.8005, + "step": 3452 + }, + { + "epoch": 0.03, + "global_step": 3453, + "learning_rate": 0.00048642320534223707, + "loss": 1.9134, + "loss_base2": 2.7605, + "loss_pixel": 0.2977, + "loss_text": 1.6156, + "ppl": 6.7761, + "step": 3453 + }, + { + "epoch": 0.03, + "global_step": 3454, + "learning_rate": 0.0004864190317195326, + "loss": 1.9063, + "loss_base2": 2.7502, + "loss_pixel": 0.2967, + "loss_text": 1.6096, + "ppl": 6.7281, + "step": 3454 + }, + { + "epoch": 0.03, + "global_step": 3455, + "learning_rate": 0.0004864148580968281, + "loss": 1.8964, + "loss_base2": 2.7359, + "loss_pixel": 0.2969, + "loss_text": 1.5996, + "ppl": 6.6619, + "step": 3455 + }, + { + "epoch": 0.03, + "global_step": 3456, + "learning_rate": 0.00048641068447412354, + "loss": 1.8781, + "loss_base2": 2.7095, + "loss_pixel": 0.2951, + "loss_text": 1.583, + "ppl": 6.5411, + "step": 3456 + }, + { + "epoch": 0.03, + "global_step": 3457, + "learning_rate": 0.000486406510851419, + "loss": 1.888, + "loss_base2": 2.7238, + "loss_pixel": 0.2944, + "loss_text": 1.5937, + "ppl": 6.6061, + "step": 3457 + }, + { + "epoch": 0.03, + "global_step": 3458, + "learning_rate": 0.0004864023372287145, + "loss": 1.8981, + "loss_base2": 2.7384, + "loss_pixel": 0.2941, + "loss_text": 1.604, + "ppl": 6.6732, + "step": 3458 + }, + { + "epoch": 0.03, + "global_step": 3459, + "learning_rate": 0.00048639816360601, + "loss": 1.9029, + "loss_base2": 2.7453, + "loss_pixel": 0.2937, + "loss_text": 1.6091, + "ppl": 6.7053, + "step": 3459 + }, + { + "epoch": 0.03, + "global_step": 3460, + "learning_rate": 0.0004863939899833055, + "loss": 1.9048, + "loss_base2": 2.748, + "loss_pixel": 0.2922, + "loss_text": 1.6126, + "ppl": 6.7181, + "step": 3460 + }, + { + "epoch": 0.03, + "global_step": 3461, + "learning_rate": 0.000486389816360601, + "loss": 1.8907, + "loss_base2": 2.7277, + "loss_pixel": 0.2918, + "loss_text": 1.5989, + "ppl": 6.624, + "step": 3461 + }, + { + "epoch": 0.03, + "global_step": 3462, + "learning_rate": 0.0004863856427378965, + "loss": 1.91, + "loss_base2": 2.7555, + "loss_pixel": 0.2907, + "loss_text": 1.6194, + "ppl": 6.7531, + "step": 3462 + }, + { + "epoch": 0.03, + "global_step": 3463, + "learning_rate": 0.000486381469115192, + "loss": 1.8954, + "loss_base2": 2.7345, + "loss_pixel": 0.2897, + "loss_text": 1.6057, + "ppl": 6.6552, + "step": 3463 + }, + { + "epoch": 0.03, + "global_step": 3464, + "learning_rate": 0.0004863772954924875, + "loss": 1.8805, + "loss_base2": 2.713, + "loss_pixel": 0.2901, + "loss_text": 1.5904, + "ppl": 6.5568, + "step": 3464 + }, + { + "epoch": 0.03, + "global_step": 3465, + "learning_rate": 0.000486373121869783, + "loss": 1.8797, + "loss_base2": 2.7118, + "loss_pixel": 0.2893, + "loss_text": 1.5903, + "ppl": 6.5515, + "step": 3465 + }, + { + "epoch": 0.03, + "global_step": 3466, + "learning_rate": 0.00048636894824707845, + "loss": 1.8816, + "loss_base2": 2.7146, + "loss_pixel": 0.2923, + "loss_text": 1.5892, + "ppl": 6.564, + "step": 3466 + }, + { + "epoch": 0.03, + "global_step": 3467, + "learning_rate": 0.00048636477462437396, + "loss": 1.8472, + "loss_base2": 2.6649, + "loss_pixel": 0.2996, + "loss_text": 1.5476, + "ppl": 6.342, + "step": 3467 + }, + { + "epoch": 0.03, + "global_step": 3468, + "learning_rate": 0.00048636060100166946, + "loss": 1.8363, + "loss_base2": 2.6492, + "loss_pixel": 0.2958, + "loss_text": 1.5405, + "ppl": 6.2733, + "step": 3468 + }, + { + "epoch": 0.03, + "global_step": 3469, + "learning_rate": 0.00048635642737896497, + "loss": 1.9163, + "loss_base2": 2.7646, + "loss_pixel": 0.2993, + "loss_text": 1.617, + "ppl": 6.7958, + "step": 3469 + }, + { + "epoch": 0.03, + "global_step": 3470, + "learning_rate": 0.0004863522537562605, + "loss": 1.9054, + "loss_base2": 2.7489, + "loss_pixel": 0.2976, + "loss_text": 1.6078, + "ppl": 6.7221, + "step": 3470 + }, + { + "epoch": 0.03, + "global_step": 3471, + "learning_rate": 0.00048634808013355593, + "loss": 1.9112, + "loss_base2": 2.7573, + "loss_pixel": 0.2934, + "loss_text": 1.6178, + "ppl": 6.7612, + "step": 3471 + }, + { + "epoch": 0.03, + "global_step": 3472, + "learning_rate": 0.00048634390651085144, + "loss": 1.8916, + "loss_base2": 2.729, + "loss_pixel": 0.2938, + "loss_text": 1.5978, + "ppl": 6.63, + "step": 3472 + }, + { + "epoch": 0.03, + "global_step": 3473, + "learning_rate": 0.00048633973288814695, + "loss": 1.9227, + "loss_base2": 2.7739, + "loss_pixel": 0.2932, + "loss_text": 1.6295, + "ppl": 6.8394, + "step": 3473 + }, + { + "epoch": 0.03, + "global_step": 3474, + "learning_rate": 0.00048633555926544245, + "loss": 1.9059, + "loss_base2": 2.7496, + "loss_pixel": 0.2915, + "loss_text": 1.6143, + "ppl": 6.7255, + "step": 3474 + }, + { + "epoch": 0.03, + "global_step": 3475, + "learning_rate": 0.0004863313856427379, + "loss": 1.8926, + "loss_base2": 2.7304, + "loss_pixel": 0.2903, + "loss_text": 1.6023, + "ppl": 6.6366, + "step": 3475 + }, + { + "epoch": 0.03, + "global_step": 3476, + "learning_rate": 0.00048632721202003336, + "loss": 1.9202, + "loss_base2": 2.7703, + "loss_pixel": 0.2889, + "loss_text": 1.6313, + "ppl": 6.8223, + "step": 3476 + }, + { + "epoch": 0.03, + "global_step": 3477, + "learning_rate": 0.00048632303839732887, + "loss": 1.9242, + "loss_base2": 2.776, + "loss_pixel": 0.2888, + "loss_text": 1.6354, + "ppl": 6.8497, + "step": 3477 + }, + { + "epoch": 0.03, + "global_step": 3478, + "learning_rate": 0.0004863188647746244, + "loss": 1.8952, + "loss_base2": 2.7342, + "loss_pixel": 0.2883, + "loss_text": 1.6069, + "ppl": 6.6539, + "step": 3478 + }, + { + "epoch": 0.03, + "global_step": 3479, + "learning_rate": 0.0004863146911519199, + "loss": 1.8788, + "loss_base2": 2.7105, + "loss_pixel": 0.2897, + "loss_text": 1.5891, + "ppl": 6.5456, + "step": 3479 + }, + { + "epoch": 0.03, + "global_step": 3480, + "learning_rate": 0.00048631051752921534, + "loss": 1.8903, + "loss_base2": 2.7271, + "loss_pixel": 0.2932, + "loss_text": 1.5971, + "ppl": 6.6214, + "step": 3480 + }, + { + "epoch": 0.03, + "global_step": 3481, + "learning_rate": 0.00048630634390651084, + "loss": 1.9038, + "loss_base2": 2.7466, + "loss_pixel": 0.293, + "loss_text": 1.6109, + "ppl": 6.7113, + "step": 3481 + }, + { + "epoch": 0.03, + "global_step": 3482, + "learning_rate": 0.00048630217028380635, + "loss": 1.8982, + "loss_base2": 2.7385, + "loss_pixel": 0.2937, + "loss_text": 1.6045, + "ppl": 6.6739, + "step": 3482 + }, + { + "epoch": 0.03, + "global_step": 3483, + "learning_rate": 0.00048629799666110186, + "loss": 1.9126, + "loss_base2": 2.7593, + "loss_pixel": 0.2931, + "loss_text": 1.6195, + "ppl": 6.7707, + "step": 3483 + }, + { + "epoch": 0.03, + "global_step": 3484, + "learning_rate": 0.00048629382303839736, + "loss": 1.8862, + "loss_base2": 2.7212, + "loss_pixel": 0.2899, + "loss_text": 1.5963, + "ppl": 6.5943, + "step": 3484 + }, + { + "epoch": 0.03, + "global_step": 3485, + "learning_rate": 0.0004862896494156928, + "loss": 1.8842, + "loss_base2": 2.7183, + "loss_pixel": 0.2877, + "loss_text": 1.5965, + "ppl": 6.5811, + "step": 3485 + }, + { + "epoch": 0.03, + "global_step": 3486, + "learning_rate": 0.0004862854757929883, + "loss": 1.8923, + "loss_base2": 2.73, + "loss_pixel": 0.2875, + "loss_text": 1.6049, + "ppl": 6.6346, + "step": 3486 + }, + { + "epoch": 0.03, + "global_step": 3487, + "learning_rate": 0.00048628130217028383, + "loss": 1.8843, + "loss_base2": 2.7185, + "loss_pixel": 0.2861, + "loss_text": 1.5982, + "ppl": 6.5817, + "step": 3487 + }, + { + "epoch": 0.03, + "global_step": 3488, + "learning_rate": 0.00048627712854757934, + "loss": 1.8991, + "loss_base2": 2.7398, + "loss_pixel": 0.2849, + "loss_text": 1.6141, + "ppl": 6.6799, + "step": 3488 + }, + { + "epoch": 0.03, + "global_step": 3489, + "learning_rate": 0.0004862729549248748, + "loss": 1.8913, + "loss_base2": 2.7286, + "loss_pixel": 0.285, + "loss_text": 1.6063, + "ppl": 6.628, + "step": 3489 + }, + { + "epoch": 0.03, + "global_step": 3490, + "learning_rate": 0.0004862687813021703, + "loss": 1.8897, + "loss_base2": 2.7263, + "loss_pixel": 0.2821, + "loss_text": 1.6076, + "ppl": 6.6174, + "step": 3490 + }, + { + "epoch": 0.03, + "global_step": 3491, + "learning_rate": 0.0004862646076794658, + "loss": 1.8742, + "loss_base2": 2.7039, + "loss_pixel": 0.282, + "loss_text": 1.5921, + "ppl": 6.5156, + "step": 3491 + }, + { + "epoch": 0.03, + "global_step": 3492, + "learning_rate": 0.0004862604340567613, + "loss": 1.8867, + "loss_base2": 2.7219, + "loss_pixel": 0.2823, + "loss_text": 1.6044, + "ppl": 6.5976, + "step": 3492 + }, + { + "epoch": 0.03, + "global_step": 3493, + "learning_rate": 0.0004862562604340568, + "loss": 1.8817, + "loss_base2": 2.7147, + "loss_pixel": 0.2804, + "loss_text": 1.6013, + "ppl": 6.5647, + "step": 3493 + }, + { + "epoch": 0.03, + "global_step": 3494, + "learning_rate": 0.0004862520868113522, + "loss": 1.8823, + "loss_base2": 2.7156, + "loss_pixel": 0.281, + "loss_text": 1.6014, + "ppl": 6.5686, + "step": 3494 + }, + { + "epoch": 0.03, + "global_step": 3495, + "learning_rate": 0.00048624791318864773, + "loss": 1.8879, + "loss_base2": 2.7237, + "loss_pixel": 0.2825, + "loss_text": 1.6054, + "ppl": 6.6055, + "step": 3495 + }, + { + "epoch": 0.03, + "global_step": 3496, + "learning_rate": 0.00048624373956594324, + "loss": 1.8802, + "loss_base2": 2.7126, + "loss_pixel": 0.2804, + "loss_text": 1.5997, + "ppl": 6.5548, + "step": 3496 + }, + { + "epoch": 0.03, + "global_step": 3497, + "learning_rate": 0.00048623956594323874, + "loss": 1.8798, + "loss_base2": 2.712, + "loss_pixel": 0.2785, + "loss_text": 1.6012, + "ppl": 6.5522, + "step": 3497 + }, + { + "epoch": 0.03, + "global_step": 3498, + "learning_rate": 0.0004862353923205342, + "loss": 1.8667, + "loss_base2": 2.6931, + "loss_pixel": 0.2785, + "loss_text": 1.5882, + "ppl": 6.4669, + "step": 3498 + }, + { + "epoch": 0.03, + "global_step": 3499, + "learning_rate": 0.0004862312186978297, + "loss": 1.8749, + "loss_base2": 2.7049, + "loss_pixel": 0.2779, + "loss_text": 1.597, + "ppl": 6.5202, + "step": 3499 + }, + { + "epoch": 0.03, + "global_step": 3500, + "learning_rate": 0.0004862270450751252, + "loss": 1.8686, + "loss_base2": 2.6958, + "loss_pixel": 0.2786, + "loss_text": 1.59, + "ppl": 6.4792, + "step": 3500 + }, + { + "epoch": 0.03, + "global_step": 3501, + "learning_rate": 0.0004862228714524207, + "loss": 1.8809, + "loss_base2": 2.7136, + "loss_pixel": 0.279, + "loss_text": 1.6019, + "ppl": 6.5594, + "step": 3501 + }, + { + "epoch": 0.03, + "global_step": 3502, + "learning_rate": 0.0004862186978297162, + "loss": 1.8813, + "loss_base2": 2.7141, + "loss_pixel": 0.2795, + "loss_text": 1.6018, + "ppl": 6.562, + "step": 3502 + }, + { + "epoch": 0.03, + "global_step": 3503, + "learning_rate": 0.0004862145242070117, + "loss": 1.8802, + "loss_base2": 2.7126, + "loss_pixel": 0.2784, + "loss_text": 1.6019, + "ppl": 6.5548, + "step": 3503 + }, + { + "epoch": 0.03, + "global_step": 3504, + "learning_rate": 0.0004862103505843072, + "loss": 1.8853, + "loss_base2": 2.7199, + "loss_pixel": 0.2774, + "loss_text": 1.608, + "ppl": 6.5883, + "step": 3504 + }, + { + "epoch": 0.03, + "global_step": 3505, + "learning_rate": 0.0004862061769616027, + "loss": 1.8685, + "loss_base2": 2.6957, + "loss_pixel": 0.2762, + "loss_text": 1.5923, + "ppl": 6.4786, + "step": 3505 + }, + { + "epoch": 0.03, + "global_step": 3506, + "learning_rate": 0.0004862020033388982, + "loss": 1.8702, + "loss_base2": 2.6981, + "loss_pixel": 0.2751, + "loss_text": 1.5952, + "ppl": 6.4896, + "step": 3506 + }, + { + "epoch": 0.03, + "global_step": 3507, + "learning_rate": 0.00048619782971619365, + "loss": 1.8815, + "loss_base2": 2.7144, + "loss_pixel": 0.2754, + "loss_text": 1.6062, + "ppl": 6.5633, + "step": 3507 + }, + { + "epoch": 0.03, + "global_step": 3508, + "learning_rate": 0.00048619365609348916, + "loss": 1.8805, + "loss_base2": 2.713, + "loss_pixel": 0.2773, + "loss_text": 1.6031, + "ppl": 6.5568, + "step": 3508 + }, + { + "epoch": 0.03, + "global_step": 3509, + "learning_rate": 0.00048618948247078467, + "loss": 1.8742, + "loss_base2": 2.7039, + "loss_pixel": 0.2749, + "loss_text": 1.5993, + "ppl": 6.5156, + "step": 3509 + }, + { + "epoch": 0.03, + "global_step": 3510, + "learning_rate": 0.0004861853088480802, + "loss": 1.8765, + "loss_base2": 2.7072, + "loss_pixel": 0.2747, + "loss_text": 1.6018, + "ppl": 6.5306, + "step": 3510 + }, + { + "epoch": 0.03, + "global_step": 3511, + "learning_rate": 0.0004861811352253757, + "loss": 1.8741, + "loss_base2": 2.7038, + "loss_pixel": 0.274, + "loss_text": 1.6001, + "ppl": 6.515, + "step": 3511 + }, + { + "epoch": 0.03, + "global_step": 3512, + "learning_rate": 0.0004861769616026711, + "loss": 1.8796, + "loss_base2": 2.7117, + "loss_pixel": 0.276, + "loss_text": 1.6036, + "ppl": 6.5509, + "step": 3512 + }, + { + "epoch": 0.03, + "global_step": 3513, + "learning_rate": 0.0004861727879799666, + "loss": 1.8834, + "loss_base2": 2.7172, + "loss_pixel": 0.2788, + "loss_text": 1.6046, + "ppl": 6.5758, + "step": 3513 + }, + { + "epoch": 0.03, + "global_step": 3514, + "learning_rate": 0.0004861686143572621, + "loss": 1.8778, + "loss_base2": 2.7091, + "loss_pixel": 0.2789, + "loss_text": 1.5989, + "ppl": 6.5391, + "step": 3514 + }, + { + "epoch": 0.03, + "global_step": 3515, + "learning_rate": 0.0004861644407345576, + "loss": 1.8813, + "loss_base2": 2.7141, + "loss_pixel": 0.2798, + "loss_text": 1.6015, + "ppl": 6.562, + "step": 3515 + }, + { + "epoch": 0.03, + "global_step": 3516, + "learning_rate": 0.00048616026711185306, + "loss": 1.7757, + "loss_base2": 2.5618, + "loss_pixel": 0.275, + "loss_text": 1.5007, + "ppl": 5.9044, + "step": 3516 + }, + { + "epoch": 0.03, + "global_step": 3517, + "learning_rate": 0.00048615609348914856, + "loss": 1.6697, + "loss_base2": 2.4089, + "loss_pixel": 0.2762, + "loss_text": 1.3935, + "ppl": 5.3106, + "step": 3517 + }, + { + "epoch": 0.03, + "global_step": 3518, + "learning_rate": 0.00048615191986644407, + "loss": 1.6397, + "loss_base2": 2.3656, + "loss_pixel": 0.2728, + "loss_text": 1.3669, + "ppl": 5.1536, + "step": 3518 + }, + { + "epoch": 0.03, + "global_step": 3519, + "learning_rate": 0.0004861477462437396, + "loss": 1.6498, + "loss_base2": 2.3802, + "loss_pixel": 0.2729, + "loss_text": 1.3769, + "ppl": 5.2059, + "step": 3519 + }, + { + "epoch": 0.03, + "global_step": 3520, + "learning_rate": 0.0004861435726210351, + "loss": 1.6517, + "loss_base2": 2.3829, + "loss_pixel": 0.272, + "loss_text": 1.3796, + "ppl": 5.2158, + "step": 3520 + }, + { + "epoch": 0.03, + "global_step": 3521, + "learning_rate": 0.00048613939899833054, + "loss": 1.6375, + "loss_base2": 2.3624, + "loss_pixel": 0.2701, + "loss_text": 1.3674, + "ppl": 5.1423, + "step": 3521 + }, + { + "epoch": 0.03, + "global_step": 3522, + "learning_rate": 0.00048613522537562605, + "loss": 1.6364, + "loss_base2": 2.3608, + "loss_pixel": 0.2714, + "loss_text": 1.365, + "ppl": 5.1366, + "step": 3522 + }, + { + "epoch": 0.03, + "global_step": 3523, + "learning_rate": 0.00048613105175292155, + "loss": 1.6263, + "loss_base2": 2.3463, + "loss_pixel": 0.271, + "loss_text": 1.3553, + "ppl": 5.085, + "step": 3523 + }, + { + "epoch": 0.03, + "global_step": 3524, + "learning_rate": 0.00048612687813021706, + "loss": 1.6918, + "loss_base2": 2.4408, + "loss_pixel": 0.267, + "loss_text": 1.4248, + "ppl": 5.4292, + "step": 3524 + }, + { + "epoch": 0.03, + "global_step": 3525, + "learning_rate": 0.00048612270450751257, + "loss": 1.9042, + "loss_base2": 2.7472, + "loss_pixel": 0.266, + "loss_text": 1.6382, + "ppl": 6.714, + "step": 3525 + }, + { + "epoch": 0.03, + "global_step": 3526, + "learning_rate": 0.000486118530884808, + "loss": 1.8767, + "loss_base2": 2.7075, + "loss_pixel": 0.2642, + "loss_text": 1.6125, + "ppl": 6.5319, + "step": 3526 + }, + { + "epoch": 0.03, + "global_step": 3527, + "learning_rate": 0.00048611435726210353, + "loss": 1.8624, + "loss_base2": 2.6869, + "loss_pixel": 0.2658, + "loss_text": 1.5966, + "ppl": 6.4392, + "step": 3527 + }, + { + "epoch": 0.03, + "global_step": 3528, + "learning_rate": 0.00048611018363939904, + "loss": 1.8727, + "loss_base2": 2.7017, + "loss_pixel": 0.2677, + "loss_text": 1.605, + "ppl": 6.5058, + "step": 3528 + }, + { + "epoch": 0.03, + "global_step": 3529, + "learning_rate": 0.00048610601001669454, + "loss": 1.8881, + "loss_base2": 2.724, + "loss_pixel": 0.2706, + "loss_text": 1.6175, + "ppl": 6.6068, + "step": 3529 + }, + { + "epoch": 0.03, + "global_step": 3530, + "learning_rate": 0.00048610183639399, + "loss": 1.8692, + "loss_base2": 2.6967, + "loss_pixel": 0.2703, + "loss_text": 1.5989, + "ppl": 6.4831, + "step": 3530 + }, + { + "epoch": 0.03, + "global_step": 3531, + "learning_rate": 0.00048609766277128545, + "loss": 1.8675, + "loss_base2": 2.6942, + "loss_pixel": 0.2676, + "loss_text": 1.6, + "ppl": 6.4721, + "step": 3531 + }, + { + "epoch": 0.03, + "global_step": 3532, + "learning_rate": 0.00048609348914858096, + "loss": 1.8752, + "loss_base2": 2.7053, + "loss_pixel": 0.2638, + "loss_text": 1.6114, + "ppl": 6.5221, + "step": 3532 + }, + { + "epoch": 0.03, + "global_step": 3533, + "learning_rate": 0.00048608931552587646, + "loss": 1.8663, + "loss_base2": 2.6925, + "loss_pixel": 0.2629, + "loss_text": 1.6035, + "ppl": 6.4643, + "step": 3533 + }, + { + "epoch": 0.03, + "global_step": 3534, + "learning_rate": 0.00048608514190317197, + "loss": 1.8675, + "loss_base2": 2.6942, + "loss_pixel": 0.2634, + "loss_text": 1.604, + "ppl": 6.4721, + "step": 3534 + }, + { + "epoch": 0.03, + "global_step": 3535, + "learning_rate": 0.0004860809682804674, + "loss": 1.8424, + "loss_base2": 2.658, + "loss_pixel": 0.261, + "loss_text": 1.5815, + "ppl": 6.3117, + "step": 3535 + }, + { + "epoch": 0.03, + "global_step": 3536, + "learning_rate": 0.00048607679465776293, + "loss": 1.8555, + "loss_base2": 2.6769, + "loss_pixel": 0.2609, + "loss_text": 1.5946, + "ppl": 6.3949, + "step": 3536 + }, + { + "epoch": 0.03, + "global_step": 3537, + "learning_rate": 0.00048607262103505844, + "loss": 1.8587, + "loss_base2": 2.6815, + "loss_pixel": 0.2624, + "loss_text": 1.5963, + "ppl": 6.4154, + "step": 3537 + }, + { + "epoch": 0.03, + "global_step": 3538, + "learning_rate": 0.00048606844741235395, + "loss": 1.8701, + "loss_base2": 2.698, + "loss_pixel": 0.2599, + "loss_text": 1.6102, + "ppl": 6.4889, + "step": 3538 + }, + { + "epoch": 0.03, + "global_step": 3539, + "learning_rate": 0.0004860642737896494, + "loss": 1.8757, + "loss_base2": 2.7061, + "loss_pixel": 0.26, + "loss_text": 1.6158, + "ppl": 6.5254, + "step": 3539 + }, + { + "epoch": 0.03, + "global_step": 3540, + "learning_rate": 0.0004860601001669449, + "loss": 1.8577, + "loss_base2": 2.6801, + "loss_pixel": 0.2595, + "loss_text": 1.5981, + "ppl": 6.409, + "step": 3540 + }, + { + "epoch": 0.03, + "global_step": 3541, + "learning_rate": 0.0004860559265442404, + "loss": 1.8542, + "loss_base2": 2.675, + "loss_pixel": 0.2576, + "loss_text": 1.5966, + "ppl": 6.3866, + "step": 3541 + }, + { + "epoch": 0.03, + "global_step": 3542, + "learning_rate": 0.0004860517529215359, + "loss": 1.8558, + "loss_base2": 2.6774, + "loss_pixel": 0.2573, + "loss_text": 1.5985, + "ppl": 6.3968, + "step": 3542 + }, + { + "epoch": 0.03, + "global_step": 3543, + "learning_rate": 0.00048604757929883143, + "loss": 1.8503, + "loss_base2": 2.6694, + "loss_pixel": 0.2568, + "loss_text": 1.5935, + "ppl": 6.3617, + "step": 3543 + }, + { + "epoch": 0.03, + "global_step": 3544, + "learning_rate": 0.0004860434056761269, + "loss": 1.8441, + "loss_base2": 2.6605, + "loss_pixel": 0.2586, + "loss_text": 1.5855, + "ppl": 6.3224, + "step": 3544 + }, + { + "epoch": 0.03, + "global_step": 3545, + "learning_rate": 0.0004860392320534224, + "loss": 1.8704, + "loss_base2": 2.6984, + "loss_pixel": 0.2574, + "loss_text": 1.613, + "ppl": 6.4909, + "step": 3545 + }, + { + "epoch": 0.03, + "global_step": 3546, + "learning_rate": 0.0004860350584307179, + "loss": 1.8618, + "loss_base2": 2.686, + "loss_pixel": 0.2547, + "loss_text": 1.6071, + "ppl": 6.4353, + "step": 3546 + }, + { + "epoch": 0.03, + "global_step": 3547, + "learning_rate": 0.0004860308848080134, + "loss": 1.8718, + "loss_base2": 2.7004, + "loss_pixel": 0.2557, + "loss_text": 1.616, + "ppl": 6.5, + "step": 3547 + }, + { + "epoch": 0.03, + "global_step": 3548, + "learning_rate": 0.00048602671118530886, + "loss": 1.8332, + "loss_base2": 2.6447, + "loss_pixel": 0.2535, + "loss_text": 1.5797, + "ppl": 6.2539, + "step": 3548 + }, + { + "epoch": 0.03, + "global_step": 3549, + "learning_rate": 0.00048602253756260436, + "loss": 1.792, + "loss_base2": 2.5853, + "loss_pixel": 0.2522, + "loss_text": 1.5399, + "ppl": 6.0014, + "step": 3549 + }, + { + "epoch": 0.03, + "global_step": 3550, + "learning_rate": 0.0004860183639398998, + "loss": 1.845, + "loss_base2": 2.6618, + "loss_pixel": 0.2522, + "loss_text": 1.5928, + "ppl": 6.3281, + "step": 3550 + }, + { + "epoch": 0.03, + "global_step": 3551, + "learning_rate": 0.0004860141903171953, + "loss": 1.8561, + "loss_base2": 2.6778, + "loss_pixel": 0.25, + "loss_text": 1.6061, + "ppl": 6.3987, + "step": 3551 + }, + { + "epoch": 0.03, + "global_step": 3552, + "learning_rate": 0.00048601001669449083, + "loss": 1.8361, + "loss_base2": 2.6489, + "loss_pixel": 0.2496, + "loss_text": 1.5865, + "ppl": 6.272, + "step": 3552 + }, + { + "epoch": 0.03, + "global_step": 3553, + "learning_rate": 0.0004860058430717863, + "loss": 1.8466, + "loss_base2": 2.6641, + "loss_pixel": 0.2511, + "loss_text": 1.5955, + "ppl": 6.3382, + "step": 3553 + }, + { + "epoch": 0.03, + "global_step": 3554, + "learning_rate": 0.0004860016694490818, + "loss": 1.8762, + "loss_base2": 2.7068, + "loss_pixel": 0.2623, + "loss_text": 1.6139, + "ppl": 6.5286, + "step": 3554 + }, + { + "epoch": 0.03, + "global_step": 3555, + "learning_rate": 0.0004859974958263773, + "loss": 1.8492, + "loss_base2": 2.6678, + "loss_pixel": 0.2566, + "loss_text": 1.5926, + "ppl": 6.3547, + "step": 3555 + }, + { + "epoch": 0.03, + "global_step": 3556, + "learning_rate": 0.0004859933222036728, + "loss": 1.8524, + "loss_base2": 2.6724, + "loss_pixel": 0.258, + "loss_text": 1.5944, + "ppl": 6.3751, + "step": 3556 + }, + { + "epoch": 0.03, + "global_step": 3557, + "learning_rate": 0.00048598914858096826, + "loss": 1.8568, + "loss_base2": 2.6788, + "loss_pixel": 0.2572, + "loss_text": 1.5996, + "ppl": 6.4032, + "step": 3557 + }, + { + "epoch": 0.03, + "global_step": 3558, + "learning_rate": 0.00048598497495826377, + "loss": 1.8575, + "loss_base2": 2.6798, + "loss_pixel": 0.2533, + "loss_text": 1.6042, + "ppl": 6.4077, + "step": 3558 + }, + { + "epoch": 0.03, + "global_step": 3559, + "learning_rate": 0.0004859808013355593, + "loss": 1.8394, + "loss_base2": 2.6537, + "loss_pixel": 0.2557, + "loss_text": 1.5837, + "ppl": 6.2928, + "step": 3559 + }, + { + "epoch": 0.03, + "global_step": 3560, + "learning_rate": 0.0004859766277128548, + "loss": 1.8653, + "loss_base2": 2.6911, + "loss_pixel": 0.2515, + "loss_text": 1.6138, + "ppl": 6.4579, + "step": 3560 + }, + { + "epoch": 0.03, + "global_step": 3561, + "learning_rate": 0.0004859724540901503, + "loss": 1.8469, + "loss_base2": 2.6645, + "loss_pixel": 0.2499, + "loss_text": 1.597, + "ppl": 6.3401, + "step": 3561 + }, + { + "epoch": 0.03, + "global_step": 3562, + "learning_rate": 0.00048596828046744574, + "loss": 1.8387, + "loss_base2": 2.6527, + "loss_pixel": 0.2513, + "loss_text": 1.5874, + "ppl": 6.2884, + "step": 3562 + }, + { + "epoch": 0.03, + "global_step": 3563, + "learning_rate": 0.00048596410684474125, + "loss": 1.8287, + "loss_base2": 2.6383, + "loss_pixel": 0.2483, + "loss_text": 1.5803, + "ppl": 6.2258, + "step": 3563 + }, + { + "epoch": 0.03, + "global_step": 3564, + "learning_rate": 0.00048595993322203676, + "loss": 1.8593, + "loss_base2": 2.6824, + "loss_pixel": 0.2478, + "loss_text": 1.6115, + "ppl": 6.4192, + "step": 3564 + }, + { + "epoch": 0.03, + "global_step": 3565, + "learning_rate": 0.00048595575959933226, + "loss": 1.86, + "loss_base2": 2.6834, + "loss_pixel": 0.249, + "loss_text": 1.6111, + "ppl": 6.4237, + "step": 3565 + }, + { + "epoch": 0.03, + "global_step": 3566, + "learning_rate": 0.0004859515859766277, + "loss": 1.8484, + "loss_base2": 2.6667, + "loss_pixel": 0.2519, + "loss_text": 1.5966, + "ppl": 6.3497, + "step": 3566 + }, + { + "epoch": 0.03, + "global_step": 3567, + "learning_rate": 0.0004859474123539232, + "loss": 1.8531, + "loss_base2": 2.6735, + "loss_pixel": 0.2593, + "loss_text": 1.5938, + "ppl": 6.3796, + "step": 3567 + }, + { + "epoch": 0.03, + "global_step": 3568, + "learning_rate": 0.00048594323873121873, + "loss": 1.8556, + "loss_base2": 2.6771, + "loss_pixel": 0.2579, + "loss_text": 1.5977, + "ppl": 6.3955, + "step": 3568 + }, + { + "epoch": 0.03, + "global_step": 3569, + "learning_rate": 0.0004859390651085142, + "loss": 1.8521, + "loss_base2": 2.672, + "loss_pixel": 0.2573, + "loss_text": 1.5948, + "ppl": 6.3732, + "step": 3569 + }, + { + "epoch": 0.03, + "global_step": 3570, + "learning_rate": 0.0004859348914858097, + "loss": 1.8496, + "loss_base2": 2.6684, + "loss_pixel": 0.2563, + "loss_text": 1.5933, + "ppl": 6.3573, + "step": 3570 + }, + { + "epoch": 0.03, + "global_step": 3571, + "learning_rate": 0.00048593071786310515, + "loss": 1.8435, + "loss_base2": 2.6596, + "loss_pixel": 0.254, + "loss_text": 1.5895, + "ppl": 6.3186, + "step": 3571 + }, + { + "epoch": 0.03, + "global_step": 3572, + "learning_rate": 0.00048592654424040065, + "loss": 1.8478, + "loss_base2": 2.6658, + "loss_pixel": 0.2534, + "loss_text": 1.5944, + "ppl": 6.3458, + "step": 3572 + }, + { + "epoch": 0.03, + "global_step": 3573, + "learning_rate": 0.00048592237061769616, + "loss": 1.788, + "loss_base2": 2.5795, + "loss_pixel": 0.2511, + "loss_text": 1.5369, + "ppl": 5.9775, + "step": 3573 + }, + { + "epoch": 0.03, + "global_step": 3574, + "learning_rate": 0.00048591819699499167, + "loss": 1.7842, + "loss_base2": 2.5741, + "loss_pixel": 0.2482, + "loss_text": 1.536, + "ppl": 5.9548, + "step": 3574 + }, + { + "epoch": 0.03, + "global_step": 3575, + "learning_rate": 0.0004859140233722871, + "loss": 1.783, + "loss_base2": 2.5723, + "loss_pixel": 0.2466, + "loss_text": 1.5364, + "ppl": 5.9477, + "step": 3575 + }, + { + "epoch": 0.03, + "global_step": 3576, + "learning_rate": 0.00048590984974958263, + "loss": 1.8536, + "loss_base2": 2.6742, + "loss_pixel": 0.2462, + "loss_text": 1.6075, + "ppl": 6.3828, + "step": 3576 + }, + { + "epoch": 0.03, + "global_step": 3577, + "learning_rate": 0.00048590567612687814, + "loss": 1.8481, + "loss_base2": 2.6662, + "loss_pixel": 0.2448, + "loss_text": 1.6033, + "ppl": 6.3477, + "step": 3577 + }, + { + "epoch": 0.03, + "global_step": 3578, + "learning_rate": 0.00048590150250417364, + "loss": 1.852, + "loss_base2": 2.6719, + "loss_pixel": 0.2444, + "loss_text": 1.6077, + "ppl": 6.3726, + "step": 3578 + }, + { + "epoch": 0.03, + "global_step": 3579, + "learning_rate": 0.00048589732888146915, + "loss": 1.8556, + "loss_base2": 2.6771, + "loss_pixel": 0.2482, + "loss_text": 1.6074, + "ppl": 6.3955, + "step": 3579 + }, + { + "epoch": 0.03, + "global_step": 3580, + "learning_rate": 0.0004858931552587646, + "loss": 1.8611, + "loss_base2": 2.685, + "loss_pixel": 0.2629, + "loss_text": 1.5982, + "ppl": 6.4308, + "step": 3580 + }, + { + "epoch": 0.03, + "global_step": 3581, + "learning_rate": 0.0004858889816360601, + "loss": 1.8695, + "loss_base2": 2.6971, + "loss_pixel": 0.2591, + "loss_text": 1.6104, + "ppl": 6.4851, + "step": 3581 + }, + { + "epoch": 0.03, + "global_step": 3582, + "learning_rate": 0.0004858848080133556, + "loss": 1.8609, + "loss_base2": 2.6847, + "loss_pixel": 0.2515, + "loss_text": 1.6095, + "ppl": 6.4295, + "step": 3582 + }, + { + "epoch": 0.03, + "global_step": 3583, + "learning_rate": 0.0004858806343906511, + "loss": 1.8685, + "loss_base2": 2.6957, + "loss_pixel": 0.2517, + "loss_text": 1.6168, + "ppl": 6.4786, + "step": 3583 + }, + { + "epoch": 0.03, + "global_step": 3584, + "learning_rate": 0.00048587646076794663, + "loss": 1.8629, + "loss_base2": 2.6876, + "loss_pixel": 0.2467, + "loss_text": 1.6163, + "ppl": 6.4424, + "step": 3584 + }, + { + "epoch": 0.03, + "global_step": 3585, + "learning_rate": 0.0004858722871452421, + "loss": 1.8346, + "loss_base2": 2.6468, + "loss_pixel": 0.2434, + "loss_text": 1.5912, + "ppl": 6.2626, + "step": 3585 + }, + { + "epoch": 0.03, + "global_step": 3586, + "learning_rate": 0.0004858681135225376, + "loss": 1.83, + "loss_base2": 2.6401, + "loss_pixel": 0.2427, + "loss_text": 1.5874, + "ppl": 6.2339, + "step": 3586 + }, + { + "epoch": 0.03, + "global_step": 3587, + "learning_rate": 0.0004858639398998331, + "loss": 1.8402, + "loss_base2": 2.6548, + "loss_pixel": 0.2437, + "loss_text": 1.5965, + "ppl": 6.2978, + "step": 3587 + }, + { + "epoch": 0.03, + "global_step": 3588, + "learning_rate": 0.00048585976627712855, + "loss": 1.8236, + "loss_base2": 2.6309, + "loss_pixel": 0.242, + "loss_text": 1.5816, + "ppl": 6.1941, + "step": 3588 + }, + { + "epoch": 0.03, + "global_step": 3589, + "learning_rate": 0.000485855592654424, + "loss": 1.822, + "loss_base2": 2.6286, + "loss_pixel": 0.2409, + "loss_text": 1.5811, + "ppl": 6.1842, + "step": 3589 + }, + { + "epoch": 0.03, + "global_step": 3590, + "learning_rate": 0.0004858514190317195, + "loss": 1.8381, + "loss_base2": 2.6518, + "loss_pixel": 0.2403, + "loss_text": 1.5978, + "ppl": 6.2846, + "step": 3590 + }, + { + "epoch": 0.03, + "global_step": 3591, + "learning_rate": 0.000485847245409015, + "loss": 1.8321, + "loss_base2": 2.6432, + "loss_pixel": 0.2404, + "loss_text": 1.5917, + "ppl": 6.247, + "step": 3591 + }, + { + "epoch": 0.03, + "global_step": 3592, + "learning_rate": 0.00048584307178631053, + "loss": 1.8373, + "loss_base2": 2.6507, + "loss_pixel": 0.2377, + "loss_text": 1.5997, + "ppl": 6.2796, + "step": 3592 + }, + { + "epoch": 0.03, + "global_step": 3593, + "learning_rate": 0.00048583889816360604, + "loss": 1.832, + "loss_base2": 2.643, + "loss_pixel": 0.2378, + "loss_text": 1.5941, + "ppl": 6.2464, + "step": 3593 + }, + { + "epoch": 0.03, + "global_step": 3594, + "learning_rate": 0.0004858347245409015, + "loss": 1.8099, + "loss_base2": 2.6111, + "loss_pixel": 0.2379, + "loss_text": 1.5719, + "ppl": 6.1098, + "step": 3594 + }, + { + "epoch": 0.03, + "global_step": 3595, + "learning_rate": 0.000485830550918197, + "loss": 1.8318, + "loss_base2": 2.6427, + "loss_pixel": 0.2386, + "loss_text": 1.5932, + "ppl": 6.2451, + "step": 3595 + }, + { + "epoch": 0.03, + "global_step": 3596, + "learning_rate": 0.0004858263772954925, + "loss": 1.833, + "loss_base2": 2.6445, + "loss_pixel": 0.2343, + "loss_text": 1.5987, + "ppl": 6.2526, + "step": 3596 + }, + { + "epoch": 0.03, + "global_step": 3597, + "learning_rate": 0.000485822203672788, + "loss": 1.8264, + "loss_base2": 2.6349, + "loss_pixel": 0.2344, + "loss_text": 1.592, + "ppl": 6.2115, + "step": 3597 + }, + { + "epoch": 0.03, + "global_step": 3598, + "learning_rate": 0.00048581803005008346, + "loss": 1.8286, + "loss_base2": 2.6381, + "loss_pixel": 0.2338, + "loss_text": 1.5948, + "ppl": 6.2252, + "step": 3598 + }, + { + "epoch": 0.03, + "global_step": 3599, + "learning_rate": 0.00048581385642737897, + "loss": 1.8205, + "loss_base2": 2.6264, + "loss_pixel": 0.233, + "loss_text": 1.5875, + "ppl": 6.1749, + "step": 3599 + }, + { + "epoch": 0.03, + "global_step": 3600, + "learning_rate": 0.0004858096828046745, + "loss": 1.8081, + "loss_base2": 2.6085, + "loss_pixel": 0.2356, + "loss_text": 1.5725, + "ppl": 6.0988, + "step": 3600 + }, + { + "epoch": 0.03, + "global_step": 3601, + "learning_rate": 0.00048580550918197, + "loss": 1.8369, + "loss_base2": 2.6501, + "loss_pixel": 0.2465, + "loss_text": 1.5904, + "ppl": 6.277, + "step": 3601 + }, + { + "epoch": 0.03, + "global_step": 3602, + "learning_rate": 0.0004858013355592655, + "loss": 1.8372, + "loss_base2": 2.6505, + "loss_pixel": 0.246, + "loss_text": 1.5912, + "ppl": 6.2789, + "step": 3602 + }, + { + "epoch": 0.03, + "global_step": 3603, + "learning_rate": 0.00048579716193656095, + "loss": 1.8268, + "loss_base2": 2.6355, + "loss_pixel": 0.2355, + "loss_text": 1.5914, + "ppl": 6.214, + "step": 3603 + }, + { + "epoch": 0.03, + "global_step": 3604, + "learning_rate": 0.00048579298831385645, + "loss": 1.8254, + "loss_base2": 2.6335, + "loss_pixel": 0.233, + "loss_text": 1.5924, + "ppl": 6.2053, + "step": 3604 + }, + { + "epoch": 0.03, + "global_step": 3605, + "learning_rate": 0.00048578881469115196, + "loss": 1.8275, + "loss_base2": 2.6365, + "loss_pixel": 0.231, + "loss_text": 1.5966, + "ppl": 6.2183, + "step": 3605 + }, + { + "epoch": 0.03, + "global_step": 3606, + "learning_rate": 0.00048578464106844747, + "loss": 1.8425, + "loss_base2": 2.6582, + "loss_pixel": 0.2301, + "loss_text": 1.6123, + "ppl": 6.3123, + "step": 3606 + }, + { + "epoch": 0.03, + "global_step": 3607, + "learning_rate": 0.00048578046744574287, + "loss": 1.8174, + "loss_base2": 2.622, + "loss_pixel": 0.2274, + "loss_text": 1.59, + "ppl": 6.1558, + "step": 3607 + }, + { + "epoch": 0.03, + "global_step": 3608, + "learning_rate": 0.0004857762938230384, + "loss": 1.8024, + "loss_base2": 2.6003, + "loss_pixel": 0.2299, + "loss_text": 1.5724, + "ppl": 6.0642, + "step": 3608 + }, + { + "epoch": 0.03, + "global_step": 3609, + "learning_rate": 0.0004857721202003339, + "loss": 1.8324, + "loss_base2": 2.6436, + "loss_pixel": 0.23, + "loss_text": 1.6024, + "ppl": 6.2489, + "step": 3609 + }, + { + "epoch": 0.03, + "global_step": 3610, + "learning_rate": 0.0004857679465776294, + "loss": 1.8043, + "loss_base2": 2.6031, + "loss_pixel": 0.23, + "loss_text": 1.5744, + "ppl": 6.0757, + "step": 3610 + }, + { + "epoch": 0.03, + "global_step": 3611, + "learning_rate": 0.0004857637729549249, + "loss": 1.8418, + "loss_base2": 2.6572, + "loss_pixel": 0.2343, + "loss_text": 1.6075, + "ppl": 6.3079, + "step": 3611 + }, + { + "epoch": 0.03, + "global_step": 3612, + "learning_rate": 0.00048575959933222035, + "loss": 1.8257, + "loss_base2": 2.6339, + "loss_pixel": 0.2385, + "loss_text": 1.5872, + "ppl": 6.2071, + "step": 3612 + }, + { + "epoch": 0.03, + "global_step": 3613, + "learning_rate": 0.00048575542570951586, + "loss": 1.8553, + "loss_base2": 2.6766, + "loss_pixel": 0.246, + "loss_text": 1.6093, + "ppl": 6.3936, + "step": 3613 + }, + { + "epoch": 0.03, + "global_step": 3614, + "learning_rate": 0.00048575125208681136, + "loss": 1.8311, + "loss_base2": 2.6417, + "loss_pixel": 0.2504, + "loss_text": 1.5807, + "ppl": 6.2407, + "step": 3614 + }, + { + "epoch": 0.03, + "global_step": 3615, + "learning_rate": 0.00048574707846410687, + "loss": 1.8332, + "loss_base2": 2.6447, + "loss_pixel": 0.2496, + "loss_text": 1.5836, + "ppl": 6.2539, + "step": 3615 + }, + { + "epoch": 0.03, + "global_step": 3616, + "learning_rate": 0.0004857429048414023, + "loss": 1.8281, + "loss_base2": 2.6374, + "loss_pixel": 0.2431, + "loss_text": 1.585, + "ppl": 6.2221, + "step": 3616 + }, + { + "epoch": 0.03, + "global_step": 3617, + "learning_rate": 0.00048573873121869783, + "loss": 1.8316, + "loss_base2": 2.6424, + "loss_pixel": 0.2412, + "loss_text": 1.5904, + "ppl": 6.2439, + "step": 3617 + }, + { + "epoch": 0.03, + "global_step": 3618, + "learning_rate": 0.00048573455759599334, + "loss": 1.8126, + "loss_base2": 2.615, + "loss_pixel": 0.2357, + "loss_text": 1.5769, + "ppl": 6.1264, + "step": 3618 + }, + { + "epoch": 0.03, + "global_step": 3619, + "learning_rate": 0.00048573038397328885, + "loss": 1.8499, + "loss_base2": 2.6688, + "loss_pixel": 0.2404, + "loss_text": 1.6096, + "ppl": 6.3592, + "step": 3619 + }, + { + "epoch": 0.03, + "global_step": 3620, + "learning_rate": 0.00048572621035058435, + "loss": 1.8465, + "loss_base2": 2.6639, + "loss_pixel": 0.2493, + "loss_text": 1.5972, + "ppl": 6.3376, + "step": 3620 + }, + { + "epoch": 0.03, + "global_step": 3621, + "learning_rate": 0.0004857220367278798, + "loss": 1.8569, + "loss_base2": 2.6789, + "loss_pixel": 0.2478, + "loss_text": 1.6091, + "ppl": 6.4039, + "step": 3621 + }, + { + "epoch": 0.03, + "global_step": 3622, + "learning_rate": 0.0004857178631051753, + "loss": 1.809, + "loss_base2": 2.6098, + "loss_pixel": 0.2452, + "loss_text": 1.5638, + "ppl": 6.1043, + "step": 3622 + }, + { + "epoch": 0.03, + "global_step": 3623, + "learning_rate": 0.0004857136894824708, + "loss": 1.6916, + "loss_base2": 2.4405, + "loss_pixel": 0.243, + "loss_text": 1.4485, + "ppl": 5.4282, + "step": 3623 + }, + { + "epoch": 0.03, + "global_step": 3624, + "learning_rate": 0.00048570951585976633, + "loss": 1.65, + "loss_base2": 2.3804, + "loss_pixel": 0.241, + "loss_text": 1.409, + "ppl": 5.207, + "step": 3624 + }, + { + "epoch": 0.03, + "global_step": 3625, + "learning_rate": 0.00048570534223706173, + "loss": 1.6202, + "loss_base2": 2.3375, + "loss_pixel": 0.2398, + "loss_text": 1.3804, + "ppl": 5.0541, + "step": 3625 + }, + { + "epoch": 0.03, + "global_step": 3626, + "learning_rate": 0.00048570116861435724, + "loss": 1.607, + "loss_base2": 2.3184, + "loss_pixel": 0.2382, + "loss_text": 1.3688, + "ppl": 4.9878, + "step": 3626 + }, + { + "epoch": 0.03, + "global_step": 3627, + "learning_rate": 0.00048569699499165274, + "loss": 1.6302, + "loss_base2": 2.3519, + "loss_pixel": 0.2368, + "loss_text": 1.3934, + "ppl": 5.1049, + "step": 3627 + }, + { + "epoch": 0.03, + "global_step": 3628, + "learning_rate": 0.00048569282136894825, + "loss": 1.6155, + "loss_base2": 2.3307, + "loss_pixel": 0.2368, + "loss_text": 1.3787, + "ppl": 5.0304, + "step": 3628 + }, + { + "epoch": 0.03, + "global_step": 3629, + "learning_rate": 0.00048568864774624376, + "loss": 1.6166, + "loss_base2": 2.3323, + "loss_pixel": 0.2355, + "loss_text": 1.3811, + "ppl": 5.0359, + "step": 3629 + }, + { + "epoch": 0.03, + "global_step": 3630, + "learning_rate": 0.0004856844741235392, + "loss": 1.6038, + "loss_base2": 2.3138, + "loss_pixel": 0.2349, + "loss_text": 1.3689, + "ppl": 4.9719, + "step": 3630 + }, + { + "epoch": 0.03, + "global_step": 3631, + "learning_rate": 0.0004856803005008347, + "loss": 1.6049, + "loss_base2": 2.3154, + "loss_pixel": 0.2338, + "loss_text": 1.371, + "ppl": 4.9774, + "step": 3631 + }, + { + "epoch": 0.03, + "global_step": 3632, + "learning_rate": 0.0004856761268781302, + "loss": 1.613, + "loss_base2": 2.3271, + "loss_pixel": 0.2339, + "loss_text": 1.3791, + "ppl": 5.0178, + "step": 3632 + }, + { + "epoch": 0.03, + "global_step": 3633, + "learning_rate": 0.00048567195325542573, + "loss": 1.6289, + "loss_base2": 2.35, + "loss_pixel": 0.2317, + "loss_text": 1.3972, + "ppl": 5.0983, + "step": 3633 + }, + { + "epoch": 0.03, + "global_step": 3634, + "learning_rate": 0.0004856677796327212, + "loss": 1.595, + "loss_base2": 2.3011, + "loss_pixel": 0.231, + "loss_text": 1.3639, + "ppl": 4.9283, + "step": 3634 + }, + { + "epoch": 0.03, + "global_step": 3635, + "learning_rate": 0.0004856636060100167, + "loss": 1.6138, + "loss_base2": 2.3282, + "loss_pixel": 0.2325, + "loss_text": 1.3813, + "ppl": 5.0219, + "step": 3635 + }, + { + "epoch": 0.03, + "global_step": 3636, + "learning_rate": 0.0004856594323873122, + "loss": 1.6094, + "loss_base2": 2.3219, + "loss_pixel": 0.2313, + "loss_text": 1.3781, + "ppl": 4.9998, + "step": 3636 + }, + { + "epoch": 0.03, + "global_step": 3637, + "learning_rate": 0.0004856552587646077, + "loss": 1.6033, + "loss_base2": 2.3131, + "loss_pixel": 0.2298, + "loss_text": 1.3735, + "ppl": 4.9694, + "step": 3637 + }, + { + "epoch": 0.03, + "global_step": 3638, + "learning_rate": 0.0004856510851419032, + "loss": 1.6117, + "loss_base2": 2.3252, + "loss_pixel": 0.232, + "loss_text": 1.3796, + "ppl": 5.0113, + "step": 3638 + }, + { + "epoch": 0.03, + "global_step": 3639, + "learning_rate": 0.00048564691151919867, + "loss": 1.6373, + "loss_base2": 2.3621, + "loss_pixel": 0.2356, + "loss_text": 1.4017, + "ppl": 5.1413, + "step": 3639 + }, + { + "epoch": 0.03, + "global_step": 3640, + "learning_rate": 0.0004856427378964942, + "loss": 1.7754, + "loss_base2": 2.5614, + "loss_pixel": 0.2328, + "loss_text": 1.5426, + "ppl": 5.9026, + "step": 3640 + }, + { + "epoch": 0.03, + "global_step": 3641, + "learning_rate": 0.0004856385642737897, + "loss": 1.7736, + "loss_base2": 2.5588, + "loss_pixel": 0.2329, + "loss_text": 1.5407, + "ppl": 5.892, + "step": 3641 + }, + { + "epoch": 0.03, + "global_step": 3642, + "learning_rate": 0.0004856343906510852, + "loss": 1.8429, + "loss_base2": 2.6587, + "loss_pixel": 0.2316, + "loss_text": 1.6112, + "ppl": 6.3148, + "step": 3642 + }, + { + "epoch": 0.03, + "global_step": 3643, + "learning_rate": 0.0004856302170283807, + "loss": 1.822, + "loss_base2": 2.6286, + "loss_pixel": 0.2293, + "loss_text": 1.5928, + "ppl": 6.1842, + "step": 3643 + }, + { + "epoch": 0.03, + "global_step": 3644, + "learning_rate": 0.0004856260434056761, + "loss": 1.8277, + "loss_base2": 2.6368, + "loss_pixel": 0.2281, + "loss_text": 1.5997, + "ppl": 6.2196, + "step": 3644 + }, + { + "epoch": 0.03, + "global_step": 3645, + "learning_rate": 0.0004856218697829716, + "loss": 1.8435, + "loss_base2": 2.6596, + "loss_pixel": 0.2295, + "loss_text": 1.6141, + "ppl": 6.3186, + "step": 3645 + }, + { + "epoch": 0.03, + "global_step": 3646, + "learning_rate": 0.0004856176961602671, + "loss": 1.8215, + "loss_base2": 2.6279, + "loss_pixel": 0.2275, + "loss_text": 1.594, + "ppl": 6.1811, + "step": 3646 + }, + { + "epoch": 0.03, + "global_step": 3647, + "learning_rate": 0.0004856135225375626, + "loss": 1.833, + "loss_base2": 2.6445, + "loss_pixel": 0.2272, + "loss_text": 1.6058, + "ppl": 6.2526, + "step": 3647 + }, + { + "epoch": 0.03, + "global_step": 3648, + "learning_rate": 0.00048560934891485807, + "loss": 1.8193, + "loss_base2": 2.6247, + "loss_pixel": 0.2258, + "loss_text": 1.5935, + "ppl": 6.1675, + "step": 3648 + }, + { + "epoch": 0.03, + "global_step": 3649, + "learning_rate": 0.0004856051752921536, + "loss": 1.8201, + "loss_base2": 2.6258, + "loss_pixel": 0.2256, + "loss_text": 1.5946, + "ppl": 6.1725, + "step": 3649 + }, + { + "epoch": 0.03, + "global_step": 3650, + "learning_rate": 0.0004856010016694491, + "loss": 1.8171, + "loss_base2": 2.6215, + "loss_pixel": 0.2255, + "loss_text": 1.5916, + "ppl": 6.154, + "step": 3650 + }, + { + "epoch": 0.03, + "global_step": 3651, + "learning_rate": 0.0004855968280467446, + "loss": 1.8335, + "loss_base2": 2.6452, + "loss_pixel": 0.2247, + "loss_text": 1.6088, + "ppl": 6.2557, + "step": 3651 + }, + { + "epoch": 0.03, + "global_step": 3652, + "learning_rate": 0.0004855926544240401, + "loss": 1.806, + "loss_base2": 2.6055, + "loss_pixel": 0.2241, + "loss_text": 1.5819, + "ppl": 6.0861, + "step": 3652 + }, + { + "epoch": 0.03, + "global_step": 3653, + "learning_rate": 0.00048558848080133555, + "loss": 1.8195, + "loss_base2": 2.625, + "loss_pixel": 0.2231, + "loss_text": 1.5964, + "ppl": 6.1688, + "step": 3653 + }, + { + "epoch": 0.03, + "global_step": 3654, + "learning_rate": 0.00048558430717863106, + "loss": 1.8279, + "loss_base2": 2.6371, + "loss_pixel": 0.2234, + "loss_text": 1.6045, + "ppl": 6.2208, + "step": 3654 + }, + { + "epoch": 0.03, + "global_step": 3655, + "learning_rate": 0.00048558013355592657, + "loss": 1.8185, + "loss_base2": 2.6235, + "loss_pixel": 0.2231, + "loss_text": 1.5954, + "ppl": 6.1626, + "step": 3655 + }, + { + "epoch": 0.03, + "global_step": 3656, + "learning_rate": 0.0004855759599332221, + "loss": 1.8187, + "loss_base2": 2.6238, + "loss_pixel": 0.2228, + "loss_text": 1.5959, + "ppl": 6.1638, + "step": 3656 + }, + { + "epoch": 0.03, + "global_step": 3657, + "learning_rate": 0.00048557178631051753, + "loss": 1.8366, + "loss_base2": 2.6497, + "loss_pixel": 0.2208, + "loss_text": 1.6159, + "ppl": 6.2752, + "step": 3657 + }, + { + "epoch": 0.03, + "global_step": 3658, + "learning_rate": 0.00048556761268781304, + "loss": 1.8278, + "loss_base2": 2.637, + "loss_pixel": 0.2211, + "loss_text": 1.6067, + "ppl": 6.2202, + "step": 3658 + }, + { + "epoch": 0.03, + "global_step": 3659, + "learning_rate": 0.00048556343906510854, + "loss": 1.8244, + "loss_base2": 2.6321, + "loss_pixel": 0.2202, + "loss_text": 1.6041, + "ppl": 6.1991, + "step": 3659 + }, + { + "epoch": 0.03, + "global_step": 3660, + "learning_rate": 0.00048555926544240405, + "loss": 1.8111, + "loss_base2": 2.6129, + "loss_pixel": 0.2203, + "loss_text": 1.5907, + "ppl": 6.1172, + "step": 3660 + }, + { + "epoch": 0.03, + "global_step": 3661, + "learning_rate": 0.00048555509181969956, + "loss": 1.8121, + "loss_base2": 2.6143, + "loss_pixel": 0.2203, + "loss_text": 1.5918, + "ppl": 6.1233, + "step": 3661 + }, + { + "epoch": 0.03, + "global_step": 3662, + "learning_rate": 0.000485550918196995, + "loss": 1.8047, + "loss_base2": 2.6036, + "loss_pixel": 0.2195, + "loss_text": 1.5852, + "ppl": 6.0781, + "step": 3662 + }, + { + "epoch": 0.03, + "global_step": 3663, + "learning_rate": 0.00048554674457429046, + "loss": 1.819, + "loss_base2": 2.6243, + "loss_pixel": 0.2204, + "loss_text": 1.5986, + "ppl": 6.1657, + "step": 3663 + }, + { + "epoch": 0.03, + "global_step": 3664, + "learning_rate": 0.00048554257095158597, + "loss": 1.803, + "loss_base2": 2.6012, + "loss_pixel": 0.2206, + "loss_text": 1.5824, + "ppl": 6.0678, + "step": 3664 + }, + { + "epoch": 0.03, + "global_step": 3665, + "learning_rate": 0.0004855383973288815, + "loss": 1.8018, + "loss_base2": 2.5994, + "loss_pixel": 0.2199, + "loss_text": 1.5819, + "ppl": 6.0605, + "step": 3665 + }, + { + "epoch": 0.03, + "global_step": 3666, + "learning_rate": 0.00048553422370617693, + "loss": 1.8055, + "loss_base2": 2.6048, + "loss_pixel": 0.2183, + "loss_text": 1.5872, + "ppl": 6.083, + "step": 3666 + }, + { + "epoch": 0.03, + "global_step": 3667, + "learning_rate": 0.00048553005008347244, + "loss": 1.604, + "loss_base2": 2.3141, + "loss_pixel": 0.22, + "loss_text": 1.3839, + "ppl": 4.9729, + "step": 3667 + }, + { + "epoch": 0.03, + "global_step": 3668, + "learning_rate": 0.00048552587646076795, + "loss": 1.6103, + "loss_base2": 2.3232, + "loss_pixel": 0.2173, + "loss_text": 1.393, + "ppl": 5.0043, + "step": 3668 + }, + { + "epoch": 0.03, + "global_step": 3669, + "learning_rate": 0.00048552170283806345, + "loss": 1.6004, + "loss_base2": 2.3089, + "loss_pixel": 0.218, + "loss_text": 1.3825, + "ppl": 4.955, + "step": 3669 + }, + { + "epoch": 0.03, + "global_step": 3670, + "learning_rate": 0.00048551752921535896, + "loss": 1.6016, + "loss_base2": 2.3106, + "loss_pixel": 0.2181, + "loss_text": 1.3836, + "ppl": 4.961, + "step": 3670 + }, + { + "epoch": 0.03, + "global_step": 3671, + "learning_rate": 0.0004855133555926544, + "loss": 1.5818, + "loss_base2": 2.2821, + "loss_pixel": 0.2172, + "loss_text": 1.3646, + "ppl": 4.8637, + "step": 3671 + }, + { + "epoch": 0.03, + "global_step": 3672, + "learning_rate": 0.0004855091819699499, + "loss": 1.5992, + "loss_base2": 2.3072, + "loss_pixel": 0.216, + "loss_text": 1.3832, + "ppl": 4.9491, + "step": 3672 + }, + { + "epoch": 0.03, + "global_step": 3673, + "learning_rate": 0.00048550500834724543, + "loss": 1.59, + "loss_base2": 2.2939, + "loss_pixel": 0.2168, + "loss_text": 1.3732, + "ppl": 4.9037, + "step": 3673 + }, + { + "epoch": 0.03, + "global_step": 3674, + "learning_rate": 0.00048550083472454094, + "loss": 1.5677, + "loss_base2": 2.2617, + "loss_pixel": 0.2168, + "loss_text": 1.3509, + "ppl": 4.7956, + "step": 3674 + }, + { + "epoch": 0.03, + "global_step": 3675, + "learning_rate": 0.0004854966611018364, + "loss": 1.5574, + "loss_base2": 2.2469, + "loss_pixel": 0.2159, + "loss_text": 1.3415, + "ppl": 4.7465, + "step": 3675 + }, + { + "epoch": 0.03, + "global_step": 3676, + "learning_rate": 0.0004854924874791319, + "loss": 1.5897, + "loss_base2": 2.2935, + "loss_pixel": 0.2137, + "loss_text": 1.376, + "ppl": 4.9023, + "step": 3676 + }, + { + "epoch": 0.03, + "global_step": 3677, + "learning_rate": 0.0004854883138564274, + "loss": 1.5813, + "loss_base2": 2.2813, + "loss_pixel": 0.2153, + "loss_text": 1.366, + "ppl": 4.8613, + "step": 3677 + }, + { + "epoch": 0.03, + "global_step": 3678, + "learning_rate": 0.0004854841402337229, + "loss": 1.5644, + "loss_base2": 2.257, + "loss_pixel": 0.2155, + "loss_text": 1.3489, + "ppl": 4.7798, + "step": 3678 + }, + { + "epoch": 0.03, + "global_step": 3679, + "learning_rate": 0.0004854799666110184, + "loss": 1.575, + "loss_base2": 2.2722, + "loss_pixel": 0.2156, + "loss_text": 1.3594, + "ppl": 4.8307, + "step": 3679 + }, + { + "epoch": 0.03, + "global_step": 3680, + "learning_rate": 0.00048547579298831387, + "loss": 1.5627, + "loss_base2": 2.2545, + "loss_pixel": 0.2171, + "loss_text": 1.3456, + "ppl": 4.7717, + "step": 3680 + }, + { + "epoch": 0.03, + "global_step": 3681, + "learning_rate": 0.0004854716193656093, + "loss": 1.5937, + "loss_base2": 2.2992, + "loss_pixel": 0.2201, + "loss_text": 1.3737, + "ppl": 4.9219, + "step": 3681 + }, + { + "epoch": 0.03, + "global_step": 3682, + "learning_rate": 0.00048546744574290483, + "loss": 1.6988, + "loss_base2": 2.4509, + "loss_pixel": 0.2312, + "loss_text": 1.4676, + "ppl": 5.4674, + "step": 3682 + }, + { + "epoch": 0.03, + "global_step": 3683, + "learning_rate": 0.00048546327212020034, + "loss": 1.7659, + "loss_base2": 2.5477, + "loss_pixel": 0.2412, + "loss_text": 1.5247, + "ppl": 5.8468, + "step": 3683 + }, + { + "epoch": 0.03, + "global_step": 3684, + "learning_rate": 0.0004854590984974958, + "loss": 1.6839, + "loss_base2": 2.4294, + "loss_pixel": 0.2607, + "loss_text": 1.4232, + "ppl": 5.3865, + "step": 3684 + }, + { + "epoch": 0.03, + "global_step": 3685, + "learning_rate": 0.0004854549248747913, + "loss": 1.708, + "loss_base2": 2.4641, + "loss_pixel": 0.3385, + "loss_text": 1.3696, + "ppl": 5.5179, + "step": 3685 + }, + { + "epoch": 0.03, + "global_step": 3686, + "learning_rate": 0.0004854507512520868, + "loss": 1.6888, + "loss_base2": 2.4364, + "loss_pixel": 0.3208, + "loss_text": 1.368, + "ppl": 5.413, + "step": 3686 + }, + { + "epoch": 0.03, + "global_step": 3687, + "learning_rate": 0.0004854465776293823, + "loss": 1.703, + "loss_base2": 2.4569, + "loss_pixel": 0.3386, + "loss_text": 1.3644, + "ppl": 5.4904, + "step": 3687 + }, + { + "epoch": 0.03, + "global_step": 3688, + "learning_rate": 0.0004854424040066778, + "loss": 1.7133, + "loss_base2": 2.4718, + "loss_pixel": 0.3442, + "loss_text": 1.3691, + "ppl": 5.5472, + "step": 3688 + }, + { + "epoch": 0.03, + "global_step": 3689, + "learning_rate": 0.0004854382303839733, + "loss": 1.7404, + "loss_base2": 2.5109, + "loss_pixel": 0.3554, + "loss_text": 1.385, + "ppl": 5.6996, + "step": 3689 + }, + { + "epoch": 0.03, + "global_step": 3690, + "learning_rate": 0.0004854340567612688, + "loss": 1.7162, + "loss_base2": 2.476, + "loss_pixel": 0.3522, + "loss_text": 1.364, + "ppl": 5.5633, + "step": 3690 + }, + { + "epoch": 0.03, + "global_step": 3691, + "learning_rate": 0.0004854298831385643, + "loss": 1.7973, + "loss_base2": 2.593, + "loss_pixel": 0.3438, + "loss_text": 1.4534, + "ppl": 6.0333, + "step": 3691 + }, + { + "epoch": 0.03, + "global_step": 3692, + "learning_rate": 0.0004854257095158598, + "loss": 1.7882, + "loss_base2": 2.5798, + "loss_pixel": 0.3429, + "loss_text": 1.4453, + "ppl": 5.9787, + "step": 3692 + }, + { + "epoch": 0.03, + "global_step": 3693, + "learning_rate": 0.00048542153589315525, + "loss": 1.74, + "loss_base2": 2.5103, + "loss_pixel": 0.3703, + "loss_text": 1.3697, + "ppl": 5.6973, + "step": 3693 + }, + { + "epoch": 0.03, + "global_step": 3694, + "learning_rate": 0.00048541736227045076, + "loss": 1.7393, + "loss_base2": 2.5093, + "loss_pixel": 0.3756, + "loss_text": 1.3636, + "ppl": 5.6934, + "step": 3694 + }, + { + "epoch": 0.03, + "global_step": 3695, + "learning_rate": 0.00048541318864774626, + "loss": 1.7537, + "loss_base2": 2.5301, + "loss_pixel": 0.3746, + "loss_text": 1.3791, + "ppl": 5.7759, + "step": 3695 + }, + { + "epoch": 0.03, + "global_step": 3696, + "learning_rate": 0.00048540901502504177, + "loss": 1.722, + "loss_base2": 2.4843, + "loss_pixel": 0.37, + "loss_text": 1.3519, + "ppl": 5.5957, + "step": 3696 + }, + { + "epoch": 0.03, + "global_step": 3697, + "learning_rate": 0.0004854048414023373, + "loss": 1.7414, + "loss_base2": 2.5123, + "loss_pixel": 0.3669, + "loss_text": 1.3744, + "ppl": 5.7053, + "step": 3697 + }, + { + "epoch": 0.03, + "global_step": 3698, + "learning_rate": 0.00048540066777963273, + "loss": 1.7474, + "loss_base2": 2.521, + "loss_pixel": 0.3689, + "loss_text": 1.3784, + "ppl": 5.7397, + "step": 3698 + }, + { + "epoch": 0.03, + "global_step": 3699, + "learning_rate": 0.00048539649415692824, + "loss": 1.7578, + "loss_base2": 2.536, + "loss_pixel": 0.38, + "loss_text": 1.3778, + "ppl": 5.7997, + "step": 3699 + }, + { + "epoch": 0.03, + "global_step": 3700, + "learning_rate": 0.0004853923205342237, + "loss": 1.8885, + "loss_base2": 2.7245, + "loss_pixel": 0.3683, + "loss_text": 1.5202, + "ppl": 6.6094, + "step": 3700 + }, + { + "epoch": 0.03, + "global_step": 3701, + "learning_rate": 0.0004853881469115192, + "loss": 1.7747, + "loss_base2": 2.5604, + "loss_pixel": 0.3694, + "loss_text": 1.4053, + "ppl": 5.8985, + "step": 3701 + }, + { + "epoch": 0.03, + "global_step": 3702, + "learning_rate": 0.0004853839732888147, + "loss": 1.758, + "loss_base2": 2.5363, + "loss_pixel": 0.3749, + "loss_text": 1.3831, + "ppl": 5.8008, + "step": 3702 + }, + { + "epoch": 0.03, + "global_step": 3703, + "learning_rate": 0.00048537979966611016, + "loss": 1.752, + "loss_base2": 2.5276, + "loss_pixel": 0.3824, + "loss_text": 1.3696, + "ppl": 5.7661, + "step": 3703 + }, + { + "epoch": 0.03, + "global_step": 3704, + "learning_rate": 0.00048537562604340567, + "loss": 1.7554, + "loss_base2": 2.5325, + "loss_pixel": 0.3767, + "loss_text": 1.3787, + "ppl": 5.7858, + "step": 3704 + }, + { + "epoch": 0.03, + "global_step": 3705, + "learning_rate": 0.0004853714524207012, + "loss": 1.747, + "loss_base2": 2.5204, + "loss_pixel": 0.3784, + "loss_text": 1.3686, + "ppl": 5.7374, + "step": 3705 + }, + { + "epoch": 0.03, + "global_step": 3706, + "learning_rate": 0.0004853672787979967, + "loss": 1.7389, + "loss_base2": 2.5087, + "loss_pixel": 0.3777, + "loss_text": 1.3612, + "ppl": 5.6911, + "step": 3706 + }, + { + "epoch": 0.03, + "global_step": 3707, + "learning_rate": 0.00048536310517529214, + "loss": 1.7638, + "loss_base2": 2.5446, + "loss_pixel": 0.3788, + "loss_text": 1.3849, + "ppl": 5.8346, + "step": 3707 + }, + { + "epoch": 0.03, + "global_step": 3708, + "learning_rate": 0.00048535893155258764, + "loss": 1.7596, + "loss_base2": 2.5386, + "loss_pixel": 0.378, + "loss_text": 1.3816, + "ppl": 5.8101, + "step": 3708 + }, + { + "epoch": 0.03, + "global_step": 3709, + "learning_rate": 0.00048535475792988315, + "loss": 1.7316, + "loss_base2": 2.4982, + "loss_pixel": 0.3727, + "loss_text": 1.3589, + "ppl": 5.6497, + "step": 3709 + }, + { + "epoch": 0.03, + "global_step": 3710, + "learning_rate": 0.00048535058430717866, + "loss": 1.7269, + "loss_base2": 2.4914, + "loss_pixel": 0.3729, + "loss_text": 1.354, + "ppl": 5.6232, + "step": 3710 + }, + { + "epoch": 0.03, + "global_step": 3711, + "learning_rate": 0.00048534641068447416, + "loss": 1.7255, + "loss_base2": 2.4894, + "loss_pixel": 0.3698, + "loss_text": 1.3557, + "ppl": 5.6153, + "step": 3711 + }, + { + "epoch": 0.03, + "global_step": 3712, + "learning_rate": 0.0004853422370617696, + "loss": 1.7226, + "loss_base2": 2.4852, + "loss_pixel": 0.3705, + "loss_text": 1.3521, + "ppl": 5.5991, + "step": 3712 + }, + { + "epoch": 0.03, + "global_step": 3713, + "learning_rate": 0.0004853380634390651, + "loss": 1.7143, + "loss_base2": 2.4732, + "loss_pixel": 0.3675, + "loss_text": 1.3468, + "ppl": 5.5528, + "step": 3713 + }, + { + "epoch": 0.03, + "global_step": 3714, + "learning_rate": 0.00048533388981636063, + "loss": 1.7114, + "loss_base2": 2.469, + "loss_pixel": 0.3666, + "loss_text": 1.3448, + "ppl": 5.5367, + "step": 3714 + }, + { + "epoch": 0.03, + "global_step": 3715, + "learning_rate": 0.00048532971619365614, + "loss": 1.717, + "loss_base2": 2.4771, + "loss_pixel": 0.3638, + "loss_text": 1.3532, + "ppl": 5.5678, + "step": 3715 + }, + { + "epoch": 0.03, + "global_step": 3716, + "learning_rate": 0.0004853255425709516, + "loss": 1.7345, + "loss_base2": 2.5024, + "loss_pixel": 0.3634, + "loss_text": 1.3711, + "ppl": 5.6661, + "step": 3716 + }, + { + "epoch": 0.03, + "global_step": 3717, + "learning_rate": 0.0004853213689482471, + "loss": 1.73, + "loss_base2": 2.4959, + "loss_pixel": 0.362, + "loss_text": 1.368, + "ppl": 5.6407, + "step": 3717 + }, + { + "epoch": 0.03, + "global_step": 3718, + "learning_rate": 0.0004853171953255426, + "loss": 1.7207, + "loss_base2": 2.4824, + "loss_pixel": 0.3598, + "loss_text": 1.3609, + "ppl": 5.5884, + "step": 3718 + }, + { + "epoch": 0.03, + "global_step": 3719, + "learning_rate": 0.00048531302170283806, + "loss": 1.7095, + "loss_base2": 2.4663, + "loss_pixel": 0.3573, + "loss_text": 1.3522, + "ppl": 5.5262, + "step": 3719 + }, + { + "epoch": 0.03, + "global_step": 3720, + "learning_rate": 0.00048530884808013357, + "loss": 1.6976, + "loss_base2": 2.4491, + "loss_pixel": 0.3546, + "loss_text": 1.343, + "ppl": 5.4608, + "step": 3720 + }, + { + "epoch": 0.03, + "global_step": 3721, + "learning_rate": 0.000485304674457429, + "loss": 1.7206, + "loss_base2": 2.4823, + "loss_pixel": 0.354, + "loss_text": 1.3667, + "ppl": 5.5879, + "step": 3721 + }, + { + "epoch": 0.03, + "global_step": 3722, + "learning_rate": 0.00048530050083472453, + "loss": 1.6938, + "loss_base2": 2.4436, + "loss_pixel": 0.3503, + "loss_text": 1.3435, + "ppl": 5.4401, + "step": 3722 + }, + { + "epoch": 0.03, + "global_step": 3723, + "learning_rate": 0.00048529632721202004, + "loss": 1.7041, + "loss_base2": 2.4585, + "loss_pixel": 0.349, + "loss_text": 1.3551, + "ppl": 5.4964, + "step": 3723 + }, + { + "epoch": 0.03, + "global_step": 3724, + "learning_rate": 0.00048529215358931554, + "loss": 1.6771, + "loss_base2": 2.4195, + "loss_pixel": 0.3461, + "loss_text": 1.3309, + "ppl": 5.35, + "step": 3724 + }, + { + "epoch": 0.03, + "global_step": 3725, + "learning_rate": 0.000485287979966611, + "loss": 1.8864, + "loss_base2": 2.7215, + "loss_pixel": 0.345, + "loss_text": 1.5414, + "ppl": 6.5956, + "step": 3725 + }, + { + "epoch": 0.03, + "global_step": 3726, + "learning_rate": 0.0004852838063439065, + "loss": 1.9968, + "loss_base2": 2.8808, + "loss_pixel": 0.3428, + "loss_text": 1.654, + "ppl": 7.3654, + "step": 3726 + }, + { + "epoch": 0.03, + "global_step": 3727, + "learning_rate": 0.000485279632721202, + "loss": 1.9835, + "loss_base2": 2.8616, + "loss_pixel": 0.3427, + "loss_text": 1.6409, + "ppl": 7.2681, + "step": 3727 + }, + { + "epoch": 0.03, + "global_step": 3728, + "learning_rate": 0.0004852754590984975, + "loss": 1.9542, + "loss_base2": 2.8193, + "loss_pixel": 0.3383, + "loss_text": 1.6159, + "ppl": 7.0583, + "step": 3728 + }, + { + "epoch": 0.03, + "global_step": 3729, + "learning_rate": 0.000485271285475793, + "loss": 1.9698, + "loss_base2": 2.8418, + "loss_pixel": 0.3363, + "loss_text": 1.6335, + "ppl": 7.1692, + "step": 3729 + }, + { + "epoch": 0.03, + "global_step": 3730, + "learning_rate": 0.0004852671118530885, + "loss": 1.9751, + "loss_base2": 2.8495, + "loss_pixel": 0.3354, + "loss_text": 1.6398, + "ppl": 7.2073, + "step": 3730 + }, + { + "epoch": 0.03, + "global_step": 3731, + "learning_rate": 0.000485262938230384, + "loss": 1.9645, + "loss_base2": 2.8342, + "loss_pixel": 0.3376, + "loss_text": 1.6269, + "ppl": 7.1313, + "step": 3731 + }, + { + "epoch": 0.03, + "global_step": 3732, + "learning_rate": 0.0004852587646076795, + "loss": 1.9874, + "loss_base2": 2.8672, + "loss_pixel": 0.3616, + "loss_text": 1.6257, + "ppl": 7.2965, + "step": 3732 + }, + { + "epoch": 0.03, + "global_step": 3733, + "learning_rate": 0.000485254590984975, + "loss": 1.9573, + "loss_base2": 2.8238, + "loss_pixel": 0.348, + "loss_text": 1.6093, + "ppl": 7.0802, + "step": 3733 + }, + { + "epoch": 0.03, + "global_step": 3734, + "learning_rate": 0.00048525041736227045, + "loss": 1.977, + "loss_base2": 2.8522, + "loss_pixel": 0.3468, + "loss_text": 1.6301, + "ppl": 7.221, + "step": 3734 + }, + { + "epoch": 0.03, + "global_step": 3735, + "learning_rate": 0.00048524624373956596, + "loss": 1.9562, + "loss_base2": 2.8222, + "loss_pixel": 0.3457, + "loss_text": 1.6105, + "ppl": 7.0724, + "step": 3735 + }, + { + "epoch": 0.03, + "global_step": 3736, + "learning_rate": 0.00048524207011686147, + "loss": 1.9651, + "loss_base2": 2.835, + "loss_pixel": 0.3447, + "loss_text": 1.6204, + "ppl": 7.1356, + "step": 3736 + }, + { + "epoch": 0.03, + "global_step": 3737, + "learning_rate": 0.000485237896494157, + "loss": 1.9552, + "loss_base2": 2.8208, + "loss_pixel": 0.3475, + "loss_text": 1.6077, + "ppl": 7.0653, + "step": 3737 + }, + { + "epoch": 0.03, + "global_step": 3738, + "learning_rate": 0.00048523372287145243, + "loss": 1.9512, + "loss_base2": 2.815, + "loss_pixel": 0.3474, + "loss_text": 1.6038, + "ppl": 7.0371, + "step": 3738 + }, + { + "epoch": 0.03, + "global_step": 3739, + "learning_rate": 0.0004852295492487479, + "loss": 1.9434, + "loss_base2": 2.8037, + "loss_pixel": 0.3453, + "loss_text": 1.5981, + "ppl": 6.9825, + "step": 3739 + }, + { + "epoch": 0.03, + "global_step": 3740, + "learning_rate": 0.0004852253756260434, + "loss": 1.9482, + "loss_base2": 2.8107, + "loss_pixel": 0.3466, + "loss_text": 1.6016, + "ppl": 7.016, + "step": 3740 + }, + { + "epoch": 0.03, + "global_step": 3741, + "learning_rate": 0.0004852212020033389, + "loss": 1.9479, + "loss_base2": 2.8102, + "loss_pixel": 0.3415, + "loss_text": 1.6063, + "ppl": 7.0139, + "step": 3741 + }, + { + "epoch": 0.03, + "global_step": 3742, + "learning_rate": 0.0004852170283806344, + "loss": 1.9492, + "loss_base2": 2.8121, + "loss_pixel": 0.3391, + "loss_text": 1.6101, + "ppl": 7.0231, + "step": 3742 + }, + { + "epoch": 0.03, + "global_step": 3743, + "learning_rate": 0.00048521285475792986, + "loss": 1.9466, + "loss_base2": 2.8084, + "loss_pixel": 0.3407, + "loss_text": 1.6059, + "ppl": 7.0048, + "step": 3743 + }, + { + "epoch": 0.03, + "global_step": 3744, + "learning_rate": 0.00048520868113522536, + "loss": 1.9314, + "loss_base2": 2.7864, + "loss_pixel": 0.338, + "loss_text": 1.5934, + "ppl": 6.8992, + "step": 3744 + }, + { + "epoch": 0.03, + "global_step": 3745, + "learning_rate": 0.00048520450751252087, + "loss": 1.9341, + "loss_base2": 2.7903, + "loss_pixel": 0.3344, + "loss_text": 1.5997, + "ppl": 6.9178, + "step": 3745 + }, + { + "epoch": 0.03, + "global_step": 3746, + "learning_rate": 0.0004852003338898164, + "loss": 1.9267, + "loss_base2": 2.7796, + "loss_pixel": 0.3329, + "loss_text": 1.5938, + "ppl": 6.8668, + "step": 3746 + }, + { + "epoch": 0.03, + "global_step": 3747, + "learning_rate": 0.0004851961602671119, + "loss": 1.9221, + "loss_base2": 2.773, + "loss_pixel": 0.3313, + "loss_text": 1.5909, + "ppl": 6.8353, + "step": 3747 + }, + { + "epoch": 0.03, + "global_step": 3748, + "learning_rate": 0.00048519198664440734, + "loss": 1.9473, + "loss_base2": 2.8094, + "loss_pixel": 0.3294, + "loss_text": 1.6179, + "ppl": 7.0097, + "step": 3748 + }, + { + "epoch": 0.03, + "global_step": 3749, + "learning_rate": 0.00048518781302170285, + "loss": 1.9415, + "loss_base2": 2.801, + "loss_pixel": 0.3283, + "loss_text": 1.6132, + "ppl": 6.9692, + "step": 3749 + }, + { + "epoch": 0.03, + "global_step": 3750, + "learning_rate": 0.00048518363939899835, + "loss": 1.8325, + "loss_base2": 2.6437, + "loss_pixel": 0.3284, + "loss_text": 1.5041, + "ppl": 6.2495, + "step": 3750 + }, + { + "epoch": 0.03, + "global_step": 3751, + "learning_rate": 0.00048517946577629386, + "loss": 1.6846, + "loss_base2": 2.4304, + "loss_pixel": 0.3265, + "loss_text": 1.358, + "ppl": 5.3903, + "step": 3751 + }, + { + "epoch": 0.03, + "global_step": 3752, + "learning_rate": 0.0004851752921535893, + "loss": 1.6955, + "loss_base2": 2.4461, + "loss_pixel": 0.3259, + "loss_text": 1.3696, + "ppl": 5.4494, + "step": 3752 + }, + { + "epoch": 0.03, + "global_step": 3753, + "learning_rate": 0.0004851711185308848, + "loss": 1.6881, + "loss_base2": 2.4354, + "loss_pixel": 0.3235, + "loss_text": 1.3645, + "ppl": 5.4092, + "step": 3753 + }, + { + "epoch": 0.03, + "global_step": 3754, + "learning_rate": 0.00048516694490818033, + "loss": 1.6723, + "loss_base2": 2.4126, + "loss_pixel": 0.3225, + "loss_text": 1.3498, + "ppl": 5.3244, + "step": 3754 + }, + { + "epoch": 0.03, + "global_step": 3755, + "learning_rate": 0.00048516277128547584, + "loss": 1.6759, + "loss_base2": 2.4178, + "loss_pixel": 0.3216, + "loss_text": 1.3543, + "ppl": 5.3436, + "step": 3755 + }, + { + "epoch": 0.03, + "global_step": 3756, + "learning_rate": 0.00048515859766277134, + "loss": 1.6805, + "loss_base2": 2.4244, + "loss_pixel": 0.3204, + "loss_text": 1.36, + "ppl": 5.3682, + "step": 3756 + }, + { + "epoch": 0.03, + "global_step": 3757, + "learning_rate": 0.00048515442404006674, + "loss": 1.6676, + "loss_base2": 2.4058, + "loss_pixel": 0.3216, + "loss_text": 1.3459, + "ppl": 5.2994, + "step": 3757 + }, + { + "epoch": 0.03, + "global_step": 3758, + "learning_rate": 0.00048515025041736225, + "loss": 1.7061, + "loss_base2": 2.4614, + "loss_pixel": 0.3179, + "loss_text": 1.3882, + "ppl": 5.5074, + "step": 3758 + }, + { + "epoch": 0.03, + "global_step": 3759, + "learning_rate": 0.00048514607679465776, + "loss": 1.6885, + "loss_base2": 2.436, + "loss_pixel": 0.3179, + "loss_text": 1.3706, + "ppl": 5.4114, + "step": 3759 + }, + { + "epoch": 0.03, + "global_step": 3760, + "learning_rate": 0.00048514190317195326, + "loss": 1.6678, + "loss_base2": 2.4061, + "loss_pixel": 0.3249, + "loss_text": 1.3428, + "ppl": 5.3005, + "step": 3760 + }, + { + "epoch": 0.03, + "global_step": 3761, + "learning_rate": 0.00048513772954924877, + "loss": 1.6857, + "loss_base2": 2.432, + "loss_pixel": 0.3265, + "loss_text": 1.3592, + "ppl": 5.3962, + "step": 3761 + }, + { + "epoch": 0.03, + "global_step": 3762, + "learning_rate": 0.0004851335559265442, + "loss": 1.6844, + "loss_base2": 2.4301, + "loss_pixel": 0.3228, + "loss_text": 1.3616, + "ppl": 5.3892, + "step": 3762 + }, + { + "epoch": 0.03, + "global_step": 3763, + "learning_rate": 0.00048512938230383973, + "loss": 1.6941, + "loss_base2": 2.4441, + "loss_pixel": 0.3256, + "loss_text": 1.3685, + "ppl": 5.4417, + "step": 3763 + }, + { + "epoch": 0.03, + "global_step": 3764, + "learning_rate": 0.00048512520868113524, + "loss": 1.6466, + "loss_base2": 2.3755, + "loss_pixel": 0.3176, + "loss_text": 1.329, + "ppl": 5.1893, + "step": 3764 + }, + { + "epoch": 0.03, + "global_step": 3765, + "learning_rate": 0.00048512103505843075, + "loss": 1.6507, + "loss_base2": 2.3815, + "loss_pixel": 0.3166, + "loss_text": 1.3341, + "ppl": 5.2106, + "step": 3765 + }, + { + "epoch": 0.03, + "global_step": 3766, + "learning_rate": 0.0004851168614357262, + "loss": 1.6857, + "loss_base2": 2.432, + "loss_pixel": 0.3181, + "loss_text": 1.3676, + "ppl": 5.3962, + "step": 3766 + }, + { + "epoch": 0.03, + "global_step": 3767, + "learning_rate": 0.0004851126878130217, + "loss": 1.8394, + "loss_base2": 2.6537, + "loss_pixel": 0.3153, + "loss_text": 1.5241, + "ppl": 6.2928, + "step": 3767 + }, + { + "epoch": 0.03, + "global_step": 3768, + "learning_rate": 0.0004851085141903172, + "loss": 1.8126, + "loss_base2": 2.615, + "loss_pixel": 0.3151, + "loss_text": 1.4975, + "ppl": 6.1264, + "step": 3768 + }, + { + "epoch": 0.03, + "global_step": 3769, + "learning_rate": 0.0004851043405676127, + "loss": 1.6729, + "loss_base2": 2.4135, + "loss_pixel": 0.315, + "loss_text": 1.358, + "ppl": 5.3276, + "step": 3769 + }, + { + "epoch": 0.03, + "global_step": 3770, + "learning_rate": 0.00048510016694490823, + "loss": 1.679, + "loss_base2": 2.4223, + "loss_pixel": 0.3124, + "loss_text": 1.3666, + "ppl": 5.3602, + "step": 3770 + }, + { + "epoch": 0.03, + "global_step": 3771, + "learning_rate": 0.0004850959933222037, + "loss": 1.665, + "loss_base2": 2.4021, + "loss_pixel": 0.3111, + "loss_text": 1.3539, + "ppl": 5.2857, + "step": 3771 + }, + { + "epoch": 0.03, + "global_step": 3772, + "learning_rate": 0.0004850918196994992, + "loss": 1.6815, + "loss_base2": 2.4259, + "loss_pixel": 0.3097, + "loss_text": 1.3718, + "ppl": 5.3736, + "step": 3772 + }, + { + "epoch": 0.03, + "global_step": 3773, + "learning_rate": 0.0004850876460767947, + "loss": 1.6462, + "loss_base2": 2.375, + "loss_pixel": 0.3094, + "loss_text": 1.3368, + "ppl": 5.1872, + "step": 3773 + }, + { + "epoch": 0.03, + "global_step": 3774, + "learning_rate": 0.0004850834724540902, + "loss": 1.6549, + "loss_base2": 2.3875, + "loss_pixel": 0.3073, + "loss_text": 1.3477, + "ppl": 5.2326, + "step": 3774 + }, + { + "epoch": 0.03, + "global_step": 3775, + "learning_rate": 0.0004850792988313856, + "loss": 1.6464, + "loss_base2": 2.3753, + "loss_pixel": 0.3059, + "loss_text": 1.3405, + "ppl": 5.1883, + "step": 3775 + }, + { + "epoch": 0.03, + "global_step": 3776, + "learning_rate": 0.0004850751252086811, + "loss": 1.6453, + "loss_base2": 2.3737, + "loss_pixel": 0.304, + "loss_text": 1.3413, + "ppl": 5.1826, + "step": 3776 + }, + { + "epoch": 0.03, + "global_step": 3777, + "learning_rate": 0.0004850709515859766, + "loss": 1.6514, + "loss_base2": 2.3825, + "loss_pixel": 0.3021, + "loss_text": 1.3493, + "ppl": 5.2143, + "step": 3777 + }, + { + "epoch": 0.03, + "global_step": 3778, + "learning_rate": 0.0004850667779632721, + "loss": 1.6568, + "loss_base2": 2.3903, + "loss_pixel": 0.302, + "loss_text": 1.3548, + "ppl": 5.2425, + "step": 3778 + }, + { + "epoch": 0.03, + "global_step": 3779, + "learning_rate": 0.00048506260434056763, + "loss": 1.6474, + "loss_base2": 2.3767, + "loss_pixel": 0.3019, + "loss_text": 1.3454, + "ppl": 5.1935, + "step": 3779 + }, + { + "epoch": 0.03, + "global_step": 3780, + "learning_rate": 0.0004850584307178631, + "loss": 1.6446, + "loss_base2": 2.3727, + "loss_pixel": 0.3082, + "loss_text": 1.3364, + "ppl": 5.1789, + "step": 3780 + }, + { + "epoch": 0.03, + "global_step": 3781, + "learning_rate": 0.0004850542570951586, + "loss": 1.6521, + "loss_base2": 2.3835, + "loss_pixel": 0.3169, + "loss_text": 1.3351, + "ppl": 5.2179, + "step": 3781 + }, + { + "epoch": 0.03, + "global_step": 3782, + "learning_rate": 0.0004850500834724541, + "loss": 1.6703, + "loss_base2": 2.4097, + "loss_pixel": 0.3093, + "loss_text": 1.361, + "ppl": 5.3138, + "step": 3782 + }, + { + "epoch": 0.03, + "global_step": 3783, + "learning_rate": 0.0004850459098497496, + "loss": 1.6726, + "loss_base2": 2.4131, + "loss_pixel": 0.3155, + "loss_text": 1.3571, + "ppl": 5.326, + "step": 3783 + }, + { + "epoch": 0.03, + "global_step": 3784, + "learning_rate": 0.00048504173622704506, + "loss": 1.642, + "loss_base2": 2.3689, + "loss_pixel": 0.322, + "loss_text": 1.3199, + "ppl": 5.1655, + "step": 3784 + }, + { + "epoch": 0.03, + "global_step": 3785, + "learning_rate": 0.00048503756260434057, + "loss": 1.7307, + "loss_base2": 2.4969, + "loss_pixel": 0.3085, + "loss_text": 1.4222, + "ppl": 5.6446, + "step": 3785 + }, + { + "epoch": 0.03, + "global_step": 3786, + "learning_rate": 0.0004850333889816361, + "loss": 1.9627, + "loss_base2": 2.8316, + "loss_pixel": 0.3102, + "loss_text": 1.6525, + "ppl": 7.1185, + "step": 3786 + }, + { + "epoch": 0.03, + "global_step": 3787, + "learning_rate": 0.0004850292153589316, + "loss": 1.9344, + "loss_base2": 2.7907, + "loss_pixel": 0.3072, + "loss_text": 1.6273, + "ppl": 6.9199, + "step": 3787 + }, + { + "epoch": 0.03, + "global_step": 3788, + "learning_rate": 0.0004850250417362271, + "loss": 1.9267, + "loss_base2": 2.7796, + "loss_pixel": 0.3063, + "loss_text": 1.6204, + "ppl": 6.8668, + "step": 3788 + }, + { + "epoch": 0.03, + "global_step": 3789, + "learning_rate": 0.00048502086811352254, + "loss": 1.9256, + "loss_base2": 2.7781, + "loss_pixel": 0.3021, + "loss_text": 1.6235, + "ppl": 6.8593, + "step": 3789 + }, + { + "epoch": 0.03, + "global_step": 3790, + "learning_rate": 0.00048501669449081805, + "loss": 1.9163, + "loss_base2": 2.7646, + "loss_pixel": 0.3029, + "loss_text": 1.6134, + "ppl": 6.7958, + "step": 3790 + }, + { + "epoch": 0.03, + "global_step": 3791, + "learning_rate": 0.00048501252086811356, + "loss": 1.9091, + "loss_base2": 2.7542, + "loss_pixel": 0.3014, + "loss_text": 1.6077, + "ppl": 6.747, + "step": 3791 + }, + { + "epoch": 0.03, + "global_step": 3792, + "learning_rate": 0.00048500834724540906, + "loss": 1.8962, + "loss_base2": 2.7356, + "loss_pixel": 0.2984, + "loss_text": 1.5978, + "ppl": 6.6605, + "step": 3792 + }, + { + "epoch": 0.03, + "global_step": 3793, + "learning_rate": 0.0004850041736227045, + "loss": 1.8976, + "loss_base2": 2.7377, + "loss_pixel": 0.2994, + "loss_text": 1.5982, + "ppl": 6.6699, + "step": 3793 + }, + { + "epoch": 0.03, + "global_step": 3794, + "learning_rate": 0.00048499999999999997, + "loss": 1.9158, + "loss_base2": 2.7639, + "loss_pixel": 0.3018, + "loss_text": 1.614, + "ppl": 6.7924, + "step": 3794 + }, + { + "epoch": 0.03, + "global_step": 3795, + "learning_rate": 0.0004849958263772955, + "loss": 1.9114, + "loss_base2": 2.7576, + "loss_pixel": 0.299, + "loss_text": 1.6124, + "ppl": 6.7625, + "step": 3795 + }, + { + "epoch": 0.03, + "global_step": 3796, + "learning_rate": 0.000484991652754591, + "loss": 1.9015, + "loss_base2": 2.7433, + "loss_pixel": 0.2967, + "loss_text": 1.6048, + "ppl": 6.6959, + "step": 3796 + }, + { + "epoch": 0.03, + "global_step": 3797, + "learning_rate": 0.0004849874791318865, + "loss": 1.8933, + "loss_base2": 2.7315, + "loss_pixel": 0.2965, + "loss_text": 1.5968, + "ppl": 6.6412, + "step": 3797 + }, + { + "epoch": 0.03, + "global_step": 3798, + "learning_rate": 0.00048498330550918195, + "loss": 1.8983, + "loss_base2": 2.7387, + "loss_pixel": 0.2961, + "loss_text": 1.6022, + "ppl": 6.6745, + "step": 3798 + }, + { + "epoch": 0.03, + "global_step": 3799, + "learning_rate": 0.00048497913188647745, + "loss": 1.909, + "loss_base2": 2.7541, + "loss_pixel": 0.2942, + "loss_text": 1.6148, + "ppl": 6.7463, + "step": 3799 + }, + { + "epoch": 0.03, + "global_step": 3800, + "learning_rate": 0.00048497495826377296, + "loss": 1.8923, + "loss_base2": 2.73, + "loss_pixel": 0.294, + "loss_text": 1.5983, + "ppl": 6.6346, + "step": 3800 + }, + { + "epoch": 0.03, + "global_step": 3801, + "learning_rate": 0.00048497078464106847, + "loss": 1.9094, + "loss_base2": 2.7547, + "loss_pixel": 0.295, + "loss_text": 1.6144, + "ppl": 6.749, + "step": 3801 + }, + { + "epoch": 0.03, + "global_step": 3802, + "learning_rate": 0.0004849666110183639, + "loss": 1.901, + "loss_base2": 2.7426, + "loss_pixel": 0.2965, + "loss_text": 1.6046, + "ppl": 6.6926, + "step": 3802 + }, + { + "epoch": 0.03, + "global_step": 3803, + "learning_rate": 0.00048496243739565943, + "loss": 1.9006, + "loss_base2": 2.742, + "loss_pixel": 0.2958, + "loss_text": 1.6047, + "ppl": 6.6899, + "step": 3803 + }, + { + "epoch": 0.03, + "global_step": 3804, + "learning_rate": 0.00048495826377295494, + "loss": 1.8981, + "loss_base2": 2.7384, + "loss_pixel": 0.2926, + "loss_text": 1.6055, + "ppl": 6.6732, + "step": 3804 + }, + { + "epoch": 0.03, + "global_step": 3805, + "learning_rate": 0.00048495409015025044, + "loss": 1.8769, + "loss_base2": 2.7078, + "loss_pixel": 0.291, + "loss_text": 1.5858, + "ppl": 6.5332, + "step": 3805 + }, + { + "epoch": 0.03, + "global_step": 3806, + "learning_rate": 0.00048494991652754595, + "loss": 1.8878, + "loss_base2": 2.7235, + "loss_pixel": 0.2898, + "loss_text": 1.598, + "ppl": 6.6048, + "step": 3806 + }, + { + "epoch": 0.03, + "global_step": 3807, + "learning_rate": 0.0004849457429048414, + "loss": 1.8954, + "loss_base2": 2.7345, + "loss_pixel": 0.2903, + "loss_text": 1.6051, + "ppl": 6.6552, + "step": 3807 + }, + { + "epoch": 0.03, + "global_step": 3808, + "learning_rate": 0.0004849415692821369, + "loss": 1.8949, + "loss_base2": 2.7338, + "loss_pixel": 0.2879, + "loss_text": 1.6071, + "ppl": 6.6519, + "step": 3808 + }, + { + "epoch": 0.03, + "global_step": 3809, + "learning_rate": 0.0004849373956594324, + "loss": 1.8941, + "loss_base2": 2.7326, + "loss_pixel": 0.2875, + "loss_text": 1.6065, + "ppl": 6.6466, + "step": 3809 + }, + { + "epoch": 0.03, + "global_step": 3810, + "learning_rate": 0.0004849332220367279, + "loss": 1.8644, + "loss_base2": 2.6898, + "loss_pixel": 0.2852, + "loss_text": 1.5791, + "ppl": 6.4521, + "step": 3810 + }, + { + "epoch": 0.03, + "global_step": 3811, + "learning_rate": 0.0004849290484140234, + "loss": 1.8734, + "loss_base2": 2.7027, + "loss_pixel": 0.2846, + "loss_text": 1.5888, + "ppl": 6.5104, + "step": 3811 + }, + { + "epoch": 0.03, + "global_step": 3812, + "learning_rate": 0.0004849248747913189, + "loss": 1.8757, + "loss_base2": 2.7061, + "loss_pixel": 0.2836, + "loss_text": 1.5921, + "ppl": 6.5254, + "step": 3812 + }, + { + "epoch": 0.03, + "global_step": 3813, + "learning_rate": 0.00048492070116861434, + "loss": 1.8393, + "loss_base2": 2.6535, + "loss_pixel": 0.2829, + "loss_text": 1.5564, + "ppl": 6.2921, + "step": 3813 + }, + { + "epoch": 0.03, + "global_step": 3814, + "learning_rate": 0.00048491652754590985, + "loss": 1.8648, + "loss_base2": 2.6903, + "loss_pixel": 0.2815, + "loss_text": 1.5833, + "ppl": 6.4546, + "step": 3814 + }, + { + "epoch": 0.03, + "global_step": 3815, + "learning_rate": 0.00048491235392320535, + "loss": 1.8723, + "loss_base2": 2.7012, + "loss_pixel": 0.2816, + "loss_text": 1.5907, + "ppl": 6.5032, + "step": 3815 + }, + { + "epoch": 0.03, + "global_step": 3816, + "learning_rate": 0.0004849081803005008, + "loss": 1.8635, + "loss_base2": 2.6885, + "loss_pixel": 0.2814, + "loss_text": 1.5821, + "ppl": 6.4463, + "step": 3816 + }, + { + "epoch": 0.03, + "global_step": 3817, + "learning_rate": 0.0004849040066777963, + "loss": 1.8723, + "loss_base2": 2.7012, + "loss_pixel": 0.2797, + "loss_text": 1.5926, + "ppl": 6.5032, + "step": 3817 + }, + { + "epoch": 0.03, + "global_step": 3818, + "learning_rate": 0.0004848998330550918, + "loss": 1.8752, + "loss_base2": 2.7053, + "loss_pixel": 0.2795, + "loss_text": 1.5956, + "ppl": 6.5221, + "step": 3818 + }, + { + "epoch": 0.03, + "global_step": 3819, + "learning_rate": 0.00048489565943238733, + "loss": 1.8544, + "loss_base2": 2.6753, + "loss_pixel": 0.2782, + "loss_text": 1.5762, + "ppl": 6.3879, + "step": 3819 + }, + { + "epoch": 0.03, + "global_step": 3820, + "learning_rate": 0.00048489148580968284, + "loss": 1.8676, + "loss_base2": 2.6944, + "loss_pixel": 0.2765, + "loss_text": 1.5911, + "ppl": 6.4727, + "step": 3820 + }, + { + "epoch": 0.03, + "global_step": 3821, + "learning_rate": 0.0004848873121869783, + "loss": 1.8615, + "loss_base2": 2.6856, + "loss_pixel": 0.2772, + "loss_text": 1.5842, + "ppl": 6.4334, + "step": 3821 + }, + { + "epoch": 0.03, + "global_step": 3822, + "learning_rate": 0.0004848831385642738, + "loss": 1.8624, + "loss_base2": 2.6869, + "loss_pixel": 0.2772, + "loss_text": 1.5852, + "ppl": 6.4392, + "step": 3822 + }, + { + "epoch": 0.03, + "global_step": 3823, + "learning_rate": 0.0004848789649415693, + "loss": 1.831, + "loss_base2": 2.6416, + "loss_pixel": 0.2763, + "loss_text": 1.5547, + "ppl": 6.2401, + "step": 3823 + }, + { + "epoch": 0.03, + "global_step": 3824, + "learning_rate": 0.0004848747913188648, + "loss": 1.878, + "loss_base2": 2.7094, + "loss_pixel": 0.2781, + "loss_text": 1.5999, + "ppl": 6.5404, + "step": 3824 + }, + { + "epoch": 0.03, + "global_step": 3825, + "learning_rate": 0.00048487061769616026, + "loss": 1.8833, + "loss_base2": 2.717, + "loss_pixel": 0.2758, + "loss_text": 1.6075, + "ppl": 6.5752, + "step": 3825 + }, + { + "epoch": 0.03, + "global_step": 3826, + "learning_rate": 0.00048486644407345577, + "loss": 1.8476, + "loss_base2": 2.6655, + "loss_pixel": 0.2779, + "loss_text": 1.5697, + "ppl": 6.3446, + "step": 3826 + }, + { + "epoch": 0.03, + "global_step": 3827, + "learning_rate": 0.0004848622704507513, + "loss": 1.8656, + "loss_base2": 2.6915, + "loss_pixel": 0.2726, + "loss_text": 1.593, + "ppl": 6.4598, + "step": 3827 + }, + { + "epoch": 0.03, + "global_step": 3828, + "learning_rate": 0.0004848580968280468, + "loss": 1.8662, + "loss_base2": 2.6924, + "loss_pixel": 0.2728, + "loss_text": 1.5934, + "ppl": 6.4637, + "step": 3828 + }, + { + "epoch": 0.03, + "global_step": 3829, + "learning_rate": 0.0004848539232053423, + "loss": 1.8675, + "loss_base2": 2.6942, + "loss_pixel": 0.2696, + "loss_text": 1.5979, + "ppl": 6.4721, + "step": 3829 + }, + { + "epoch": 0.03, + "global_step": 3830, + "learning_rate": 0.00048484974958263775, + "loss": 1.8627, + "loss_base2": 2.6873, + "loss_pixel": 0.2694, + "loss_text": 1.5933, + "ppl": 6.4411, + "step": 3830 + }, + { + "epoch": 0.03, + "global_step": 3831, + "learning_rate": 0.00048484557595993325, + "loss": 1.8724, + "loss_base2": 2.7013, + "loss_pixel": 0.2708, + "loss_text": 1.6015, + "ppl": 6.5039, + "step": 3831 + }, + { + "epoch": 0.03, + "global_step": 3832, + "learning_rate": 0.0004848414023372287, + "loss": 1.6851, + "loss_base2": 2.4311, + "loss_pixel": 0.2679, + "loss_text": 1.4172, + "ppl": 5.393, + "step": 3832 + }, + { + "epoch": 0.03, + "global_step": 3833, + "learning_rate": 0.0004848372287145242, + "loss": 1.6245, + "loss_base2": 2.3437, + "loss_pixel": 0.2657, + "loss_text": 1.3589, + "ppl": 5.0759, + "step": 3833 + }, + { + "epoch": 0.03, + "global_step": 3834, + "learning_rate": 0.00048483305509181967, + "loss": 1.6227, + "loss_base2": 2.3411, + "loss_pixel": 0.2656, + "loss_text": 1.3571, + "ppl": 5.0668, + "step": 3834 + }, + { + "epoch": 0.03, + "global_step": 3835, + "learning_rate": 0.0004848288814691152, + "loss": 1.6144, + "loss_base2": 2.3291, + "loss_pixel": 0.2636, + "loss_text": 1.3507, + "ppl": 5.0249, + "step": 3835 + }, + { + "epoch": 0.03, + "global_step": 3836, + "learning_rate": 0.0004848247078464107, + "loss": 1.5887, + "loss_base2": 2.292, + "loss_pixel": 0.2626, + "loss_text": 1.3261, + "ppl": 4.8974, + "step": 3836 + }, + { + "epoch": 0.03, + "global_step": 3837, + "learning_rate": 0.0004848205342237062, + "loss": 1.6093, + "loss_base2": 2.3217, + "loss_pixel": 0.2614, + "loss_text": 1.3479, + "ppl": 4.9993, + "step": 3837 + }, + { + "epoch": 0.03, + "global_step": 3838, + "learning_rate": 0.0004848163606010017, + "loss": 1.6275, + "loss_base2": 2.348, + "loss_pixel": 0.2597, + "loss_text": 1.3679, + "ppl": 5.0911, + "step": 3838 + }, + { + "epoch": 0.03, + "global_step": 3839, + "learning_rate": 0.00048481218697829715, + "loss": 1.6125, + "loss_base2": 2.3263, + "loss_pixel": 0.2586, + "loss_text": 1.3538, + "ppl": 5.0153, + "step": 3839 + }, + { + "epoch": 0.03, + "global_step": 3840, + "learning_rate": 0.00048480801335559266, + "loss": 1.6823, + "loss_base2": 2.427, + "loss_pixel": 0.2586, + "loss_text": 1.4237, + "ppl": 5.3779, + "step": 3840 + }, + { + "epoch": 0.03, + "global_step": 3841, + "learning_rate": 0.00048480383973288816, + "loss": 1.6724, + "loss_base2": 2.4128, + "loss_pixel": 0.265, + "loss_text": 1.4074, + "ppl": 5.3249, + "step": 3841 + }, + { + "epoch": 0.03, + "global_step": 3842, + "learning_rate": 0.00048479966611018367, + "loss": 1.6561, + "loss_base2": 2.3892, + "loss_pixel": 0.3065, + "loss_text": 1.3496, + "ppl": 5.2388, + "step": 3842 + }, + { + "epoch": 0.03, + "global_step": 3843, + "learning_rate": 0.0004847954924874791, + "loss": 1.6759, + "loss_base2": 2.4178, + "loss_pixel": 0.3159, + "loss_text": 1.36, + "ppl": 5.3436, + "step": 3843 + }, + { + "epoch": 0.03, + "global_step": 3844, + "learning_rate": 0.00048479131886477463, + "loss": 1.6741, + "loss_base2": 2.4152, + "loss_pixel": 0.3134, + "loss_text": 1.3608, + "ppl": 5.334, + "step": 3844 + }, + { + "epoch": 0.03, + "global_step": 3845, + "learning_rate": 0.00048478714524207014, + "loss": 1.6485, + "loss_base2": 2.3783, + "loss_pixel": 0.3093, + "loss_text": 1.3392, + "ppl": 5.1992, + "step": 3845 + }, + { + "epoch": 0.03, + "global_step": 3846, + "learning_rate": 0.00048478297161936565, + "loss": 1.6469, + "loss_base2": 2.376, + "loss_pixel": 0.3042, + "loss_text": 1.3427, + "ppl": 5.1909, + "step": 3846 + }, + { + "epoch": 0.03, + "global_step": 3847, + "learning_rate": 0.00048477879799666115, + "loss": 1.6343, + "loss_base2": 2.3578, + "loss_pixel": 0.2964, + "loss_text": 1.3379, + "ppl": 5.1259, + "step": 3847 + }, + { + "epoch": 0.03, + "global_step": 3848, + "learning_rate": 0.0004847746243739566, + "loss": 1.6324, + "loss_base2": 2.3551, + "loss_pixel": 0.2956, + "loss_text": 1.3368, + "ppl": 5.1161, + "step": 3848 + }, + { + "epoch": 0.03, + "global_step": 3849, + "learning_rate": 0.0004847704507512521, + "loss": 1.6313, + "loss_base2": 2.3535, + "loss_pixel": 0.2937, + "loss_text": 1.3377, + "ppl": 5.1105, + "step": 3849 + }, + { + "epoch": 0.03, + "global_step": 3850, + "learning_rate": 0.00048476627712854757, + "loss": 1.6416, + "loss_base2": 2.3683, + "loss_pixel": 0.291, + "loss_text": 1.3506, + "ppl": 5.1634, + "step": 3850 + }, + { + "epoch": 0.03, + "global_step": 3851, + "learning_rate": 0.0004847621035058431, + "loss": 1.6141, + "loss_base2": 2.3287, + "loss_pixel": 0.2887, + "loss_text": 1.3255, + "ppl": 5.0234, + "step": 3851 + }, + { + "epoch": 0.03, + "global_step": 3852, + "learning_rate": 0.00048475792988313853, + "loss": 1.6284, + "loss_base2": 2.3493, + "loss_pixel": 0.2849, + "loss_text": 1.3435, + "ppl": 5.0957, + "step": 3852 + }, + { + "epoch": 0.03, + "global_step": 3853, + "learning_rate": 0.00048475375626043404, + "loss": 1.6331, + "loss_base2": 2.3561, + "loss_pixel": 0.2836, + "loss_text": 1.3495, + "ppl": 5.1197, + "step": 3853 + }, + { + "epoch": 0.03, + "global_step": 3854, + "learning_rate": 0.00048474958263772954, + "loss": 1.606, + "loss_base2": 2.317, + "loss_pixel": 0.2824, + "loss_text": 1.3237, + "ppl": 4.9828, + "step": 3854 + }, + { + "epoch": 0.03, + "global_step": 3855, + "learning_rate": 0.00048474540901502505, + "loss": 1.6132, + "loss_base2": 2.3274, + "loss_pixel": 0.281, + "loss_text": 1.3322, + "ppl": 5.0188, + "step": 3855 + }, + { + "epoch": 0.03, + "global_step": 3856, + "learning_rate": 0.00048474123539232056, + "loss": 1.6262, + "loss_base2": 2.3461, + "loss_pixel": 0.2795, + "loss_text": 1.3467, + "ppl": 5.0845, + "step": 3856 + }, + { + "epoch": 0.03, + "global_step": 3857, + "learning_rate": 0.000484737061769616, + "loss": 1.6071, + "loss_base2": 2.3186, + "loss_pixel": 0.28, + "loss_text": 1.3272, + "ppl": 4.9883, + "step": 3857 + }, + { + "epoch": 0.03, + "global_step": 3858, + "learning_rate": 0.0004847328881469115, + "loss": 1.6245, + "loss_base2": 2.3437, + "loss_pixel": 0.2772, + "loss_text": 1.3472, + "ppl": 5.0759, + "step": 3858 + }, + { + "epoch": 0.03, + "global_step": 3859, + "learning_rate": 0.000484728714524207, + "loss": 1.6103, + "loss_base2": 2.3232, + "loss_pixel": 0.2772, + "loss_text": 1.333, + "ppl": 5.0043, + "step": 3859 + }, + { + "epoch": 0.03, + "global_step": 3860, + "learning_rate": 0.00048472454090150253, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.2738, + "loss_text": 1.3413, + "ppl": 5.0284, + "step": 3860 + }, + { + "epoch": 0.03, + "global_step": 3861, + "learning_rate": 0.000484720367278798, + "loss": 1.5946, + "loss_base2": 2.3005, + "loss_pixel": 0.2731, + "loss_text": 1.3216, + "ppl": 4.9264, + "step": 3861 + }, + { + "epoch": 0.03, + "global_step": 3862, + "learning_rate": 0.0004847161936560935, + "loss": 1.5855, + "loss_base2": 2.2874, + "loss_pixel": 0.2711, + "loss_text": 1.3144, + "ppl": 4.8817, + "step": 3862 + }, + { + "epoch": 0.03, + "global_step": 3863, + "learning_rate": 0.000484712020033389, + "loss": 1.6035, + "loss_base2": 2.3134, + "loss_pixel": 0.2688, + "loss_text": 1.3347, + "ppl": 4.9704, + "step": 3863 + }, + { + "epoch": 0.03, + "global_step": 3864, + "learning_rate": 0.0004847078464106845, + "loss": 1.6161, + "loss_base2": 2.3315, + "loss_pixel": 0.2678, + "loss_text": 1.3483, + "ppl": 5.0334, + "step": 3864 + }, + { + "epoch": 0.03, + "global_step": 3865, + "learning_rate": 0.00048470367278798, + "loss": 1.6014, + "loss_base2": 2.3103, + "loss_pixel": 0.2672, + "loss_text": 1.3342, + "ppl": 4.96, + "step": 3865 + }, + { + "epoch": 0.03, + "global_step": 3866, + "learning_rate": 0.00048469949916527547, + "loss": 1.9076, + "loss_base2": 2.7521, + "loss_pixel": 0.2685, + "loss_text": 1.6391, + "ppl": 6.7369, + "step": 3866 + }, + { + "epoch": 0.03, + "global_step": 3867, + "learning_rate": 0.000484695325542571, + "loss": 1.89, + "loss_base2": 2.7267, + "loss_pixel": 0.27, + "loss_text": 1.62, + "ppl": 6.6194, + "step": 3867 + }, + { + "epoch": 0.03, + "global_step": 3868, + "learning_rate": 0.0004846911519198665, + "loss": 1.8849, + "loss_base2": 2.7193, + "loss_pixel": 0.2693, + "loss_text": 1.6156, + "ppl": 6.5857, + "step": 3868 + }, + { + "epoch": 0.03, + "global_step": 3869, + "learning_rate": 0.00048468697829716194, + "loss": 1.8846, + "loss_base2": 2.7189, + "loss_pixel": 0.266, + "loss_text": 1.6186, + "ppl": 6.5837, + "step": 3869 + }, + { + "epoch": 0.03, + "global_step": 3870, + "learning_rate": 0.0004846828046744574, + "loss": 1.8825, + "loss_base2": 2.7159, + "loss_pixel": 0.2642, + "loss_text": 1.6182, + "ppl": 6.5699, + "step": 3870 + }, + { + "epoch": 0.03, + "global_step": 3871, + "learning_rate": 0.0004846786310517529, + "loss": 1.8778, + "loss_base2": 2.7091, + "loss_pixel": 0.2635, + "loss_text": 1.6143, + "ppl": 6.5391, + "step": 3871 + }, + { + "epoch": 0.03, + "global_step": 3872, + "learning_rate": 0.0004846744574290484, + "loss": 1.8881, + "loss_base2": 2.724, + "loss_pixel": 0.26, + "loss_text": 1.6281, + "ppl": 6.6068, + "step": 3872 + }, + { + "epoch": 0.03, + "global_step": 3873, + "learning_rate": 0.0004846702838063439, + "loss": 1.8661, + "loss_base2": 2.6922, + "loss_pixel": 0.2609, + "loss_text": 1.6052, + "ppl": 6.463, + "step": 3873 + }, + { + "epoch": 0.03, + "global_step": 3874, + "learning_rate": 0.0004846661101836394, + "loss": 1.8512, + "loss_base2": 2.6707, + "loss_pixel": 0.2573, + "loss_text": 1.5939, + "ppl": 6.3675, + "step": 3874 + }, + { + "epoch": 0.03, + "global_step": 3875, + "learning_rate": 0.00048466193656093487, + "loss": 1.8534, + "loss_base2": 2.6739, + "loss_pixel": 0.2565, + "loss_text": 1.5969, + "ppl": 6.3815, + "step": 3875 + }, + { + "epoch": 0.03, + "global_step": 3876, + "learning_rate": 0.0004846577629382304, + "loss": 1.8475, + "loss_base2": 2.6654, + "loss_pixel": 0.2548, + "loss_text": 1.5927, + "ppl": 6.3439, + "step": 3876 + }, + { + "epoch": 0.03, + "global_step": 3877, + "learning_rate": 0.0004846535893155259, + "loss": 1.8511, + "loss_base2": 2.6706, + "loss_pixel": 0.2536, + "loss_text": 1.5975, + "ppl": 6.3668, + "step": 3877 + }, + { + "epoch": 0.03, + "global_step": 3878, + "learning_rate": 0.0004846494156928214, + "loss": 1.8493, + "loss_base2": 2.668, + "loss_pixel": 0.2534, + "loss_text": 1.5959, + "ppl": 6.3554, + "step": 3878 + }, + { + "epoch": 0.03, + "global_step": 3879, + "learning_rate": 0.0004846452420701169, + "loss": 1.85, + "loss_base2": 2.669, + "loss_pixel": 0.2509, + "loss_text": 1.599, + "ppl": 6.3598, + "step": 3879 + }, + { + "epoch": 0.03, + "global_step": 3880, + "learning_rate": 0.00048464106844741235, + "loss": 1.8546, + "loss_base2": 2.6756, + "loss_pixel": 0.2491, + "loss_text": 1.6055, + "ppl": 6.3891, + "step": 3880 + }, + { + "epoch": 0.03, + "global_step": 3881, + "learning_rate": 0.00048463689482470786, + "loss": 1.8448, + "loss_base2": 2.6615, + "loss_pixel": 0.2484, + "loss_text": 1.5965, + "ppl": 6.3268, + "step": 3881 + }, + { + "epoch": 0.03, + "global_step": 3882, + "learning_rate": 0.00048463272120200337, + "loss": 1.8634, + "loss_base2": 2.6883, + "loss_pixel": 0.2468, + "loss_text": 1.6166, + "ppl": 6.4456, + "step": 3882 + }, + { + "epoch": 0.03, + "global_step": 3883, + "learning_rate": 0.0004846285475792989, + "loss": 1.8468, + "loss_base2": 2.6644, + "loss_pixel": 0.2473, + "loss_text": 1.5995, + "ppl": 6.3395, + "step": 3883 + }, + { + "epoch": 0.03, + "global_step": 3884, + "learning_rate": 0.00048462437395659433, + "loss": 1.8518, + "loss_base2": 2.6716, + "loss_pixel": 0.2448, + "loss_text": 1.607, + "ppl": 6.3713, + "step": 3884 + }, + { + "epoch": 0.03, + "global_step": 3885, + "learning_rate": 0.00048462020033388984, + "loss": 1.8532, + "loss_base2": 2.6736, + "loss_pixel": 0.2466, + "loss_text": 1.6067, + "ppl": 6.3802, + "step": 3885 + }, + { + "epoch": 0.03, + "global_step": 3886, + "learning_rate": 0.00048461602671118534, + "loss": 1.8306, + "loss_base2": 2.641, + "loss_pixel": 0.2493, + "loss_text": 1.5813, + "ppl": 6.2376, + "step": 3886 + }, + { + "epoch": 0.03, + "global_step": 3887, + "learning_rate": 0.00048461185308848085, + "loss": 1.8456, + "loss_base2": 2.6626, + "loss_pixel": 0.2464, + "loss_text": 1.5992, + "ppl": 6.3319, + "step": 3887 + }, + { + "epoch": 0.03, + "global_step": 3888, + "learning_rate": 0.0004846076794657763, + "loss": 1.8298, + "loss_base2": 2.6398, + "loss_pixel": 0.2429, + "loss_text": 1.5869, + "ppl": 6.2326, + "step": 3888 + }, + { + "epoch": 0.03, + "global_step": 3889, + "learning_rate": 0.00048460350584307176, + "loss": 1.8329, + "loss_base2": 2.6443, + "loss_pixel": 0.2426, + "loss_text": 1.5902, + "ppl": 6.252, + "step": 3889 + }, + { + "epoch": 0.03, + "global_step": 3890, + "learning_rate": 0.00048459933222036726, + "loss": 1.7334, + "loss_base2": 2.5008, + "loss_pixel": 0.2406, + "loss_text": 1.4928, + "ppl": 5.6599, + "step": 3890 + }, + { + "epoch": 0.03, + "global_step": 3891, + "learning_rate": 0.00048459515859766277, + "loss": 1.6097, + "loss_base2": 2.3223, + "loss_pixel": 0.2404, + "loss_text": 1.3693, + "ppl": 5.0013, + "step": 3891 + }, + { + "epoch": 0.03, + "global_step": 3892, + "learning_rate": 0.0004845909849749583, + "loss": 1.6047, + "loss_base2": 2.3151, + "loss_pixel": 0.2434, + "loss_text": 1.3614, + "ppl": 4.9764, + "step": 3892 + }, + { + "epoch": 0.03, + "global_step": 3893, + "learning_rate": 0.00048458681135225373, + "loss": 1.59, + "loss_base2": 2.2939, + "loss_pixel": 0.2436, + "loss_text": 1.3464, + "ppl": 4.9037, + "step": 3893 + }, + { + "epoch": 0.03, + "global_step": 3894, + "learning_rate": 0.00048458263772954924, + "loss": 1.5898, + "loss_base2": 2.2936, + "loss_pixel": 0.2453, + "loss_text": 1.3445, + "ppl": 4.9028, + "step": 3894 + }, + { + "epoch": 0.03, + "global_step": 3895, + "learning_rate": 0.00048457846410684475, + "loss": 1.5833, + "loss_base2": 2.2842, + "loss_pixel": 0.2409, + "loss_text": 1.3424, + "ppl": 4.871, + "step": 3895 + }, + { + "epoch": 0.03, + "global_step": 3896, + "learning_rate": 0.00048457429048414025, + "loss": 1.5837, + "loss_base2": 2.2848, + "loss_pixel": 0.2389, + "loss_text": 1.3448, + "ppl": 4.873, + "step": 3896 + }, + { + "epoch": 0.03, + "global_step": 3897, + "learning_rate": 0.00048457011686143576, + "loss": 1.5501, + "loss_base2": 2.2363, + "loss_pixel": 0.238, + "loss_text": 1.3121, + "ppl": 4.7119, + "step": 3897 + }, + { + "epoch": 0.03, + "global_step": 3898, + "learning_rate": 0.0004845659432387312, + "loss": 1.7129, + "loss_base2": 2.4712, + "loss_pixel": 0.2357, + "loss_text": 1.4772, + "ppl": 5.545, + "step": 3898 + }, + { + "epoch": 0.03, + "global_step": 3899, + "learning_rate": 0.0004845617696160267, + "loss": 1.7622, + "loss_base2": 2.5423, + "loss_pixel": 0.2359, + "loss_text": 1.5262, + "ppl": 5.8252, + "step": 3899 + }, + { + "epoch": 0.03, + "global_step": 3900, + "learning_rate": 0.00048455759599332223, + "loss": 1.8134, + "loss_base2": 2.6162, + "loss_pixel": 0.232, + "loss_text": 1.5815, + "ppl": 6.1313, + "step": 3900 + }, + { + "epoch": 0.03, + "global_step": 3901, + "learning_rate": 0.00048455342237061774, + "loss": 1.8339, + "loss_base2": 2.6458, + "loss_pixel": 0.232, + "loss_text": 1.602, + "ppl": 6.2582, + "step": 3901 + }, + { + "epoch": 0.03, + "global_step": 3902, + "learning_rate": 0.0004845492487479132, + "loss": 1.8472, + "loss_base2": 2.6649, + "loss_pixel": 0.2294, + "loss_text": 1.6178, + "ppl": 6.342, + "step": 3902 + }, + { + "epoch": 0.03, + "global_step": 3903, + "learning_rate": 0.0004845450751252087, + "loss": 1.8175, + "loss_base2": 2.6221, + "loss_pixel": 0.2297, + "loss_text": 1.5877, + "ppl": 6.1564, + "step": 3903 + }, + { + "epoch": 0.03, + "global_step": 3904, + "learning_rate": 0.0004845409015025042, + "loss": 1.8352, + "loss_base2": 2.6476, + "loss_pixel": 0.229, + "loss_text": 1.6062, + "ppl": 6.2664, + "step": 3904 + }, + { + "epoch": 0.03, + "global_step": 3905, + "learning_rate": 0.0004845367278797997, + "loss": 1.8136, + "loss_base2": 2.6165, + "loss_pixel": 0.2271, + "loss_text": 1.5865, + "ppl": 6.1325, + "step": 3905 + }, + { + "epoch": 0.03, + "global_step": 3906, + "learning_rate": 0.0004845325542570952, + "loss": 1.8194, + "loss_base2": 2.6248, + "loss_pixel": 0.2265, + "loss_text": 1.5929, + "ppl": 6.1682, + "step": 3906 + }, + { + "epoch": 0.03, + "global_step": 3907, + "learning_rate": 0.0004845283806343906, + "loss": 1.835, + "loss_base2": 2.6473, + "loss_pixel": 0.2263, + "loss_text": 1.6087, + "ppl": 6.2651, + "step": 3907 + }, + { + "epoch": 0.03, + "global_step": 3908, + "learning_rate": 0.0004845242070116861, + "loss": 1.82, + "loss_base2": 2.6257, + "loss_pixel": 0.2255, + "loss_text": 1.5946, + "ppl": 6.1719, + "step": 3908 + }, + { + "epoch": 0.03, + "global_step": 3909, + "learning_rate": 0.00048452003338898163, + "loss": 1.8305, + "loss_base2": 2.6409, + "loss_pixel": 0.2271, + "loss_text": 1.6033, + "ppl": 6.237, + "step": 3909 + }, + { + "epoch": 0.03, + "global_step": 3910, + "learning_rate": 0.00048451585976627714, + "loss": 1.8138, + "loss_base2": 2.6168, + "loss_pixel": 0.2232, + "loss_text": 1.5907, + "ppl": 6.1337, + "step": 3910 + }, + { + "epoch": 0.03, + "global_step": 3911, + "learning_rate": 0.0004845116861435726, + "loss": 1.8175, + "loss_base2": 2.6221, + "loss_pixel": 0.2239, + "loss_text": 1.5936, + "ppl": 6.1564, + "step": 3911 + }, + { + "epoch": 0.03, + "global_step": 3912, + "learning_rate": 0.0004845075125208681, + "loss": 1.8177, + "loss_base2": 2.6224, + "loss_pixel": 0.2224, + "loss_text": 1.5953, + "ppl": 6.1577, + "step": 3912 + }, + { + "epoch": 0.03, + "global_step": 3913, + "learning_rate": 0.0004845033388981636, + "loss": 1.8163, + "loss_base2": 2.6204, + "loss_pixel": 0.2219, + "loss_text": 1.5944, + "ppl": 6.1491, + "step": 3913 + }, + { + "epoch": 0.03, + "global_step": 3914, + "learning_rate": 0.0004844991652754591, + "loss": 1.8293, + "loss_base2": 2.6391, + "loss_pixel": 0.2208, + "loss_text": 1.6085, + "ppl": 6.2295, + "step": 3914 + }, + { + "epoch": 0.03, + "global_step": 3915, + "learning_rate": 0.0004844949916527546, + "loss": 1.8127, + "loss_base2": 2.6152, + "loss_pixel": 0.2215, + "loss_text": 1.5913, + "ppl": 6.127, + "step": 3915 + }, + { + "epoch": 0.03, + "global_step": 3916, + "learning_rate": 0.0004844908180300501, + "loss": 1.8071, + "loss_base2": 2.6071, + "loss_pixel": 0.2215, + "loss_text": 1.5857, + "ppl": 6.0928, + "step": 3916 + }, + { + "epoch": 0.03, + "global_step": 3917, + "learning_rate": 0.0004844866444073456, + "loss": 1.8151, + "loss_base2": 2.6186, + "loss_pixel": 0.2218, + "loss_text": 1.5933, + "ppl": 6.1417, + "step": 3917 + }, + { + "epoch": 0.03, + "global_step": 3918, + "learning_rate": 0.0004844824707846411, + "loss": 1.8131, + "loss_base2": 2.6158, + "loss_pixel": 0.2205, + "loss_text": 1.5925, + "ppl": 6.1294, + "step": 3918 + }, + { + "epoch": 0.03, + "global_step": 3919, + "learning_rate": 0.0004844782971619366, + "loss": 1.8067, + "loss_base2": 2.6065, + "loss_pixel": 0.2206, + "loss_text": 1.5861, + "ppl": 6.0903, + "step": 3919 + }, + { + "epoch": 0.03, + "global_step": 3920, + "learning_rate": 0.00048447412353923205, + "loss": 1.8142, + "loss_base2": 2.6173, + "loss_pixel": 0.2201, + "loss_text": 1.5941, + "ppl": 6.1362, + "step": 3920 + }, + { + "epoch": 0.03, + "global_step": 3921, + "learning_rate": 0.00048446994991652756, + "loss": 1.8012, + "loss_base2": 2.5986, + "loss_pixel": 0.2192, + "loss_text": 1.5821, + "ppl": 6.0569, + "step": 3921 + }, + { + "epoch": 0.03, + "global_step": 3922, + "learning_rate": 0.00048446577629382306, + "loss": 1.8145, + "loss_base2": 2.6178, + "loss_pixel": 0.2187, + "loss_text": 1.5959, + "ppl": 6.138, + "step": 3922 + }, + { + "epoch": 0.03, + "global_step": 3923, + "learning_rate": 0.00048446160267111857, + "loss": 1.8049, + "loss_base2": 2.6039, + "loss_pixel": 0.2177, + "loss_text": 1.5872, + "ppl": 6.0794, + "step": 3923 + }, + { + "epoch": 0.03, + "global_step": 3924, + "learning_rate": 0.0004844574290484141, + "loss": 1.8057, + "loss_base2": 2.6051, + "loss_pixel": 0.2167, + "loss_text": 1.589, + "ppl": 6.0842, + "step": 3924 + }, + { + "epoch": 0.03, + "global_step": 3925, + "learning_rate": 0.0004844532554257095, + "loss": 1.8086, + "loss_base2": 2.6093, + "loss_pixel": 0.2169, + "loss_text": 1.5917, + "ppl": 6.1019, + "step": 3925 + }, + { + "epoch": 0.03, + "global_step": 3926, + "learning_rate": 0.000484449081803005, + "loss": 1.7779, + "loss_base2": 2.565, + "loss_pixel": 0.2173, + "loss_text": 1.5606, + "ppl": 5.9174, + "step": 3926 + }, + { + "epoch": 0.03, + "global_step": 3927, + "learning_rate": 0.0004844449081803005, + "loss": 1.8085, + "loss_base2": 2.6091, + "loss_pixel": 0.2163, + "loss_text": 1.5922, + "ppl": 6.1013, + "step": 3927 + }, + { + "epoch": 0.03, + "global_step": 3928, + "learning_rate": 0.000484440734557596, + "loss": 1.7864, + "loss_base2": 2.5772, + "loss_pixel": 0.2164, + "loss_text": 1.57, + "ppl": 5.9679, + "step": 3928 + }, + { + "epoch": 0.03, + "global_step": 3929, + "learning_rate": 0.00048443656093489145, + "loss": 1.8059, + "loss_base2": 2.6054, + "loss_pixel": 0.2137, + "loss_text": 1.5922, + "ppl": 6.0854, + "step": 3929 + }, + { + "epoch": 0.03, + "global_step": 3930, + "learning_rate": 0.00048443238731218696, + "loss": 1.7935, + "loss_base2": 2.5875, + "loss_pixel": 0.2144, + "loss_text": 1.5791, + "ppl": 6.0105, + "step": 3930 + }, + { + "epoch": 0.03, + "global_step": 3931, + "learning_rate": 0.00048442821368948247, + "loss": 1.7984, + "loss_base2": 2.5945, + "loss_pixel": 0.2135, + "loss_text": 1.5848, + "ppl": 6.04, + "step": 3931 + }, + { + "epoch": 0.03, + "global_step": 3932, + "learning_rate": 0.000484424040066778, + "loss": 1.8206, + "loss_base2": 2.6266, + "loss_pixel": 0.2138, + "loss_text": 1.6067, + "ppl": 6.1756, + "step": 3932 + }, + { + "epoch": 0.03, + "global_step": 3933, + "learning_rate": 0.0004844198664440735, + "loss": 1.7926, + "loss_base2": 2.5862, + "loss_pixel": 0.2143, + "loss_text": 1.5784, + "ppl": 6.005, + "step": 3933 + }, + { + "epoch": 0.03, + "global_step": 3934, + "learning_rate": 0.00048441569282136894, + "loss": 1.8076, + "loss_base2": 2.6078, + "loss_pixel": 0.2143, + "loss_text": 1.5932, + "ppl": 6.0958, + "step": 3934 + }, + { + "epoch": 0.03, + "global_step": 3935, + "learning_rate": 0.00048441151919866444, + "loss": 1.7965, + "loss_base2": 2.5918, + "loss_pixel": 0.2138, + "loss_text": 1.5827, + "ppl": 6.0285, + "step": 3935 + }, + { + "epoch": 0.03, + "global_step": 3936, + "learning_rate": 0.00048440734557595995, + "loss": 1.7936, + "loss_base2": 2.5876, + "loss_pixel": 0.2135, + "loss_text": 1.5801, + "ppl": 6.0111, + "step": 3936 + }, + { + "epoch": 0.03, + "global_step": 3937, + "learning_rate": 0.00048440317195325546, + "loss": 1.7878, + "loss_base2": 2.5793, + "loss_pixel": 0.2125, + "loss_text": 1.5754, + "ppl": 5.9763, + "step": 3937 + }, + { + "epoch": 0.03, + "global_step": 3938, + "learning_rate": 0.00048439899833055096, + "loss": 1.7801, + "loss_base2": 2.5681, + "loss_pixel": 0.2132, + "loss_text": 1.5669, + "ppl": 5.9304, + "step": 3938 + }, + { + "epoch": 0.03, + "global_step": 3939, + "learning_rate": 0.0004843948247078464, + "loss": 1.7931, + "loss_base2": 2.5869, + "loss_pixel": 0.2136, + "loss_text": 1.5795, + "ppl": 6.008, + "step": 3939 + }, + { + "epoch": 0.03, + "global_step": 3940, + "learning_rate": 0.0004843906510851419, + "loss": 1.7872, + "loss_base2": 2.5784, + "loss_pixel": 0.2126, + "loss_text": 1.5746, + "ppl": 5.9727, + "step": 3940 + }, + { + "epoch": 0.03, + "global_step": 3941, + "learning_rate": 0.00048438647746243743, + "loss": 1.8048, + "loss_base2": 2.6038, + "loss_pixel": 0.2151, + "loss_text": 1.5897, + "ppl": 6.0788, + "step": 3941 + }, + { + "epoch": 0.03, + "global_step": 3942, + "learning_rate": 0.00048438230383973294, + "loss": 1.8034, + "loss_base2": 2.6018, + "loss_pixel": 0.2119, + "loss_text": 1.5914, + "ppl": 6.0703, + "step": 3942 + }, + { + "epoch": 0.03, + "global_step": 3943, + "learning_rate": 0.0004843781302170284, + "loss": 1.8045, + "loss_base2": 2.6033, + "loss_pixel": 0.2119, + "loss_text": 1.5927, + "ppl": 6.0769, + "step": 3943 + }, + { + "epoch": 0.03, + "global_step": 3944, + "learning_rate": 0.00048437395659432385, + "loss": 1.7903, + "loss_base2": 2.5829, + "loss_pixel": 0.2109, + "loss_text": 1.5794, + "ppl": 5.9912, + "step": 3944 + }, + { + "epoch": 0.03, + "global_step": 3945, + "learning_rate": 0.00048436978297161935, + "loss": 1.8085, + "loss_base2": 2.6091, + "loss_pixel": 0.2116, + "loss_text": 1.5969, + "ppl": 6.1013, + "step": 3945 + }, + { + "epoch": 0.03, + "global_step": 3946, + "learning_rate": 0.00048436560934891486, + "loss": 1.7756, + "loss_base2": 2.5616, + "loss_pixel": 0.2123, + "loss_text": 1.5633, + "ppl": 5.9038, + "step": 3946 + }, + { + "epoch": 0.03, + "global_step": 3947, + "learning_rate": 0.00048436143572621037, + "loss": 1.7879, + "loss_base2": 2.5794, + "loss_pixel": 0.2113, + "loss_text": 1.5766, + "ppl": 5.9769, + "step": 3947 + }, + { + "epoch": 0.03, + "global_step": 3948, + "learning_rate": 0.0004843572621035058, + "loss": 1.7776, + "loss_base2": 2.5645, + "loss_pixel": 0.2123, + "loss_text": 1.5653, + "ppl": 5.9156, + "step": 3948 + }, + { + "epoch": 0.03, + "global_step": 3949, + "learning_rate": 0.00048435308848080133, + "loss": 1.7997, + "loss_base2": 2.5964, + "loss_pixel": 0.2112, + "loss_text": 1.5885, + "ppl": 6.0478, + "step": 3949 + }, + { + "epoch": 0.03, + "global_step": 3950, + "learning_rate": 0.00048434891485809684, + "loss": 1.8047, + "loss_base2": 2.6036, + "loss_pixel": 0.211, + "loss_text": 1.5937, + "ppl": 6.0781, + "step": 3950 + }, + { + "epoch": 0.03, + "global_step": 3951, + "learning_rate": 0.00048434474123539234, + "loss": 1.7922, + "loss_base2": 2.5856, + "loss_pixel": 0.2111, + "loss_text": 1.5811, + "ppl": 6.0026, + "step": 3951 + }, + { + "epoch": 0.03, + "global_step": 3952, + "learning_rate": 0.0004843405676126878, + "loss": 1.791, + "loss_base2": 2.5839, + "loss_pixel": 0.211, + "loss_text": 1.58, + "ppl": 5.9954, + "step": 3952 + }, + { + "epoch": 0.03, + "global_step": 3953, + "learning_rate": 0.0004843363939899833, + "loss": 1.8036, + "loss_base2": 2.602, + "loss_pixel": 0.2105, + "loss_text": 1.5931, + "ppl": 6.0715, + "step": 3953 + }, + { + "epoch": 0.03, + "global_step": 3954, + "learning_rate": 0.0004843322203672788, + "loss": 1.7918, + "loss_base2": 2.585, + "loss_pixel": 0.2102, + "loss_text": 1.5816, + "ppl": 6.0002, + "step": 3954 + }, + { + "epoch": 0.03, + "global_step": 3955, + "learning_rate": 0.0004843280467445743, + "loss": 1.7904, + "loss_base2": 2.583, + "loss_pixel": 0.2105, + "loss_text": 1.5799, + "ppl": 5.9918, + "step": 3955 + }, + { + "epoch": 0.03, + "global_step": 3956, + "learning_rate": 0.0004843238731218698, + "loss": 1.793, + "loss_base2": 2.5868, + "loss_pixel": 0.2095, + "loss_text": 1.5835, + "ppl": 6.0074, + "step": 3956 + }, + { + "epoch": 0.03, + "global_step": 3957, + "learning_rate": 0.0004843196994991653, + "loss": 1.7805, + "loss_base2": 2.5687, + "loss_pixel": 0.2106, + "loss_text": 1.5699, + "ppl": 5.9328, + "step": 3957 + }, + { + "epoch": 0.03, + "global_step": 3958, + "learning_rate": 0.0004843155258764608, + "loss": 1.7853, + "loss_base2": 2.5756, + "loss_pixel": 0.2096, + "loss_text": 1.5756, + "ppl": 5.9614, + "step": 3958 + }, + { + "epoch": 0.03, + "global_step": 3959, + "learning_rate": 0.0004843113522537563, + "loss": 1.7712, + "loss_base2": 2.5553, + "loss_pixel": 0.2088, + "loss_text": 1.5624, + "ppl": 5.8779, + "step": 3959 + }, + { + "epoch": 0.03, + "global_step": 3960, + "learning_rate": 0.0004843071786310518, + "loss": 1.7843, + "loss_base2": 2.5742, + "loss_pixel": 0.2084, + "loss_text": 1.5759, + "ppl": 5.9554, + "step": 3960 + }, + { + "epoch": 0.03, + "global_step": 3961, + "learning_rate": 0.00048430300500834725, + "loss": 1.7722, + "loss_base2": 2.5567, + "loss_pixel": 0.2079, + "loss_text": 1.5643, + "ppl": 5.8838, + "step": 3961 + }, + { + "epoch": 0.03, + "global_step": 3962, + "learning_rate": 0.00048429883138564276, + "loss": 1.802, + "loss_base2": 2.5997, + "loss_pixel": 0.2087, + "loss_text": 1.5933, + "ppl": 6.0618, + "step": 3962 + }, + { + "epoch": 0.03, + "global_step": 3963, + "learning_rate": 0.0004842946577629382, + "loss": 1.8028, + "loss_base2": 2.6009, + "loss_pixel": 0.2071, + "loss_text": 1.5957, + "ppl": 6.0666, + "step": 3963 + }, + { + "epoch": 0.03, + "global_step": 3964, + "learning_rate": 0.0004842904841402337, + "loss": 1.787, + "loss_base2": 2.5781, + "loss_pixel": 0.2081, + "loss_text": 1.5789, + "ppl": 5.9715, + "step": 3964 + }, + { + "epoch": 0.03, + "global_step": 3965, + "learning_rate": 0.00048428631051752923, + "loss": 1.7879, + "loss_base2": 2.5794, + "loss_pixel": 0.2092, + "loss_text": 1.5786, + "ppl": 5.9769, + "step": 3965 + }, + { + "epoch": 0.03, + "global_step": 3966, + "learning_rate": 0.0004842821368948247, + "loss": 1.7776, + "loss_base2": 2.5645, + "loss_pixel": 0.2079, + "loss_text": 1.5698, + "ppl": 5.9156, + "step": 3966 + }, + { + "epoch": 0.03, + "global_step": 3967, + "learning_rate": 0.0004842779632721202, + "loss": 1.8027, + "loss_base2": 2.6007, + "loss_pixel": 0.2109, + "loss_text": 1.5917, + "ppl": 6.066, + "step": 3967 + }, + { + "epoch": 0.03, + "global_step": 3968, + "learning_rate": 0.0004842737896494157, + "loss": 1.7075, + "loss_base2": 2.4634, + "loss_pixel": 0.2086, + "loss_text": 1.4989, + "ppl": 5.5152, + "step": 3968 + }, + { + "epoch": 0.03, + "global_step": 3969, + "learning_rate": 0.0004842696160267112, + "loss": 1.5307, + "loss_base2": 2.2083, + "loss_pixel": 0.2083, + "loss_text": 1.3224, + "ppl": 4.6214, + "step": 3969 + }, + { + "epoch": 0.03, + "global_step": 3970, + "learning_rate": 0.00048426544240400666, + "loss": 1.5627, + "loss_base2": 2.2545, + "loss_pixel": 0.2074, + "loss_text": 1.3553, + "ppl": 4.7717, + "step": 3970 + }, + { + "epoch": 0.03, + "global_step": 3971, + "learning_rate": 0.00048426126878130216, + "loss": 1.5427, + "loss_base2": 2.2256, + "loss_pixel": 0.2074, + "loss_text": 1.3353, + "ppl": 4.6772, + "step": 3971 + }, + { + "epoch": 0.03, + "global_step": 3972, + "learning_rate": 0.00048425709515859767, + "loss": 1.5689, + "loss_base2": 2.2634, + "loss_pixel": 0.2068, + "loss_text": 1.3621, + "ppl": 4.8014, + "step": 3972 + }, + { + "epoch": 0.03, + "global_step": 3973, + "learning_rate": 0.0004842529215358932, + "loss": 1.5482, + "loss_base2": 2.2336, + "loss_pixel": 0.2073, + "loss_text": 1.3409, + "ppl": 4.703, + "step": 3973 + }, + { + "epoch": 0.03, + "global_step": 3974, + "learning_rate": 0.0004842487479131887, + "loss": 1.5353, + "loss_base2": 2.215, + "loss_pixel": 0.21, + "loss_text": 1.3253, + "ppl": 4.6427, + "step": 3974 + }, + { + "epoch": 0.03, + "global_step": 3975, + "learning_rate": 0.00048424457429048414, + "loss": 1.5485, + "loss_base2": 2.234, + "loss_pixel": 0.206, + "loss_text": 1.3426, + "ppl": 4.7044, + "step": 3975 + }, + { + "epoch": 0.03, + "global_step": 3976, + "learning_rate": 0.00048424040066777965, + "loss": 1.5441, + "loss_base2": 2.2277, + "loss_pixel": 0.2054, + "loss_text": 1.3387, + "ppl": 4.6838, + "step": 3976 + }, + { + "epoch": 0.03, + "global_step": 3977, + "learning_rate": 0.00048423622704507515, + "loss": 1.5391, + "loss_base2": 2.2205, + "loss_pixel": 0.2056, + "loss_text": 1.3335, + "ppl": 4.6604, + "step": 3977 + }, + { + "epoch": 0.03, + "global_step": 3978, + "learning_rate": 0.00048423205342237066, + "loss": 1.5373, + "loss_base2": 2.2179, + "loss_pixel": 0.2059, + "loss_text": 1.3313, + "ppl": 4.652, + "step": 3978 + }, + { + "epoch": 0.03, + "global_step": 3979, + "learning_rate": 0.0004842278797996661, + "loss": 1.528, + "loss_base2": 2.2044, + "loss_pixel": 0.2052, + "loss_text": 1.3228, + "ppl": 4.6089, + "step": 3979 + }, + { + "epoch": 0.03, + "global_step": 3980, + "learning_rate": 0.0004842237061769616, + "loss": 1.5343, + "loss_base2": 2.2135, + "loss_pixel": 0.2042, + "loss_text": 1.3301, + "ppl": 4.6381, + "step": 3980 + }, + { + "epoch": 0.03, + "global_step": 3981, + "learning_rate": 0.00048421953255425713, + "loss": 1.5392, + "loss_base2": 2.2206, + "loss_pixel": 0.2041, + "loss_text": 1.3351, + "ppl": 4.6609, + "step": 3981 + }, + { + "epoch": 0.03, + "global_step": 3982, + "learning_rate": 0.0004842153589315526, + "loss": 1.5427, + "loss_base2": 2.2256, + "loss_pixel": 0.2069, + "loss_text": 1.3357, + "ppl": 4.6772, + "step": 3982 + }, + { + "epoch": 0.03, + "global_step": 3983, + "learning_rate": 0.0004842111853088481, + "loss": 1.5143, + "loss_base2": 2.1847, + "loss_pixel": 0.205, + "loss_text": 1.3093, + "ppl": 4.5462, + "step": 3983 + }, + { + "epoch": 0.03, + "global_step": 3984, + "learning_rate": 0.00048420701168614354, + "loss": 1.5313, + "loss_base2": 2.2092, + "loss_pixel": 0.2042, + "loss_text": 1.327, + "ppl": 4.6242, + "step": 3984 + }, + { + "epoch": 0.03, + "global_step": 3985, + "learning_rate": 0.00048420283806343905, + "loss": 1.5329, + "loss_base2": 2.2115, + "loss_pixel": 0.2046, + "loss_text": 1.3283, + "ppl": 4.6316, + "step": 3985 + }, + { + "epoch": 0.03, + "global_step": 3986, + "learning_rate": 0.00048419866444073456, + "loss": 1.7839, + "loss_base2": 2.5736, + "loss_pixel": 0.205, + "loss_text": 1.579, + "ppl": 5.953, + "step": 3986 + }, + { + "epoch": 0.03, + "global_step": 3987, + "learning_rate": 0.00048419449081803006, + "loss": 1.8028, + "loss_base2": 2.6009, + "loss_pixel": 0.205, + "loss_text": 1.5978, + "ppl": 6.0666, + "step": 3987 + }, + { + "epoch": 0.03, + "global_step": 3988, + "learning_rate": 0.00048419031719532557, + "loss": 1.8155, + "loss_base2": 2.6192, + "loss_pixel": 0.2052, + "loss_text": 1.6103, + "ppl": 6.1441, + "step": 3988 + }, + { + "epoch": 0.03, + "global_step": 3989, + "learning_rate": 0.000484186143572621, + "loss": 1.8064, + "loss_base2": 2.6061, + "loss_pixel": 0.206, + "loss_text": 1.6004, + "ppl": 6.0885, + "step": 3989 + }, + { + "epoch": 0.03, + "global_step": 3990, + "learning_rate": 0.00048418196994991653, + "loss": 1.8178, + "loss_base2": 2.6225, + "loss_pixel": 0.2092, + "loss_text": 1.6086, + "ppl": 6.1583, + "step": 3990 + }, + { + "epoch": 0.03, + "global_step": 3991, + "learning_rate": 0.00048417779632721204, + "loss": 1.7988, + "loss_base2": 2.5951, + "loss_pixel": 0.2182, + "loss_text": 1.5807, + "ppl": 6.0424, + "step": 3991 + }, + { + "epoch": 0.03, + "global_step": 3992, + "learning_rate": 0.00048417362270450755, + "loss": 1.8094, + "loss_base2": 2.6104, + "loss_pixel": 0.2163, + "loss_text": 1.5931, + "ppl": 6.1068, + "step": 3992 + }, + { + "epoch": 0.03, + "global_step": 3993, + "learning_rate": 0.000484169449081803, + "loss": 1.7997, + "loss_base2": 2.5964, + "loss_pixel": 0.2185, + "loss_text": 1.5813, + "ppl": 6.0478, + "step": 3993 + }, + { + "epoch": 0.03, + "global_step": 3994, + "learning_rate": 0.0004841652754590985, + "loss": 1.7973, + "loss_base2": 2.593, + "loss_pixel": 0.2232, + "loss_text": 1.574, + "ppl": 6.0333, + "step": 3994 + }, + { + "epoch": 0.03, + "global_step": 3995, + "learning_rate": 0.000484161101836394, + "loss": 1.8303, + "loss_base2": 2.6406, + "loss_pixel": 0.2229, + "loss_text": 1.6074, + "ppl": 6.2358, + "step": 3995 + }, + { + "epoch": 0.03, + "global_step": 3996, + "learning_rate": 0.0004841569282136895, + "loss": 1.8013, + "loss_base2": 2.5987, + "loss_pixel": 0.2225, + "loss_text": 1.5787, + "ppl": 6.0575, + "step": 3996 + }, + { + "epoch": 0.03, + "global_step": 3997, + "learning_rate": 0.00048415275459098503, + "loss": 1.7954, + "loss_base2": 2.5902, + "loss_pixel": 0.2175, + "loss_text": 1.5779, + "ppl": 6.0219, + "step": 3997 + }, + { + "epoch": 0.03, + "global_step": 3998, + "learning_rate": 0.0004841485809682805, + "loss": 1.7938, + "loss_base2": 2.5879, + "loss_pixel": 0.2179, + "loss_text": 1.5759, + "ppl": 6.0123, + "step": 3998 + }, + { + "epoch": 0.03, + "global_step": 3999, + "learning_rate": 0.000484144407345576, + "loss": 1.7909, + "loss_base2": 2.5837, + "loss_pixel": 0.2153, + "loss_text": 1.5756, + "ppl": 5.9948, + "step": 3999 + }, + { + "epoch": 0.03, + "global_step": 4000, + "learning_rate": 0.0004841402337228715, + "loss": 1.8253, + "loss_base2": 2.6334, + "loss_pixel": 0.2151, + "loss_text": 1.6102, + "ppl": 6.2047, + "step": 4000 + }, + { + "epoch": 0.03, + "global_step": 4001, + "learning_rate": 0.00048413606010016695, + "loss": 1.8043, + "loss_base2": 2.6031, + "loss_pixel": 0.2146, + "loss_text": 1.5897, + "ppl": 6.0757, + "step": 4001 + }, + { + "epoch": 0.03, + "global_step": 4002, + "learning_rate": 0.0004841318864774624, + "loss": 1.793, + "loss_base2": 2.5868, + "loss_pixel": 0.2134, + "loss_text": 1.5796, + "ppl": 6.0074, + "step": 4002 + }, + { + "epoch": 0.03, + "global_step": 4003, + "learning_rate": 0.0004841277128547579, + "loss": 1.7821, + "loss_base2": 2.571, + "loss_pixel": 0.211, + "loss_text": 1.571, + "ppl": 5.9423, + "step": 4003 + }, + { + "epoch": 0.03, + "global_step": 4004, + "learning_rate": 0.0004841235392320534, + "loss": 1.7906, + "loss_base2": 2.5833, + "loss_pixel": 0.2111, + "loss_text": 1.5795, + "ppl": 5.993, + "step": 4004 + }, + { + "epoch": 0.03, + "global_step": 4005, + "learning_rate": 0.0004841193656093489, + "loss": 1.7706, + "loss_base2": 2.5544, + "loss_pixel": 0.2101, + "loss_text": 1.5605, + "ppl": 5.8744, + "step": 4005 + }, + { + "epoch": 0.03, + "global_step": 4006, + "learning_rate": 0.00048411519198664443, + "loss": 1.7973, + "loss_base2": 2.593, + "loss_pixel": 0.2094, + "loss_text": 1.5879, + "ppl": 6.0333, + "step": 4006 + }, + { + "epoch": 0.03, + "global_step": 4007, + "learning_rate": 0.0004841110183639399, + "loss": 1.7842, + "loss_base2": 2.5741, + "loss_pixel": 0.21, + "loss_text": 1.5741, + "ppl": 5.9548, + "step": 4007 + }, + { + "epoch": 0.03, + "global_step": 4008, + "learning_rate": 0.0004841068447412354, + "loss": 1.809, + "loss_base2": 2.6098, + "loss_pixel": 0.2091, + "loss_text": 1.5999, + "ppl": 6.1043, + "step": 4008 + }, + { + "epoch": 0.03, + "global_step": 4009, + "learning_rate": 0.0004841026711185309, + "loss": 1.796, + "loss_base2": 2.5911, + "loss_pixel": 0.2078, + "loss_text": 1.5882, + "ppl": 6.0255, + "step": 4009 + }, + { + "epoch": 0.03, + "global_step": 4010, + "learning_rate": 0.0004840984974958264, + "loss": 1.7872, + "loss_base2": 2.5784, + "loss_pixel": 0.208, + "loss_text": 1.5792, + "ppl": 5.9727, + "step": 4010 + }, + { + "epoch": 0.03, + "global_step": 4011, + "learning_rate": 0.00048409432387312186, + "loss": 1.7993, + "loss_base2": 2.5958, + "loss_pixel": 0.2091, + "loss_text": 1.5902, + "ppl": 6.0454, + "step": 4011 + }, + { + "epoch": 0.03, + "global_step": 4012, + "learning_rate": 0.00048409015025041737, + "loss": 1.8177, + "loss_base2": 2.6224, + "loss_pixel": 0.2099, + "loss_text": 1.6078, + "ppl": 6.1577, + "step": 4012 + }, + { + "epoch": 0.03, + "global_step": 4013, + "learning_rate": 0.0004840859766277129, + "loss": 1.8015, + "loss_base2": 2.599, + "loss_pixel": 0.2088, + "loss_text": 1.5926, + "ppl": 6.0587, + "step": 4013 + }, + { + "epoch": 0.03, + "global_step": 4014, + "learning_rate": 0.0004840818030050084, + "loss": 1.7972, + "loss_base2": 2.5928, + "loss_pixel": 0.2085, + "loss_text": 1.5887, + "ppl": 6.0327, + "step": 4014 + }, + { + "epoch": 0.03, + "global_step": 4015, + "learning_rate": 0.0004840776293823039, + "loss": 1.7926, + "loss_base2": 2.5862, + "loss_pixel": 0.2079, + "loss_text": 1.5847, + "ppl": 6.005, + "step": 4015 + }, + { + "epoch": 0.03, + "global_step": 4016, + "learning_rate": 0.00048407345575959934, + "loss": 1.8005, + "loss_base2": 2.5976, + "loss_pixel": 0.206, + "loss_text": 1.5945, + "ppl": 6.0527, + "step": 4016 + }, + { + "epoch": 0.03, + "global_step": 4017, + "learning_rate": 0.00048406928213689485, + "loss": 1.7867, + "loss_base2": 2.5777, + "loss_pixel": 0.2079, + "loss_text": 1.5788, + "ppl": 5.9697, + "step": 4017 + }, + { + "epoch": 0.03, + "global_step": 4018, + "learning_rate": 0.00048406510851419036, + "loss": 1.8014, + "loss_base2": 2.5989, + "loss_pixel": 0.2061, + "loss_text": 1.5952, + "ppl": 6.0581, + "step": 4018 + }, + { + "epoch": 0.03, + "global_step": 4019, + "learning_rate": 0.0004840609348914858, + "loss": 1.781, + "loss_base2": 2.5694, + "loss_pixel": 0.2023, + "loss_text": 1.5787, + "ppl": 5.9358, + "step": 4019 + }, + { + "epoch": 0.03, + "global_step": 4020, + "learning_rate": 0.00048405676126878126, + "loss": 1.7908, + "loss_base2": 2.5836, + "loss_pixel": 0.2039, + "loss_text": 1.5868, + "ppl": 5.9942, + "step": 4020 + }, + { + "epoch": 0.03, + "global_step": 4021, + "learning_rate": 0.00048405258764607677, + "loss": 1.7859, + "loss_base2": 2.5765, + "loss_pixel": 0.2032, + "loss_text": 1.5827, + "ppl": 5.9649, + "step": 4021 + }, + { + "epoch": 0.03, + "global_step": 4022, + "learning_rate": 0.0004840484140233723, + "loss": 1.7828, + "loss_base2": 2.572, + "loss_pixel": 0.2027, + "loss_text": 1.5801, + "ppl": 5.9465, + "step": 4022 + }, + { + "epoch": 0.03, + "global_step": 4023, + "learning_rate": 0.0004840442404006678, + "loss": 1.7943, + "loss_base2": 2.5886, + "loss_pixel": 0.2044, + "loss_text": 1.5899, + "ppl": 6.0153, + "step": 4023 + }, + { + "epoch": 0.03, + "global_step": 4024, + "learning_rate": 0.0004840400667779633, + "loss": 1.7995, + "loss_base2": 2.5961, + "loss_pixel": 0.2007, + "loss_text": 1.5988, + "ppl": 6.0466, + "step": 4024 + }, + { + "epoch": 0.03, + "global_step": 4025, + "learning_rate": 0.00048403589315525875, + "loss": 1.7666, + "loss_base2": 2.5487, + "loss_pixel": 0.2007, + "loss_text": 1.5659, + "ppl": 5.8509, + "step": 4025 + }, + { + "epoch": 0.03, + "global_step": 4026, + "learning_rate": 0.00048403171953255425, + "loss": 1.7783, + "loss_base2": 2.5655, + "loss_pixel": 0.1997, + "loss_text": 1.5786, + "ppl": 5.9198, + "step": 4026 + }, + { + "epoch": 0.03, + "global_step": 4027, + "learning_rate": 0.00048402754590984976, + "loss": 1.7714, + "loss_base2": 2.5556, + "loss_pixel": 0.2005, + "loss_text": 1.5709, + "ppl": 5.8791, + "step": 4027 + }, + { + "epoch": 0.03, + "global_step": 4028, + "learning_rate": 0.00048402337228714527, + "loss": 1.7857, + "loss_base2": 2.5762, + "loss_pixel": 0.2005, + "loss_text": 1.5852, + "ppl": 5.9638, + "step": 4028 + }, + { + "epoch": 0.03, + "global_step": 4029, + "learning_rate": 0.0004840191986644407, + "loss": 1.7992, + "loss_base2": 2.5957, + "loss_pixel": 0.1997, + "loss_text": 1.5994, + "ppl": 6.0448, + "step": 4029 + }, + { + "epoch": 0.03, + "global_step": 4030, + "learning_rate": 0.00048401502504173623, + "loss": 1.7896, + "loss_base2": 2.5818, + "loss_pixel": 0.2098, + "loss_text": 1.5798, + "ppl": 5.9871, + "step": 4030 + }, + { + "epoch": 0.03, + "global_step": 4031, + "learning_rate": 0.00048401085141903174, + "loss": 1.7949, + "loss_base2": 2.5895, + "loss_pixel": 0.2084, + "loss_text": 1.5865, + "ppl": 6.0189, + "step": 4031 + }, + { + "epoch": 0.03, + "global_step": 4032, + "learning_rate": 0.00048400667779632724, + "loss": 1.7998, + "loss_base2": 2.5966, + "loss_pixel": 0.2064, + "loss_text": 1.5934, + "ppl": 6.0484, + "step": 4032 + }, + { + "epoch": 0.03, + "global_step": 4033, + "learning_rate": 0.00048400250417362275, + "loss": 1.7866, + "loss_base2": 2.5775, + "loss_pixel": 0.2062, + "loss_text": 1.5804, + "ppl": 5.9691, + "step": 4033 + }, + { + "epoch": 0.03, + "global_step": 4034, + "learning_rate": 0.0004839983305509182, + "loss": 1.7892, + "loss_base2": 2.5813, + "loss_pixel": 0.2062, + "loss_text": 1.583, + "ppl": 5.9847, + "step": 4034 + }, + { + "epoch": 0.03, + "global_step": 4035, + "learning_rate": 0.0004839941569282137, + "loss": 1.795, + "loss_base2": 2.5896, + "loss_pixel": 0.2069, + "loss_text": 1.5881, + "ppl": 6.0195, + "step": 4035 + }, + { + "epoch": 0.03, + "global_step": 4036, + "learning_rate": 0.0004839899833055092, + "loss": 1.7898, + "loss_base2": 2.5821, + "loss_pixel": 0.2047, + "loss_text": 1.5852, + "ppl": 5.9883, + "step": 4036 + }, + { + "epoch": 0.03, + "global_step": 4037, + "learning_rate": 0.0004839858096828047, + "loss": 1.7827, + "loss_base2": 2.5719, + "loss_pixel": 0.2057, + "loss_text": 1.577, + "ppl": 5.9459, + "step": 4037 + }, + { + "epoch": 0.03, + "global_step": 4038, + "learning_rate": 0.0004839816360601001, + "loss": 1.8125, + "loss_base2": 2.6149, + "loss_pixel": 0.2044, + "loss_text": 1.6081, + "ppl": 6.1257, + "step": 4038 + }, + { + "epoch": 0.03, + "global_step": 4039, + "learning_rate": 0.00048397746243739563, + "loss": 1.7653, + "loss_base2": 2.5468, + "loss_pixel": 0.2038, + "loss_text": 1.5615, + "ppl": 5.8433, + "step": 4039 + }, + { + "epoch": 0.03, + "global_step": 4040, + "learning_rate": 0.00048397328881469114, + "loss": 1.7802, + "loss_base2": 2.5683, + "loss_pixel": 0.2043, + "loss_text": 1.5759, + "ppl": 5.931, + "step": 4040 + }, + { + "epoch": 0.03, + "global_step": 4041, + "learning_rate": 0.00048396911519198665, + "loss": 1.7885, + "loss_base2": 2.5803, + "loss_pixel": 0.2034, + "loss_text": 1.5851, + "ppl": 5.9805, + "step": 4041 + }, + { + "epoch": 0.03, + "global_step": 4042, + "learning_rate": 0.00048396494156928215, + "loss": 1.7796, + "loss_base2": 2.5674, + "loss_pixel": 0.2029, + "loss_text": 1.5767, + "ppl": 5.9275, + "step": 4042 + }, + { + "epoch": 0.03, + "global_step": 4043, + "learning_rate": 0.0004839607679465776, + "loss": 1.7884, + "loss_base2": 2.5801, + "loss_pixel": 0.2044, + "loss_text": 1.584, + "ppl": 5.9799, + "step": 4043 + }, + { + "epoch": 0.03, + "global_step": 4044, + "learning_rate": 0.0004839565943238731, + "loss": 1.7741, + "loss_base2": 2.5595, + "loss_pixel": 0.2027, + "loss_text": 1.5714, + "ppl": 5.895, + "step": 4044 + }, + { + "epoch": 0.03, + "global_step": 4045, + "learning_rate": 0.0004839524207011686, + "loss": 1.7844, + "loss_base2": 2.5743, + "loss_pixel": 0.2018, + "loss_text": 1.5826, + "ppl": 5.956, + "step": 4045 + }, + { + "epoch": 0.03, + "global_step": 4046, + "learning_rate": 0.00048394824707846413, + "loss": 1.7602, + "loss_base2": 2.5394, + "loss_pixel": 0.2021, + "loss_text": 1.5581, + "ppl": 5.8136, + "step": 4046 + }, + { + "epoch": 0.03, + "global_step": 4047, + "learning_rate": 0.00048394407345575964, + "loss": 1.7923, + "loss_base2": 2.5857, + "loss_pixel": 0.2054, + "loss_text": 1.5869, + "ppl": 6.0032, + "step": 4047 + }, + { + "epoch": 0.03, + "global_step": 4048, + "learning_rate": 0.0004839398998330551, + "loss": 1.7903, + "loss_base2": 2.5829, + "loss_pixel": 0.2025, + "loss_text": 1.5878, + "ppl": 5.9912, + "step": 4048 + }, + { + "epoch": 0.03, + "global_step": 4049, + "learning_rate": 0.0004839357262103506, + "loss": 1.7719, + "loss_base2": 2.5563, + "loss_pixel": 0.2032, + "loss_text": 1.5687, + "ppl": 5.882, + "step": 4049 + }, + { + "epoch": 0.03, + "global_step": 4050, + "learning_rate": 0.0004839315525876461, + "loss": 1.7783, + "loss_base2": 2.5655, + "loss_pixel": 0.2023, + "loss_text": 1.576, + "ppl": 5.9198, + "step": 4050 + }, + { + "epoch": 0.03, + "global_step": 4051, + "learning_rate": 0.0004839273789649416, + "loss": 1.7868, + "loss_base2": 2.5778, + "loss_pixel": 0.2035, + "loss_text": 1.5833, + "ppl": 5.9703, + "step": 4051 + }, + { + "epoch": 0.03, + "global_step": 4052, + "learning_rate": 0.00048392320534223706, + "loss": 1.6576, + "loss_base2": 2.3914, + "loss_pixel": 0.2023, + "loss_text": 1.4554, + "ppl": 5.2467, + "step": 4052 + }, + { + "epoch": 0.03, + "global_step": 4053, + "learning_rate": 0.00048391903171953257, + "loss": 1.5426, + "loss_base2": 2.2255, + "loss_pixel": 0.2008, + "loss_text": 1.3417, + "ppl": 4.6767, + "step": 4053 + }, + { + "epoch": 0.03, + "global_step": 4054, + "learning_rate": 0.0004839148580968281, + "loss": 1.5425, + "loss_base2": 2.2254, + "loss_pixel": 0.2006, + "loss_text": 1.342, + "ppl": 4.6763, + "step": 4054 + }, + { + "epoch": 0.03, + "global_step": 4055, + "learning_rate": 0.0004839106844741236, + "loss": 1.5253, + "loss_base2": 2.2005, + "loss_pixel": 0.2013, + "loss_text": 1.324, + "ppl": 4.5965, + "step": 4055 + }, + { + "epoch": 0.03, + "global_step": 4056, + "learning_rate": 0.0004839065108514191, + "loss": 1.5423, + "loss_base2": 2.2251, + "loss_pixel": 0.2005, + "loss_text": 1.3419, + "ppl": 4.6753, + "step": 4056 + }, + { + "epoch": 0.03, + "global_step": 4057, + "learning_rate": 0.0004839023372287145, + "loss": 1.5632, + "loss_base2": 2.2552, + "loss_pixel": 0.2006, + "loss_text": 1.3627, + "ppl": 4.7741, + "step": 4057 + }, + { + "epoch": 0.03, + "global_step": 4058, + "learning_rate": 0.00048389816360601, + "loss": 1.5329, + "loss_base2": 2.2115, + "loss_pixel": 0.1997, + "loss_text": 1.3332, + "ppl": 4.6316, + "step": 4058 + }, + { + "epoch": 0.03, + "global_step": 4059, + "learning_rate": 0.0004838939899833055, + "loss": 1.5288, + "loss_base2": 2.2056, + "loss_pixel": 0.2005, + "loss_text": 1.3282, + "ppl": 4.6126, + "step": 4059 + }, + { + "epoch": 0.03, + "global_step": 4060, + "learning_rate": 0.000483889816360601, + "loss": 1.5404, + "loss_base2": 2.2223, + "loss_pixel": 0.201, + "loss_text": 1.3393, + "ppl": 4.6665, + "step": 4060 + }, + { + "epoch": 0.03, + "global_step": 4061, + "learning_rate": 0.00048388564273789647, + "loss": 1.5327, + "loss_base2": 2.2112, + "loss_pixel": 0.201, + "loss_text": 1.3317, + "ppl": 4.6307, + "step": 4061 + }, + { + "epoch": 0.03, + "global_step": 4062, + "learning_rate": 0.000483881469115192, + "loss": 1.5184, + "loss_base2": 2.1906, + "loss_pixel": 0.2003, + "loss_text": 1.3181, + "ppl": 4.5649, + "step": 4062 + }, + { + "epoch": 0.03, + "global_step": 4063, + "learning_rate": 0.0004838772954924875, + "loss": 1.5437, + "loss_base2": 2.2271, + "loss_pixel": 0.1993, + "loss_text": 1.3444, + "ppl": 4.6819, + "step": 4063 + }, + { + "epoch": 0.03, + "global_step": 4064, + "learning_rate": 0.000483873121869783, + "loss": 1.549, + "loss_base2": 2.2347, + "loss_pixel": 0.1992, + "loss_text": 1.3498, + "ppl": 4.7068, + "step": 4064 + }, + { + "epoch": 0.03, + "global_step": 4065, + "learning_rate": 0.0004838689482470785, + "loss": 1.5259, + "loss_base2": 2.2014, + "loss_pixel": 0.1996, + "loss_text": 1.3263, + "ppl": 4.5993, + "step": 4065 + }, + { + "epoch": 0.03, + "global_step": 4066, + "learning_rate": 0.00048386477462437395, + "loss": 1.5581, + "loss_base2": 2.2479, + "loss_pixel": 0.1995, + "loss_text": 1.3587, + "ppl": 4.7498, + "step": 4066 + }, + { + "epoch": 0.03, + "global_step": 4067, + "learning_rate": 0.00048386060100166946, + "loss": 1.5119, + "loss_base2": 2.1812, + "loss_pixel": 0.1991, + "loss_text": 1.3128, + "ppl": 4.5353, + "step": 4067 + }, + { + "epoch": 0.03, + "global_step": 4068, + "learning_rate": 0.00048385642737896496, + "loss": 1.559, + "loss_base2": 2.2492, + "loss_pixel": 0.2011, + "loss_text": 1.3579, + "ppl": 4.7541, + "step": 4068 + }, + { + "epoch": 0.03, + "global_step": 4069, + "learning_rate": 0.00048385225375626047, + "loss": 1.5364, + "loss_base2": 2.2166, + "loss_pixel": 0.2001, + "loss_text": 1.3363, + "ppl": 4.6478, + "step": 4069 + }, + { + "epoch": 0.03, + "global_step": 4070, + "learning_rate": 0.0004838480801335559, + "loss": 1.5137, + "loss_base2": 2.1838, + "loss_pixel": 0.1992, + "loss_text": 1.3145, + "ppl": 4.5435, + "step": 4070 + }, + { + "epoch": 0.03, + "global_step": 4071, + "learning_rate": 0.00048384390651085143, + "loss": 1.5326, + "loss_base2": 2.2111, + "loss_pixel": 0.1991, + "loss_text": 1.3335, + "ppl": 4.6302, + "step": 4071 + }, + { + "epoch": 0.03, + "global_step": 4072, + "learning_rate": 0.00048383973288814694, + "loss": 1.5368, + "loss_base2": 2.2171, + "loss_pixel": 0.2003, + "loss_text": 1.3366, + "ppl": 4.6497, + "step": 4072 + }, + { + "epoch": 0.03, + "global_step": 4073, + "learning_rate": 0.00048383555926544245, + "loss": 1.5195, + "loss_base2": 2.1922, + "loss_pixel": 0.1992, + "loss_text": 1.3204, + "ppl": 4.5699, + "step": 4073 + }, + { + "epoch": 0.03, + "global_step": 4074, + "learning_rate": 0.00048383138564273795, + "loss": 1.523, + "loss_base2": 2.1972, + "loss_pixel": 0.1992, + "loss_text": 1.3238, + "ppl": 4.586, + "step": 4074 + }, + { + "epoch": 0.03, + "global_step": 4075, + "learning_rate": 0.00048382721202003335, + "loss": 1.5298, + "loss_base2": 2.207, + "loss_pixel": 0.2004, + "loss_text": 1.3294, + "ppl": 4.6173, + "step": 4075 + }, + { + "epoch": 0.03, + "global_step": 4076, + "learning_rate": 0.00048382303839732886, + "loss": 1.5005, + "loss_base2": 2.1648, + "loss_pixel": 0.1997, + "loss_text": 1.3009, + "ppl": 4.4839, + "step": 4076 + }, + { + "epoch": 0.03, + "global_step": 4077, + "learning_rate": 0.00048381886477462437, + "loss": 1.5415, + "loss_base2": 2.2239, + "loss_pixel": 0.2006, + "loss_text": 1.3409, + "ppl": 4.6716, + "step": 4077 + }, + { + "epoch": 0.03, + "global_step": 4078, + "learning_rate": 0.0004838146911519199, + "loss": 1.5156, + "loss_base2": 2.1865, + "loss_pixel": 0.1979, + "loss_text": 1.3177, + "ppl": 4.5522, + "step": 4078 + }, + { + "epoch": 0.03, + "global_step": 4079, + "learning_rate": 0.00048381051752921533, + "loss": 1.5192, + "loss_base2": 2.1917, + "loss_pixel": 0.201, + "loss_text": 1.3182, + "ppl": 4.5686, + "step": 4079 + }, + { + "epoch": 0.03, + "global_step": 4080, + "learning_rate": 0.00048380634390651084, + "loss": 1.5156, + "loss_base2": 2.1865, + "loss_pixel": 0.1999, + "loss_text": 1.3156, + "ppl": 4.5522, + "step": 4080 + }, + { + "epoch": 0.03, + "global_step": 4081, + "learning_rate": 0.00048380217028380634, + "loss": 1.5228, + "loss_base2": 2.1969, + "loss_pixel": 0.1993, + "loss_text": 1.3235, + "ppl": 4.585, + "step": 4081 + }, + { + "epoch": 0.03, + "global_step": 4082, + "learning_rate": 0.00048379799666110185, + "loss": 1.5331, + "loss_base2": 2.2118, + "loss_pixel": 0.1996, + "loss_text": 1.3335, + "ppl": 4.6325, + "step": 4082 + }, + { + "epoch": 0.03, + "global_step": 4083, + "learning_rate": 0.00048379382303839736, + "loss": 1.5463, + "loss_base2": 2.2308, + "loss_pixel": 0.1987, + "loss_text": 1.3475, + "ppl": 4.6941, + "step": 4083 + }, + { + "epoch": 0.03, + "global_step": 4084, + "learning_rate": 0.0004837896494156928, + "loss": 1.6484, + "loss_base2": 2.3781, + "loss_pixel": 0.1992, + "loss_text": 1.4491, + "ppl": 5.1987, + "step": 4084 + }, + { + "epoch": 0.03, + "global_step": 4085, + "learning_rate": 0.0004837854757929883, + "loss": 1.7869, + "loss_base2": 2.578, + "loss_pixel": 0.1984, + "loss_text": 1.5885, + "ppl": 5.9709, + "step": 4085 + }, + { + "epoch": 0.03, + "global_step": 4086, + "learning_rate": 0.0004837813021702838, + "loss": 1.7914, + "loss_base2": 2.5844, + "loss_pixel": 0.198, + "loss_text": 1.5934, + "ppl": 5.9978, + "step": 4086 + }, + { + "epoch": 0.03, + "global_step": 4087, + "learning_rate": 0.00048377712854757933, + "loss": 1.7946, + "loss_base2": 2.5891, + "loss_pixel": 0.1989, + "loss_text": 1.5957, + "ppl": 6.0171, + "step": 4087 + }, + { + "epoch": 0.03, + "global_step": 4088, + "learning_rate": 0.0004837729549248748, + "loss": 1.7913, + "loss_base2": 2.5843, + "loss_pixel": 0.1993, + "loss_text": 1.592, + "ppl": 5.9972, + "step": 4088 + }, + { + "epoch": 0.03, + "global_step": 4089, + "learning_rate": 0.0004837687813021703, + "loss": 1.7884, + "loss_base2": 2.5801, + "loss_pixel": 0.198, + "loss_text": 1.5903, + "ppl": 5.9799, + "step": 4089 + }, + { + "epoch": 0.03, + "global_step": 4090, + "learning_rate": 0.0004837646076794658, + "loss": 1.7779, + "loss_base2": 2.565, + "loss_pixel": 0.1967, + "loss_text": 1.5813, + "ppl": 5.9174, + "step": 4090 + }, + { + "epoch": 0.03, + "global_step": 4091, + "learning_rate": 0.0004837604340567613, + "loss": 1.7881, + "loss_base2": 2.5797, + "loss_pixel": 0.1983, + "loss_text": 1.5898, + "ppl": 5.9781, + "step": 4091 + }, + { + "epoch": 0.03, + "global_step": 4092, + "learning_rate": 0.0004837562604340568, + "loss": 1.7803, + "loss_base2": 2.5684, + "loss_pixel": 0.2002, + "loss_text": 1.5801, + "ppl": 5.9316, + "step": 4092 + }, + { + "epoch": 0.03, + "global_step": 4093, + "learning_rate": 0.00048375208681135227, + "loss": 1.7995, + "loss_base2": 2.5961, + "loss_pixel": 0.1974, + "loss_text": 1.6021, + "ppl": 6.0466, + "step": 4093 + }, + { + "epoch": 0.03, + "global_step": 4094, + "learning_rate": 0.0004837479131886477, + "loss": 1.7874, + "loss_base2": 2.5787, + "loss_pixel": 0.1986, + "loss_text": 1.5889, + "ppl": 5.9739, + "step": 4094 + }, + { + "epoch": 0.03, + "global_step": 4095, + "learning_rate": 0.00048374373956594323, + "loss": 1.7838, + "loss_base2": 2.5735, + "loss_pixel": 0.1978, + "loss_text": 1.586, + "ppl": 5.9524, + "step": 4095 + }, + { + "epoch": 0.03, + "global_step": 4096, + "learning_rate": 0.00048373956594323874, + "loss": 1.7742, + "loss_base2": 2.5596, + "loss_pixel": 0.1973, + "loss_text": 1.5769, + "ppl": 5.8956, + "step": 4096 + }, + { + "epoch": 0.03, + "global_step": 4097, + "learning_rate": 0.0004837353923205342, + "loss": 1.786, + "loss_base2": 2.5767, + "loss_pixel": 0.1994, + "loss_text": 1.5866, + "ppl": 5.9655, + "step": 4097 + }, + { + "epoch": 0.03, + "global_step": 4098, + "learning_rate": 0.0004837312186978297, + "loss": 1.7817, + "loss_base2": 2.5704, + "loss_pixel": 0.1986, + "loss_text": 1.5831, + "ppl": 5.9399, + "step": 4098 + }, + { + "epoch": 0.03, + "global_step": 4099, + "learning_rate": 0.0004837270450751252, + "loss": 1.7612, + "loss_base2": 2.5409, + "loss_pixel": 0.1974, + "loss_text": 1.5637, + "ppl": 5.8194, + "step": 4099 + }, + { + "epoch": 0.03, + "global_step": 4100, + "learning_rate": 0.0004837228714524207, + "loss": 1.787, + "loss_base2": 2.5781, + "loss_pixel": 0.1979, + "loss_text": 1.5891, + "ppl": 5.9715, + "step": 4100 + }, + { + "epoch": 0.03, + "global_step": 4101, + "learning_rate": 0.0004837186978297162, + "loss": 1.7734, + "loss_base2": 2.5585, + "loss_pixel": 0.1969, + "loss_text": 1.5766, + "ppl": 5.8908, + "step": 4101 + }, + { + "epoch": 0.03, + "global_step": 4102, + "learning_rate": 0.00048371452420701167, + "loss": 1.7937, + "loss_base2": 2.5878, + "loss_pixel": 0.1981, + "loss_text": 1.5956, + "ppl": 6.0117, + "step": 4102 + }, + { + "epoch": 0.03, + "global_step": 4103, + "learning_rate": 0.0004837103505843072, + "loss": 1.7781, + "loss_base2": 2.5653, + "loss_pixel": 0.1967, + "loss_text": 1.5815, + "ppl": 5.9186, + "step": 4103 + }, + { + "epoch": 0.03, + "global_step": 4104, + "learning_rate": 0.0004837061769616027, + "loss": 1.7775, + "loss_base2": 2.5644, + "loss_pixel": 0.1972, + "loss_text": 1.5802, + "ppl": 5.9151, + "step": 4104 + }, + { + "epoch": 0.03, + "global_step": 4105, + "learning_rate": 0.0004837020033388982, + "loss": 1.7584, + "loss_base2": 2.5368, + "loss_pixel": 0.1969, + "loss_text": 1.5615, + "ppl": 5.8031, + "step": 4105 + }, + { + "epoch": 0.03, + "global_step": 4106, + "learning_rate": 0.0004836978297161937, + "loss": 1.771, + "loss_base2": 2.555, + "loss_pixel": 0.1964, + "loss_text": 1.5746, + "ppl": 5.8767, + "step": 4106 + }, + { + "epoch": 0.03, + "global_step": 4107, + "learning_rate": 0.00048369365609348915, + "loss": 1.7894, + "loss_base2": 2.5816, + "loss_pixel": 0.1953, + "loss_text": 1.594, + "ppl": 5.9859, + "step": 4107 + }, + { + "epoch": 0.03, + "global_step": 4108, + "learning_rate": 0.00048368948247078466, + "loss": 1.7742, + "loss_base2": 2.5596, + "loss_pixel": 0.1979, + "loss_text": 1.5763, + "ppl": 5.8956, + "step": 4108 + }, + { + "epoch": 0.03, + "global_step": 4109, + "learning_rate": 0.00048368530884808017, + "loss": 1.785, + "loss_base2": 2.5752, + "loss_pixel": 0.1974, + "loss_text": 1.5876, + "ppl": 5.9596, + "step": 4109 + }, + { + "epoch": 0.03, + "global_step": 4110, + "learning_rate": 0.0004836811352253757, + "loss": 1.7545, + "loss_base2": 2.5312, + "loss_pixel": 0.196, + "loss_text": 1.5584, + "ppl": 5.7806, + "step": 4110 + }, + { + "epoch": 0.03, + "global_step": 4111, + "learning_rate": 0.00048367696160267113, + "loss": 1.7749, + "loss_base2": 2.5606, + "loss_pixel": 0.1966, + "loss_text": 1.5783, + "ppl": 5.8997, + "step": 4111 + }, + { + "epoch": 0.03, + "global_step": 4112, + "learning_rate": 0.00048367278797996664, + "loss": 1.7839, + "loss_base2": 2.5736, + "loss_pixel": 0.1975, + "loss_text": 1.5863, + "ppl": 5.953, + "step": 4112 + }, + { + "epoch": 0.03, + "global_step": 4113, + "learning_rate": 0.0004836686143572621, + "loss": 1.7715, + "loss_base2": 2.5557, + "loss_pixel": 0.1963, + "loss_text": 1.5753, + "ppl": 5.8797, + "step": 4113 + }, + { + "epoch": 0.03, + "global_step": 4114, + "learning_rate": 0.0004836644407345576, + "loss": 1.7807, + "loss_base2": 2.569, + "loss_pixel": 0.1965, + "loss_text": 1.5841, + "ppl": 5.934, + "step": 4114 + }, + { + "epoch": 0.03, + "global_step": 4115, + "learning_rate": 0.0004836602671118531, + "loss": 1.7677, + "loss_base2": 2.5503, + "loss_pixel": 0.1951, + "loss_text": 1.5725, + "ppl": 5.8574, + "step": 4115 + }, + { + "epoch": 0.03, + "global_step": 4116, + "learning_rate": 0.00048365609348914856, + "loss": 1.7767, + "loss_base2": 2.5632, + "loss_pixel": 0.1962, + "loss_text": 1.5806, + "ppl": 5.9103, + "step": 4116 + }, + { + "epoch": 0.03, + "global_step": 4117, + "learning_rate": 0.00048365191986644406, + "loss": 1.7672, + "loss_base2": 2.5495, + "loss_pixel": 0.1967, + "loss_text": 1.5705, + "ppl": 5.8544, + "step": 4117 + }, + { + "epoch": 0.03, + "global_step": 4118, + "learning_rate": 0.00048364774624373957, + "loss": 1.769, + "loss_base2": 2.5521, + "loss_pixel": 0.1963, + "loss_text": 1.5727, + "ppl": 5.865, + "step": 4118 + }, + { + "epoch": 0.03, + "global_step": 4119, + "learning_rate": 0.0004836435726210351, + "loss": 1.7875, + "loss_base2": 2.5788, + "loss_pixel": 0.1979, + "loss_text": 1.5896, + "ppl": 5.9745, + "step": 4119 + }, + { + "epoch": 0.03, + "global_step": 4120, + "learning_rate": 0.00048363939899833053, + "loss": 1.7591, + "loss_base2": 2.5378, + "loss_pixel": 0.1978, + "loss_text": 1.5613, + "ppl": 5.8072, + "step": 4120 + }, + { + "epoch": 0.03, + "global_step": 4121, + "learning_rate": 0.00048363522537562604, + "loss": 1.7537, + "loss_base2": 2.5301, + "loss_pixel": 0.1971, + "loss_text": 1.5567, + "ppl": 5.7759, + "step": 4121 + }, + { + "epoch": 0.03, + "global_step": 4122, + "learning_rate": 0.00048363105175292155, + "loss": 1.7695, + "loss_base2": 2.5528, + "loss_pixel": 0.1976, + "loss_text": 1.5719, + "ppl": 5.8679, + "step": 4122 + }, + { + "epoch": 0.03, + "global_step": 4123, + "learning_rate": 0.00048362687813021705, + "loss": 1.7703, + "loss_base2": 2.554, + "loss_pixel": 0.1975, + "loss_text": 1.5728, + "ppl": 5.8726, + "step": 4123 + }, + { + "epoch": 0.03, + "global_step": 4124, + "learning_rate": 0.00048362270450751256, + "loss": 1.7661, + "loss_base2": 2.5479, + "loss_pixel": 0.1988, + "loss_text": 1.5673, + "ppl": 5.848, + "step": 4124 + }, + { + "epoch": 0.03, + "global_step": 4125, + "learning_rate": 0.000483618530884808, + "loss": 1.7386, + "loss_base2": 2.5083, + "loss_pixel": 0.1979, + "loss_text": 1.5407, + "ppl": 5.6894, + "step": 4125 + }, + { + "epoch": 0.03, + "global_step": 4126, + "learning_rate": 0.0004836143572621035, + "loss": 1.7738, + "loss_base2": 2.5591, + "loss_pixel": 0.1963, + "loss_text": 1.5775, + "ppl": 5.8932, + "step": 4126 + }, + { + "epoch": 0.03, + "global_step": 4127, + "learning_rate": 0.00048361018363939903, + "loss": 1.7617, + "loss_base2": 2.5416, + "loss_pixel": 0.1978, + "loss_text": 1.5638, + "ppl": 5.8223, + "step": 4127 + }, + { + "epoch": 0.03, + "global_step": 4128, + "learning_rate": 0.00048360601001669454, + "loss": 1.7822, + "loss_base2": 2.5712, + "loss_pixel": 0.1992, + "loss_text": 1.583, + "ppl": 5.9429, + "step": 4128 + }, + { + "epoch": 0.03, + "global_step": 4129, + "learning_rate": 0.00048360183639399, + "loss": 1.7707, + "loss_base2": 2.5546, + "loss_pixel": 0.198, + "loss_text": 1.5727, + "ppl": 5.875, + "step": 4129 + }, + { + "epoch": 0.03, + "global_step": 4130, + "learning_rate": 0.0004835976627712855, + "loss": 1.7705, + "loss_base2": 2.5543, + "loss_pixel": 0.1943, + "loss_text": 1.5763, + "ppl": 5.8738, + "step": 4130 + }, + { + "epoch": 0.03, + "global_step": 4131, + "learning_rate": 0.000483593489148581, + "loss": 1.7524, + "loss_base2": 2.5282, + "loss_pixel": 0.196, + "loss_text": 1.5565, + "ppl": 5.7684, + "step": 4131 + }, + { + "epoch": 0.03, + "global_step": 4132, + "learning_rate": 0.00048358931552587646, + "loss": 1.7731, + "loss_base2": 2.558, + "loss_pixel": 0.197, + "loss_text": 1.576, + "ppl": 5.8891, + "step": 4132 + }, + { + "epoch": 0.03, + "global_step": 4133, + "learning_rate": 0.00048358514190317196, + "loss": 1.7778, + "loss_base2": 2.5648, + "loss_pixel": 0.197, + "loss_text": 1.5808, + "ppl": 5.9168, + "step": 4133 + }, + { + "epoch": 0.03, + "global_step": 4134, + "learning_rate": 0.0004835809682804674, + "loss": 1.7758, + "loss_base2": 2.5619, + "loss_pixel": 0.1954, + "loss_text": 1.5804, + "ppl": 5.905, + "step": 4134 + }, + { + "epoch": 0.03, + "global_step": 4135, + "learning_rate": 0.0004835767946577629, + "loss": 1.7561, + "loss_base2": 2.5335, + "loss_pixel": 0.1965, + "loss_text": 1.5596, + "ppl": 5.7898, + "step": 4135 + }, + { + "epoch": 0.03, + "global_step": 4136, + "learning_rate": 0.00048357262103505843, + "loss": 1.7761, + "loss_base2": 2.5624, + "loss_pixel": 0.1977, + "loss_text": 1.5784, + "ppl": 5.9068, + "step": 4136 + }, + { + "epoch": 0.03, + "global_step": 4137, + "learning_rate": 0.00048356844741235394, + "loss": 1.7734, + "loss_base2": 2.5585, + "loss_pixel": 0.1956, + "loss_text": 1.5778, + "ppl": 5.8908, + "step": 4137 + }, + { + "epoch": 0.03, + "global_step": 4138, + "learning_rate": 0.0004835642737896494, + "loss": 1.7667, + "loss_base2": 2.5488, + "loss_pixel": 0.1959, + "loss_text": 1.5708, + "ppl": 5.8515, + "step": 4138 + }, + { + "epoch": 0.03, + "global_step": 4139, + "learning_rate": 0.0004835601001669449, + "loss": 1.7484, + "loss_base2": 2.5224, + "loss_pixel": 0.1962, + "loss_text": 1.5521, + "ppl": 5.7454, + "step": 4139 + }, + { + "epoch": 0.03, + "global_step": 4140, + "learning_rate": 0.0004835559265442404, + "loss": 1.7599, + "loss_base2": 2.539, + "loss_pixel": 0.1961, + "loss_text": 1.5638, + "ppl": 5.8119, + "step": 4140 + }, + { + "epoch": 0.03, + "global_step": 4141, + "learning_rate": 0.0004835517529215359, + "loss": 1.7435, + "loss_base2": 2.5153, + "loss_pixel": 0.1947, + "loss_text": 1.5488, + "ppl": 5.7173, + "step": 4141 + }, + { + "epoch": 0.03, + "global_step": 4142, + "learning_rate": 0.0004835475792988314, + "loss": 1.7605, + "loss_base2": 2.5399, + "loss_pixel": 0.1959, + "loss_text": 1.5646, + "ppl": 5.8153, + "step": 4142 + }, + { + "epoch": 0.03, + "global_step": 4143, + "learning_rate": 0.0004835434056761269, + "loss": 1.7648, + "loss_base2": 2.5461, + "loss_pixel": 0.1951, + "loss_text": 1.5697, + "ppl": 5.8404, + "step": 4143 + }, + { + "epoch": 0.03, + "global_step": 4144, + "learning_rate": 0.0004835392320534224, + "loss": 1.767, + "loss_base2": 2.5492, + "loss_pixel": 0.195, + "loss_text": 1.572, + "ppl": 5.8533, + "step": 4144 + }, + { + "epoch": 0.03, + "global_step": 4145, + "learning_rate": 0.0004835350584307179, + "loss": 1.7362, + "loss_base2": 2.5048, + "loss_pixel": 0.1945, + "loss_text": 1.5417, + "ppl": 5.6757, + "step": 4145 + }, + { + "epoch": 0.03, + "global_step": 4146, + "learning_rate": 0.0004835308848080134, + "loss": 1.7658, + "loss_base2": 2.5475, + "loss_pixel": 0.1957, + "loss_text": 1.5701, + "ppl": 5.8462, + "step": 4146 + }, + { + "epoch": 0.03, + "global_step": 4147, + "learning_rate": 0.00048352671118530885, + "loss": 1.7697, + "loss_base2": 2.5531, + "loss_pixel": 0.1948, + "loss_text": 1.5749, + "ppl": 5.8691, + "step": 4147 + }, + { + "epoch": 0.03, + "global_step": 4148, + "learning_rate": 0.00048352253756260436, + "loss": 1.7751, + "loss_base2": 2.5609, + "loss_pixel": 0.1947, + "loss_text": 1.5803, + "ppl": 5.9009, + "step": 4148 + }, + { + "epoch": 0.03, + "global_step": 4149, + "learning_rate": 0.00048351836393989987, + "loss": 1.7665, + "loss_base2": 2.5485, + "loss_pixel": 0.194, + "loss_text": 1.5725, + "ppl": 5.8503, + "step": 4149 + }, + { + "epoch": 0.03, + "global_step": 4150, + "learning_rate": 0.00048351419031719537, + "loss": 1.7729, + "loss_base2": 2.5578, + "loss_pixel": 0.195, + "loss_text": 1.5779, + "ppl": 5.8879, + "step": 4150 + }, + { + "epoch": 0.03, + "global_step": 4151, + "learning_rate": 0.0004835100166944908, + "loss": 1.7838, + "loss_base2": 2.5735, + "loss_pixel": 0.1952, + "loss_text": 1.5886, + "ppl": 5.9524, + "step": 4151 + }, + { + "epoch": 0.03, + "global_step": 4152, + "learning_rate": 0.0004835058430717863, + "loss": 1.7514, + "loss_base2": 2.5267, + "loss_pixel": 0.1951, + "loss_text": 1.5563, + "ppl": 5.7627, + "step": 4152 + }, + { + "epoch": 0.03, + "global_step": 4153, + "learning_rate": 0.0004835016694490818, + "loss": 1.7542, + "loss_base2": 2.5308, + "loss_pixel": 0.1946, + "loss_text": 1.5596, + "ppl": 5.7788, + "step": 4153 + }, + { + "epoch": 0.03, + "global_step": 4154, + "learning_rate": 0.0004834974958263773, + "loss": 1.7591, + "loss_base2": 2.5378, + "loss_pixel": 0.1937, + "loss_text": 1.5653, + "ppl": 5.8072, + "step": 4154 + }, + { + "epoch": 0.03, + "global_step": 4155, + "learning_rate": 0.0004834933222036728, + "loss": 1.6556, + "loss_base2": 2.3885, + "loss_pixel": 0.1953, + "loss_text": 1.4602, + "ppl": 5.2362, + "step": 4155 + }, + { + "epoch": 0.03, + "global_step": 4156, + "learning_rate": 0.00048348914858096825, + "loss": 1.5662, + "loss_base2": 2.2595, + "loss_pixel": 0.1956, + "loss_text": 1.3706, + "ppl": 4.7884, + "step": 4156 + }, + { + "epoch": 0.03, + "global_step": 4157, + "learning_rate": 0.00048348497495826376, + "loss": 1.5275, + "loss_base2": 2.2037, + "loss_pixel": 0.1956, + "loss_text": 1.3319, + "ppl": 4.6066, + "step": 4157 + }, + { + "epoch": 0.03, + "global_step": 4158, + "learning_rate": 0.00048348080133555927, + "loss": 1.5339, + "loss_base2": 2.2129, + "loss_pixel": 0.1962, + "loss_text": 1.3377, + "ppl": 4.6362, + "step": 4158 + }, + { + "epoch": 0.03, + "global_step": 4159, + "learning_rate": 0.0004834766277128548, + "loss": 1.5371, + "loss_base2": 2.2176, + "loss_pixel": 0.196, + "loss_text": 1.3411, + "ppl": 4.6511, + "step": 4159 + }, + { + "epoch": 0.03, + "global_step": 4160, + "learning_rate": 0.0004834724540901503, + "loss": 1.5042, + "loss_base2": 2.1701, + "loss_pixel": 0.1958, + "loss_text": 1.3085, + "ppl": 4.5006, + "step": 4160 + }, + { + "epoch": 0.03, + "global_step": 4161, + "learning_rate": 0.00048346828046744574, + "loss": 1.5376, + "loss_base2": 2.2183, + "loss_pixel": 0.2, + "loss_text": 1.3376, + "ppl": 4.6534, + "step": 4161 + }, + { + "epoch": 0.03, + "global_step": 4162, + "learning_rate": 0.00048346410684474124, + "loss": 1.5292, + "loss_base2": 2.2062, + "loss_pixel": 0.1994, + "loss_text": 1.3298, + "ppl": 4.6145, + "step": 4162 + }, + { + "epoch": 0.03, + "global_step": 4163, + "learning_rate": 0.00048345993322203675, + "loss": 1.6268, + "loss_base2": 2.347, + "loss_pixel": 0.1961, + "loss_text": 1.4307, + "ppl": 5.0876, + "step": 4163 + }, + { + "epoch": 0.03, + "global_step": 4164, + "learning_rate": 0.00048345575959933226, + "loss": 1.7936, + "loss_base2": 2.5876, + "loss_pixel": 0.1951, + "loss_text": 1.5986, + "ppl": 6.0111, + "step": 4164 + }, + { + "epoch": 0.03, + "global_step": 4165, + "learning_rate": 0.00048345158597662777, + "loss": 1.7901, + "loss_base2": 2.5826, + "loss_pixel": 0.1949, + "loss_text": 1.5952, + "ppl": 5.9901, + "step": 4165 + }, + { + "epoch": 0.03, + "global_step": 4166, + "learning_rate": 0.0004834474123539232, + "loss": 1.7614, + "loss_base2": 2.5412, + "loss_pixel": 0.1954, + "loss_text": 1.5661, + "ppl": 5.8206, + "step": 4166 + }, + { + "epoch": 0.03, + "global_step": 4167, + "learning_rate": 0.0004834432387312187, + "loss": 1.7815, + "loss_base2": 2.5702, + "loss_pixel": 0.1961, + "loss_text": 1.5854, + "ppl": 5.9388, + "step": 4167 + }, + { + "epoch": 0.03, + "global_step": 4168, + "learning_rate": 0.00048343906510851423, + "loss": 1.7735, + "loss_base2": 2.5586, + "loss_pixel": 0.1943, + "loss_text": 1.5792, + "ppl": 5.8914, + "step": 4168 + }, + { + "epoch": 0.03, + "global_step": 4169, + "learning_rate": 0.00048343489148580974, + "loss": 1.7885, + "loss_base2": 2.5803, + "loss_pixel": 0.1959, + "loss_text": 1.5927, + "ppl": 5.9805, + "step": 4169 + }, + { + "epoch": 0.03, + "global_step": 4170, + "learning_rate": 0.00048343071786310514, + "loss": 1.7808, + "loss_base2": 2.5692, + "loss_pixel": 0.1953, + "loss_text": 1.5855, + "ppl": 5.9346, + "step": 4170 + }, + { + "epoch": 0.03, + "global_step": 4171, + "learning_rate": 0.00048342654424040065, + "loss": 1.7692, + "loss_base2": 2.5524, + "loss_pixel": 0.1938, + "loss_text": 1.5755, + "ppl": 5.8662, + "step": 4171 + }, + { + "epoch": 0.03, + "global_step": 4172, + "learning_rate": 0.00048342237061769615, + "loss": 1.7852, + "loss_base2": 2.5755, + "loss_pixel": 0.1943, + "loss_text": 1.5909, + "ppl": 5.9608, + "step": 4172 + }, + { + "epoch": 0.03, + "global_step": 4173, + "learning_rate": 0.00048341819699499166, + "loss": 1.7705, + "loss_base2": 2.5543, + "loss_pixel": 0.1936, + "loss_text": 1.5769, + "ppl": 5.8738, + "step": 4173 + }, + { + "epoch": 0.03, + "global_step": 4174, + "learning_rate": 0.00048341402337228717, + "loss": 1.757, + "loss_base2": 2.5348, + "loss_pixel": 0.1936, + "loss_text": 1.5634, + "ppl": 5.795, + "step": 4174 + }, + { + "epoch": 0.03, + "global_step": 4175, + "learning_rate": 0.0004834098497495826, + "loss": 1.7764, + "loss_base2": 2.5628, + "loss_pixel": 0.1961, + "loss_text": 1.5803, + "ppl": 5.9085, + "step": 4175 + }, + { + "epoch": 0.03, + "global_step": 4176, + "learning_rate": 0.00048340567612687813, + "loss": 1.7638, + "loss_base2": 2.5446, + "loss_pixel": 0.1944, + "loss_text": 1.5694, + "ppl": 5.8346, + "step": 4176 + }, + { + "epoch": 0.03, + "global_step": 4177, + "learning_rate": 0.00048340150250417364, + "loss": 1.7796, + "loss_base2": 2.5674, + "loss_pixel": 0.195, + "loss_text": 1.5846, + "ppl": 5.9275, + "step": 4177 + }, + { + "epoch": 0.03, + "global_step": 4178, + "learning_rate": 0.00048339732888146914, + "loss": 1.763, + "loss_base2": 2.5435, + "loss_pixel": 0.1943, + "loss_text": 1.5687, + "ppl": 5.8299, + "step": 4178 + }, + { + "epoch": 0.03, + "global_step": 4179, + "learning_rate": 0.0004833931552587646, + "loss": 1.7721, + "loss_base2": 2.5566, + "loss_pixel": 0.1939, + "loss_text": 1.5782, + "ppl": 5.8832, + "step": 4179 + }, + { + "epoch": 0.03, + "global_step": 4180, + "learning_rate": 0.0004833889816360601, + "loss": 1.7572, + "loss_base2": 2.5351, + "loss_pixel": 0.194, + "loss_text": 1.5632, + "ppl": 5.7962, + "step": 4180 + }, + { + "epoch": 0.03, + "global_step": 4181, + "learning_rate": 0.0004833848080133556, + "loss": 1.7787, + "loss_base2": 2.5661, + "loss_pixel": 0.1948, + "loss_text": 1.584, + "ppl": 5.9222, + "step": 4181 + }, + { + "epoch": 0.03, + "global_step": 4182, + "learning_rate": 0.0004833806343906511, + "loss": 1.761, + "loss_base2": 2.5406, + "loss_pixel": 0.1927, + "loss_text": 1.5682, + "ppl": 5.8183, + "step": 4182 + }, + { + "epoch": 0.03, + "global_step": 4183, + "learning_rate": 0.0004833764607679466, + "loss": 1.7671, + "loss_base2": 2.5494, + "loss_pixel": 0.1938, + "loss_text": 1.5733, + "ppl": 5.8539, + "step": 4183 + }, + { + "epoch": 0.03, + "global_step": 4184, + "learning_rate": 0.0004833722871452421, + "loss": 1.7783, + "loss_base2": 2.5655, + "loss_pixel": 0.1948, + "loss_text": 1.5834, + "ppl": 5.9198, + "step": 4184 + }, + { + "epoch": 0.03, + "global_step": 4185, + "learning_rate": 0.0004833681135225376, + "loss": 1.7782, + "loss_base2": 2.5654, + "loss_pixel": 0.1938, + "loss_text": 1.5844, + "ppl": 5.9192, + "step": 4185 + }, + { + "epoch": 0.03, + "global_step": 4186, + "learning_rate": 0.0004833639398998331, + "loss": 1.7752, + "loss_base2": 2.5611, + "loss_pixel": 0.1929, + "loss_text": 1.5823, + "ppl": 5.9015, + "step": 4186 + }, + { + "epoch": 0.03, + "global_step": 4187, + "learning_rate": 0.0004833597662771286, + "loss": 1.747, + "loss_base2": 2.5204, + "loss_pixel": 0.192, + "loss_text": 1.555, + "ppl": 5.7374, + "step": 4187 + }, + { + "epoch": 0.03, + "global_step": 4188, + "learning_rate": 0.000483355592654424, + "loss": 1.628, + "loss_base2": 2.3487, + "loss_pixel": 0.1935, + "loss_text": 1.4345, + "ppl": 5.0937, + "step": 4188 + }, + { + "epoch": 0.03, + "global_step": 4189, + "learning_rate": 0.0004833514190317195, + "loss": 1.557, + "loss_base2": 2.2463, + "loss_pixel": 0.1935, + "loss_text": 1.3635, + "ppl": 4.7446, + "step": 4189 + }, + { + "epoch": 0.03, + "global_step": 4190, + "learning_rate": 0.000483347245409015, + "loss": 1.5173, + "loss_base2": 2.189, + "loss_pixel": 0.1932, + "loss_text": 1.324, + "ppl": 4.5599, + "step": 4190 + }, + { + "epoch": 0.03, + "global_step": 4191, + "learning_rate": 0.0004833430717863105, + "loss": 1.5105, + "loss_base2": 2.1792, + "loss_pixel": 0.1941, + "loss_text": 1.3164, + "ppl": 4.529, + "step": 4191 + }, + { + "epoch": 0.03, + "global_step": 4192, + "learning_rate": 0.00048333889816360603, + "loss": 1.5319, + "loss_base2": 2.2101, + "loss_pixel": 0.1945, + "loss_text": 1.3374, + "ppl": 4.627, + "step": 4192 + }, + { + "epoch": 0.03, + "global_step": 4193, + "learning_rate": 0.0004833347245409015, + "loss": 1.5266, + "loss_base2": 2.2024, + "loss_pixel": 0.1931, + "loss_text": 1.3335, + "ppl": 4.6025, + "step": 4193 + }, + { + "epoch": 0.03, + "global_step": 4194, + "learning_rate": 0.000483330550918197, + "loss": 1.5337, + "loss_base2": 2.2127, + "loss_pixel": 0.1919, + "loss_text": 1.3418, + "ppl": 4.6353, + "step": 4194 + }, + { + "epoch": 0.03, + "global_step": 4195, + "learning_rate": 0.0004833263772954925, + "loss": 1.5132, + "loss_base2": 2.1831, + "loss_pixel": 0.1941, + "loss_text": 1.319, + "ppl": 4.5412, + "step": 4195 + }, + { + "epoch": 0.03, + "global_step": 4196, + "learning_rate": 0.000483322203672788, + "loss": 1.4998, + "loss_base2": 2.1638, + "loss_pixel": 0.1936, + "loss_text": 1.3061, + "ppl": 4.4808, + "step": 4196 + }, + { + "epoch": 0.03, + "global_step": 4197, + "learning_rate": 0.00048331803005008346, + "loss": 1.5247, + "loss_base2": 2.1997, + "loss_pixel": 0.1927, + "loss_text": 1.332, + "ppl": 4.5938, + "step": 4197 + }, + { + "epoch": 0.03, + "global_step": 4198, + "learning_rate": 0.00048331385642737896, + "loss": 1.5319, + "loss_base2": 2.2101, + "loss_pixel": 0.1927, + "loss_text": 1.3393, + "ppl": 4.627, + "step": 4198 + }, + { + "epoch": 0.03, + "global_step": 4199, + "learning_rate": 0.00048330968280467447, + "loss": 1.5203, + "loss_base2": 2.1933, + "loss_pixel": 0.1941, + "loss_text": 1.3261, + "ppl": 4.5736, + "step": 4199 + }, + { + "epoch": 0.03, + "global_step": 4200, + "learning_rate": 0.00048330550918197, + "loss": 1.5153, + "loss_base2": 2.1861, + "loss_pixel": 0.1929, + "loss_text": 1.3225, + "ppl": 4.5508, + "step": 4200 + }, + { + "epoch": 0.03, + "global_step": 4201, + "learning_rate": 0.0004833013355592655, + "loss": 1.4976, + "loss_base2": 2.1606, + "loss_pixel": 0.1921, + "loss_text": 1.3054, + "ppl": 4.4709, + "step": 4201 + }, + { + "epoch": 0.03, + "global_step": 4202, + "learning_rate": 0.00048329716193656094, + "loss": 1.5461, + "loss_base2": 2.2306, + "loss_pixel": 0.1929, + "loss_text": 1.3532, + "ppl": 4.6931, + "step": 4202 + }, + { + "epoch": 0.03, + "global_step": 4203, + "learning_rate": 0.00048329298831385645, + "loss": 1.531, + "loss_base2": 2.2088, + "loss_pixel": 0.1932, + "loss_text": 1.3378, + "ppl": 4.6228, + "step": 4203 + }, + { + "epoch": 0.03, + "global_step": 4204, + "learning_rate": 0.00048328881469115195, + "loss": 1.5024, + "loss_base2": 2.1675, + "loss_pixel": 0.1937, + "loss_text": 1.3086, + "ppl": 4.4925, + "step": 4204 + }, + { + "epoch": 0.03, + "global_step": 4205, + "learning_rate": 0.00048328464106844746, + "loss": 1.6751, + "loss_base2": 2.4167, + "loss_pixel": 0.1926, + "loss_text": 1.4825, + "ppl": 5.3393, + "step": 4205 + }, + { + "epoch": 0.03, + "global_step": 4206, + "learning_rate": 0.0004832804674457429, + "loss": 1.7885, + "loss_base2": 2.5803, + "loss_pixel": 0.1926, + "loss_text": 1.5959, + "ppl": 5.9805, + "step": 4206 + }, + { + "epoch": 0.03, + "global_step": 4207, + "learning_rate": 0.00048327629382303837, + "loss": 1.7788, + "loss_base2": 2.5663, + "loss_pixel": 0.193, + "loss_text": 1.5857, + "ppl": 5.9227, + "step": 4207 + }, + { + "epoch": 0.03, + "global_step": 4208, + "learning_rate": 0.0004832721202003339, + "loss": 1.7656, + "loss_base2": 2.5472, + "loss_pixel": 0.1921, + "loss_text": 1.5735, + "ppl": 5.8451, + "step": 4208 + }, + { + "epoch": 0.03, + "global_step": 4209, + "learning_rate": 0.0004832679465776294, + "loss": 1.7833, + "loss_base2": 2.5728, + "loss_pixel": 0.1932, + "loss_text": 1.5901, + "ppl": 5.9495, + "step": 4209 + }, + { + "epoch": 0.03, + "global_step": 4210, + "learning_rate": 0.0004832637729549249, + "loss": 1.7941, + "loss_base2": 2.5883, + "loss_pixel": 0.1941, + "loss_text": 1.6, + "ppl": 6.0141, + "step": 4210 + }, + { + "epoch": 0.03, + "global_step": 4211, + "learning_rate": 0.00048325959933222034, + "loss": 1.7922, + "loss_base2": 2.5856, + "loss_pixel": 0.1938, + "loss_text": 1.5984, + "ppl": 6.0026, + "step": 4211 + }, + { + "epoch": 0.03, + "global_step": 4212, + "learning_rate": 0.00048325542570951585, + "loss": 1.7722, + "loss_base2": 2.5567, + "loss_pixel": 0.1925, + "loss_text": 1.5797, + "ppl": 5.8838, + "step": 4212 + }, + { + "epoch": 0.03, + "global_step": 4213, + "learning_rate": 0.00048325125208681136, + "loss": 1.7663, + "loss_base2": 2.5482, + "loss_pixel": 0.1937, + "loss_text": 1.5726, + "ppl": 5.8492, + "step": 4213 + }, + { + "epoch": 0.03, + "global_step": 4214, + "learning_rate": 0.00048324707846410686, + "loss": 1.7637, + "loss_base2": 2.5445, + "loss_pixel": 0.193, + "loss_text": 1.5707, + "ppl": 5.834, + "step": 4214 + }, + { + "epoch": 0.03, + "global_step": 4215, + "learning_rate": 0.0004832429048414023, + "loss": 1.7667, + "loss_base2": 2.5488, + "loss_pixel": 0.193, + "loss_text": 1.5737, + "ppl": 5.8515, + "step": 4215 + }, + { + "epoch": 0.03, + "global_step": 4216, + "learning_rate": 0.0004832387312186978, + "loss": 1.7647, + "loss_base2": 2.5459, + "loss_pixel": 0.1932, + "loss_text": 1.5715, + "ppl": 5.8398, + "step": 4216 + }, + { + "epoch": 0.03, + "global_step": 4217, + "learning_rate": 0.00048323455759599333, + "loss": 1.7674, + "loss_base2": 2.5498, + "loss_pixel": 0.1927, + "loss_text": 1.5747, + "ppl": 5.8556, + "step": 4217 + }, + { + "epoch": 0.03, + "global_step": 4218, + "learning_rate": 0.00048323038397328884, + "loss": 1.7707, + "loss_base2": 2.5546, + "loss_pixel": 0.193, + "loss_text": 1.5777, + "ppl": 5.875, + "step": 4218 + }, + { + "epoch": 0.03, + "global_step": 4219, + "learning_rate": 0.00048322621035058435, + "loss": 1.7729, + "loss_base2": 2.5578, + "loss_pixel": 0.193, + "loss_text": 1.5799, + "ppl": 5.8879, + "step": 4219 + }, + { + "epoch": 0.03, + "global_step": 4220, + "learning_rate": 0.0004832220367278798, + "loss": 1.772, + "loss_base2": 2.5565, + "loss_pixel": 0.1937, + "loss_text": 1.5783, + "ppl": 5.8826, + "step": 4220 + }, + { + "epoch": 0.03, + "global_step": 4221, + "learning_rate": 0.0004832178631051753, + "loss": 1.7657, + "loss_base2": 2.5474, + "loss_pixel": 0.1914, + "loss_text": 1.5743, + "ppl": 5.8457, + "step": 4221 + }, + { + "epoch": 0.03, + "global_step": 4222, + "learning_rate": 0.0004832136894824708, + "loss": 1.7685, + "loss_base2": 2.5514, + "loss_pixel": 0.1918, + "loss_text": 1.5767, + "ppl": 5.8621, + "step": 4222 + }, + { + "epoch": 0.03, + "global_step": 4223, + "learning_rate": 0.0004832095158597663, + "loss": 1.7576, + "loss_base2": 2.5357, + "loss_pixel": 0.1916, + "loss_text": 1.566, + "ppl": 5.7985, + "step": 4223 + }, + { + "epoch": 0.03, + "global_step": 4224, + "learning_rate": 0.00048320534223706183, + "loss": 1.7512, + "loss_base2": 2.5264, + "loss_pixel": 0.1926, + "loss_text": 1.5586, + "ppl": 5.7615, + "step": 4224 + }, + { + "epoch": 0.03, + "global_step": 4225, + "learning_rate": 0.0004832011686143573, + "loss": 1.7582, + "loss_base2": 2.5365, + "loss_pixel": 0.1924, + "loss_text": 1.5659, + "ppl": 5.802, + "step": 4225 + }, + { + "epoch": 0.03, + "global_step": 4226, + "learning_rate": 0.00048319699499165274, + "loss": 1.7664, + "loss_base2": 2.5484, + "loss_pixel": 0.1925, + "loss_text": 1.5738, + "ppl": 5.8498, + "step": 4226 + }, + { + "epoch": 0.03, + "global_step": 4227, + "learning_rate": 0.00048319282136894824, + "loss": 1.7643, + "loss_base2": 2.5453, + "loss_pixel": 0.1932, + "loss_text": 1.571, + "ppl": 5.8375, + "step": 4227 + }, + { + "epoch": 0.03, + "global_step": 4228, + "learning_rate": 0.00048318864774624375, + "loss": 1.7148, + "loss_base2": 2.4739, + "loss_pixel": 0.1926, + "loss_text": 1.5221, + "ppl": 5.5556, + "step": 4228 + }, + { + "epoch": 0.03, + "global_step": 4229, + "learning_rate": 0.0004831844741235392, + "loss": 1.5966, + "loss_base2": 2.3034, + "loss_pixel": 0.1946, + "loss_text": 1.402, + "ppl": 4.9362, + "step": 4229 + }, + { + "epoch": 0.03, + "global_step": 4230, + "learning_rate": 0.0004831803005008347, + "loss": 1.5446, + "loss_base2": 2.2284, + "loss_pixel": 0.197, + "loss_text": 1.3476, + "ppl": 4.6861, + "step": 4230 + }, + { + "epoch": 0.03, + "global_step": 4231, + "learning_rate": 0.0004831761268781302, + "loss": 1.519, + "loss_base2": 2.1915, + "loss_pixel": 0.1947, + "loss_text": 1.3243, + "ppl": 4.5677, + "step": 4231 + }, + { + "epoch": 0.03, + "global_step": 4232, + "learning_rate": 0.0004831719532554257, + "loss": 1.5233, + "loss_base2": 2.1977, + "loss_pixel": 0.1933, + "loss_text": 1.33, + "ppl": 4.5873, + "step": 4232 + }, + { + "epoch": 0.03, + "global_step": 4233, + "learning_rate": 0.00048316777963272123, + "loss": 1.5284, + "loss_base2": 2.205, + "loss_pixel": 0.194, + "loss_text": 1.3344, + "ppl": 4.6108, + "step": 4233 + }, + { + "epoch": 0.03, + "global_step": 4234, + "learning_rate": 0.0004831636060100167, + "loss": 1.536, + "loss_base2": 2.216, + "loss_pixel": 0.1913, + "loss_text": 1.3447, + "ppl": 4.646, + "step": 4234 + }, + { + "epoch": 0.03, + "global_step": 4235, + "learning_rate": 0.0004831594323873122, + "loss": 1.5089, + "loss_base2": 2.1769, + "loss_pixel": 0.1906, + "loss_text": 1.3183, + "ppl": 4.5218, + "step": 4235 + }, + { + "epoch": 0.03, + "global_step": 4236, + "learning_rate": 0.0004831552587646077, + "loss": 1.6357, + "loss_base2": 2.3598, + "loss_pixel": 0.1898, + "loss_text": 1.4459, + "ppl": 5.133, + "step": 4236 + }, + { + "epoch": 0.03, + "global_step": 4237, + "learning_rate": 0.0004831510851419032, + "loss": 1.7868, + "loss_base2": 2.5778, + "loss_pixel": 0.1903, + "loss_text": 1.5965, + "ppl": 5.9703, + "step": 4237 + }, + { + "epoch": 0.03, + "global_step": 4238, + "learning_rate": 0.00048314691151919866, + "loss": 1.7869, + "loss_base2": 2.578, + "loss_pixel": 0.195, + "loss_text": 1.5919, + "ppl": 5.9709, + "step": 4238 + }, + { + "epoch": 0.03, + "global_step": 4239, + "learning_rate": 0.00048314273789649417, + "loss": 1.8003, + "loss_base2": 2.5973, + "loss_pixel": 0.193, + "loss_text": 1.6074, + "ppl": 6.0515, + "step": 4239 + }, + { + "epoch": 0.03, + "global_step": 4240, + "learning_rate": 0.0004831385642737897, + "loss": 1.7774, + "loss_base2": 2.5642, + "loss_pixel": 0.192, + "loss_text": 1.5854, + "ppl": 5.9145, + "step": 4240 + }, + { + "epoch": 0.03, + "global_step": 4241, + "learning_rate": 0.0004831343906510852, + "loss": 1.7683, + "loss_base2": 2.5511, + "loss_pixel": 0.1896, + "loss_text": 1.5787, + "ppl": 5.8609, + "step": 4241 + }, + { + "epoch": 0.03, + "global_step": 4242, + "learning_rate": 0.0004831302170283807, + "loss": 1.7628, + "loss_base2": 2.5432, + "loss_pixel": 0.1895, + "loss_text": 1.5734, + "ppl": 5.8287, + "step": 4242 + }, + { + "epoch": 0.03, + "global_step": 4243, + "learning_rate": 0.00048312604340567614, + "loss": 1.766, + "loss_base2": 2.5478, + "loss_pixel": 0.1929, + "loss_text": 1.5731, + "ppl": 5.8474, + "step": 4243 + }, + { + "epoch": 0.03, + "global_step": 4244, + "learning_rate": 0.0004831218697829716, + "loss": 1.7603, + "loss_base2": 2.5396, + "loss_pixel": 0.1982, + "loss_text": 1.5621, + "ppl": 5.8142, + "step": 4244 + }, + { + "epoch": 0.03, + "global_step": 4245, + "learning_rate": 0.0004831176961602671, + "loss": 1.7773, + "loss_base2": 2.5641, + "loss_pixel": 0.2012, + "loss_text": 1.5761, + "ppl": 5.9139, + "step": 4245 + }, + { + "epoch": 0.03, + "global_step": 4246, + "learning_rate": 0.0004831135225375626, + "loss": 1.7977, + "loss_base2": 2.5935, + "loss_pixel": 0.2225, + "loss_text": 1.5752, + "ppl": 6.0357, + "step": 4246 + }, + { + "epoch": 0.03, + "global_step": 4247, + "learning_rate": 0.00048310934891485806, + "loss": 1.8031, + "loss_base2": 2.6013, + "loss_pixel": 0.24, + "loss_text": 1.5631, + "ppl": 6.0684, + "step": 4247 + }, + { + "epoch": 0.03, + "global_step": 4248, + "learning_rate": 0.00048310517529215357, + "loss": 1.8209, + "loss_base2": 2.627, + "loss_pixel": 0.2439, + "loss_text": 1.577, + "ppl": 6.1774, + "step": 4248 + }, + { + "epoch": 0.03, + "global_step": 4249, + "learning_rate": 0.0004831010016694491, + "loss": 1.8163, + "loss_base2": 2.6204, + "loss_pixel": 0.2366, + "loss_text": 1.5797, + "ppl": 6.1491, + "step": 4249 + }, + { + "epoch": 0.03, + "global_step": 4250, + "learning_rate": 0.0004830968280467446, + "loss": 1.8105, + "loss_base2": 2.612, + "loss_pixel": 0.2305, + "loss_text": 1.58, + "ppl": 6.1135, + "step": 4250 + }, + { + "epoch": 0.03, + "global_step": 4251, + "learning_rate": 0.0004830926544240401, + "loss": 1.7961, + "loss_base2": 2.5912, + "loss_pixel": 0.2262, + "loss_text": 1.5699, + "ppl": 6.0261, + "step": 4251 + }, + { + "epoch": 0.03, + "global_step": 4252, + "learning_rate": 0.00048308848080133555, + "loss": 1.8096, + "loss_base2": 2.6107, + "loss_pixel": 0.2238, + "loss_text": 1.5857, + "ppl": 6.108, + "step": 4252 + }, + { + "epoch": 0.03, + "global_step": 4253, + "learning_rate": 0.00048308430717863105, + "loss": 1.8015, + "loss_base2": 2.599, + "loss_pixel": 0.2294, + "loss_text": 1.5721, + "ppl": 6.0587, + "step": 4253 + }, + { + "epoch": 0.03, + "global_step": 4254, + "learning_rate": 0.00048308013355592656, + "loss": 1.7986, + "loss_base2": 2.5948, + "loss_pixel": 0.2211, + "loss_text": 1.5776, + "ppl": 6.0412, + "step": 4254 + }, + { + "epoch": 0.03, + "global_step": 4255, + "learning_rate": 0.00048307595993322207, + "loss": 1.8019, + "loss_base2": 2.5996, + "loss_pixel": 0.2207, + "loss_text": 1.5812, + "ppl": 6.0612, + "step": 4255 + }, + { + "epoch": 0.03, + "global_step": 4256, + "learning_rate": 0.0004830717863105175, + "loss": 1.784, + "loss_base2": 2.5738, + "loss_pixel": 0.2167, + "loss_text": 1.5673, + "ppl": 5.9536, + "step": 4256 + }, + { + "epoch": 0.03, + "global_step": 4257, + "learning_rate": 0.00048306761268781303, + "loss": 1.7705, + "loss_base2": 2.5543, + "loss_pixel": 0.2132, + "loss_text": 1.5573, + "ppl": 5.8738, + "step": 4257 + }, + { + "epoch": 0.03, + "global_step": 4258, + "learning_rate": 0.00048306343906510854, + "loss": 1.7926, + "loss_base2": 2.5862, + "loss_pixel": 0.2111, + "loss_text": 1.5815, + "ppl": 6.005, + "step": 4258 + }, + { + "epoch": 0.03, + "global_step": 4259, + "learning_rate": 0.00048305926544240404, + "loss": 1.7816, + "loss_base2": 2.5703, + "loss_pixel": 0.2106, + "loss_text": 1.571, + "ppl": 5.9394, + "step": 4259 + }, + { + "epoch": 0.03, + "global_step": 4260, + "learning_rate": 0.00048305509181969955, + "loss": 1.7869, + "loss_base2": 2.578, + "loss_pixel": 0.2082, + "loss_text": 1.5788, + "ppl": 5.9709, + "step": 4260 + }, + { + "epoch": 0.03, + "global_step": 4261, + "learning_rate": 0.000483050918196995, + "loss": 1.7748, + "loss_base2": 2.5605, + "loss_pixel": 0.2074, + "loss_text": 1.5675, + "ppl": 5.8991, + "step": 4261 + }, + { + "epoch": 0.03, + "global_step": 4262, + "learning_rate": 0.0004830467445742905, + "loss": 1.7913, + "loss_base2": 2.5843, + "loss_pixel": 0.2062, + "loss_text": 1.5852, + "ppl": 5.9972, + "step": 4262 + }, + { + "epoch": 0.03, + "global_step": 4263, + "learning_rate": 0.00048304257095158596, + "loss": 1.7756, + "loss_base2": 2.5616, + "loss_pixel": 0.2058, + "loss_text": 1.5698, + "ppl": 5.9038, + "step": 4263 + }, + { + "epoch": 0.03, + "global_step": 4264, + "learning_rate": 0.00048303839732888147, + "loss": 1.7671, + "loss_base2": 2.5494, + "loss_pixel": 0.2036, + "loss_text": 1.5635, + "ppl": 5.8539, + "step": 4264 + }, + { + "epoch": 0.03, + "global_step": 4265, + "learning_rate": 0.0004830342237061769, + "loss": 1.7646, + "loss_base2": 2.5458, + "loss_pixel": 0.204, + "loss_text": 1.5606, + "ppl": 5.8392, + "step": 4265 + }, + { + "epoch": 0.03, + "global_step": 4266, + "learning_rate": 0.00048303005008347243, + "loss": 1.7654, + "loss_base2": 2.5469, + "loss_pixel": 0.2035, + "loss_text": 1.5619, + "ppl": 5.8439, + "step": 4266 + }, + { + "epoch": 0.03, + "global_step": 4267, + "learning_rate": 0.00048302587646076794, + "loss": 1.7876, + "loss_base2": 2.579, + "loss_pixel": 0.2014, + "loss_text": 1.5862, + "ppl": 5.9751, + "step": 4267 + }, + { + "epoch": 0.03, + "global_step": 4268, + "learning_rate": 0.00048302170283806345, + "loss": 1.7598, + "loss_base2": 2.5389, + "loss_pixel": 0.2015, + "loss_text": 1.5583, + "ppl": 5.8113, + "step": 4268 + }, + { + "epoch": 0.03, + "global_step": 4269, + "learning_rate": 0.00048301752921535895, + "loss": 1.771, + "loss_base2": 2.555, + "loss_pixel": 0.1995, + "loss_text": 1.5715, + "ppl": 5.8767, + "step": 4269 + }, + { + "epoch": 0.03, + "global_step": 4270, + "learning_rate": 0.0004830133555926544, + "loss": 1.7631, + "loss_base2": 2.5436, + "loss_pixel": 0.2009, + "loss_text": 1.5622, + "ppl": 5.8305, + "step": 4270 + }, + { + "epoch": 0.03, + "global_step": 4271, + "learning_rate": 0.0004830091819699499, + "loss": 1.7715, + "loss_base2": 2.5557, + "loss_pixel": 0.1996, + "loss_text": 1.5719, + "ppl": 5.8797, + "step": 4271 + }, + { + "epoch": 0.03, + "global_step": 4272, + "learning_rate": 0.0004830050083472454, + "loss": 1.7764, + "loss_base2": 2.5628, + "loss_pixel": 0.1995, + "loss_text": 1.5769, + "ppl": 5.9085, + "step": 4272 + }, + { + "epoch": 0.03, + "global_step": 4273, + "learning_rate": 0.00048300083472454093, + "loss": 1.7567, + "loss_base2": 2.5344, + "loss_pixel": 0.1997, + "loss_text": 1.5569, + "ppl": 5.7933, + "step": 4273 + }, + { + "epoch": 0.03, + "global_step": 4274, + "learning_rate": 0.0004829966611018364, + "loss": 1.7697, + "loss_base2": 2.5531, + "loss_pixel": 0.1994, + "loss_text": 1.5704, + "ppl": 5.8691, + "step": 4274 + }, + { + "epoch": 0.03, + "global_step": 4275, + "learning_rate": 0.0004829924874791319, + "loss": 1.7618, + "loss_base2": 2.5417, + "loss_pixel": 0.1988, + "loss_text": 1.5631, + "ppl": 5.8229, + "step": 4275 + }, + { + "epoch": 0.03, + "global_step": 4276, + "learning_rate": 0.0004829883138564274, + "loss": 1.766, + "loss_base2": 2.5478, + "loss_pixel": 0.1982, + "loss_text": 1.5678, + "ppl": 5.8474, + "step": 4276 + }, + { + "epoch": 0.03, + "global_step": 4277, + "learning_rate": 0.0004829841402337229, + "loss": 1.7693, + "loss_base2": 2.5526, + "loss_pixel": 0.1974, + "loss_text": 1.572, + "ppl": 5.8667, + "step": 4277 + }, + { + "epoch": 0.03, + "global_step": 4278, + "learning_rate": 0.0004829799666110184, + "loss": 1.7561, + "loss_base2": 2.5335, + "loss_pixel": 0.1968, + "loss_text": 1.5593, + "ppl": 5.7898, + "step": 4278 + }, + { + "epoch": 0.03, + "global_step": 4279, + "learning_rate": 0.00048297579298831386, + "loss": 1.7455, + "loss_base2": 2.5182, + "loss_pixel": 0.1972, + "loss_text": 1.5483, + "ppl": 5.7288, + "step": 4279 + }, + { + "epoch": 0.03, + "global_step": 4280, + "learning_rate": 0.00048297161936560937, + "loss": 1.7461, + "loss_base2": 2.5191, + "loss_pixel": 0.1973, + "loss_text": 1.5488, + "ppl": 5.7322, + "step": 4280 + }, + { + "epoch": 0.03, + "global_step": 4281, + "learning_rate": 0.0004829674457429049, + "loss": 1.7484, + "loss_base2": 2.5224, + "loss_pixel": 0.1969, + "loss_text": 1.5515, + "ppl": 5.7454, + "step": 4281 + }, + { + "epoch": 0.03, + "global_step": 4282, + "learning_rate": 0.00048296327212020033, + "loss": 1.7618, + "loss_base2": 2.5417, + "loss_pixel": 0.1954, + "loss_text": 1.5665, + "ppl": 5.8229, + "step": 4282 + }, + { + "epoch": 0.03, + "global_step": 4283, + "learning_rate": 0.00048295909849749584, + "loss": 1.7479, + "loss_base2": 2.5217, + "loss_pixel": 0.1949, + "loss_text": 1.553, + "ppl": 5.7425, + "step": 4283 + }, + { + "epoch": 0.03, + "global_step": 4284, + "learning_rate": 0.0004829549248747913, + "loss": 1.7505, + "loss_base2": 2.5254, + "loss_pixel": 0.1966, + "loss_text": 1.5539, + "ppl": 5.7575, + "step": 4284 + }, + { + "epoch": 0.03, + "global_step": 4285, + "learning_rate": 0.0004829507512520868, + "loss": 1.7169, + "loss_base2": 2.477, + "loss_pixel": 0.1956, + "loss_text": 1.5212, + "ppl": 5.5672, + "step": 4285 + }, + { + "epoch": 0.03, + "global_step": 4286, + "learning_rate": 0.0004829465776293823, + "loss": 1.5977, + "loss_base2": 2.305, + "loss_pixel": 0.1953, + "loss_text": 1.4024, + "ppl": 4.9417, + "step": 4286 + }, + { + "epoch": 0.03, + "global_step": 4287, + "learning_rate": 0.0004829424040066778, + "loss": 1.5433, + "loss_base2": 2.2265, + "loss_pixel": 0.1949, + "loss_text": 1.3483, + "ppl": 4.68, + "step": 4287 + }, + { + "epoch": 0.03, + "global_step": 4288, + "learning_rate": 0.00048293823038397327, + "loss": 1.5486, + "loss_base2": 2.2342, + "loss_pixel": 0.1948, + "loss_text": 1.3537, + "ppl": 4.7049, + "step": 4288 + }, + { + "epoch": 0.03, + "global_step": 4289, + "learning_rate": 0.0004829340567612688, + "loss": 1.5075, + "loss_base2": 2.1749, + "loss_pixel": 0.1944, + "loss_text": 1.3131, + "ppl": 4.5154, + "step": 4289 + }, + { + "epoch": 0.03, + "global_step": 4290, + "learning_rate": 0.0004829298831385643, + "loss": 1.5082, + "loss_base2": 2.1759, + "loss_pixel": 0.1948, + "loss_text": 1.3134, + "ppl": 4.5186, + "step": 4290 + }, + { + "epoch": 0.03, + "global_step": 4291, + "learning_rate": 0.0004829257095158598, + "loss": 1.5291, + "loss_base2": 2.206, + "loss_pixel": 0.195, + "loss_text": 1.3341, + "ppl": 4.614, + "step": 4291 + }, + { + "epoch": 0.03, + "global_step": 4292, + "learning_rate": 0.0004829215358931553, + "loss": 1.5222, + "loss_base2": 2.1961, + "loss_pixel": 0.1934, + "loss_text": 1.3288, + "ppl": 4.5823, + "step": 4292 + }, + { + "epoch": 0.03, + "global_step": 4293, + "learning_rate": 0.00048291736227045075, + "loss": 1.5149, + "loss_base2": 2.1855, + "loss_pixel": 0.1936, + "loss_text": 1.3214, + "ppl": 4.549, + "step": 4293 + }, + { + "epoch": 0.03, + "global_step": 4294, + "learning_rate": 0.00048291318864774626, + "loss": 1.6264, + "loss_base2": 2.3464, + "loss_pixel": 0.1936, + "loss_text": 1.4328, + "ppl": 5.0855, + "step": 4294 + }, + { + "epoch": 0.03, + "global_step": 4295, + "learning_rate": 0.00048290901502504177, + "loss": 1.6992, + "loss_base2": 2.4514, + "loss_pixel": 0.1933, + "loss_text": 1.506, + "ppl": 5.4696, + "step": 4295 + }, + { + "epoch": 0.03, + "global_step": 4296, + "learning_rate": 0.00048290484140233727, + "loss": 1.5655, + "loss_base2": 2.2585, + "loss_pixel": 0.1943, + "loss_text": 1.3712, + "ppl": 4.7851, + "step": 4296 + }, + { + "epoch": 0.03, + "global_step": 4297, + "learning_rate": 0.0004829006677796327, + "loss": 1.5183, + "loss_base2": 2.1904, + "loss_pixel": 0.1919, + "loss_text": 1.3264, + "ppl": 4.5645, + "step": 4297 + }, + { + "epoch": 0.03, + "global_step": 4298, + "learning_rate": 0.00048289649415692823, + "loss": 1.507, + "loss_base2": 2.1741, + "loss_pixel": 0.1934, + "loss_text": 1.3136, + "ppl": 4.5132, + "step": 4298 + }, + { + "epoch": 0.03, + "global_step": 4299, + "learning_rate": 0.00048289232053422374, + "loss": 1.5351, + "loss_base2": 2.2147, + "loss_pixel": 0.1944, + "loss_text": 1.3407, + "ppl": 4.6418, + "step": 4299 + }, + { + "epoch": 0.03, + "global_step": 4300, + "learning_rate": 0.00048288814691151925, + "loss": 1.5302, + "loss_base2": 2.2076, + "loss_pixel": 0.1949, + "loss_text": 1.3352, + "ppl": 4.6191, + "step": 4300 + }, + { + "epoch": 0.03, + "global_step": 4301, + "learning_rate": 0.0004828839732888147, + "loss": 1.5148, + "loss_base2": 2.1854, + "loss_pixel": 0.1935, + "loss_text": 1.3212, + "ppl": 4.5485, + "step": 4301 + }, + { + "epoch": 0.03, + "global_step": 4302, + "learning_rate": 0.00048287979966611015, + "loss": 1.4981, + "loss_base2": 2.1613, + "loss_pixel": 0.1936, + "loss_text": 1.3045, + "ppl": 4.4732, + "step": 4302 + }, + { + "epoch": 0.03, + "global_step": 4303, + "learning_rate": 0.00048287562604340566, + "loss": 1.5437, + "loss_base2": 2.2271, + "loss_pixel": 0.1935, + "loss_text": 1.3502, + "ppl": 4.6819, + "step": 4303 + }, + { + "epoch": 0.03, + "global_step": 4304, + "learning_rate": 0.00048287145242070117, + "loss": 1.6501, + "loss_base2": 2.3806, + "loss_pixel": 0.1936, + "loss_text": 1.4565, + "ppl": 5.2075, + "step": 4304 + }, + { + "epoch": 0.03, + "global_step": 4305, + "learning_rate": 0.0004828672787979967, + "loss": 1.7555, + "loss_base2": 2.5327, + "loss_pixel": 0.1934, + "loss_text": 1.5621, + "ppl": 5.7863, + "step": 4305 + }, + { + "epoch": 0.03, + "global_step": 4306, + "learning_rate": 0.00048286310517529213, + "loss": 1.7983, + "loss_base2": 2.5944, + "loss_pixel": 0.1932, + "loss_text": 1.6051, + "ppl": 6.0394, + "step": 4306 + }, + { + "epoch": 0.03, + "global_step": 4307, + "learning_rate": 0.00048285893155258764, + "loss": 1.7787, + "loss_base2": 2.5661, + "loss_pixel": 0.1939, + "loss_text": 1.5848, + "ppl": 5.9222, + "step": 4307 + }, + { + "epoch": 0.03, + "global_step": 4308, + "learning_rate": 0.00048285475792988314, + "loss": 1.787, + "loss_base2": 2.5781, + "loss_pixel": 0.1913, + "loss_text": 1.5957, + "ppl": 5.9715, + "step": 4308 + }, + { + "epoch": 0.03, + "global_step": 4309, + "learning_rate": 0.00048285058430717865, + "loss": 1.7827, + "loss_base2": 2.5719, + "loss_pixel": 0.1924, + "loss_text": 1.5902, + "ppl": 5.9459, + "step": 4309 + }, + { + "epoch": 0.03, + "global_step": 4310, + "learning_rate": 0.00048284641068447416, + "loss": 1.7746, + "loss_base2": 2.5602, + "loss_pixel": 0.1915, + "loss_text": 1.5831, + "ppl": 5.8979, + "step": 4310 + }, + { + "epoch": 0.03, + "global_step": 4311, + "learning_rate": 0.0004828422370617696, + "loss": 1.7707, + "loss_base2": 2.5546, + "loss_pixel": 0.1922, + "loss_text": 1.5785, + "ppl": 5.875, + "step": 4311 + }, + { + "epoch": 0.03, + "global_step": 4312, + "learning_rate": 0.0004828380634390651, + "loss": 1.7653, + "loss_base2": 2.5468, + "loss_pixel": 0.1922, + "loss_text": 1.5731, + "ppl": 5.8433, + "step": 4312 + }, + { + "epoch": 0.03, + "global_step": 4313, + "learning_rate": 0.0004828338898163606, + "loss": 1.7638, + "loss_base2": 2.5446, + "loss_pixel": 0.1919, + "loss_text": 1.5719, + "ppl": 5.8346, + "step": 4313 + }, + { + "epoch": 0.03, + "global_step": 4314, + "learning_rate": 0.00048282971619365613, + "loss": 1.7672, + "loss_base2": 2.5495, + "loss_pixel": 0.1917, + "loss_text": 1.5755, + "ppl": 5.8544, + "step": 4314 + }, + { + "epoch": 0.03, + "global_step": 4315, + "learning_rate": 0.0004828255425709516, + "loss": 1.7671, + "loss_base2": 2.5494, + "loss_pixel": 0.1959, + "loss_text": 1.5712, + "ppl": 5.8539, + "step": 4315 + }, + { + "epoch": 0.03, + "global_step": 4316, + "learning_rate": 0.0004828213689482471, + "loss": 1.7612, + "loss_base2": 2.5409, + "loss_pixel": 0.1947, + "loss_text": 1.5665, + "ppl": 5.8194, + "step": 4316 + }, + { + "epoch": 0.03, + "global_step": 4317, + "learning_rate": 0.0004828171953255426, + "loss": 1.7609, + "loss_base2": 2.5404, + "loss_pixel": 0.1909, + "loss_text": 1.57, + "ppl": 5.8177, + "step": 4317 + }, + { + "epoch": 0.03, + "global_step": 4318, + "learning_rate": 0.0004828130217028381, + "loss": 1.7596, + "loss_base2": 2.5386, + "loss_pixel": 0.1903, + "loss_text": 1.5694, + "ppl": 5.8101, + "step": 4318 + }, + { + "epoch": 0.03, + "global_step": 4319, + "learning_rate": 0.0004828088480801336, + "loss": 1.753, + "loss_base2": 2.529, + "loss_pixel": 0.1906, + "loss_text": 1.5623, + "ppl": 5.7719, + "step": 4319 + }, + { + "epoch": 0.03, + "global_step": 4320, + "learning_rate": 0.000482804674457429, + "loss": 1.7543, + "loss_base2": 2.5309, + "loss_pixel": 0.1895, + "loss_text": 1.5648, + "ppl": 5.7794, + "step": 4320 + }, + { + "epoch": 0.03, + "global_step": 4321, + "learning_rate": 0.0004828005008347245, + "loss": 1.7726, + "loss_base2": 2.5573, + "loss_pixel": 0.1902, + "loss_text": 1.5825, + "ppl": 5.8861, + "step": 4321 + }, + { + "epoch": 0.03, + "global_step": 4322, + "learning_rate": 0.00048279632721202003, + "loss": 1.7383, + "loss_base2": 2.5078, + "loss_pixel": 0.1862, + "loss_text": 1.552, + "ppl": 5.6877, + "step": 4322 + }, + { + "epoch": 0.03, + "global_step": 4323, + "learning_rate": 0.00048279215358931554, + "loss": 1.7637, + "loss_base2": 2.5445, + "loss_pixel": 0.1913, + "loss_text": 1.5725, + "ppl": 5.834, + "step": 4323 + }, + { + "epoch": 0.03, + "global_step": 4324, + "learning_rate": 0.000482787979966611, + "loss": 1.7655, + "loss_base2": 2.5471, + "loss_pixel": 0.19, + "loss_text": 1.5755, + "ppl": 5.8445, + "step": 4324 + }, + { + "epoch": 0.03, + "global_step": 4325, + "learning_rate": 0.0004827838063439065, + "loss": 1.7774, + "loss_base2": 2.5642, + "loss_pixel": 0.1907, + "loss_text": 1.5866, + "ppl": 5.9145, + "step": 4325 + }, + { + "epoch": 0.03, + "global_step": 4326, + "learning_rate": 0.000482779632721202, + "loss": 1.7477, + "loss_base2": 2.5214, + "loss_pixel": 0.1888, + "loss_text": 1.5589, + "ppl": 5.7414, + "step": 4326 + }, + { + "epoch": 0.03, + "global_step": 4327, + "learning_rate": 0.0004827754590984975, + "loss": 1.7477, + "loss_base2": 2.5214, + "loss_pixel": 0.1867, + "loss_text": 1.5611, + "ppl": 5.7414, + "step": 4327 + }, + { + "epoch": 0.03, + "global_step": 4328, + "learning_rate": 0.000482771285475793, + "loss": 1.7572, + "loss_base2": 2.5351, + "loss_pixel": 0.1875, + "loss_text": 1.5697, + "ppl": 5.7962, + "step": 4328 + }, + { + "epoch": 0.03, + "global_step": 4329, + "learning_rate": 0.00048276711185308847, + "loss": 1.7531, + "loss_base2": 2.5292, + "loss_pixel": 0.187, + "loss_text": 1.5661, + "ppl": 5.7725, + "step": 4329 + }, + { + "epoch": 0.03, + "global_step": 4330, + "learning_rate": 0.000482762938230384, + "loss": 1.7422, + "loss_base2": 2.5135, + "loss_pixel": 0.1861, + "loss_text": 1.5561, + "ppl": 5.7099, + "step": 4330 + }, + { + "epoch": 0.03, + "global_step": 4331, + "learning_rate": 0.0004827587646076795, + "loss": 1.7816, + "loss_base2": 2.5703, + "loss_pixel": 0.1876, + "loss_text": 1.594, + "ppl": 5.9394, + "step": 4331 + }, + { + "epoch": 0.03, + "global_step": 4332, + "learning_rate": 0.000482754590984975, + "loss": 1.7479, + "loss_base2": 2.5217, + "loss_pixel": 0.1864, + "loss_text": 1.5615, + "ppl": 5.7425, + "step": 4332 + }, + { + "epoch": 0.03, + "global_step": 4333, + "learning_rate": 0.00048275041736227045, + "loss": 1.7396, + "loss_base2": 2.5097, + "loss_pixel": 0.1898, + "loss_text": 1.5499, + "ppl": 5.6951, + "step": 4333 + }, + { + "epoch": 0.03, + "global_step": 4334, + "learning_rate": 0.00048274624373956595, + "loss": 1.7553, + "loss_base2": 2.5324, + "loss_pixel": 0.1855, + "loss_text": 1.5698, + "ppl": 5.7852, + "step": 4334 + }, + { + "epoch": 0.03, + "global_step": 4335, + "learning_rate": 0.00048274207011686146, + "loss": 1.7538, + "loss_base2": 2.5302, + "loss_pixel": 0.1864, + "loss_text": 1.5674, + "ppl": 5.7765, + "step": 4335 + }, + { + "epoch": 0.03, + "global_step": 4336, + "learning_rate": 0.00048273789649415697, + "loss": 1.7538, + "loss_base2": 2.5302, + "loss_pixel": 0.1882, + "loss_text": 1.5655, + "ppl": 5.7765, + "step": 4336 + }, + { + "epoch": 0.03, + "global_step": 4337, + "learning_rate": 0.0004827337228714525, + "loss": 1.7451, + "loss_base2": 2.5176, + "loss_pixel": 0.1855, + "loss_text": 1.5595, + "ppl": 5.7265, + "step": 4337 + }, + { + "epoch": 0.03, + "global_step": 4338, + "learning_rate": 0.0004827295492487479, + "loss": 1.7495, + "loss_base2": 2.524, + "loss_pixel": 0.1837, + "loss_text": 1.5658, + "ppl": 5.7517, + "step": 4338 + }, + { + "epoch": 0.03, + "global_step": 4339, + "learning_rate": 0.0004827253756260434, + "loss": 1.7549, + "loss_base2": 2.5318, + "loss_pixel": 0.1869, + "loss_text": 1.5679, + "ppl": 5.7829, + "step": 4339 + }, + { + "epoch": 0.03, + "global_step": 4340, + "learning_rate": 0.0004827212020033389, + "loss": 1.745, + "loss_base2": 2.5175, + "loss_pixel": 0.1864, + "loss_text": 1.5585, + "ppl": 5.7259, + "step": 4340 + }, + { + "epoch": 0.03, + "global_step": 4341, + "learning_rate": 0.0004827170283806344, + "loss": 1.7583, + "loss_base2": 2.5367, + "loss_pixel": 0.1861, + "loss_text": 1.5723, + "ppl": 5.8026, + "step": 4341 + }, + { + "epoch": 0.03, + "global_step": 4342, + "learning_rate": 0.0004827128547579299, + "loss": 1.763, + "loss_base2": 2.5435, + "loss_pixel": 0.1856, + "loss_text": 1.5774, + "ppl": 5.8299, + "step": 4342 + }, + { + "epoch": 0.03, + "global_step": 4343, + "learning_rate": 0.00048270868113522536, + "loss": 1.7509, + "loss_base2": 2.526, + "loss_pixel": 0.1847, + "loss_text": 1.5663, + "ppl": 5.7598, + "step": 4343 + }, + { + "epoch": 0.03, + "global_step": 4344, + "learning_rate": 0.00048270450751252086, + "loss": 1.7579, + "loss_base2": 2.5361, + "loss_pixel": 0.184, + "loss_text": 1.5738, + "ppl": 5.8002, + "step": 4344 + }, + { + "epoch": 0.03, + "global_step": 4345, + "learning_rate": 0.00048270033388981637, + "loss": 1.7593, + "loss_base2": 2.5381, + "loss_pixel": 0.186, + "loss_text": 1.5734, + "ppl": 5.8084, + "step": 4345 + }, + { + "epoch": 0.03, + "global_step": 4346, + "learning_rate": 0.0004826961602671119, + "loss": 1.7628, + "loss_base2": 2.5432, + "loss_pixel": 0.1856, + "loss_text": 1.5772, + "ppl": 5.8287, + "step": 4346 + }, + { + "epoch": 0.03, + "global_step": 4347, + "learning_rate": 0.00048269198664440733, + "loss": 1.751, + "loss_base2": 2.5262, + "loss_pixel": 0.1838, + "loss_text": 1.5672, + "ppl": 5.7604, + "step": 4347 + }, + { + "epoch": 0.03, + "global_step": 4348, + "learning_rate": 0.00048268781302170284, + "loss": 1.7505, + "loss_base2": 2.5254, + "loss_pixel": 0.1897, + "loss_text": 1.5608, + "ppl": 5.7575, + "step": 4348 + }, + { + "epoch": 0.03, + "global_step": 4349, + "learning_rate": 0.00048268363939899835, + "loss": 1.566, + "loss_base2": 2.2593, + "loss_pixel": 0.1944, + "loss_text": 1.3716, + "ppl": 4.7875, + "step": 4349 + }, + { + "epoch": 0.03, + "global_step": 4350, + "learning_rate": 0.00048267946577629385, + "loss": 1.5165, + "loss_base2": 2.1878, + "loss_pixel": 0.1945, + "loss_text": 1.322, + "ppl": 4.5563, + "step": 4350 + }, + { + "epoch": 0.03, + "global_step": 4351, + "learning_rate": 0.00048267529215358936, + "loss": 1.5157, + "loss_base2": 2.1867, + "loss_pixel": 0.1938, + "loss_text": 1.322, + "ppl": 4.5526, + "step": 4351 + }, + { + "epoch": 0.03, + "global_step": 4352, + "learning_rate": 0.0004826711185308848, + "loss": 1.5355, + "loss_base2": 2.2153, + "loss_pixel": 0.1936, + "loss_text": 1.3419, + "ppl": 4.6436, + "step": 4352 + }, + { + "epoch": 0.03, + "global_step": 4353, + "learning_rate": 0.0004826669449081803, + "loss": 1.5307, + "loss_base2": 2.2083, + "loss_pixel": 0.1925, + "loss_text": 1.3382, + "ppl": 4.6214, + "step": 4353 + }, + { + "epoch": 0.03, + "global_step": 4354, + "learning_rate": 0.00048266277128547583, + "loss": 1.5154, + "loss_base2": 2.1863, + "loss_pixel": 0.1926, + "loss_text": 1.3229, + "ppl": 4.5512, + "step": 4354 + }, + { + "epoch": 0.03, + "global_step": 4355, + "learning_rate": 0.00048265859766277134, + "loss": 1.5133, + "loss_base2": 2.1832, + "loss_pixel": 0.1927, + "loss_text": 1.3207, + "ppl": 4.5417, + "step": 4355 + }, + { + "epoch": 0.03, + "global_step": 4356, + "learning_rate": 0.0004826544240400668, + "loss": 1.6762, + "loss_base2": 2.4182, + "loss_pixel": 0.1941, + "loss_text": 1.4821, + "ppl": 5.3452, + "step": 4356 + }, + { + "epoch": 0.03, + "global_step": 4357, + "learning_rate": 0.00048265025041736224, + "loss": 1.7705, + "loss_base2": 2.5543, + "loss_pixel": 0.1916, + "loss_text": 1.5789, + "ppl": 5.8738, + "step": 4357 + }, + { + "epoch": 0.03, + "global_step": 4358, + "learning_rate": 0.00048264607679465775, + "loss": 1.7543, + "loss_base2": 2.5309, + "loss_pixel": 0.1918, + "loss_text": 1.5625, + "ppl": 5.7794, + "step": 4358 + }, + { + "epoch": 0.03, + "global_step": 4359, + "learning_rate": 0.00048264190317195326, + "loss": 1.7754, + "loss_base2": 2.5614, + "loss_pixel": 0.1915, + "loss_text": 1.5838, + "ppl": 5.9026, + "step": 4359 + }, + { + "epoch": 0.03, + "global_step": 4360, + "learning_rate": 0.00048263772954924877, + "loss": 1.7791, + "loss_base2": 2.5667, + "loss_pixel": 0.1922, + "loss_text": 1.5869, + "ppl": 5.9245, + "step": 4360 + }, + { + "epoch": 0.03, + "global_step": 4361, + "learning_rate": 0.0004826335559265442, + "loss": 1.7539, + "loss_base2": 2.5303, + "loss_pixel": 0.1927, + "loss_text": 1.5612, + "ppl": 5.7771, + "step": 4361 + }, + { + "epoch": 0.03, + "global_step": 4362, + "learning_rate": 0.0004826293823038397, + "loss": 1.7594, + "loss_base2": 2.5383, + "loss_pixel": 0.1926, + "loss_text": 1.5667, + "ppl": 5.809, + "step": 4362 + }, + { + "epoch": 0.03, + "global_step": 4363, + "learning_rate": 0.00048262520868113523, + "loss": 1.7575, + "loss_base2": 2.5355, + "loss_pixel": 0.1909, + "loss_text": 1.5666, + "ppl": 5.7979, + "step": 4363 + }, + { + "epoch": 0.03, + "global_step": 4364, + "learning_rate": 0.00048262103505843074, + "loss": 1.7652, + "loss_base2": 2.5466, + "loss_pixel": 0.1912, + "loss_text": 1.574, + "ppl": 5.8427, + "step": 4364 + }, + { + "epoch": 0.03, + "global_step": 4365, + "learning_rate": 0.0004826168614357262, + "loss": 1.7507, + "loss_base2": 2.5257, + "loss_pixel": 0.1917, + "loss_text": 1.559, + "ppl": 5.7586, + "step": 4365 + }, + { + "epoch": 0.03, + "global_step": 4366, + "learning_rate": 0.0004826126878130217, + "loss": 1.7651, + "loss_base2": 2.5465, + "loss_pixel": 0.1918, + "loss_text": 1.5734, + "ppl": 5.8422, + "step": 4366 + }, + { + "epoch": 0.03, + "global_step": 4367, + "learning_rate": 0.0004826085141903172, + "loss": 1.7566, + "loss_base2": 2.5342, + "loss_pixel": 0.1911, + "loss_text": 1.5655, + "ppl": 5.7927, + "step": 4367 + }, + { + "epoch": 0.03, + "global_step": 4368, + "learning_rate": 0.0004826043405676127, + "loss": 1.7535, + "loss_base2": 2.5298, + "loss_pixel": 0.1907, + "loss_text": 1.5628, + "ppl": 5.7748, + "step": 4368 + }, + { + "epoch": 0.03, + "global_step": 4369, + "learning_rate": 0.0004826001669449082, + "loss": 1.7637, + "loss_base2": 2.5445, + "loss_pixel": 0.1921, + "loss_text": 1.5716, + "ppl": 5.834, + "step": 4369 + }, + { + "epoch": 0.03, + "global_step": 4370, + "learning_rate": 0.0004825959933222037, + "loss": 1.7486, + "loss_base2": 2.5227, + "loss_pixel": 0.192, + "loss_text": 1.5566, + "ppl": 5.7466, + "step": 4370 + }, + { + "epoch": 0.03, + "global_step": 4371, + "learning_rate": 0.0004825918196994992, + "loss": 1.7568, + "loss_base2": 2.5345, + "loss_pixel": 0.1912, + "loss_text": 1.5656, + "ppl": 5.7939, + "step": 4371 + }, + { + "epoch": 0.03, + "global_step": 4372, + "learning_rate": 0.0004825876460767947, + "loss": 1.7602, + "loss_base2": 2.5394, + "loss_pixel": 0.1921, + "loss_text": 1.5681, + "ppl": 5.8136, + "step": 4372 + }, + { + "epoch": 0.03, + "global_step": 4373, + "learning_rate": 0.0004825834724540902, + "loss": 1.7506, + "loss_base2": 2.5256, + "loss_pixel": 0.1901, + "loss_text": 1.5605, + "ppl": 5.7581, + "step": 4373 + }, + { + "epoch": 0.03, + "global_step": 4374, + "learning_rate": 0.00048257929883138565, + "loss": 1.7645, + "loss_base2": 2.5456, + "loss_pixel": 0.1923, + "loss_text": 1.5722, + "ppl": 5.8387, + "step": 4374 + }, + { + "epoch": 0.03, + "global_step": 4375, + "learning_rate": 0.00048257512520868116, + "loss": 1.7571, + "loss_base2": 2.535, + "loss_pixel": 0.1906, + "loss_text": 1.5664, + "ppl": 5.7956, + "step": 4375 + }, + { + "epoch": 0.03, + "global_step": 4376, + "learning_rate": 0.0004825709515859766, + "loss": 1.7316, + "loss_base2": 2.4982, + "loss_pixel": 0.191, + "loss_text": 1.5406, + "ppl": 5.6497, + "step": 4376 + }, + { + "epoch": 0.03, + "global_step": 4377, + "learning_rate": 0.0004825667779632721, + "loss": 1.7491, + "loss_base2": 2.5234, + "loss_pixel": 0.1916, + "loss_text": 1.5574, + "ppl": 5.7494, + "step": 4377 + }, + { + "epoch": 0.03, + "global_step": 4378, + "learning_rate": 0.0004825626043405676, + "loss": 1.67, + "loss_base2": 2.4093, + "loss_pixel": 0.1914, + "loss_text": 1.4786, + "ppl": 5.3122, + "step": 4378 + }, + { + "epoch": 0.03, + "global_step": 4379, + "learning_rate": 0.0004825584307178631, + "loss": 1.5333, + "loss_base2": 2.2121, + "loss_pixel": 0.1916, + "loss_text": 1.3417, + "ppl": 4.6334, + "step": 4379 + }, + { + "epoch": 0.03, + "global_step": 4380, + "learning_rate": 0.0004825542570951586, + "loss": 1.5167, + "loss_base2": 2.1881, + "loss_pixel": 0.1915, + "loss_text": 1.3252, + "ppl": 4.5572, + "step": 4380 + }, + { + "epoch": 0.03, + "global_step": 4381, + "learning_rate": 0.0004825500834724541, + "loss": 1.5316, + "loss_base2": 2.2096, + "loss_pixel": 0.1906, + "loss_text": 1.341, + "ppl": 4.6256, + "step": 4381 + }, + { + "epoch": 0.03, + "global_step": 4382, + "learning_rate": 0.0004825459098497496, + "loss": 1.5313, + "loss_base2": 2.2092, + "loss_pixel": 0.1899, + "loss_text": 1.3414, + "ppl": 4.6242, + "step": 4382 + }, + { + "epoch": 0.03, + "global_step": 4383, + "learning_rate": 0.00048254173622704505, + "loss": 1.5133, + "loss_base2": 2.1832, + "loss_pixel": 0.19, + "loss_text": 1.3233, + "ppl": 4.5417, + "step": 4383 + }, + { + "epoch": 0.03, + "global_step": 4384, + "learning_rate": 0.00048253756260434056, + "loss": 1.5112, + "loss_base2": 2.1802, + "loss_pixel": 0.1897, + "loss_text": 1.3215, + "ppl": 4.5322, + "step": 4384 + }, + { + "epoch": 0.03, + "global_step": 4385, + "learning_rate": 0.00048253338898163607, + "loss": 1.5227, + "loss_base2": 2.1968, + "loss_pixel": 0.1914, + "loss_text": 1.3313, + "ppl": 4.5846, + "step": 4385 + }, + { + "epoch": 0.03, + "global_step": 4386, + "learning_rate": 0.0004825292153589316, + "loss": 1.5016, + "loss_base2": 2.1664, + "loss_pixel": 0.1899, + "loss_text": 1.3117, + "ppl": 4.4889, + "step": 4386 + }, + { + "epoch": 0.03, + "global_step": 4387, + "learning_rate": 0.0004825250417362271, + "loss": 1.5012, + "loss_base2": 2.1658, + "loss_pixel": 0.191, + "loss_text": 1.3102, + "ppl": 4.4871, + "step": 4387 + }, + { + "epoch": 0.03, + "global_step": 4388, + "learning_rate": 0.00048252086811352254, + "loss": 1.506, + "loss_base2": 2.1727, + "loss_pixel": 0.1896, + "loss_text": 1.3164, + "ppl": 4.5087, + "step": 4388 + }, + { + "epoch": 0.03, + "global_step": 4389, + "learning_rate": 0.00048251669449081804, + "loss": 1.5247, + "loss_base2": 2.1997, + "loss_pixel": 0.1901, + "loss_text": 1.3346, + "ppl": 4.5938, + "step": 4389 + }, + { + "epoch": 0.03, + "global_step": 4390, + "learning_rate": 0.00048251252086811355, + "loss": 1.4968, + "loss_base2": 2.1594, + "loss_pixel": 0.1894, + "loss_text": 1.3074, + "ppl": 4.4674, + "step": 4390 + }, + { + "epoch": 0.03, + "global_step": 4391, + "learning_rate": 0.00048250834724540906, + "loss": 1.4979, + "loss_base2": 2.161, + "loss_pixel": 0.1901, + "loss_text": 1.3079, + "ppl": 4.4723, + "step": 4391 + }, + { + "epoch": 0.03, + "global_step": 4392, + "learning_rate": 0.00048250417362270457, + "loss": 1.4907, + "loss_base2": 2.1506, + "loss_pixel": 0.1899, + "loss_text": 1.3008, + "ppl": 4.4402, + "step": 4392 + }, + { + "epoch": 0.03, + "global_step": 4393, + "learning_rate": 0.0004825, + "loss": 1.5216, + "loss_base2": 2.1952, + "loss_pixel": 0.1904, + "loss_text": 1.3311, + "ppl": 4.5795, + "step": 4393 + }, + { + "epoch": 0.03, + "global_step": 4394, + "learning_rate": 0.0004824958263772955, + "loss": 1.5137, + "loss_base2": 2.1838, + "loss_pixel": 0.1899, + "loss_text": 1.3238, + "ppl": 4.5435, + "step": 4394 + }, + { + "epoch": 0.03, + "global_step": 4395, + "learning_rate": 0.000482491652754591, + "loss": 1.503, + "loss_base2": 2.1684, + "loss_pixel": 0.1901, + "loss_text": 1.3129, + "ppl": 4.4952, + "step": 4395 + }, + { + "epoch": 0.03, + "global_step": 4396, + "learning_rate": 0.0004824874791318865, + "loss": 1.513, + "loss_base2": 2.1828, + "loss_pixel": 0.1886, + "loss_text": 1.3244, + "ppl": 4.5403, + "step": 4396 + }, + { + "epoch": 0.03, + "global_step": 4397, + "learning_rate": 0.00048248330550918194, + "loss": 1.49, + "loss_base2": 2.1496, + "loss_pixel": 0.1888, + "loss_text": 1.3012, + "ppl": 4.4371, + "step": 4397 + }, + { + "epoch": 0.03, + "global_step": 4398, + "learning_rate": 0.00048247913188647745, + "loss": 1.5394, + "loss_base2": 2.2209, + "loss_pixel": 0.1906, + "loss_text": 1.3488, + "ppl": 4.6618, + "step": 4398 + }, + { + "epoch": 0.03, + "global_step": 4399, + "learning_rate": 0.00048247495826377295, + "loss": 1.5037, + "loss_base2": 2.1694, + "loss_pixel": 0.1915, + "loss_text": 1.3121, + "ppl": 4.4983, + "step": 4399 + }, + { + "epoch": 0.03, + "global_step": 4400, + "learning_rate": 0.00048247078464106846, + "loss": 1.5003, + "loss_base2": 2.1645, + "loss_pixel": 0.1916, + "loss_text": 1.3087, + "ppl": 4.483, + "step": 4400 + }, + { + "epoch": 0.03, + "global_step": 4401, + "learning_rate": 0.00048246661101836397, + "loss": 1.5138, + "loss_base2": 2.184, + "loss_pixel": 0.1893, + "loss_text": 1.3245, + "ppl": 4.544, + "step": 4401 + }, + { + "epoch": 0.03, + "global_step": 4402, + "learning_rate": 0.0004824624373956594, + "loss": 1.4864, + "loss_base2": 2.1444, + "loss_pixel": 0.1907, + "loss_text": 1.2957, + "ppl": 4.4212, + "step": 4402 + }, + { + "epoch": 0.03, + "global_step": 4403, + "learning_rate": 0.00048245826377295493, + "loss": 1.4994, + "loss_base2": 2.1632, + "loss_pixel": 0.19, + "loss_text": 1.3093, + "ppl": 4.479, + "step": 4403 + }, + { + "epoch": 0.03, + "global_step": 4404, + "learning_rate": 0.00048245409015025044, + "loss": 1.505, + "loss_base2": 2.1713, + "loss_pixel": 0.1903, + "loss_text": 1.3147, + "ppl": 4.5042, + "step": 4404 + }, + { + "epoch": 0.03, + "global_step": 4405, + "learning_rate": 0.00048244991652754594, + "loss": 1.5212, + "loss_base2": 2.1946, + "loss_pixel": 0.1897, + "loss_text": 1.3314, + "ppl": 4.5777, + "step": 4405 + }, + { + "epoch": 0.03, + "global_step": 4406, + "learning_rate": 0.0004824457429048414, + "loss": 1.5029, + "loss_base2": 2.1682, + "loss_pixel": 0.1886, + "loss_text": 1.3144, + "ppl": 4.4947, + "step": 4406 + }, + { + "epoch": 0.03, + "global_step": 4407, + "learning_rate": 0.0004824415692821369, + "loss": 1.5073, + "loss_base2": 2.1746, + "loss_pixel": 0.1898, + "loss_text": 1.3175, + "ppl": 4.5145, + "step": 4407 + }, + { + "epoch": 0.03, + "global_step": 4408, + "learning_rate": 0.0004824373956594324, + "loss": 1.4996, + "loss_base2": 2.1635, + "loss_pixel": 0.1901, + "loss_text": 1.3095, + "ppl": 4.4799, + "step": 4408 + }, + { + "epoch": 0.03, + "global_step": 4409, + "learning_rate": 0.0004824332220367279, + "loss": 1.5116, + "loss_base2": 2.1808, + "loss_pixel": 0.1921, + "loss_text": 1.3196, + "ppl": 4.534, + "step": 4409 + }, + { + "epoch": 0.03, + "global_step": 4410, + "learning_rate": 0.0004824290484140234, + "loss": 1.5039, + "loss_base2": 2.1697, + "loss_pixel": 0.1906, + "loss_text": 1.3133, + "ppl": 4.4992, + "step": 4410 + }, + { + "epoch": 0.03, + "global_step": 4411, + "learning_rate": 0.0004824248747913189, + "loss": 1.4947, + "loss_base2": 2.1564, + "loss_pixel": 0.1903, + "loss_text": 1.3044, + "ppl": 4.458, + "step": 4411 + }, + { + "epoch": 0.03, + "global_step": 4412, + "learning_rate": 0.0004824207011686144, + "loss": 1.4961, + "loss_base2": 2.1584, + "loss_pixel": 0.189, + "loss_text": 1.307, + "ppl": 4.4642, + "step": 4412 + }, + { + "epoch": 0.03, + "global_step": 4413, + "learning_rate": 0.00048241652754590984, + "loss": 1.5084, + "loss_base2": 2.1762, + "loss_pixel": 0.191, + "loss_text": 1.3175, + "ppl": 4.5195, + "step": 4413 + }, + { + "epoch": 0.03, + "global_step": 4414, + "learning_rate": 0.00048241235392320535, + "loss": 1.5113, + "loss_base2": 2.1803, + "loss_pixel": 0.1887, + "loss_text": 1.3226, + "ppl": 4.5326, + "step": 4414 + }, + { + "epoch": 0.03, + "global_step": 4415, + "learning_rate": 0.0004824081803005008, + "loss": 1.491, + "loss_base2": 2.1511, + "loss_pixel": 0.1902, + "loss_text": 1.3008, + "ppl": 4.4415, + "step": 4415 + }, + { + "epoch": 0.03, + "global_step": 4416, + "learning_rate": 0.0004824040066777963, + "loss": 1.4882, + "loss_base2": 2.147, + "loss_pixel": 0.1886, + "loss_text": 1.2996, + "ppl": 4.4291, + "step": 4416 + }, + { + "epoch": 0.03, + "global_step": 4417, + "learning_rate": 0.0004823998330550918, + "loss": 1.5215, + "loss_base2": 2.1951, + "loss_pixel": 0.1898, + "loss_text": 1.3318, + "ppl": 4.5791, + "step": 4417 + }, + { + "epoch": 0.03, + "global_step": 4418, + "learning_rate": 0.0004823956594323873, + "loss": 1.4804, + "loss_base2": 2.1358, + "loss_pixel": 0.1895, + "loss_text": 1.2908, + "ppl": 4.3947, + "step": 4418 + }, + { + "epoch": 0.03, + "global_step": 4419, + "learning_rate": 0.00048239148580968283, + "loss": 1.5024, + "loss_base2": 2.1675, + "loss_pixel": 0.1892, + "loss_text": 1.3132, + "ppl": 4.4925, + "step": 4419 + }, + { + "epoch": 0.03, + "global_step": 4420, + "learning_rate": 0.0004823873121869783, + "loss": 1.6853, + "loss_base2": 2.4314, + "loss_pixel": 0.1887, + "loss_text": 1.4966, + "ppl": 5.3941, + "step": 4420 + }, + { + "epoch": 0.03, + "global_step": 4421, + "learning_rate": 0.0004823831385642738, + "loss": 1.5348, + "loss_base2": 2.2142, + "loss_pixel": 0.189, + "loss_text": 1.3458, + "ppl": 4.6404, + "step": 4421 + }, + { + "epoch": 0.03, + "global_step": 4422, + "learning_rate": 0.0004823789649415693, + "loss": 1.5031, + "loss_base2": 2.1685, + "loss_pixel": 0.1897, + "loss_text": 1.3135, + "ppl": 4.4956, + "step": 4422 + }, + { + "epoch": 0.03, + "global_step": 4423, + "learning_rate": 0.0004823747913188648, + "loss": 1.493, + "loss_base2": 2.1539, + "loss_pixel": 0.1895, + "loss_text": 1.3036, + "ppl": 4.4504, + "step": 4423 + }, + { + "epoch": 0.03, + "global_step": 4424, + "learning_rate": 0.00048237061769616026, + "loss": 1.5097, + "loss_base2": 2.178, + "loss_pixel": 0.1884, + "loss_text": 1.3213, + "ppl": 4.5254, + "step": 4424 + }, + { + "epoch": 0.03, + "global_step": 4425, + "learning_rate": 0.00048236644407345577, + "loss": 1.4895, + "loss_base2": 2.1489, + "loss_pixel": 0.1886, + "loss_text": 1.3009, + "ppl": 4.4349, + "step": 4425 + }, + { + "epoch": 0.03, + "global_step": 4426, + "learning_rate": 0.00048236227045075127, + "loss": 1.4929, + "loss_base2": 2.1538, + "loss_pixel": 0.1883, + "loss_text": 1.3046, + "ppl": 4.45, + "step": 4426 + }, + { + "epoch": 0.03, + "global_step": 4427, + "learning_rate": 0.0004823580968280468, + "loss": 1.4992, + "loss_base2": 2.1629, + "loss_pixel": 0.1883, + "loss_text": 1.311, + "ppl": 4.4781, + "step": 4427 + }, + { + "epoch": 0.03, + "global_step": 4428, + "learning_rate": 0.0004823539232053423, + "loss": 1.4902, + "loss_base2": 2.1499, + "loss_pixel": 0.1898, + "loss_text": 1.3005, + "ppl": 4.438, + "step": 4428 + }, + { + "epoch": 0.03, + "global_step": 4429, + "learning_rate": 0.00048234974958263774, + "loss": 1.5151, + "loss_base2": 2.1858, + "loss_pixel": 0.1885, + "loss_text": 1.3266, + "ppl": 4.5499, + "step": 4429 + }, + { + "epoch": 0.03, + "global_step": 4430, + "learning_rate": 0.00048234557595993325, + "loss": 1.6753, + "loss_base2": 2.4169, + "loss_pixel": 0.1892, + "loss_text": 1.4861, + "ppl": 5.3404, + "step": 4430 + }, + { + "epoch": 0.03, + "global_step": 4431, + "learning_rate": 0.00048234140233722875, + "loss": 1.8003, + "loss_base2": 2.5973, + "loss_pixel": 0.1888, + "loss_text": 1.6114, + "ppl": 6.0515, + "step": 4431 + }, + { + "epoch": 0.03, + "global_step": 4432, + "learning_rate": 0.0004823372287145242, + "loss": 1.792, + "loss_base2": 2.5853, + "loss_pixel": 0.1902, + "loss_text": 1.6018, + "ppl": 6.0014, + "step": 4432 + }, + { + "epoch": 0.03, + "global_step": 4433, + "learning_rate": 0.00048233305509181966, + "loss": 1.7858, + "loss_base2": 2.5764, + "loss_pixel": 0.1899, + "loss_text": 1.5959, + "ppl": 5.9643, + "step": 4433 + }, + { + "epoch": 0.03, + "global_step": 4434, + "learning_rate": 0.00048232888146911517, + "loss": 1.7662, + "loss_base2": 2.5481, + "loss_pixel": 0.1924, + "loss_text": 1.5738, + "ppl": 5.8486, + "step": 4434 + }, + { + "epoch": 0.03, + "global_step": 4435, + "learning_rate": 0.0004823247078464107, + "loss": 1.7825, + "loss_base2": 2.5716, + "loss_pixel": 0.1886, + "loss_text": 1.5939, + "ppl": 5.9447, + "step": 4435 + }, + { + "epoch": 0.03, + "global_step": 4436, + "learning_rate": 0.0004823205342237062, + "loss": 1.7918, + "loss_base2": 2.585, + "loss_pixel": 0.1887, + "loss_text": 1.6031, + "ppl": 6.0002, + "step": 4436 + }, + { + "epoch": 0.03, + "global_step": 4437, + "learning_rate": 0.0004823163606010017, + "loss": 1.741, + "loss_base2": 2.5117, + "loss_pixel": 0.1887, + "loss_text": 1.5523, + "ppl": 5.703, + "step": 4437 + }, + { + "epoch": 0.03, + "global_step": 4438, + "learning_rate": 0.00048231218697829714, + "loss": 1.7734, + "loss_base2": 2.5585, + "loss_pixel": 0.1883, + "loss_text": 1.5851, + "ppl": 5.8908, + "step": 4438 + }, + { + "epoch": 0.03, + "global_step": 4439, + "learning_rate": 0.00048230801335559265, + "loss": 1.7588, + "loss_base2": 2.5374, + "loss_pixel": 0.1893, + "loss_text": 1.5695, + "ppl": 5.8055, + "step": 4439 + }, + { + "epoch": 0.03, + "global_step": 4440, + "learning_rate": 0.00048230383973288816, + "loss": 1.7689, + "loss_base2": 2.552, + "loss_pixel": 0.1902, + "loss_text": 1.5788, + "ppl": 5.8644, + "step": 4440 + }, + { + "epoch": 0.03, + "global_step": 4441, + "learning_rate": 0.00048229966611018367, + "loss": 1.766, + "loss_base2": 2.5478, + "loss_pixel": 0.1882, + "loss_text": 1.5778, + "ppl": 5.8474, + "step": 4441 + }, + { + "epoch": 0.03, + "global_step": 4442, + "learning_rate": 0.0004822954924874791, + "loss": 1.7727, + "loss_base2": 2.5575, + "loss_pixel": 0.1881, + "loss_text": 1.5846, + "ppl": 5.8867, + "step": 4442 + }, + { + "epoch": 0.03, + "global_step": 4443, + "learning_rate": 0.0004822913188647746, + "loss": 1.7396, + "loss_base2": 2.5097, + "loss_pixel": 0.1878, + "loss_text": 1.5518, + "ppl": 5.6951, + "step": 4443 + }, + { + "epoch": 0.03, + "global_step": 4444, + "learning_rate": 0.00048228714524207013, + "loss": 1.7632, + "loss_base2": 2.5438, + "loss_pixel": 0.1884, + "loss_text": 1.5747, + "ppl": 5.8311, + "step": 4444 + }, + { + "epoch": 0.03, + "global_step": 4445, + "learning_rate": 0.00048228297161936564, + "loss": 1.7692, + "loss_base2": 2.5524, + "loss_pixel": 0.1884, + "loss_text": 1.5808, + "ppl": 5.8662, + "step": 4445 + }, + { + "epoch": 0.03, + "global_step": 4446, + "learning_rate": 0.00048227879799666115, + "loss": 1.7809, + "loss_base2": 2.5693, + "loss_pixel": 0.189, + "loss_text": 1.5919, + "ppl": 5.9352, + "step": 4446 + }, + { + "epoch": 0.03, + "global_step": 4447, + "learning_rate": 0.0004822746243739566, + "loss": 1.7474, + "loss_base2": 2.521, + "loss_pixel": 0.1903, + "loss_text": 1.5571, + "ppl": 5.7397, + "step": 4447 + }, + { + "epoch": 0.03, + "global_step": 4448, + "learning_rate": 0.0004822704507512521, + "loss": 1.7403, + "loss_base2": 2.5107, + "loss_pixel": 0.1891, + "loss_text": 1.5512, + "ppl": 5.6991, + "step": 4448 + }, + { + "epoch": 0.03, + "global_step": 4449, + "learning_rate": 0.0004822662771285476, + "loss": 1.7624, + "loss_base2": 2.5426, + "loss_pixel": 0.1885, + "loss_text": 1.5738, + "ppl": 5.8264, + "step": 4449 + }, + { + "epoch": 0.03, + "global_step": 4450, + "learning_rate": 0.0004822621035058431, + "loss": 1.755, + "loss_base2": 2.5319, + "loss_pixel": 0.1889, + "loss_text": 1.5662, + "ppl": 5.7834, + "step": 4450 + }, + { + "epoch": 0.03, + "global_step": 4451, + "learning_rate": 0.0004822579298831386, + "loss": 1.7623, + "loss_base2": 2.5425, + "loss_pixel": 0.1898, + "loss_text": 1.5726, + "ppl": 5.8258, + "step": 4451 + }, + { + "epoch": 0.03, + "global_step": 4452, + "learning_rate": 0.00048225375626043403, + "loss": 1.7644, + "loss_base2": 2.5455, + "loss_pixel": 0.189, + "loss_text": 1.5754, + "ppl": 5.8381, + "step": 4452 + }, + { + "epoch": 0.03, + "global_step": 4453, + "learning_rate": 0.00048224958263772954, + "loss": 1.7572, + "loss_base2": 2.5351, + "loss_pixel": 0.188, + "loss_text": 1.5692, + "ppl": 5.7962, + "step": 4453 + }, + { + "epoch": 0.03, + "global_step": 4454, + "learning_rate": 0.00048224540901502504, + "loss": 1.7706, + "loss_base2": 2.5544, + "loss_pixel": 0.1901, + "loss_text": 1.5804, + "ppl": 5.8744, + "step": 4454 + }, + { + "epoch": 0.03, + "global_step": 4455, + "learning_rate": 0.00048224123539232055, + "loss": 1.7395, + "loss_base2": 2.5096, + "loss_pixel": 0.19, + "loss_text": 1.5495, + "ppl": 5.6945, + "step": 4455 + }, + { + "epoch": 0.03, + "global_step": 4456, + "learning_rate": 0.000482237061769616, + "loss": 1.7564, + "loss_base2": 2.5339, + "loss_pixel": 0.188, + "loss_text": 1.5684, + "ppl": 5.7916, + "step": 4456 + }, + { + "epoch": 0.03, + "global_step": 4457, + "learning_rate": 0.0004822328881469115, + "loss": 1.7516, + "loss_base2": 2.527, + "loss_pixel": 0.1884, + "loss_text": 1.5632, + "ppl": 5.7638, + "step": 4457 + }, + { + "epoch": 0.03, + "global_step": 4458, + "learning_rate": 0.000482228714524207, + "loss": 1.7489, + "loss_base2": 2.5231, + "loss_pixel": 0.1884, + "loss_text": 1.5605, + "ppl": 5.7483, + "step": 4458 + }, + { + "epoch": 0.03, + "global_step": 4459, + "learning_rate": 0.0004822245409015025, + "loss": 1.7468, + "loss_base2": 2.5201, + "loss_pixel": 0.1874, + "loss_text": 1.5594, + "ppl": 5.7362, + "step": 4459 + }, + { + "epoch": 0.03, + "global_step": 4460, + "learning_rate": 0.00048222036727879803, + "loss": 1.745, + "loss_base2": 2.5175, + "loss_pixel": 0.1875, + "loss_text": 1.5575, + "ppl": 5.7259, + "step": 4460 + }, + { + "epoch": 0.03, + "global_step": 4461, + "learning_rate": 0.0004822161936560935, + "loss": 1.7596, + "loss_base2": 2.5386, + "loss_pixel": 0.1891, + "loss_text": 1.5705, + "ppl": 5.8101, + "step": 4461 + }, + { + "epoch": 0.03, + "global_step": 4462, + "learning_rate": 0.000482212020033389, + "loss": 1.7544, + "loss_base2": 2.5311, + "loss_pixel": 0.1891, + "loss_text": 1.5653, + "ppl": 5.78, + "step": 4462 + }, + { + "epoch": 0.03, + "global_step": 4463, + "learning_rate": 0.0004822078464106845, + "loss": 1.7559, + "loss_base2": 2.5332, + "loss_pixel": 0.1887, + "loss_text": 1.5672, + "ppl": 5.7887, + "step": 4463 + }, + { + "epoch": 0.03, + "global_step": 4464, + "learning_rate": 0.00048220367278798, + "loss": 1.7344, + "loss_base2": 2.5022, + "loss_pixel": 0.1885, + "loss_text": 1.5458, + "ppl": 5.6655, + "step": 4464 + }, + { + "epoch": 0.03, + "global_step": 4465, + "learning_rate": 0.00048219949916527546, + "loss": 1.7475, + "loss_base2": 2.5211, + "loss_pixel": 0.1866, + "loss_text": 1.5609, + "ppl": 5.7402, + "step": 4465 + }, + { + "epoch": 0.03, + "global_step": 4466, + "learning_rate": 0.00048219532554257097, + "loss": 1.7315, + "loss_base2": 2.498, + "loss_pixel": 0.1874, + "loss_text": 1.544, + "ppl": 5.6491, + "step": 4466 + }, + { + "epoch": 0.03, + "global_step": 4467, + "learning_rate": 0.0004821911519198665, + "loss": 1.7598, + "loss_base2": 2.5389, + "loss_pixel": 0.188, + "loss_text": 1.5718, + "ppl": 5.8113, + "step": 4467 + }, + { + "epoch": 0.03, + "global_step": 4468, + "learning_rate": 0.000482186978297162, + "loss": 1.7501, + "loss_base2": 2.5249, + "loss_pixel": 0.1893, + "loss_text": 1.5608, + "ppl": 5.7552, + "step": 4468 + }, + { + "epoch": 0.03, + "global_step": 4469, + "learning_rate": 0.0004821828046744575, + "loss": 1.7503, + "loss_base2": 2.5251, + "loss_pixel": 0.1882, + "loss_text": 1.5621, + "ppl": 5.7563, + "step": 4469 + }, + { + "epoch": 0.03, + "global_step": 4470, + "learning_rate": 0.0004821786310517529, + "loss": 1.7408, + "loss_base2": 2.5114, + "loss_pixel": 0.1866, + "loss_text": 1.5542, + "ppl": 5.7019, + "step": 4470 + }, + { + "epoch": 0.03, + "global_step": 4471, + "learning_rate": 0.0004821744574290484, + "loss": 1.7415, + "loss_base2": 2.5125, + "loss_pixel": 0.188, + "loss_text": 1.5534, + "ppl": 5.7059, + "step": 4471 + }, + { + "epoch": 0.03, + "global_step": 4472, + "learning_rate": 0.0004821702838063439, + "loss": 1.7464, + "loss_base2": 2.5195, + "loss_pixel": 0.1941, + "loss_text": 1.5523, + "ppl": 5.7339, + "step": 4472 + }, + { + "epoch": 0.03, + "global_step": 4473, + "learning_rate": 0.0004821661101836394, + "loss": 1.7547, + "loss_base2": 2.5315, + "loss_pixel": 0.1966, + "loss_text": 1.558, + "ppl": 5.7817, + "step": 4473 + }, + { + "epoch": 0.03, + "global_step": 4474, + "learning_rate": 0.00048216193656093486, + "loss": 1.7651, + "loss_base2": 2.5465, + "loss_pixel": 0.1958, + "loss_text": 1.5692, + "ppl": 5.8422, + "step": 4474 + }, + { + "epoch": 0.03, + "global_step": 4475, + "learning_rate": 0.00048215776293823037, + "loss": 1.758, + "loss_base2": 2.5363, + "loss_pixel": 0.188, + "loss_text": 1.5699, + "ppl": 5.8008, + "step": 4475 + }, + { + "epoch": 0.03, + "global_step": 4476, + "learning_rate": 0.0004821535893155259, + "loss": 1.737, + "loss_base2": 2.506, + "loss_pixel": 0.1894, + "loss_text": 1.5476, + "ppl": 5.6803, + "step": 4476 + }, + { + "epoch": 0.03, + "global_step": 4477, + "learning_rate": 0.0004821494156928214, + "loss": 1.7105, + "loss_base2": 2.4677, + "loss_pixel": 0.1885, + "loss_text": 1.5221, + "ppl": 5.5317, + "step": 4477 + }, + { + "epoch": 0.03, + "global_step": 4478, + "learning_rate": 0.0004821452420701169, + "loss": 1.6043, + "loss_base2": 2.3145, + "loss_pixel": 0.1898, + "loss_text": 1.4145, + "ppl": 4.9744, + "step": 4478 + }, + { + "epoch": 0.03, + "global_step": 4479, + "learning_rate": 0.00048214106844741235, + "loss": 1.5038, + "loss_base2": 2.1695, + "loss_pixel": 0.1863, + "loss_text": 1.3175, + "ppl": 4.4988, + "step": 4479 + }, + { + "epoch": 0.03, + "global_step": 4480, + "learning_rate": 0.00048213689482470785, + "loss": 1.4905, + "loss_base2": 2.1503, + "loss_pixel": 0.1873, + "loss_text": 1.3032, + "ppl": 4.4393, + "step": 4480 + }, + { + "epoch": 0.03, + "global_step": 4481, + "learning_rate": 0.00048213272120200336, + "loss": 1.5018, + "loss_base2": 2.1666, + "loss_pixel": 0.1845, + "loss_text": 1.3173, + "ppl": 4.4898, + "step": 4481 + }, + { + "epoch": 0.03, + "global_step": 4482, + "learning_rate": 0.00048212854757929887, + "loss": 1.4915, + "loss_base2": 2.1518, + "loss_pixel": 0.1867, + "loss_text": 1.3048, + "ppl": 4.4438, + "step": 4482 + }, + { + "epoch": 0.03, + "global_step": 4483, + "learning_rate": 0.0004821243739565943, + "loss": 1.4989, + "loss_base2": 2.1625, + "loss_pixel": 0.1866, + "loss_text": 1.3123, + "ppl": 4.4768, + "step": 4483 + }, + { + "epoch": 0.03, + "global_step": 4484, + "learning_rate": 0.00048212020033388983, + "loss": 1.5099, + "loss_base2": 2.1783, + "loss_pixel": 0.1843, + "loss_text": 1.3256, + "ppl": 4.5263, + "step": 4484 + }, + { + "epoch": 0.03, + "global_step": 4485, + "learning_rate": 0.00048211602671118534, + "loss": 1.4953, + "loss_base2": 2.1573, + "loss_pixel": 0.1869, + "loss_text": 1.3085, + "ppl": 4.4607, + "step": 4485 + }, + { + "epoch": 0.03, + "global_step": 4486, + "learning_rate": 0.00048211185308848084, + "loss": 1.4862, + "loss_base2": 2.1441, + "loss_pixel": 0.185, + "loss_text": 1.3012, + "ppl": 4.4203, + "step": 4486 + }, + { + "epoch": 0.03, + "global_step": 4487, + "learning_rate": 0.00048210767946577635, + "loss": 1.4933, + "loss_base2": 2.1544, + "loss_pixel": 0.1829, + "loss_text": 1.3104, + "ppl": 4.4518, + "step": 4487 + }, + { + "epoch": 0.03, + "global_step": 4488, + "learning_rate": 0.00048210350584307175, + "loss": 1.4895, + "loss_base2": 2.1489, + "loss_pixel": 0.1845, + "loss_text": 1.3051, + "ppl": 4.4349, + "step": 4488 + }, + { + "epoch": 0.03, + "global_step": 4489, + "learning_rate": 0.00048209933222036726, + "loss": 1.4852, + "loss_base2": 2.1427, + "loss_pixel": 0.1825, + "loss_text": 1.3027, + "ppl": 4.4158, + "step": 4489 + }, + { + "epoch": 0.03, + "global_step": 4490, + "learning_rate": 0.00048209515859766276, + "loss": 1.5027, + "loss_base2": 2.1679, + "loss_pixel": 0.1842, + "loss_text": 1.3184, + "ppl": 4.4938, + "step": 4490 + }, + { + "epoch": 0.03, + "global_step": 4491, + "learning_rate": 0.00048209098497495827, + "loss": 1.4981, + "loss_base2": 2.1613, + "loss_pixel": 0.1836, + "loss_text": 1.3145, + "ppl": 4.4732, + "step": 4491 + }, + { + "epoch": 0.03, + "global_step": 4492, + "learning_rate": 0.0004820868113522537, + "loss": 1.5144, + "loss_base2": 2.1848, + "loss_pixel": 0.1963, + "loss_text": 1.318, + "ppl": 4.5467, + "step": 4492 + }, + { + "epoch": 0.03, + "global_step": 4493, + "learning_rate": 0.00048208263772954923, + "loss": 1.5767, + "loss_base2": 2.2747, + "loss_pixel": 0.1999, + "loss_text": 1.3768, + "ppl": 4.839, + "step": 4493 + }, + { + "epoch": 0.03, + "global_step": 4494, + "learning_rate": 0.00048207846410684474, + "loss": 1.682, + "loss_base2": 2.4266, + "loss_pixel": 0.1975, + "loss_text": 1.4845, + "ppl": 5.3763, + "step": 4494 + }, + { + "epoch": 0.03, + "global_step": 4495, + "learning_rate": 0.00048207429048414025, + "loss": 1.6749, + "loss_base2": 2.4164, + "loss_pixel": 0.1931, + "loss_text": 1.4818, + "ppl": 5.3383, + "step": 4495 + }, + { + "epoch": 0.03, + "global_step": 4496, + "learning_rate": 0.00048207011686143575, + "loss": 1.5943, + "loss_base2": 2.3001, + "loss_pixel": 0.1915, + "loss_text": 1.4027, + "ppl": 4.9249, + "step": 4496 + }, + { + "epoch": 0.03, + "global_step": 4497, + "learning_rate": 0.0004820659432387312, + "loss": 1.5281, + "loss_base2": 2.2046, + "loss_pixel": 0.1918, + "loss_text": 1.3363, + "ppl": 4.6094, + "step": 4497 + }, + { + "epoch": 0.03, + "global_step": 4498, + "learning_rate": 0.0004820617696160267, + "loss": 1.4925, + "loss_base2": 2.1532, + "loss_pixel": 0.192, + "loss_text": 1.3004, + "ppl": 4.4482, + "step": 4498 + }, + { + "epoch": 0.03, + "global_step": 4499, + "learning_rate": 0.0004820575959933222, + "loss": 1.523, + "loss_base2": 2.1972, + "loss_pixel": 0.192, + "loss_text": 1.331, + "ppl": 4.586, + "step": 4499 + }, + { + "epoch": 0.03, + "global_step": 4500, + "learning_rate": 0.00048205342237061773, + "loss": 1.5027, + "loss_base2": 2.1679, + "loss_pixel": 0.1931, + "loss_text": 1.3096, + "ppl": 4.4938, + "step": 4500 + }, + { + "epoch": 0.03, + "global_step": 4501, + "learning_rate": 0.0004820492487479132, + "loss": 1.5146, + "loss_base2": 2.1851, + "loss_pixel": 0.1977, + "loss_text": 1.317, + "ppl": 4.5476, + "step": 4501 + }, + { + "epoch": 0.03, + "global_step": 4502, + "learning_rate": 0.0004820450751252087, + "loss": 1.5149, + "loss_base2": 2.1855, + "loss_pixel": 0.194, + "loss_text": 1.3209, + "ppl": 4.549, + "step": 4502 + }, + { + "epoch": 0.03, + "global_step": 4503, + "learning_rate": 0.0004820409015025042, + "loss": 1.5547, + "loss_base2": 2.243, + "loss_pixel": 0.1941, + "loss_text": 1.3606, + "ppl": 4.7337, + "step": 4503 + }, + { + "epoch": 0.03, + "global_step": 4504, + "learning_rate": 0.0004820367278797997, + "loss": 1.7788, + "loss_base2": 2.5663, + "loss_pixel": 0.1949, + "loss_text": 1.5839, + "ppl": 5.9227, + "step": 4504 + }, + { + "epoch": 0.03, + "global_step": 4505, + "learning_rate": 0.0004820325542570952, + "loss": 1.7949, + "loss_base2": 2.5895, + "loss_pixel": 0.1966, + "loss_text": 1.5983, + "ppl": 6.0189, + "step": 4505 + }, + { + "epoch": 0.03, + "global_step": 4506, + "learning_rate": 0.00048202838063439067, + "loss": 1.7694, + "loss_base2": 2.5527, + "loss_pixel": 0.1946, + "loss_text": 1.5747, + "ppl": 5.8673, + "step": 4506 + }, + { + "epoch": 0.03, + "global_step": 4507, + "learning_rate": 0.0004820242070116861, + "loss": 1.7834, + "loss_base2": 2.5729, + "loss_pixel": 0.2004, + "loss_text": 1.583, + "ppl": 5.9501, + "step": 4507 + }, + { + "epoch": 0.03, + "global_step": 4508, + "learning_rate": 0.0004820200333889816, + "loss": 1.7809, + "loss_base2": 2.5693, + "loss_pixel": 0.2053, + "loss_text": 1.5755, + "ppl": 5.9352, + "step": 4508 + }, + { + "epoch": 0.03, + "global_step": 4509, + "learning_rate": 0.00048201585976627713, + "loss": 1.7961, + "loss_base2": 2.5912, + "loss_pixel": 0.2057, + "loss_text": 1.5905, + "ppl": 6.0261, + "step": 4509 + }, + { + "epoch": 0.03, + "global_step": 4510, + "learning_rate": 0.00048201168614357264, + "loss": 1.7698, + "loss_base2": 2.5533, + "loss_pixel": 0.2074, + "loss_text": 1.5624, + "ppl": 5.8697, + "step": 4510 + }, + { + "epoch": 0.03, + "global_step": 4511, + "learning_rate": 0.0004820075125208681, + "loss": 1.7693, + "loss_base2": 2.5526, + "loss_pixel": 0.2009, + "loss_text": 1.5684, + "ppl": 5.8667, + "step": 4511 + }, + { + "epoch": 0.03, + "global_step": 4512, + "learning_rate": 0.0004820033388981636, + "loss": 1.7734, + "loss_base2": 2.5585, + "loss_pixel": 0.2013, + "loss_text": 1.5721, + "ppl": 5.8908, + "step": 4512 + }, + { + "epoch": 0.03, + "global_step": 4513, + "learning_rate": 0.0004819991652754591, + "loss": 1.7609, + "loss_base2": 2.5404, + "loss_pixel": 0.1983, + "loss_text": 1.5627, + "ppl": 5.8177, + "step": 4513 + }, + { + "epoch": 0.03, + "global_step": 4514, + "learning_rate": 0.0004819949916527546, + "loss": 1.7725, + "loss_base2": 2.5572, + "loss_pixel": 0.1978, + "loss_text": 1.5747, + "ppl": 5.8855, + "step": 4514 + }, + { + "epoch": 0.03, + "global_step": 4515, + "learning_rate": 0.00048199081803005007, + "loss": 1.7516, + "loss_base2": 2.527, + "loss_pixel": 0.1959, + "loss_text": 1.5557, + "ppl": 5.7638, + "step": 4515 + }, + { + "epoch": 0.03, + "global_step": 4516, + "learning_rate": 0.0004819866444073456, + "loss": 1.7644, + "loss_base2": 2.5455, + "loss_pixel": 0.1947, + "loss_text": 1.5696, + "ppl": 5.8381, + "step": 4516 + }, + { + "epoch": 0.03, + "global_step": 4517, + "learning_rate": 0.0004819824707846411, + "loss": 1.7727, + "loss_base2": 2.5575, + "loss_pixel": 0.195, + "loss_text": 1.5776, + "ppl": 5.8867, + "step": 4517 + }, + { + "epoch": 0.03, + "global_step": 4518, + "learning_rate": 0.0004819782971619366, + "loss": 1.7557, + "loss_base2": 2.5329, + "loss_pixel": 0.1949, + "loss_text": 1.5608, + "ppl": 5.7875, + "step": 4518 + }, + { + "epoch": 0.03, + "global_step": 4519, + "learning_rate": 0.0004819741235392321, + "loss": 1.8078, + "loss_base2": 2.6081, + "loss_pixel": 0.1946, + "loss_text": 1.6132, + "ppl": 6.097, + "step": 4519 + }, + { + "epoch": 0.03, + "global_step": 4520, + "learning_rate": 0.00048196994991652755, + "loss": 1.7733, + "loss_base2": 2.5583, + "loss_pixel": 0.1937, + "loss_text": 1.5796, + "ppl": 5.8903, + "step": 4520 + }, + { + "epoch": 0.03, + "global_step": 4521, + "learning_rate": 0.00048196577629382306, + "loss": 1.7564, + "loss_base2": 2.5339, + "loss_pixel": 0.1933, + "loss_text": 1.5631, + "ppl": 5.7916, + "step": 4521 + }, + { + "epoch": 0.03, + "global_step": 4522, + "learning_rate": 0.00048196160267111857, + "loss": 1.7392, + "loss_base2": 2.5091, + "loss_pixel": 0.1928, + "loss_text": 1.5464, + "ppl": 5.6928, + "step": 4522 + }, + { + "epoch": 0.03, + "global_step": 4523, + "learning_rate": 0.00048195742904841407, + "loss": 1.7635, + "loss_base2": 2.5442, + "loss_pixel": 0.1925, + "loss_text": 1.571, + "ppl": 5.8328, + "step": 4523 + }, + { + "epoch": 0.03, + "global_step": 4524, + "learning_rate": 0.0004819532554257095, + "loss": 1.7416, + "loss_base2": 2.5126, + "loss_pixel": 0.192, + "loss_text": 1.5496, + "ppl": 5.7065, + "step": 4524 + }, + { + "epoch": 0.03, + "global_step": 4525, + "learning_rate": 0.00048194908180300503, + "loss": 1.7541, + "loss_base2": 2.5306, + "loss_pixel": 0.1919, + "loss_text": 1.5621, + "ppl": 5.7782, + "step": 4525 + }, + { + "epoch": 0.03, + "global_step": 4526, + "learning_rate": 0.0004819449081803005, + "loss": 1.7517, + "loss_base2": 2.5272, + "loss_pixel": 0.192, + "loss_text": 1.5597, + "ppl": 5.7644, + "step": 4526 + }, + { + "epoch": 0.03, + "global_step": 4527, + "learning_rate": 0.000481940734557596, + "loss": 1.7412, + "loss_base2": 2.512, + "loss_pixel": 0.1899, + "loss_text": 1.5513, + "ppl": 5.7042, + "step": 4527 + }, + { + "epoch": 0.03, + "global_step": 4528, + "learning_rate": 0.0004819365609348915, + "loss": 1.7486, + "loss_base2": 2.5227, + "loss_pixel": 0.1921, + "loss_text": 1.5565, + "ppl": 5.7466, + "step": 4528 + }, + { + "epoch": 0.03, + "global_step": 4529, + "learning_rate": 0.00048193238731218695, + "loss": 1.7485, + "loss_base2": 2.5226, + "loss_pixel": 0.1887, + "loss_text": 1.5598, + "ppl": 5.746, + "step": 4529 + }, + { + "epoch": 0.03, + "global_step": 4530, + "learning_rate": 0.00048192821368948246, + "loss": 1.7436, + "loss_base2": 2.5155, + "loss_pixel": 0.1912, + "loss_text": 1.5524, + "ppl": 5.7179, + "step": 4530 + }, + { + "epoch": 0.03, + "global_step": 4531, + "learning_rate": 0.00048192404006677797, + "loss": 1.756, + "loss_base2": 2.5334, + "loss_pixel": 0.1911, + "loss_text": 1.565, + "ppl": 5.7892, + "step": 4531 + }, + { + "epoch": 0.03, + "global_step": 4532, + "learning_rate": 0.0004819198664440735, + "loss": 1.7491, + "loss_base2": 2.5234, + "loss_pixel": 0.1898, + "loss_text": 1.5593, + "ppl": 5.7494, + "step": 4532 + }, + { + "epoch": 0.03, + "global_step": 4533, + "learning_rate": 0.00048191569282136893, + "loss": 1.7547, + "loss_base2": 2.5315, + "loss_pixel": 0.1892, + "loss_text": 1.5655, + "ppl": 5.7817, + "step": 4533 + }, + { + "epoch": 0.03, + "global_step": 4534, + "learning_rate": 0.00048191151919866444, + "loss": 1.7432, + "loss_base2": 2.5149, + "loss_pixel": 0.1902, + "loss_text": 1.553, + "ppl": 5.7156, + "step": 4534 + }, + { + "epoch": 0.03, + "global_step": 4535, + "learning_rate": 0.00048190734557595994, + "loss": 1.7699, + "loss_base2": 2.5534, + "loss_pixel": 0.1889, + "loss_text": 1.581, + "ppl": 5.8703, + "step": 4535 + }, + { + "epoch": 0.03, + "global_step": 4536, + "learning_rate": 0.00048190317195325545, + "loss": 1.7639, + "loss_base2": 2.5448, + "loss_pixel": 0.191, + "loss_text": 1.5729, + "ppl": 5.8352, + "step": 4536 + }, + { + "epoch": 0.03, + "global_step": 4537, + "learning_rate": 0.00048189899833055096, + "loss": 1.7292, + "loss_base2": 2.4947, + "loss_pixel": 0.1883, + "loss_text": 1.5409, + "ppl": 5.6361, + "step": 4537 + }, + { + "epoch": 0.03, + "global_step": 4538, + "learning_rate": 0.0004818948247078464, + "loss": 1.7263, + "loss_base2": 2.4905, + "loss_pixel": 0.1872, + "loss_text": 1.5391, + "ppl": 5.6198, + "step": 4538 + }, + { + "epoch": 0.03, + "global_step": 4539, + "learning_rate": 0.0004818906510851419, + "loss": 1.7333, + "loss_base2": 2.5006, + "loss_pixel": 0.1887, + "loss_text": 1.5446, + "ppl": 5.6593, + "step": 4539 + }, + { + "epoch": 0.03, + "global_step": 4540, + "learning_rate": 0.0004818864774624374, + "loss": 1.7425, + "loss_base2": 2.5139, + "loss_pixel": 0.1886, + "loss_text": 1.554, + "ppl": 5.7116, + "step": 4540 + }, + { + "epoch": 0.03, + "global_step": 4541, + "learning_rate": 0.00048188230383973293, + "loss": 1.7507, + "loss_base2": 2.5257, + "loss_pixel": 0.1895, + "loss_text": 1.5612, + "ppl": 5.7586, + "step": 4541 + }, + { + "epoch": 0.03, + "global_step": 4542, + "learning_rate": 0.0004818781302170284, + "loss": 1.7566, + "loss_base2": 2.5342, + "loss_pixel": 0.1892, + "loss_text": 1.5675, + "ppl": 5.7927, + "step": 4542 + }, + { + "epoch": 0.03, + "global_step": 4543, + "learning_rate": 0.0004818739565943239, + "loss": 1.7382, + "loss_base2": 2.5077, + "loss_pixel": 0.1882, + "loss_text": 1.5501, + "ppl": 5.6871, + "step": 4543 + }, + { + "epoch": 0.03, + "global_step": 4544, + "learning_rate": 0.0004818697829716194, + "loss": 1.7533, + "loss_base2": 2.5295, + "loss_pixel": 0.1878, + "loss_text": 1.5655, + "ppl": 5.7736, + "step": 4544 + }, + { + "epoch": 0.03, + "global_step": 4545, + "learning_rate": 0.00048186560934891485, + "loss": 1.75, + "loss_base2": 2.5247, + "loss_pixel": 0.189, + "loss_text": 1.561, + "ppl": 5.7546, + "step": 4545 + }, + { + "epoch": 0.03, + "global_step": 4546, + "learning_rate": 0.00048186143572621036, + "loss": 1.7531, + "loss_base2": 2.5292, + "loss_pixel": 0.1873, + "loss_text": 1.5657, + "ppl": 5.7725, + "step": 4546 + }, + { + "epoch": 0.03, + "global_step": 4547, + "learning_rate": 0.0004818572621035058, + "loss": 1.7604, + "loss_base2": 2.5397, + "loss_pixel": 0.1879, + "loss_text": 1.5725, + "ppl": 5.8148, + "step": 4547 + }, + { + "epoch": 0.03, + "global_step": 4548, + "learning_rate": 0.0004818530884808013, + "loss": 1.7488, + "loss_base2": 2.523, + "loss_pixel": 0.1872, + "loss_text": 1.5616, + "ppl": 5.7477, + "step": 4548 + }, + { + "epoch": 0.03, + "global_step": 4549, + "learning_rate": 0.00048184891485809683, + "loss": 1.7367, + "loss_base2": 2.5055, + "loss_pixel": 0.1881, + "loss_text": 1.5486, + "ppl": 5.6786, + "step": 4549 + }, + { + "epoch": 0.03, + "global_step": 4550, + "learning_rate": 0.00048184474123539234, + "loss": 1.7354, + "loss_base2": 2.5037, + "loss_pixel": 0.1871, + "loss_text": 1.5483, + "ppl": 5.6712, + "step": 4550 + }, + { + "epoch": 0.03, + "global_step": 4551, + "learning_rate": 0.0004818405676126878, + "loss": 1.728, + "loss_base2": 2.493, + "loss_pixel": 0.188, + "loss_text": 1.54, + "ppl": 5.6294, + "step": 4551 + }, + { + "epoch": 0.03, + "global_step": 4552, + "learning_rate": 0.0004818363939899833, + "loss": 1.7458, + "loss_base2": 2.5187, + "loss_pixel": 0.1888, + "loss_text": 1.557, + "ppl": 5.7305, + "step": 4552 + }, + { + "epoch": 0.03, + "global_step": 4553, + "learning_rate": 0.0004818322203672788, + "loss": 1.7283, + "loss_base2": 2.4934, + "loss_pixel": 0.1867, + "loss_text": 1.5416, + "ppl": 5.6311, + "step": 4553 + }, + { + "epoch": 0.03, + "global_step": 4554, + "learning_rate": 0.0004818280467445743, + "loss": 1.5135, + "loss_base2": 2.1835, + "loss_pixel": 0.1888, + "loss_text": 1.3247, + "ppl": 4.5426, + "step": 4554 + }, + { + "epoch": 0.03, + "global_step": 4555, + "learning_rate": 0.0004818238731218698, + "loss": 1.5104, + "loss_base2": 2.179, + "loss_pixel": 0.1923, + "loss_text": 1.3181, + "ppl": 4.5285, + "step": 4555 + }, + { + "epoch": 0.03, + "global_step": 4556, + "learning_rate": 0.00048181969949916527, + "loss": 1.5222, + "loss_base2": 2.1961, + "loss_pixel": 0.1931, + "loss_text": 1.3292, + "ppl": 4.5823, + "step": 4556 + }, + { + "epoch": 0.03, + "global_step": 4557, + "learning_rate": 0.0004818155258764608, + "loss": 1.5067, + "loss_base2": 2.1737, + "loss_pixel": 0.1895, + "loss_text": 1.3171, + "ppl": 4.5118, + "step": 4557 + }, + { + "epoch": 0.03, + "global_step": 4558, + "learning_rate": 0.0004818113522537563, + "loss": 1.4828, + "loss_base2": 2.1392, + "loss_pixel": 0.1905, + "loss_text": 1.2923, + "ppl": 4.4053, + "step": 4558 + }, + { + "epoch": 0.03, + "global_step": 4559, + "learning_rate": 0.0004818071786310518, + "loss": 1.5014, + "loss_base2": 2.1661, + "loss_pixel": 0.1919, + "loss_text": 1.3095, + "ppl": 4.488, + "step": 4559 + }, + { + "epoch": 0.03, + "global_step": 4560, + "learning_rate": 0.00048180300500834725, + "loss": 1.4822, + "loss_base2": 2.1384, + "loss_pixel": 0.1919, + "loss_text": 1.2902, + "ppl": 4.4026, + "step": 4560 + }, + { + "epoch": 0.03, + "global_step": 4561, + "learning_rate": 0.00048179883138564275, + "loss": 1.6693, + "loss_base2": 2.4083, + "loss_pixel": 0.1945, + "loss_text": 1.4748, + "ppl": 5.3085, + "step": 4561 + }, + { + "epoch": 0.03, + "global_step": 4562, + "learning_rate": 0.00048179465776293826, + "loss": 1.7638, + "loss_base2": 2.5446, + "loss_pixel": 0.1926, + "loss_text": 1.5712, + "ppl": 5.8346, + "step": 4562 + }, + { + "epoch": 0.03, + "global_step": 4563, + "learning_rate": 0.00048179048414023377, + "loss": 1.766, + "loss_base2": 2.5478, + "loss_pixel": 0.192, + "loss_text": 1.574, + "ppl": 5.8474, + "step": 4563 + }, + { + "epoch": 0.03, + "global_step": 4564, + "learning_rate": 0.0004817863105175292, + "loss": 1.7418, + "loss_base2": 2.5129, + "loss_pixel": 0.1929, + "loss_text": 1.5489, + "ppl": 5.7076, + "step": 4564 + }, + { + "epoch": 0.03, + "global_step": 4565, + "learning_rate": 0.0004817821368948247, + "loss": 1.7504, + "loss_base2": 2.5253, + "loss_pixel": 0.1929, + "loss_text": 1.5575, + "ppl": 5.7569, + "step": 4565 + }, + { + "epoch": 0.03, + "global_step": 4566, + "learning_rate": 0.0004817779632721202, + "loss": 1.7415, + "loss_base2": 2.5125, + "loss_pixel": 0.1911, + "loss_text": 1.5504, + "ppl": 5.7059, + "step": 4566 + }, + { + "epoch": 0.03, + "global_step": 4567, + "learning_rate": 0.0004817737896494157, + "loss": 1.7561, + "loss_base2": 2.5335, + "loss_pixel": 0.1897, + "loss_text": 1.5664, + "ppl": 5.7898, + "step": 4567 + }, + { + "epoch": 0.03, + "global_step": 4568, + "learning_rate": 0.0004817696160267112, + "loss": 1.7763, + "loss_base2": 2.5627, + "loss_pixel": 0.1896, + "loss_text": 1.5867, + "ppl": 5.908, + "step": 4568 + }, + { + "epoch": 0.03, + "global_step": 4569, + "learning_rate": 0.0004817654424040067, + "loss": 1.7616, + "loss_base2": 2.5415, + "loss_pixel": 0.1905, + "loss_text": 1.5711, + "ppl": 5.8217, + "step": 4569 + }, + { + "epoch": 0.03, + "global_step": 4570, + "learning_rate": 0.00048176126878130216, + "loss": 1.7384, + "loss_base2": 2.508, + "loss_pixel": 0.1888, + "loss_text": 1.5496, + "ppl": 5.6882, + "step": 4570 + }, + { + "epoch": 0.03, + "global_step": 4571, + "learning_rate": 0.00048175709515859767, + "loss": 1.7568, + "loss_base2": 2.5345, + "loss_pixel": 0.1895, + "loss_text": 1.5673, + "ppl": 5.7939, + "step": 4571 + }, + { + "epoch": 0.03, + "global_step": 4572, + "learning_rate": 0.00048175292153589317, + "loss": 1.7341, + "loss_base2": 2.5018, + "loss_pixel": 0.1895, + "loss_text": 1.5446, + "ppl": 5.6638, + "step": 4572 + }, + { + "epoch": 0.03, + "global_step": 4573, + "learning_rate": 0.0004817487479131887, + "loss": 1.7402, + "loss_base2": 2.5106, + "loss_pixel": 0.189, + "loss_text": 1.5513, + "ppl": 5.6985, + "step": 4573 + }, + { + "epoch": 0.03, + "global_step": 4574, + "learning_rate": 0.00048174457429048413, + "loss": 1.74, + "loss_base2": 2.5103, + "loss_pixel": 0.1887, + "loss_text": 1.5513, + "ppl": 5.6973, + "step": 4574 + }, + { + "epoch": 0.03, + "global_step": 4575, + "learning_rate": 0.00048174040066777964, + "loss": 1.7408, + "loss_base2": 2.5114, + "loss_pixel": 0.1892, + "loss_text": 1.5515, + "ppl": 5.7019, + "step": 4575 + }, + { + "epoch": 0.03, + "global_step": 4576, + "learning_rate": 0.00048173622704507515, + "loss": 1.7357, + "loss_base2": 2.5041, + "loss_pixel": 0.1887, + "loss_text": 1.547, + "ppl": 5.6729, + "step": 4576 + }, + { + "epoch": 0.03, + "global_step": 4577, + "learning_rate": 0.00048173205342237065, + "loss": 1.7503, + "loss_base2": 2.5251, + "loss_pixel": 0.1885, + "loss_text": 1.5618, + "ppl": 5.7563, + "step": 4577 + }, + { + "epoch": 0.03, + "global_step": 4578, + "learning_rate": 0.00048172787979966616, + "loss": 1.7401, + "loss_base2": 2.5104, + "loss_pixel": 0.188, + "loss_text": 1.5521, + "ppl": 5.6979, + "step": 4578 + }, + { + "epoch": 0.03, + "global_step": 4579, + "learning_rate": 0.0004817237061769616, + "loss": 1.7497, + "loss_base2": 2.5243, + "loss_pixel": 0.188, + "loss_text": 1.5617, + "ppl": 5.7529, + "step": 4579 + }, + { + "epoch": 0.03, + "global_step": 4580, + "learning_rate": 0.0004817195325542571, + "loss": 1.741, + "loss_base2": 2.5117, + "loss_pixel": 0.1872, + "loss_text": 1.5538, + "ppl": 5.703, + "step": 4580 + }, + { + "epoch": 0.03, + "global_step": 4581, + "learning_rate": 0.00048171535893155263, + "loss": 1.7386, + "loss_base2": 2.5083, + "loss_pixel": 0.1887, + "loss_text": 1.5499, + "ppl": 5.6894, + "step": 4581 + }, + { + "epoch": 0.03, + "global_step": 4582, + "learning_rate": 0.0004817111853088481, + "loss": 1.7314, + "loss_base2": 2.4979, + "loss_pixel": 0.1882, + "loss_text": 1.5431, + "ppl": 5.6486, + "step": 4582 + }, + { + "epoch": 0.03, + "global_step": 4583, + "learning_rate": 0.00048170701168614354, + "loss": 1.6802, + "loss_base2": 2.424, + "loss_pixel": 0.1883, + "loss_text": 1.4919, + "ppl": 5.3666, + "step": 4583 + }, + { + "epoch": 0.03, + "global_step": 4584, + "learning_rate": 0.00048170283806343904, + "loss": 1.7437, + "loss_base2": 2.5156, + "loss_pixel": 0.1875, + "loss_text": 1.5561, + "ppl": 5.7185, + "step": 4584 + }, + { + "epoch": 0.03, + "global_step": 4585, + "learning_rate": 0.00048169866444073455, + "loss": 1.7567, + "loss_base2": 2.5344, + "loss_pixel": 0.1881, + "loss_text": 1.5686, + "ppl": 5.7933, + "step": 4585 + }, + { + "epoch": 0.03, + "global_step": 4586, + "learning_rate": 0.00048169449081803006, + "loss": 1.7361, + "loss_base2": 2.5047, + "loss_pixel": 0.1877, + "loss_text": 1.5483, + "ppl": 5.6752, + "step": 4586 + }, + { + "epoch": 0.03, + "global_step": 4587, + "learning_rate": 0.00048169031719532557, + "loss": 1.7237, + "loss_base2": 2.4868, + "loss_pixel": 0.1864, + "loss_text": 1.5372, + "ppl": 5.6052, + "step": 4587 + }, + { + "epoch": 0.03, + "global_step": 4588, + "learning_rate": 0.000481686143572621, + "loss": 1.7651, + "loss_base2": 2.5465, + "loss_pixel": 0.1876, + "loss_text": 1.5775, + "ppl": 5.8422, + "step": 4588 + }, + { + "epoch": 0.03, + "global_step": 4589, + "learning_rate": 0.0004816819699499165, + "loss": 1.7472, + "loss_base2": 2.5207, + "loss_pixel": 0.1869, + "loss_text": 1.5603, + "ppl": 5.7385, + "step": 4589 + }, + { + "epoch": 0.03, + "global_step": 4590, + "learning_rate": 0.00048167779632721203, + "loss": 1.7415, + "loss_base2": 2.5125, + "loss_pixel": 0.188, + "loss_text": 1.5535, + "ppl": 5.7059, + "step": 4590 + }, + { + "epoch": 0.03, + "global_step": 4591, + "learning_rate": 0.00048167362270450754, + "loss": 1.7361, + "loss_base2": 2.5047, + "loss_pixel": 0.1874, + "loss_text": 1.5487, + "ppl": 5.6752, + "step": 4591 + }, + { + "epoch": 0.03, + "global_step": 4592, + "learning_rate": 0.000481669449081803, + "loss": 1.7308, + "loss_base2": 2.497, + "loss_pixel": 0.187, + "loss_text": 1.5438, + "ppl": 5.6452, + "step": 4592 + }, + { + "epoch": 0.03, + "global_step": 4593, + "learning_rate": 0.0004816652754590985, + "loss": 1.7404, + "loss_base2": 2.5109, + "loss_pixel": 0.1869, + "loss_text": 1.5535, + "ppl": 5.6996, + "step": 4593 + }, + { + "epoch": 0.03, + "global_step": 4594, + "learning_rate": 0.000481661101836394, + "loss": 1.748, + "loss_base2": 2.5218, + "loss_pixel": 0.1875, + "loss_text": 1.5605, + "ppl": 5.7431, + "step": 4594 + }, + { + "epoch": 0.03, + "global_step": 4595, + "learning_rate": 0.0004816569282136895, + "loss": 1.7418, + "loss_base2": 2.5129, + "loss_pixel": 0.1859, + "loss_text": 1.5559, + "ppl": 5.7076, + "step": 4595 + }, + { + "epoch": 0.03, + "global_step": 4596, + "learning_rate": 0.000481652754590985, + "loss": 1.7501, + "loss_base2": 2.5249, + "loss_pixel": 0.1877, + "loss_text": 1.5624, + "ppl": 5.7552, + "step": 4596 + }, + { + "epoch": 0.03, + "global_step": 4597, + "learning_rate": 0.0004816485809682805, + "loss": 1.7489, + "loss_base2": 2.5231, + "loss_pixel": 0.188, + "loss_text": 1.5608, + "ppl": 5.7483, + "step": 4597 + }, + { + "epoch": 0.03, + "global_step": 4598, + "learning_rate": 0.000481644407345576, + "loss": 1.7468, + "loss_base2": 2.5201, + "loss_pixel": 0.1859, + "loss_text": 1.5609, + "ppl": 5.7362, + "step": 4598 + }, + { + "epoch": 0.03, + "global_step": 4599, + "learning_rate": 0.0004816402337228715, + "loss": 1.7291, + "loss_base2": 2.4946, + "loss_pixel": 0.1872, + "loss_text": 1.5418, + "ppl": 5.6356, + "step": 4599 + }, + { + "epoch": 0.03, + "global_step": 4600, + "learning_rate": 0.000481636060100167, + "loss": 1.7244, + "loss_base2": 2.4878, + "loss_pixel": 0.1865, + "loss_text": 1.5379, + "ppl": 5.6092, + "step": 4600 + }, + { + "epoch": 0.03, + "global_step": 4601, + "learning_rate": 0.0004816318864774624, + "loss": 1.7466, + "loss_base2": 2.5198, + "loss_pixel": 0.1878, + "loss_text": 1.5588, + "ppl": 5.7351, + "step": 4601 + }, + { + "epoch": 0.03, + "global_step": 4602, + "learning_rate": 0.0004816277128547579, + "loss": 1.7073, + "loss_base2": 2.4631, + "loss_pixel": 0.1873, + "loss_text": 1.52, + "ppl": 5.5141, + "step": 4602 + }, + { + "epoch": 0.03, + "global_step": 4603, + "learning_rate": 0.0004816235392320534, + "loss": 1.7486, + "loss_base2": 2.5227, + "loss_pixel": 0.1865, + "loss_text": 1.5621, + "ppl": 5.7466, + "step": 4603 + }, + { + "epoch": 0.03, + "global_step": 4604, + "learning_rate": 0.0004816193656093489, + "loss": 1.7521, + "loss_base2": 2.5277, + "loss_pixel": 0.1899, + "loss_text": 1.5622, + "ppl": 5.7667, + "step": 4604 + }, + { + "epoch": 0.03, + "global_step": 4605, + "learning_rate": 0.0004816151919866444, + "loss": 1.7105, + "loss_base2": 2.4677, + "loss_pixel": 0.1869, + "loss_text": 1.5236, + "ppl": 5.5317, + "step": 4605 + }, + { + "epoch": 0.03, + "global_step": 4606, + "learning_rate": 0.0004816110183639399, + "loss": 1.7507, + "loss_base2": 2.5257, + "loss_pixel": 0.1875, + "loss_text": 1.5632, + "ppl": 5.7586, + "step": 4606 + }, + { + "epoch": 0.03, + "global_step": 4607, + "learning_rate": 0.0004816068447412354, + "loss": 1.7441, + "loss_base2": 2.5162, + "loss_pixel": 0.1868, + "loss_text": 1.5573, + "ppl": 5.7208, + "step": 4607 + }, + { + "epoch": 0.03, + "global_step": 4608, + "learning_rate": 0.0004816026711185309, + "loss": 1.7194, + "loss_base2": 2.4806, + "loss_pixel": 0.1861, + "loss_text": 1.5333, + "ppl": 5.5812, + "step": 4608 + }, + { + "epoch": 0.03, + "global_step": 4609, + "learning_rate": 0.0004815984974958264, + "loss": 1.7441, + "loss_base2": 2.5162, + "loss_pixel": 0.185, + "loss_text": 1.5591, + "ppl": 5.7208, + "step": 4609 + }, + { + "epoch": 0.03, + "global_step": 4610, + "learning_rate": 0.00048159432387312185, + "loss": 1.7285, + "loss_base2": 2.4937, + "loss_pixel": 0.1855, + "loss_text": 1.543, + "ppl": 5.6322, + "step": 4610 + }, + { + "epoch": 0.03, + "global_step": 4611, + "learning_rate": 0.00048159015025041736, + "loss": 1.7407, + "loss_base2": 2.5113, + "loss_pixel": 0.1875, + "loss_text": 1.5532, + "ppl": 5.7013, + "step": 4611 + }, + { + "epoch": 0.03, + "global_step": 4612, + "learning_rate": 0.00048158597662771287, + "loss": 1.7278, + "loss_base2": 2.4927, + "loss_pixel": 0.1884, + "loss_text": 1.5394, + "ppl": 5.6283, + "step": 4612 + }, + { + "epoch": 0.03, + "global_step": 4613, + "learning_rate": 0.0004815818030050084, + "loss": 1.7284, + "loss_base2": 2.4936, + "loss_pixel": 0.1859, + "loss_text": 1.5426, + "ppl": 5.6316, + "step": 4613 + }, + { + "epoch": 0.03, + "global_step": 4614, + "learning_rate": 0.0004815776293823039, + "loss": 1.7354, + "loss_base2": 2.5037, + "loss_pixel": 0.1855, + "loss_text": 1.5499, + "ppl": 5.6712, + "step": 4614 + }, + { + "epoch": 0.03, + "global_step": 4615, + "learning_rate": 0.00048157345575959934, + "loss": 1.7311, + "loss_base2": 2.4974, + "loss_pixel": 0.1873, + "loss_text": 1.5439, + "ppl": 5.6469, + "step": 4615 + }, + { + "epoch": 0.03, + "global_step": 4616, + "learning_rate": 0.00048156928213689484, + "loss": 1.7573, + "loss_base2": 2.5352, + "loss_pixel": 0.1867, + "loss_text": 1.5706, + "ppl": 5.7968, + "step": 4616 + }, + { + "epoch": 0.03, + "global_step": 4617, + "learning_rate": 0.00048156510851419035, + "loss": 1.7358, + "loss_base2": 2.5042, + "loss_pixel": 0.1866, + "loss_text": 1.5492, + "ppl": 5.6735, + "step": 4617 + }, + { + "epoch": 0.03, + "global_step": 4618, + "learning_rate": 0.00048156093489148586, + "loss": 1.7369, + "loss_base2": 2.5058, + "loss_pixel": 0.1866, + "loss_text": 1.5503, + "ppl": 5.6797, + "step": 4618 + }, + { + "epoch": 0.03, + "global_step": 4619, + "learning_rate": 0.0004815567612687813, + "loss": 1.7235, + "loss_base2": 2.4865, + "loss_pixel": 0.1865, + "loss_text": 1.537, + "ppl": 5.6041, + "step": 4619 + }, + { + "epoch": 0.03, + "global_step": 4620, + "learning_rate": 0.00048155258764607676, + "loss": 1.7392, + "loss_base2": 2.5091, + "loss_pixel": 0.1859, + "loss_text": 1.5532, + "ppl": 5.6928, + "step": 4620 + }, + { + "epoch": 0.03, + "global_step": 4621, + "learning_rate": 0.00048154841402337227, + "loss": 1.7496, + "loss_base2": 2.5241, + "loss_pixel": 0.1862, + "loss_text": 1.5635, + "ppl": 5.7523, + "step": 4621 + }, + { + "epoch": 0.03, + "global_step": 4622, + "learning_rate": 0.0004815442404006678, + "loss": 1.7479, + "loss_base2": 2.5217, + "loss_pixel": 0.1864, + "loss_text": 1.5616, + "ppl": 5.7425, + "step": 4622 + }, + { + "epoch": 0.03, + "global_step": 4623, + "learning_rate": 0.0004815400667779633, + "loss": 1.7269, + "loss_base2": 2.4914, + "loss_pixel": 0.1862, + "loss_text": 1.5407, + "ppl": 5.6232, + "step": 4623 + }, + { + "epoch": 0.03, + "global_step": 4624, + "learning_rate": 0.00048153589315525874, + "loss": 1.7297, + "loss_base2": 2.4954, + "loss_pixel": 0.1857, + "loss_text": 1.544, + "ppl": 5.639, + "step": 4624 + }, + { + "epoch": 0.03, + "global_step": 4625, + "learning_rate": 0.00048153171953255425, + "loss": 1.7433, + "loss_base2": 2.5151, + "loss_pixel": 0.1858, + "loss_text": 1.5575, + "ppl": 5.7162, + "step": 4625 + }, + { + "epoch": 0.03, + "global_step": 4626, + "learning_rate": 0.00048152754590984975, + "loss": 1.7381, + "loss_base2": 2.5075, + "loss_pixel": 0.1873, + "loss_text": 1.5508, + "ppl": 5.6865, + "step": 4626 + }, + { + "epoch": 0.03, + "global_step": 4627, + "learning_rate": 0.00048152337228714526, + "loss": 1.7318, + "loss_base2": 2.4985, + "loss_pixel": 0.1865, + "loss_text": 1.5453, + "ppl": 5.6508, + "step": 4627 + }, + { + "epoch": 0.03, + "global_step": 4628, + "learning_rate": 0.00048151919866444077, + "loss": 1.7326, + "loss_base2": 2.4996, + "loss_pixel": 0.1878, + "loss_text": 1.5448, + "ppl": 5.6553, + "step": 4628 + }, + { + "epoch": 0.03, + "global_step": 4629, + "learning_rate": 0.0004815150250417362, + "loss": 1.7459, + "loss_base2": 2.5188, + "loss_pixel": 0.1852, + "loss_text": 1.5607, + "ppl": 5.7311, + "step": 4629 + }, + { + "epoch": 0.03, + "global_step": 4630, + "learning_rate": 0.00048151085141903173, + "loss": 1.7231, + "loss_base2": 2.4859, + "loss_pixel": 0.1856, + "loss_text": 1.5375, + "ppl": 5.6019, + "step": 4630 + }, + { + "epoch": 0.03, + "global_step": 4631, + "learning_rate": 0.00048150667779632724, + "loss": 1.7356, + "loss_base2": 2.5039, + "loss_pixel": 0.1857, + "loss_text": 1.5499, + "ppl": 5.6723, + "step": 4631 + }, + { + "epoch": 0.03, + "global_step": 4632, + "learning_rate": 0.00048150250417362274, + "loss": 1.7406, + "loss_base2": 2.5112, + "loss_pixel": 0.1857, + "loss_text": 1.5549, + "ppl": 5.7008, + "step": 4632 + }, + { + "epoch": 0.03, + "global_step": 4633, + "learning_rate": 0.0004814983305509182, + "loss": 1.7522, + "loss_base2": 2.5279, + "loss_pixel": 0.1952, + "loss_text": 1.5571, + "ppl": 5.7673, + "step": 4633 + }, + { + "epoch": 0.03, + "global_step": 4634, + "learning_rate": 0.0004814941569282137, + "loss": 1.7497, + "loss_base2": 2.5243, + "loss_pixel": 0.1971, + "loss_text": 1.5527, + "ppl": 5.7529, + "step": 4634 + }, + { + "epoch": 0.03, + "global_step": 4635, + "learning_rate": 0.0004814899833055092, + "loss": 1.7376, + "loss_base2": 2.5068, + "loss_pixel": 0.1946, + "loss_text": 1.543, + "ppl": 5.6837, + "step": 4635 + }, + { + "epoch": 0.03, + "global_step": 4636, + "learning_rate": 0.0004814858096828047, + "loss": 1.7426, + "loss_base2": 2.514, + "loss_pixel": 0.1939, + "loss_text": 1.5487, + "ppl": 5.7122, + "step": 4636 + }, + { + "epoch": 0.03, + "global_step": 4637, + "learning_rate": 0.0004814816360601002, + "loss": 1.7422, + "loss_base2": 2.5135, + "loss_pixel": 0.1931, + "loss_text": 1.5491, + "ppl": 5.7099, + "step": 4637 + }, + { + "epoch": 0.03, + "global_step": 4638, + "learning_rate": 0.0004814774624373956, + "loss": 1.7356, + "loss_base2": 2.5039, + "loss_pixel": 0.1894, + "loss_text": 1.5462, + "ppl": 5.6723, + "step": 4638 + }, + { + "epoch": 0.03, + "global_step": 4639, + "learning_rate": 0.00048147328881469113, + "loss": 1.743, + "loss_base2": 2.5146, + "loss_pixel": 0.1872, + "loss_text": 1.5558, + "ppl": 5.7145, + "step": 4639 + }, + { + "epoch": 0.03, + "global_step": 4640, + "learning_rate": 0.00048146911519198664, + "loss": 1.7288, + "loss_base2": 2.4941, + "loss_pixel": 0.1886, + "loss_text": 1.5402, + "ppl": 5.6339, + "step": 4640 + }, + { + "epoch": 0.03, + "global_step": 4641, + "learning_rate": 0.00048146494156928215, + "loss": 1.7284, + "loss_base2": 2.4936, + "loss_pixel": 0.1864, + "loss_text": 1.542, + "ppl": 5.6316, + "step": 4641 + }, + { + "epoch": 0.03, + "global_step": 4642, + "learning_rate": 0.0004814607679465776, + "loss": 1.7131, + "loss_base2": 2.4715, + "loss_pixel": 0.1865, + "loss_text": 1.5267, + "ppl": 5.5461, + "step": 4642 + }, + { + "epoch": 0.03, + "global_step": 4643, + "learning_rate": 0.0004814565943238731, + "loss": 1.7294, + "loss_base2": 2.495, + "loss_pixel": 0.1871, + "loss_text": 1.5423, + "ppl": 5.6373, + "step": 4643 + }, + { + "epoch": 0.03, + "global_step": 4644, + "learning_rate": 0.0004814524207011686, + "loss": 1.7203, + "loss_base2": 2.4819, + "loss_pixel": 0.1869, + "loss_text": 1.5334, + "ppl": 5.5862, + "step": 4644 + }, + { + "epoch": 0.03, + "global_step": 4645, + "learning_rate": 0.0004814482470784641, + "loss": 1.7251, + "loss_base2": 2.4888, + "loss_pixel": 0.1856, + "loss_text": 1.5395, + "ppl": 5.6131, + "step": 4645 + }, + { + "epoch": 0.03, + "global_step": 4646, + "learning_rate": 0.00048144407345575963, + "loss": 1.73, + "loss_base2": 2.4959, + "loss_pixel": 0.185, + "loss_text": 1.5451, + "ppl": 5.6407, + "step": 4646 + }, + { + "epoch": 0.03, + "global_step": 4647, + "learning_rate": 0.0004814398998330551, + "loss": 1.7183, + "loss_base2": 2.479, + "loss_pixel": 0.1843, + "loss_text": 1.534, + "ppl": 5.575, + "step": 4647 + }, + { + "epoch": 0.03, + "global_step": 4648, + "learning_rate": 0.0004814357262103506, + "loss": 1.7235, + "loss_base2": 2.4865, + "loss_pixel": 0.1854, + "loss_text": 1.5381, + "ppl": 5.6041, + "step": 4648 + }, + { + "epoch": 0.03, + "global_step": 4649, + "learning_rate": 0.0004814315525876461, + "loss": 1.7208, + "loss_base2": 2.4826, + "loss_pixel": 0.1862, + "loss_text": 1.5346, + "ppl": 5.589, + "step": 4649 + }, + { + "epoch": 0.03, + "global_step": 4650, + "learning_rate": 0.0004814273789649416, + "loss": 1.6644, + "loss_base2": 2.4012, + "loss_pixel": 0.1876, + "loss_text": 1.4768, + "ppl": 5.2825, + "step": 4650 + }, + { + "epoch": 0.03, + "global_step": 4651, + "learning_rate": 0.00048142320534223706, + "loss": 1.6855, + "loss_base2": 2.4317, + "loss_pixel": 0.1857, + "loss_text": 1.4998, + "ppl": 5.3951, + "step": 4651 + }, + { + "epoch": 0.03, + "global_step": 4652, + "learning_rate": 0.00048141903171953257, + "loss": 1.7368, + "loss_base2": 2.5057, + "loss_pixel": 0.1855, + "loss_text": 1.5513, + "ppl": 5.6791, + "step": 4652 + }, + { + "epoch": 0.03, + "global_step": 4653, + "learning_rate": 0.00048141485809682807, + "loss": 1.7293, + "loss_base2": 2.4949, + "loss_pixel": 0.1867, + "loss_text": 1.5426, + "ppl": 5.6367, + "step": 4653 + }, + { + "epoch": 0.03, + "global_step": 4654, + "learning_rate": 0.0004814106844741236, + "loss": 1.7467, + "loss_base2": 2.52, + "loss_pixel": 0.1851, + "loss_text": 1.5616, + "ppl": 5.7356, + "step": 4654 + }, + { + "epoch": 0.03, + "global_step": 4655, + "learning_rate": 0.0004814065108514191, + "loss": 1.7445, + "loss_base2": 2.5168, + "loss_pixel": 0.1852, + "loss_text": 1.5593, + "ppl": 5.723, + "step": 4655 + }, + { + "epoch": 0.03, + "global_step": 4656, + "learning_rate": 0.00048140233722871454, + "loss": 1.7408, + "loss_base2": 2.5114, + "loss_pixel": 0.1851, + "loss_text": 1.5557, + "ppl": 5.7019, + "step": 4656 + }, + { + "epoch": 0.03, + "global_step": 4657, + "learning_rate": 0.00048139816360601, + "loss": 1.7397, + "loss_base2": 2.5099, + "loss_pixel": 0.1869, + "loss_text": 1.5528, + "ppl": 5.6956, + "step": 4657 + }, + { + "epoch": 0.03, + "global_step": 4658, + "learning_rate": 0.0004813939899833055, + "loss": 1.748, + "loss_base2": 2.5218, + "loss_pixel": 0.1859, + "loss_text": 1.5621, + "ppl": 5.7431, + "step": 4658 + }, + { + "epoch": 0.03, + "global_step": 4659, + "learning_rate": 0.000481389816360601, + "loss": 1.7487, + "loss_base2": 2.5228, + "loss_pixel": 0.1869, + "loss_text": 1.5618, + "ppl": 5.7471, + "step": 4659 + }, + { + "epoch": 0.03, + "global_step": 4660, + "learning_rate": 0.00048138564273789646, + "loss": 1.7452, + "loss_base2": 2.5178, + "loss_pixel": 0.1869, + "loss_text": 1.5583, + "ppl": 5.727, + "step": 4660 + }, + { + "epoch": 0.03, + "global_step": 4661, + "learning_rate": 0.00048138146911519197, + "loss": 1.7419, + "loss_base2": 2.513, + "loss_pixel": 0.1861, + "loss_text": 1.5558, + "ppl": 5.7082, + "step": 4661 + }, + { + "epoch": 0.03, + "global_step": 4662, + "learning_rate": 0.0004813772954924875, + "loss": 1.7477, + "loss_base2": 2.5214, + "loss_pixel": 0.1857, + "loss_text": 1.562, + "ppl": 5.7414, + "step": 4662 + }, + { + "epoch": 0.03, + "global_step": 4663, + "learning_rate": 0.000481373121869783, + "loss": 1.7501, + "loss_base2": 2.5249, + "loss_pixel": 0.1853, + "loss_text": 1.5649, + "ppl": 5.7552, + "step": 4663 + }, + { + "epoch": 0.03, + "global_step": 4664, + "learning_rate": 0.0004813689482470785, + "loss": 1.7224, + "loss_base2": 2.4849, + "loss_pixel": 0.1864, + "loss_text": 1.536, + "ppl": 5.5979, + "step": 4664 + }, + { + "epoch": 0.03, + "global_step": 4665, + "learning_rate": 0.00048136477462437394, + "loss": 1.7411, + "loss_base2": 2.5119, + "loss_pixel": 0.1864, + "loss_text": 1.5547, + "ppl": 5.7036, + "step": 4665 + }, + { + "epoch": 0.03, + "global_step": 4666, + "learning_rate": 0.00048136060100166945, + "loss": 1.7262, + "loss_base2": 2.4904, + "loss_pixel": 0.185, + "loss_text": 1.5412, + "ppl": 5.6193, + "step": 4666 + }, + { + "epoch": 0.03, + "global_step": 4667, + "learning_rate": 0.00048135642737896496, + "loss": 1.7341, + "loss_base2": 2.5018, + "loss_pixel": 0.1853, + "loss_text": 1.5488, + "ppl": 5.6638, + "step": 4667 + }, + { + "epoch": 0.03, + "global_step": 4668, + "learning_rate": 0.00048135225375626047, + "loss": 1.7164, + "loss_base2": 2.4762, + "loss_pixel": 0.1868, + "loss_text": 1.5296, + "ppl": 5.5645, + "step": 4668 + }, + { + "epoch": 0.03, + "global_step": 4669, + "learning_rate": 0.0004813480801335559, + "loss": 1.738, + "loss_base2": 2.5074, + "loss_pixel": 0.1865, + "loss_text": 1.5515, + "ppl": 5.686, + "step": 4669 + }, + { + "epoch": 0.03, + "global_step": 4670, + "learning_rate": 0.0004813439065108514, + "loss": 1.7406, + "loss_base2": 2.5112, + "loss_pixel": 0.1856, + "loss_text": 1.555, + "ppl": 5.7008, + "step": 4670 + }, + { + "epoch": 0.03, + "global_step": 4671, + "learning_rate": 0.00048133973288814693, + "loss": 1.7338, + "loss_base2": 2.5013, + "loss_pixel": 0.1892, + "loss_text": 1.5447, + "ppl": 5.6621, + "step": 4671 + }, + { + "epoch": 0.03, + "global_step": 4672, + "learning_rate": 0.00048133555926544244, + "loss": 1.7461, + "loss_base2": 2.5191, + "loss_pixel": 0.1857, + "loss_text": 1.5604, + "ppl": 5.7322, + "step": 4672 + }, + { + "epoch": 0.03, + "global_step": 4673, + "learning_rate": 0.00048133138564273795, + "loss": 1.7225, + "loss_base2": 2.485, + "loss_pixel": 0.1862, + "loss_text": 1.5364, + "ppl": 5.5985, + "step": 4673 + }, + { + "epoch": 0.03, + "global_step": 4674, + "learning_rate": 0.0004813272120200334, + "loss": 1.6829, + "loss_base2": 2.4279, + "loss_pixel": 0.1861, + "loss_text": 1.4968, + "ppl": 5.3811, + "step": 4674 + }, + { + "epoch": 0.03, + "global_step": 4675, + "learning_rate": 0.0004813230383973289, + "loss": 1.5966, + "loss_base2": 2.3034, + "loss_pixel": 0.1855, + "loss_text": 1.4111, + "ppl": 4.9362, + "step": 4675 + }, + { + "epoch": 0.03, + "global_step": 4676, + "learning_rate": 0.00048131886477462436, + "loss": 1.5103, + "loss_base2": 2.1789, + "loss_pixel": 0.1862, + "loss_text": 1.324, + "ppl": 4.5281, + "step": 4676 + }, + { + "epoch": 0.03, + "global_step": 4677, + "learning_rate": 0.00048131469115191987, + "loss": 1.5055, + "loss_base2": 2.172, + "loss_pixel": 0.1857, + "loss_text": 1.3198, + "ppl": 4.5064, + "step": 4677 + }, + { + "epoch": 0.03, + "global_step": 4678, + "learning_rate": 0.0004813105175292153, + "loss": 1.4942, + "loss_base2": 2.1557, + "loss_pixel": 0.1857, + "loss_text": 1.3085, + "ppl": 4.4558, + "step": 4678 + }, + { + "epoch": 0.03, + "global_step": 4679, + "learning_rate": 0.00048130634390651083, + "loss": 1.4967, + "loss_base2": 2.1593, + "loss_pixel": 0.1854, + "loss_text": 1.3113, + "ppl": 4.4669, + "step": 4679 + }, + { + "epoch": 0.03, + "global_step": 4680, + "learning_rate": 0.00048130217028380634, + "loss": 1.5055, + "loss_base2": 2.172, + "loss_pixel": 0.1862, + "loss_text": 1.3194, + "ppl": 4.5064, + "step": 4680 + }, + { + "epoch": 0.03, + "global_step": 4681, + "learning_rate": 0.00048129799666110184, + "loss": 1.5069, + "loss_base2": 2.174, + "loss_pixel": 0.1879, + "loss_text": 1.3191, + "ppl": 4.5127, + "step": 4681 + }, + { + "epoch": 0.03, + "global_step": 4682, + "learning_rate": 0.00048129382303839735, + "loss": 1.4979, + "loss_base2": 2.161, + "loss_pixel": 0.1855, + "loss_text": 1.3124, + "ppl": 4.4723, + "step": 4682 + }, + { + "epoch": 0.03, + "global_step": 4683, + "learning_rate": 0.0004812896494156928, + "loss": 1.5031, + "loss_base2": 2.1685, + "loss_pixel": 0.1855, + "loss_text": 1.3176, + "ppl": 4.4956, + "step": 4683 + }, + { + "epoch": 0.03, + "global_step": 4684, + "learning_rate": 0.0004812854757929883, + "loss": 1.7148, + "loss_base2": 2.4739, + "loss_pixel": 0.1848, + "loss_text": 1.53, + "ppl": 5.5556, + "step": 4684 + }, + { + "epoch": 0.03, + "global_step": 4685, + "learning_rate": 0.0004812813021702838, + "loss": 1.7607, + "loss_base2": 2.5402, + "loss_pixel": 0.1861, + "loss_text": 1.5746, + "ppl": 5.8165, + "step": 4685 + }, + { + "epoch": 0.03, + "global_step": 4686, + "learning_rate": 0.0004812771285475793, + "loss": 1.7513, + "loss_base2": 2.5266, + "loss_pixel": 0.1852, + "loss_text": 1.5661, + "ppl": 5.7621, + "step": 4686 + }, + { + "epoch": 0.03, + "global_step": 4687, + "learning_rate": 0.00048127295492487483, + "loss": 1.7536, + "loss_base2": 2.5299, + "loss_pixel": 0.1867, + "loss_text": 1.5669, + "ppl": 5.7754, + "step": 4687 + }, + { + "epoch": 0.03, + "global_step": 4688, + "learning_rate": 0.0004812687813021703, + "loss": 1.7359, + "loss_base2": 2.5044, + "loss_pixel": 0.1864, + "loss_text": 1.5495, + "ppl": 5.674, + "step": 4688 + }, + { + "epoch": 0.03, + "global_step": 4689, + "learning_rate": 0.0004812646076794658, + "loss": 1.7488, + "loss_base2": 2.523, + "loss_pixel": 0.1854, + "loss_text": 1.5634, + "ppl": 5.7477, + "step": 4689 + }, + { + "epoch": 0.03, + "global_step": 4690, + "learning_rate": 0.0004812604340567613, + "loss": 1.7484, + "loss_base2": 2.5224, + "loss_pixel": 0.184, + "loss_text": 1.5643, + "ppl": 5.7454, + "step": 4690 + }, + { + "epoch": 0.03, + "global_step": 4691, + "learning_rate": 0.0004812562604340568, + "loss": 1.7398, + "loss_base2": 2.51, + "loss_pixel": 0.1846, + "loss_text": 1.5552, + "ppl": 5.6962, + "step": 4691 + }, + { + "epoch": 0.03, + "global_step": 4692, + "learning_rate": 0.00048125208681135226, + "loss": 1.7442, + "loss_base2": 2.5163, + "loss_pixel": 0.1853, + "loss_text": 1.5588, + "ppl": 5.7213, + "step": 4692 + }, + { + "epoch": 0.03, + "global_step": 4693, + "learning_rate": 0.00048124791318864777, + "loss": 1.7399, + "loss_base2": 2.5101, + "loss_pixel": 0.1869, + "loss_text": 1.553, + "ppl": 5.6968, + "step": 4693 + }, + { + "epoch": 0.03, + "global_step": 4694, + "learning_rate": 0.0004812437395659433, + "loss": 1.7456, + "loss_base2": 2.5184, + "loss_pixel": 0.1841, + "loss_text": 1.5615, + "ppl": 5.7293, + "step": 4694 + }, + { + "epoch": 0.03, + "global_step": 4695, + "learning_rate": 0.00048123956594323873, + "loss": 1.7398, + "loss_base2": 2.51, + "loss_pixel": 0.1851, + "loss_text": 1.5547, + "ppl": 5.6962, + "step": 4695 + }, + { + "epoch": 0.03, + "global_step": 4696, + "learning_rate": 0.00048123539232053424, + "loss": 1.7504, + "loss_base2": 2.5253, + "loss_pixel": 0.1848, + "loss_text": 1.5656, + "ppl": 5.7569, + "step": 4696 + }, + { + "epoch": 0.03, + "global_step": 4697, + "learning_rate": 0.0004812312186978297, + "loss": 1.7347, + "loss_base2": 2.5026, + "loss_pixel": 0.1831, + "loss_text": 1.5516, + "ppl": 5.6672, + "step": 4697 + }, + { + "epoch": 0.03, + "global_step": 4698, + "learning_rate": 0.0004812270450751252, + "loss": 1.7324, + "loss_base2": 2.4993, + "loss_pixel": 0.1839, + "loss_text": 1.5485, + "ppl": 5.6542, + "step": 4698 + }, + { + "epoch": 0.03, + "global_step": 4699, + "learning_rate": 0.0004812228714524207, + "loss": 1.7465, + "loss_base2": 2.5197, + "loss_pixel": 0.1838, + "loss_text": 1.5628, + "ppl": 5.7345, + "step": 4699 + }, + { + "epoch": 0.03, + "global_step": 4700, + "learning_rate": 0.0004812186978297162, + "loss": 1.7406, + "loss_base2": 2.5112, + "loss_pixel": 0.1852, + "loss_text": 1.5554, + "ppl": 5.7008, + "step": 4700 + }, + { + "epoch": 0.03, + "global_step": 4701, + "learning_rate": 0.00048121452420701167, + "loss": 1.7563, + "loss_base2": 2.5338, + "loss_pixel": 0.1856, + "loss_text": 1.5707, + "ppl": 5.791, + "step": 4701 + }, + { + "epoch": 0.03, + "global_step": 4702, + "learning_rate": 0.00048121035058430717, + "loss": 1.7222, + "loss_base2": 2.4846, + "loss_pixel": 0.1846, + "loss_text": 1.5376, + "ppl": 5.5968, + "step": 4702 + }, + { + "epoch": 0.03, + "global_step": 4703, + "learning_rate": 0.0004812061769616027, + "loss": 1.7417, + "loss_base2": 2.5127, + "loss_pixel": 0.184, + "loss_text": 1.5577, + "ppl": 5.707, + "step": 4703 + }, + { + "epoch": 0.03, + "global_step": 4704, + "learning_rate": 0.0004812020033388982, + "loss": 1.7404, + "loss_base2": 2.5109, + "loss_pixel": 0.1865, + "loss_text": 1.5539, + "ppl": 5.6996, + "step": 4704 + }, + { + "epoch": 0.03, + "global_step": 4705, + "learning_rate": 0.0004811978297161937, + "loss": 1.7289, + "loss_base2": 2.4943, + "loss_pixel": 0.1841, + "loss_text": 1.5449, + "ppl": 5.6345, + "step": 4705 + }, + { + "epoch": 0.03, + "global_step": 4706, + "learning_rate": 0.00048119365609348915, + "loss": 1.7528, + "loss_base2": 2.5288, + "loss_pixel": 0.1851, + "loss_text": 1.5677, + "ppl": 5.7707, + "step": 4706 + }, + { + "epoch": 0.03, + "global_step": 4707, + "learning_rate": 0.00048118948247078465, + "loss": 1.6275, + "loss_base2": 2.348, + "loss_pixel": 0.1855, + "loss_text": 1.442, + "ppl": 5.0911, + "step": 4707 + }, + { + "epoch": 0.03, + "global_step": 4708, + "learning_rate": 0.00048118530884808016, + "loss": 1.5227, + "loss_base2": 2.1968, + "loss_pixel": 0.1837, + "loss_text": 1.3391, + "ppl": 4.5846, + "step": 4708 + }, + { + "epoch": 0.03, + "global_step": 4709, + "learning_rate": 0.00048118113522537567, + "loss": 1.5268, + "loss_base2": 2.2027, + "loss_pixel": 0.1857, + "loss_text": 1.341, + "ppl": 4.6034, + "step": 4709 + }, + { + "epoch": 0.03, + "global_step": 4710, + "learning_rate": 0.0004811769616026711, + "loss": 1.4974, + "loss_base2": 2.1603, + "loss_pixel": 0.1849, + "loss_text": 1.3125, + "ppl": 4.4701, + "step": 4710 + }, + { + "epoch": 0.03, + "global_step": 4711, + "learning_rate": 0.00048117278797996663, + "loss": 1.493, + "loss_base2": 2.1539, + "loss_pixel": 0.1852, + "loss_text": 1.3078, + "ppl": 4.4504, + "step": 4711 + }, + { + "epoch": 0.03, + "global_step": 4712, + "learning_rate": 0.00048116861435726214, + "loss": 1.5084, + "loss_base2": 2.1762, + "loss_pixel": 0.1848, + "loss_text": 1.3236, + "ppl": 4.5195, + "step": 4712 + }, + { + "epoch": 0.03, + "global_step": 4713, + "learning_rate": 0.00048116444073455764, + "loss": 1.4928, + "loss_base2": 2.1537, + "loss_pixel": 0.1845, + "loss_text": 1.3084, + "ppl": 4.4495, + "step": 4713 + }, + { + "epoch": 0.03, + "global_step": 4714, + "learning_rate": 0.0004811602671118531, + "loss": 1.5101, + "loss_base2": 2.1786, + "loss_pixel": 0.1835, + "loss_text": 1.3267, + "ppl": 4.5272, + "step": 4714 + }, + { + "epoch": 0.03, + "global_step": 4715, + "learning_rate": 0.00048115609348914855, + "loss": 1.5286, + "loss_base2": 2.2053, + "loss_pixel": 0.1843, + "loss_text": 1.3443, + "ppl": 4.6117, + "step": 4715 + }, + { + "epoch": 0.03, + "global_step": 4716, + "learning_rate": 0.00048115191986644406, + "loss": 1.7658, + "loss_base2": 2.5475, + "loss_pixel": 0.1834, + "loss_text": 1.5823, + "ppl": 5.8462, + "step": 4716 + }, + { + "epoch": 0.03, + "global_step": 4717, + "learning_rate": 0.00048114774624373957, + "loss": 1.7591, + "loss_base2": 2.5378, + "loss_pixel": 0.1837, + "loss_text": 1.5754, + "ppl": 5.8072, + "step": 4717 + }, + { + "epoch": 0.03, + "global_step": 4718, + "learning_rate": 0.00048114357262103507, + "loss": 1.7396, + "loss_base2": 2.5097, + "loss_pixel": 0.1852, + "loss_text": 1.5544, + "ppl": 5.6951, + "step": 4718 + }, + { + "epoch": 0.03, + "global_step": 4719, + "learning_rate": 0.0004811393989983305, + "loss": 1.7445, + "loss_base2": 2.5168, + "loss_pixel": 0.1854, + "loss_text": 1.5591, + "ppl": 5.723, + "step": 4719 + }, + { + "epoch": 0.03, + "global_step": 4720, + "learning_rate": 0.00048113522537562603, + "loss": 1.7498, + "loss_base2": 2.5244, + "loss_pixel": 0.1842, + "loss_text": 1.5656, + "ppl": 5.7535, + "step": 4720 + }, + { + "epoch": 0.03, + "global_step": 4721, + "learning_rate": 0.00048113105175292154, + "loss": 1.7621, + "loss_base2": 2.5422, + "loss_pixel": 0.1842, + "loss_text": 1.5779, + "ppl": 5.8247, + "step": 4721 + }, + { + "epoch": 0.03, + "global_step": 4722, + "learning_rate": 0.00048112687813021705, + "loss": 1.7309, + "loss_base2": 2.4972, + "loss_pixel": 0.1845, + "loss_text": 1.5464, + "ppl": 5.6457, + "step": 4722 + }, + { + "epoch": 0.03, + "global_step": 4723, + "learning_rate": 0.00048112270450751255, + "loss": 1.7372, + "loss_base2": 2.5062, + "loss_pixel": 0.1843, + "loss_text": 1.5529, + "ppl": 5.6814, + "step": 4723 + }, + { + "epoch": 0.03, + "global_step": 4724, + "learning_rate": 0.000481118530884808, + "loss": 1.7257, + "loss_base2": 2.4897, + "loss_pixel": 0.1838, + "loss_text": 1.5419, + "ppl": 5.6165, + "step": 4724 + }, + { + "epoch": 0.03, + "global_step": 4725, + "learning_rate": 0.0004811143572621035, + "loss": 1.7411, + "loss_base2": 2.5119, + "loss_pixel": 0.1837, + "loss_text": 1.5575, + "ppl": 5.7036, + "step": 4725 + }, + { + "epoch": 0.03, + "global_step": 4726, + "learning_rate": 0.000481110183639399, + "loss": 1.7347, + "loss_base2": 2.5026, + "loss_pixel": 0.1849, + "loss_text": 1.5498, + "ppl": 5.6672, + "step": 4726 + }, + { + "epoch": 0.03, + "global_step": 4727, + "learning_rate": 0.00048110601001669453, + "loss": 1.741, + "loss_base2": 2.5117, + "loss_pixel": 0.1854, + "loss_text": 1.5556, + "ppl": 5.703, + "step": 4727 + }, + { + "epoch": 0.03, + "global_step": 4728, + "learning_rate": 0.00048110183639399, + "loss": 1.7288, + "loss_base2": 2.4941, + "loss_pixel": 0.1841, + "loss_text": 1.5447, + "ppl": 5.6339, + "step": 4728 + }, + { + "epoch": 0.03, + "global_step": 4729, + "learning_rate": 0.0004810976627712855, + "loss": 1.7434, + "loss_base2": 2.5152, + "loss_pixel": 0.1848, + "loss_text": 1.5586, + "ppl": 5.7167, + "step": 4729 + }, + { + "epoch": 0.03, + "global_step": 4730, + "learning_rate": 0.000481093489148581, + "loss": 1.7342, + "loss_base2": 2.5019, + "loss_pixel": 0.1837, + "loss_text": 1.5504, + "ppl": 5.6644, + "step": 4730 + }, + { + "epoch": 0.03, + "global_step": 4731, + "learning_rate": 0.0004810893155258765, + "loss": 1.7548, + "loss_base2": 2.5316, + "loss_pixel": 0.1844, + "loss_text": 1.5704, + "ppl": 5.7823, + "step": 4731 + }, + { + "epoch": 0.03, + "global_step": 4732, + "learning_rate": 0.000481085141903172, + "loss": 1.7378, + "loss_base2": 2.5071, + "loss_pixel": 0.1845, + "loss_text": 1.5533, + "ppl": 5.6848, + "step": 4732 + }, + { + "epoch": 0.03, + "global_step": 4733, + "learning_rate": 0.0004810809682804674, + "loss": 1.7139, + "loss_base2": 2.4726, + "loss_pixel": 0.187, + "loss_text": 1.5269, + "ppl": 5.5506, + "step": 4733 + }, + { + "epoch": 0.03, + "global_step": 4734, + "learning_rate": 0.0004810767946577629, + "loss": 1.746, + "loss_base2": 2.5189, + "loss_pixel": 0.1839, + "loss_text": 1.5621, + "ppl": 5.7316, + "step": 4734 + }, + { + "epoch": 0.03, + "global_step": 4735, + "learning_rate": 0.0004810726210350584, + "loss": 1.7396, + "loss_base2": 2.5097, + "loss_pixel": 0.1845, + "loss_text": 1.5551, + "ppl": 5.6951, + "step": 4735 + }, + { + "epoch": 0.03, + "global_step": 4736, + "learning_rate": 0.00048106844741235393, + "loss": 1.7326, + "loss_base2": 2.4996, + "loss_pixel": 0.1846, + "loss_text": 1.5479, + "ppl": 5.6553, + "step": 4736 + }, + { + "epoch": 0.03, + "global_step": 4737, + "learning_rate": 0.0004810642737896494, + "loss": 1.5642, + "loss_base2": 2.2567, + "loss_pixel": 0.1841, + "loss_text": 1.38, + "ppl": 4.7789, + "step": 4737 + }, + { + "epoch": 0.03, + "global_step": 4738, + "learning_rate": 0.0004810601001669449, + "loss": 1.5371, + "loss_base2": 2.2176, + "loss_pixel": 0.1849, + "loss_text": 1.3522, + "ppl": 4.6511, + "step": 4738 + }, + { + "epoch": 0.03, + "global_step": 4739, + "learning_rate": 0.0004810559265442404, + "loss": 1.5141, + "loss_base2": 2.1844, + "loss_pixel": 0.1852, + "loss_text": 1.3289, + "ppl": 4.5453, + "step": 4739 + }, + { + "epoch": 0.03, + "global_step": 4740, + "learning_rate": 0.0004810517529215359, + "loss": 1.5139, + "loss_base2": 2.1841, + "loss_pixel": 0.1848, + "loss_text": 1.3292, + "ppl": 4.5444, + "step": 4740 + }, + { + "epoch": 0.03, + "global_step": 4741, + "learning_rate": 0.0004810475792988314, + "loss": 1.4728, + "loss_base2": 2.1248, + "loss_pixel": 0.1842, + "loss_text": 1.2885, + "ppl": 4.3614, + "step": 4741 + }, + { + "epoch": 0.03, + "global_step": 4742, + "learning_rate": 0.00048104340567612687, + "loss": 1.4781, + "loss_base2": 2.1324, + "loss_pixel": 0.1838, + "loss_text": 1.2943, + "ppl": 4.3846, + "step": 4742 + }, + { + "epoch": 0.03, + "global_step": 4743, + "learning_rate": 0.0004810392320534224, + "loss": 1.4811, + "loss_base2": 2.1368, + "loss_pixel": 0.1834, + "loss_text": 1.2977, + "ppl": 4.3978, + "step": 4743 + }, + { + "epoch": 0.03, + "global_step": 4744, + "learning_rate": 0.0004810350584307179, + "loss": 1.5862, + "loss_base2": 2.2884, + "loss_pixel": 0.1834, + "loss_text": 1.4028, + "ppl": 4.8852, + "step": 4744 + }, + { + "epoch": 0.03, + "global_step": 4745, + "learning_rate": 0.0004810308848080134, + "loss": 1.7604, + "loss_base2": 2.5397, + "loss_pixel": 0.1841, + "loss_text": 1.5763, + "ppl": 5.8148, + "step": 4745 + }, + { + "epoch": 0.03, + "global_step": 4746, + "learning_rate": 0.0004810267111853089, + "loss": 1.7484, + "loss_base2": 2.5224, + "loss_pixel": 0.1851, + "loss_text": 1.5633, + "ppl": 5.7454, + "step": 4746 + }, + { + "epoch": 0.03, + "global_step": 4747, + "learning_rate": 0.00048102253756260435, + "loss": 1.7499, + "loss_base2": 2.5246, + "loss_pixel": 0.1852, + "loss_text": 1.5647, + "ppl": 5.754, + "step": 4747 + }, + { + "epoch": 0.03, + "global_step": 4748, + "learning_rate": 0.00048101836393989986, + "loss": 1.7602, + "loss_base2": 2.5394, + "loss_pixel": 0.184, + "loss_text": 1.5762, + "ppl": 5.8136, + "step": 4748 + }, + { + "epoch": 0.03, + "global_step": 4749, + "learning_rate": 0.00048101419031719537, + "loss": 1.7442, + "loss_base2": 2.5163, + "loss_pixel": 0.1843, + "loss_text": 1.5598, + "ppl": 5.7213, + "step": 4749 + }, + { + "epoch": 0.03, + "global_step": 4750, + "learning_rate": 0.0004810100166944909, + "loss": 1.7367, + "loss_base2": 2.5055, + "loss_pixel": 0.1837, + "loss_text": 1.553, + "ppl": 5.6786, + "step": 4750 + }, + { + "epoch": 0.03, + "global_step": 4751, + "learning_rate": 0.00048100584307178627, + "loss": 1.7257, + "loss_base2": 2.4897, + "loss_pixel": 0.1851, + "loss_text": 1.5405, + "ppl": 5.6165, + "step": 4751 + }, + { + "epoch": 0.03, + "global_step": 4752, + "learning_rate": 0.0004810016694490818, + "loss": 1.742, + "loss_base2": 2.5132, + "loss_pixel": 0.1843, + "loss_text": 1.5577, + "ppl": 5.7087, + "step": 4752 + }, + { + "epoch": 0.03, + "global_step": 4753, + "learning_rate": 0.0004809974958263773, + "loss": 1.7416, + "loss_base2": 2.5126, + "loss_pixel": 0.1841, + "loss_text": 1.5575, + "ppl": 5.7065, + "step": 4753 + }, + { + "epoch": 0.03, + "global_step": 4754, + "learning_rate": 0.0004809933222036728, + "loss": 1.7407, + "loss_base2": 2.5113, + "loss_pixel": 0.184, + "loss_text": 1.5568, + "ppl": 5.7013, + "step": 4754 + }, + { + "epoch": 0.03, + "global_step": 4755, + "learning_rate": 0.0004809891485809683, + "loss": 1.7468, + "loss_base2": 2.5201, + "loss_pixel": 0.1842, + "loss_text": 1.5626, + "ppl": 5.7362, + "step": 4755 + }, + { + "epoch": 0.03, + "global_step": 4756, + "learning_rate": 0.00048098497495826375, + "loss": 1.7287, + "loss_base2": 2.494, + "loss_pixel": 0.1851, + "loss_text": 1.5436, + "ppl": 5.6333, + "step": 4756 + }, + { + "epoch": 0.03, + "global_step": 4757, + "learning_rate": 0.00048098080133555926, + "loss": 1.7499, + "loss_base2": 2.5246, + "loss_pixel": 0.1849, + "loss_text": 1.5651, + "ppl": 5.754, + "step": 4757 + }, + { + "epoch": 0.03, + "global_step": 4758, + "learning_rate": 0.00048097662771285477, + "loss": 1.7293, + "loss_base2": 2.4949, + "loss_pixel": 0.1843, + "loss_text": 1.545, + "ppl": 5.6367, + "step": 4758 + }, + { + "epoch": 0.03, + "global_step": 4759, + "learning_rate": 0.0004809724540901503, + "loss": 1.7338, + "loss_base2": 2.5013, + "loss_pixel": 0.1847, + "loss_text": 1.5492, + "ppl": 5.6621, + "step": 4759 + }, + { + "epoch": 0.03, + "global_step": 4760, + "learning_rate": 0.00048096828046744573, + "loss": 1.7213, + "loss_base2": 2.4833, + "loss_pixel": 0.1838, + "loss_text": 1.5374, + "ppl": 5.5918, + "step": 4760 + }, + { + "epoch": 0.03, + "global_step": 4761, + "learning_rate": 0.00048096410684474124, + "loss": 1.722, + "loss_base2": 2.4843, + "loss_pixel": 0.1831, + "loss_text": 1.5389, + "ppl": 5.5957, + "step": 4761 + }, + { + "epoch": 0.03, + "global_step": 4762, + "learning_rate": 0.00048095993322203674, + "loss": 1.7483, + "loss_base2": 2.5223, + "loss_pixel": 0.1835, + "loss_text": 1.5648, + "ppl": 5.7448, + "step": 4762 + }, + { + "epoch": 0.03, + "global_step": 4763, + "learning_rate": 0.00048095575959933225, + "loss": 1.7287, + "loss_base2": 2.494, + "loss_pixel": 0.1837, + "loss_text": 1.5449, + "ppl": 5.6333, + "step": 4763 + }, + { + "epoch": 0.03, + "global_step": 4764, + "learning_rate": 0.00048095158597662776, + "loss": 1.7247, + "loss_base2": 2.4882, + "loss_pixel": 0.183, + "loss_text": 1.5417, + "ppl": 5.6108, + "step": 4764 + }, + { + "epoch": 0.03, + "global_step": 4765, + "learning_rate": 0.0004809474123539232, + "loss": 1.7591, + "loss_base2": 2.5378, + "loss_pixel": 0.1833, + "loss_text": 1.5758, + "ppl": 5.8072, + "step": 4765 + }, + { + "epoch": 0.03, + "global_step": 4766, + "learning_rate": 0.0004809432387312187, + "loss": 1.7322, + "loss_base2": 2.499, + "loss_pixel": 0.1838, + "loss_text": 1.5484, + "ppl": 5.6531, + "step": 4766 + }, + { + "epoch": 0.03, + "global_step": 4767, + "learning_rate": 0.0004809390651085142, + "loss": 1.7174, + "loss_base2": 2.4777, + "loss_pixel": 0.1839, + "loss_text": 1.5335, + "ppl": 5.57, + "step": 4767 + }, + { + "epoch": 0.03, + "global_step": 4768, + "learning_rate": 0.00048093489148580973, + "loss": 1.7287, + "loss_base2": 2.494, + "loss_pixel": 0.1832, + "loss_text": 1.5455, + "ppl": 5.6333, + "step": 4768 + }, + { + "epoch": 0.03, + "global_step": 4769, + "learning_rate": 0.0004809307178631052, + "loss": 1.7338, + "loss_base2": 2.5013, + "loss_pixel": 0.1844, + "loss_text": 1.5494, + "ppl": 5.6621, + "step": 4769 + }, + { + "epoch": 0.03, + "global_step": 4770, + "learning_rate": 0.00048092654424040064, + "loss": 1.746, + "loss_base2": 2.5189, + "loss_pixel": 0.1842, + "loss_text": 1.5618, + "ppl": 5.7316, + "step": 4770 + }, + { + "epoch": 0.03, + "global_step": 4771, + "learning_rate": 0.00048092237061769615, + "loss": 1.7288, + "loss_base2": 2.4941, + "loss_pixel": 0.1884, + "loss_text": 1.5404, + "ppl": 5.6339, + "step": 4771 + }, + { + "epoch": 0.03, + "global_step": 4772, + "learning_rate": 0.00048091819699499165, + "loss": 1.7221, + "loss_base2": 2.4845, + "loss_pixel": 0.1852, + "loss_text": 1.5369, + "ppl": 5.5963, + "step": 4772 + }, + { + "epoch": 0.03, + "global_step": 4773, + "learning_rate": 0.00048091402337228716, + "loss": 1.7346, + "loss_base2": 2.5025, + "loss_pixel": 0.1834, + "loss_text": 1.5512, + "ppl": 5.6667, + "step": 4773 + }, + { + "epoch": 0.03, + "global_step": 4774, + "learning_rate": 0.0004809098497495826, + "loss": 1.727, + "loss_base2": 2.4915, + "loss_pixel": 0.1823, + "loss_text": 1.5447, + "ppl": 5.6238, + "step": 4774 + }, + { + "epoch": 0.03, + "global_step": 4775, + "learning_rate": 0.0004809056761268781, + "loss": 1.7087, + "loss_base2": 2.4651, + "loss_pixel": 0.1852, + "loss_text": 1.5235, + "ppl": 5.5218, + "step": 4775 + }, + { + "epoch": 0.03, + "global_step": 4776, + "learning_rate": 0.00048090150250417363, + "loss": 1.7268, + "loss_base2": 2.4912, + "loss_pixel": 0.183, + "loss_text": 1.5439, + "ppl": 5.6226, + "step": 4776 + }, + { + "epoch": 0.03, + "global_step": 4777, + "learning_rate": 0.00048089732888146914, + "loss": 1.7215, + "loss_base2": 2.4836, + "loss_pixel": 0.1831, + "loss_text": 1.5384, + "ppl": 5.5929, + "step": 4777 + }, + { + "epoch": 0.03, + "global_step": 4778, + "learning_rate": 0.0004808931552587646, + "loss": 1.718, + "loss_base2": 2.4786, + "loss_pixel": 0.1808, + "loss_text": 1.5372, + "ppl": 5.5734, + "step": 4778 + }, + { + "epoch": 0.03, + "global_step": 4779, + "learning_rate": 0.0004808889816360601, + "loss": 1.7168, + "loss_base2": 2.4768, + "loss_pixel": 0.183, + "loss_text": 1.5337, + "ppl": 5.5667, + "step": 4779 + }, + { + "epoch": 0.03, + "global_step": 4780, + "learning_rate": 0.0004808848080133556, + "loss": 1.7257, + "loss_base2": 2.4897, + "loss_pixel": 0.1814, + "loss_text": 1.5443, + "ppl": 5.6165, + "step": 4780 + }, + { + "epoch": 0.03, + "global_step": 4781, + "learning_rate": 0.0004808806343906511, + "loss": 1.7271, + "loss_base2": 2.4917, + "loss_pixel": 0.1828, + "loss_text": 1.5443, + "ppl": 5.6243, + "step": 4781 + }, + { + "epoch": 0.03, + "global_step": 4782, + "learning_rate": 0.0004808764607679466, + "loss": 1.7143, + "loss_base2": 2.4732, + "loss_pixel": 0.1835, + "loss_text": 1.5308, + "ppl": 5.5528, + "step": 4782 + }, + { + "epoch": 0.03, + "global_step": 4783, + "learning_rate": 0.00048087228714524207, + "loss": 1.719, + "loss_base2": 2.48, + "loss_pixel": 0.182, + "loss_text": 1.537, + "ppl": 5.5789, + "step": 4783 + }, + { + "epoch": 0.03, + "global_step": 4784, + "learning_rate": 0.0004808681135225376, + "loss": 1.731, + "loss_base2": 2.4973, + "loss_pixel": 0.1826, + "loss_text": 1.5484, + "ppl": 5.6463, + "step": 4784 + }, + { + "epoch": 0.03, + "global_step": 4785, + "learning_rate": 0.0004808639398998331, + "loss": 1.7421, + "loss_base2": 2.5133, + "loss_pixel": 0.1838, + "loss_text": 1.5583, + "ppl": 5.7093, + "step": 4785 + }, + { + "epoch": 0.03, + "global_step": 4786, + "learning_rate": 0.0004808597662771286, + "loss": 1.712, + "loss_base2": 2.4699, + "loss_pixel": 0.1808, + "loss_text": 1.5312, + "ppl": 5.54, + "step": 4786 + }, + { + "epoch": 0.03, + "global_step": 4787, + "learning_rate": 0.00048085559265442405, + "loss": 1.6933, + "loss_base2": 2.4429, + "loss_pixel": 0.1825, + "loss_text": 1.5108, + "ppl": 5.4374, + "step": 4787 + }, + { + "epoch": 0.03, + "global_step": 4788, + "learning_rate": 0.00048085141903171955, + "loss": 1.7316, + "loss_base2": 2.4982, + "loss_pixel": 0.1848, + "loss_text": 1.5468, + "ppl": 5.6497, + "step": 4788 + }, + { + "epoch": 0.03, + "global_step": 4789, + "learning_rate": 0.000480847245409015, + "loss": 1.721, + "loss_base2": 2.4829, + "loss_pixel": 0.1876, + "loss_text": 1.5334, + "ppl": 5.5901, + "step": 4789 + }, + { + "epoch": 0.03, + "global_step": 4790, + "learning_rate": 0.0004808430717863105, + "loss": 1.7457, + "loss_base2": 2.5185, + "loss_pixel": 0.1905, + "loss_text": 1.5553, + "ppl": 5.7299, + "step": 4790 + }, + { + "epoch": 0.03, + "global_step": 4791, + "learning_rate": 0.000480838898163606, + "loss": 1.7153, + "loss_base2": 2.4747, + "loss_pixel": 0.1889, + "loss_text": 1.5264, + "ppl": 5.5583, + "step": 4791 + }, + { + "epoch": 0.03, + "global_step": 4792, + "learning_rate": 0.0004808347245409015, + "loss": 1.719, + "loss_base2": 2.48, + "loss_pixel": 0.1872, + "loss_text": 1.5318, + "ppl": 5.5789, + "step": 4792 + }, + { + "epoch": 0.03, + "global_step": 4793, + "learning_rate": 0.000480830550918197, + "loss": 1.7272, + "loss_base2": 2.4918, + "loss_pixel": 0.189, + "loss_text": 1.5382, + "ppl": 5.6249, + "step": 4793 + }, + { + "epoch": 0.03, + "global_step": 4794, + "learning_rate": 0.0004808263772954925, + "loss": 1.7396, + "loss_base2": 2.5097, + "loss_pixel": 0.1875, + "loss_text": 1.5521, + "ppl": 5.6951, + "step": 4794 + }, + { + "epoch": 0.03, + "global_step": 4795, + "learning_rate": 0.000480822203672788, + "loss": 1.7247, + "loss_base2": 2.4882, + "loss_pixel": 0.1866, + "loss_text": 1.5382, + "ppl": 5.6108, + "step": 4795 + }, + { + "epoch": 0.03, + "global_step": 4796, + "learning_rate": 0.00048081803005008345, + "loss": 1.7162, + "loss_base2": 2.476, + "loss_pixel": 0.1863, + "loss_text": 1.5299, + "ppl": 5.5633, + "step": 4796 + }, + { + "epoch": 0.03, + "global_step": 4797, + "learning_rate": 0.00048081385642737896, + "loss": 1.7422, + "loss_base2": 2.5135, + "loss_pixel": 0.1848, + "loss_text": 1.5573, + "ppl": 5.7099, + "step": 4797 + }, + { + "epoch": 0.03, + "global_step": 4798, + "learning_rate": 0.00048080968280467447, + "loss": 1.7442, + "loss_base2": 2.5163, + "loss_pixel": 0.1847, + "loss_text": 1.5595, + "ppl": 5.7213, + "step": 4798 + }, + { + "epoch": 0.03, + "global_step": 4799, + "learning_rate": 0.00048080550918196997, + "loss": 1.7253, + "loss_base2": 2.4891, + "loss_pixel": 0.186, + "loss_text": 1.5393, + "ppl": 5.6142, + "step": 4799 + }, + { + "epoch": 0.03, + "global_step": 4800, + "learning_rate": 0.0004808013355592655, + "loss": 1.733, + "loss_base2": 2.5002, + "loss_pixel": 0.186, + "loss_text": 1.547, + "ppl": 5.6576, + "step": 4800 + }, + { + "epoch": 0.03, + "global_step": 4801, + "learning_rate": 0.00048079716193656093, + "loss": 1.7246, + "loss_base2": 2.4881, + "loss_pixel": 0.1858, + "loss_text": 1.5388, + "ppl": 5.6103, + "step": 4801 + }, + { + "epoch": 0.03, + "global_step": 4802, + "learning_rate": 0.00048079298831385644, + "loss": 1.7436, + "loss_base2": 2.5155, + "loss_pixel": 0.1847, + "loss_text": 1.559, + "ppl": 5.7179, + "step": 4802 + }, + { + "epoch": 0.03, + "global_step": 4803, + "learning_rate": 0.00048078881469115195, + "loss": 1.7162, + "loss_base2": 2.476, + "loss_pixel": 0.1882, + "loss_text": 1.5279, + "ppl": 5.5633, + "step": 4803 + }, + { + "epoch": 0.03, + "global_step": 4804, + "learning_rate": 0.00048078464106844746, + "loss": 1.725, + "loss_base2": 2.4886, + "loss_pixel": 0.1843, + "loss_text": 1.5407, + "ppl": 5.6125, + "step": 4804 + }, + { + "epoch": 0.03, + "global_step": 4805, + "learning_rate": 0.00048078046744574296, + "loss": 1.7337, + "loss_base2": 2.5012, + "loss_pixel": 0.1857, + "loss_text": 1.548, + "ppl": 5.6616, + "step": 4805 + }, + { + "epoch": 0.03, + "global_step": 4806, + "learning_rate": 0.0004807762938230384, + "loss": 1.7261, + "loss_base2": 2.4902, + "loss_pixel": 0.185, + "loss_text": 1.5411, + "ppl": 5.6187, + "step": 4806 + }, + { + "epoch": 0.03, + "global_step": 4807, + "learning_rate": 0.00048077212020033387, + "loss": 1.7156, + "loss_base2": 2.4751, + "loss_pixel": 0.1852, + "loss_text": 1.5304, + "ppl": 5.56, + "step": 4807 + }, + { + "epoch": 0.03, + "global_step": 4808, + "learning_rate": 0.0004807679465776294, + "loss": 1.7345, + "loss_base2": 2.5024, + "loss_pixel": 0.1844, + "loss_text": 1.5501, + "ppl": 5.6661, + "step": 4808 + }, + { + "epoch": 0.03, + "global_step": 4809, + "learning_rate": 0.0004807637729549249, + "loss": 1.7338, + "loss_base2": 2.5013, + "loss_pixel": 0.1842, + "loss_text": 1.5496, + "ppl": 5.6621, + "step": 4809 + }, + { + "epoch": 0.03, + "global_step": 4810, + "learning_rate": 0.00048075959933222034, + "loss": 1.7168, + "loss_base2": 2.4768, + "loss_pixel": 0.1838, + "loss_text": 1.533, + "ppl": 5.5667, + "step": 4810 + }, + { + "epoch": 0.03, + "global_step": 4811, + "learning_rate": 0.00048075542570951584, + "loss": 1.7202, + "loss_base2": 2.4817, + "loss_pixel": 0.1831, + "loss_text": 1.537, + "ppl": 5.5856, + "step": 4811 + }, + { + "epoch": 0.03, + "global_step": 4812, + "learning_rate": 0.00048075125208681135, + "loss": 1.7151, + "loss_base2": 2.4744, + "loss_pixel": 0.1844, + "loss_text": 1.5307, + "ppl": 5.5572, + "step": 4812 + }, + { + "epoch": 0.03, + "global_step": 4813, + "learning_rate": 0.00048074707846410686, + "loss": 1.7367, + "loss_base2": 2.5055, + "loss_pixel": 0.185, + "loss_text": 1.5516, + "ppl": 5.6786, + "step": 4813 + }, + { + "epoch": 0.03, + "global_step": 4814, + "learning_rate": 0.00048074290484140237, + "loss": 1.7344, + "loss_base2": 2.5022, + "loss_pixel": 0.1847, + "loss_text": 1.5496, + "ppl": 5.6655, + "step": 4814 + }, + { + "epoch": 0.03, + "global_step": 4815, + "learning_rate": 0.0004807387312186978, + "loss": 1.7176, + "loss_base2": 2.478, + "loss_pixel": 0.1836, + "loss_text": 1.534, + "ppl": 5.5711, + "step": 4815 + }, + { + "epoch": 0.03, + "global_step": 4816, + "learning_rate": 0.0004807345575959933, + "loss": 1.7235, + "loss_base2": 2.4865, + "loss_pixel": 0.1839, + "loss_text": 1.5396, + "ppl": 5.6041, + "step": 4816 + }, + { + "epoch": 0.03, + "global_step": 4817, + "learning_rate": 0.00048073038397328883, + "loss": 1.7265, + "loss_base2": 2.4908, + "loss_pixel": 0.1832, + "loss_text": 1.5433, + "ppl": 5.6209, + "step": 4817 + }, + { + "epoch": 0.03, + "global_step": 4818, + "learning_rate": 0.00048072621035058434, + "loss": 1.7091, + "loss_base2": 2.4657, + "loss_pixel": 0.1842, + "loss_text": 1.5249, + "ppl": 5.524, + "step": 4818 + }, + { + "epoch": 0.03, + "global_step": 4819, + "learning_rate": 0.0004807220367278798, + "loss": 1.7331, + "loss_base2": 2.5003, + "loss_pixel": 0.1818, + "loss_text": 1.5513, + "ppl": 5.6582, + "step": 4819 + }, + { + "epoch": 0.03, + "global_step": 4820, + "learning_rate": 0.0004807178631051753, + "loss": 1.6894, + "loss_base2": 2.4373, + "loss_pixel": 0.1838, + "loss_text": 1.5057, + "ppl": 5.4162, + "step": 4820 + }, + { + "epoch": 0.03, + "global_step": 4821, + "learning_rate": 0.0004807136894824708, + "loss": 1.7168, + "loss_base2": 2.4768, + "loss_pixel": 0.1847, + "loss_text": 1.5321, + "ppl": 5.5667, + "step": 4821 + }, + { + "epoch": 0.03, + "global_step": 4822, + "learning_rate": 0.0004807095158597663, + "loss": 1.7307, + "loss_base2": 2.4969, + "loss_pixel": 0.1836, + "loss_text": 1.5471, + "ppl": 5.6446, + "step": 4822 + }, + { + "epoch": 0.03, + "global_step": 4823, + "learning_rate": 0.0004807053422370618, + "loss": 1.7205, + "loss_base2": 2.4822, + "loss_pixel": 0.1832, + "loss_text": 1.5373, + "ppl": 5.5873, + "step": 4823 + }, + { + "epoch": 0.03, + "global_step": 4824, + "learning_rate": 0.0004807011686143573, + "loss": 1.7119, + "loss_base2": 2.4697, + "loss_pixel": 0.1831, + "loss_text": 1.5288, + "ppl": 5.5395, + "step": 4824 + }, + { + "epoch": 0.03, + "global_step": 4825, + "learning_rate": 0.0004806969949916528, + "loss": 1.7021, + "loss_base2": 2.4556, + "loss_pixel": 0.1848, + "loss_text": 1.5174, + "ppl": 5.4855, + "step": 4825 + }, + { + "epoch": 0.03, + "global_step": 4826, + "learning_rate": 0.00048069282136894824, + "loss": 1.7178, + "loss_base2": 2.4783, + "loss_pixel": 0.1833, + "loss_text": 1.5345, + "ppl": 5.5723, + "step": 4826 + }, + { + "epoch": 0.03, + "global_step": 4827, + "learning_rate": 0.00048068864774624374, + "loss": 1.7161, + "loss_base2": 2.4758, + "loss_pixel": 0.1841, + "loss_text": 1.532, + "ppl": 5.5628, + "step": 4827 + }, + { + "epoch": 0.03, + "global_step": 4828, + "learning_rate": 0.0004806844741235392, + "loss": 1.7073, + "loss_base2": 2.4631, + "loss_pixel": 0.1841, + "loss_text": 1.5232, + "ppl": 5.5141, + "step": 4828 + }, + { + "epoch": 0.03, + "global_step": 4829, + "learning_rate": 0.0004806803005008347, + "loss": 1.7063, + "loss_base2": 2.4617, + "loss_pixel": 0.1854, + "loss_text": 1.5209, + "ppl": 5.5085, + "step": 4829 + }, + { + "epoch": 0.03, + "global_step": 4830, + "learning_rate": 0.0004806761268781302, + "loss": 1.7288, + "loss_base2": 2.4941, + "loss_pixel": 0.1853, + "loss_text": 1.5435, + "ppl": 5.6339, + "step": 4830 + }, + { + "epoch": 0.03, + "global_step": 4831, + "learning_rate": 0.0004806719532554257, + "loss": 1.7297, + "loss_base2": 2.4954, + "loss_pixel": 0.1839, + "loss_text": 1.5458, + "ppl": 5.639, + "step": 4831 + }, + { + "epoch": 0.03, + "global_step": 4832, + "learning_rate": 0.0004806677796327212, + "loss": 1.741, + "loss_base2": 2.5117, + "loss_pixel": 0.1849, + "loss_text": 1.5561, + "ppl": 5.703, + "step": 4832 + }, + { + "epoch": 0.03, + "global_step": 4833, + "learning_rate": 0.0004806636060100167, + "loss": 1.7126, + "loss_base2": 2.4708, + "loss_pixel": 0.184, + "loss_text": 1.5286, + "ppl": 5.5434, + "step": 4833 + }, + { + "epoch": 0.03, + "global_step": 4834, + "learning_rate": 0.0004806594323873122, + "loss": 1.6656, + "loss_base2": 2.403, + "loss_pixel": 0.1828, + "loss_text": 1.4829, + "ppl": 5.2888, + "step": 4834 + }, + { + "epoch": 0.03, + "global_step": 4835, + "learning_rate": 0.0004806552587646077, + "loss": 1.7222, + "loss_base2": 2.4846, + "loss_pixel": 0.1829, + "loss_text": 1.5394, + "ppl": 5.5968, + "step": 4835 + }, + { + "epoch": 0.03, + "global_step": 4836, + "learning_rate": 0.0004806510851419032, + "loss": 1.7189, + "loss_base2": 2.4798, + "loss_pixel": 0.1835, + "loss_text": 1.5354, + "ppl": 5.5784, + "step": 4836 + }, + { + "epoch": 0.03, + "global_step": 4837, + "learning_rate": 0.00048064691151919865, + "loss": 1.7322, + "loss_base2": 2.499, + "loss_pixel": 0.184, + "loss_text": 1.5482, + "ppl": 5.6531, + "step": 4837 + }, + { + "epoch": 0.03, + "global_step": 4838, + "learning_rate": 0.00048064273789649416, + "loss": 1.7232, + "loss_base2": 2.4861, + "loss_pixel": 0.1843, + "loss_text": 1.5389, + "ppl": 5.6024, + "step": 4838 + }, + { + "epoch": 0.03, + "global_step": 4839, + "learning_rate": 0.00048063856427378967, + "loss": 1.7127, + "loss_base2": 2.4709, + "loss_pixel": 0.1842, + "loss_text": 1.5285, + "ppl": 5.5439, + "step": 4839 + }, + { + "epoch": 0.03, + "global_step": 4840, + "learning_rate": 0.0004806343906510852, + "loss": 1.7173, + "loss_base2": 2.4775, + "loss_pixel": 0.1855, + "loss_text": 1.5318, + "ppl": 5.5695, + "step": 4840 + }, + { + "epoch": 0.03, + "global_step": 4841, + "learning_rate": 0.0004806302170283807, + "loss": 1.7421, + "loss_base2": 2.5133, + "loss_pixel": 0.1838, + "loss_text": 1.5583, + "ppl": 5.7093, + "step": 4841 + }, + { + "epoch": 0.03, + "global_step": 4842, + "learning_rate": 0.00048062604340567614, + "loss": 1.7436, + "loss_base2": 2.5155, + "loss_pixel": 0.1833, + "loss_text": 1.5603, + "ppl": 5.7179, + "step": 4842 + }, + { + "epoch": 0.03, + "global_step": 4843, + "learning_rate": 0.00048062186978297164, + "loss": 1.7155, + "loss_base2": 2.4749, + "loss_pixel": 0.1829, + "loss_text": 1.5326, + "ppl": 5.5595, + "step": 4843 + }, + { + "epoch": 0.03, + "global_step": 4844, + "learning_rate": 0.00048061769616026715, + "loss": 1.7149, + "loss_base2": 2.4741, + "loss_pixel": 0.1834, + "loss_text": 1.5316, + "ppl": 5.5561, + "step": 4844 + }, + { + "epoch": 0.03, + "global_step": 4845, + "learning_rate": 0.0004806135225375626, + "loss": 1.7063, + "loss_base2": 2.4617, + "loss_pixel": 0.1843, + "loss_text": 1.5219, + "ppl": 5.5085, + "step": 4845 + }, + { + "epoch": 0.03, + "global_step": 4846, + "learning_rate": 0.00048060934891485806, + "loss": 1.7196, + "loss_base2": 2.4809, + "loss_pixel": 0.1852, + "loss_text": 1.5344, + "ppl": 5.5823, + "step": 4846 + }, + { + "epoch": 0.03, + "global_step": 4847, + "learning_rate": 0.00048060517529215357, + "loss": 1.7043, + "loss_base2": 2.4588, + "loss_pixel": 0.1839, + "loss_text": 1.5204, + "ppl": 5.4975, + "step": 4847 + }, + { + "epoch": 0.03, + "global_step": 4848, + "learning_rate": 0.00048060100166944907, + "loss": 1.7127, + "loss_base2": 2.4709, + "loss_pixel": 0.1842, + "loss_text": 1.5284, + "ppl": 5.5439, + "step": 4848 + }, + { + "epoch": 0.03, + "global_step": 4849, + "learning_rate": 0.0004805968280467446, + "loss": 1.7075, + "loss_base2": 2.4634, + "loss_pixel": 0.1829, + "loss_text": 1.5246, + "ppl": 5.5152, + "step": 4849 + }, + { + "epoch": 0.03, + "global_step": 4850, + "learning_rate": 0.0004805926544240401, + "loss": 1.719, + "loss_base2": 2.48, + "loss_pixel": 0.1833, + "loss_text": 1.5358, + "ppl": 5.5789, + "step": 4850 + }, + { + "epoch": 0.03, + "global_step": 4851, + "learning_rate": 0.00048058848080133554, + "loss": 1.7123, + "loss_base2": 2.4703, + "loss_pixel": 0.1847, + "loss_text": 1.5276, + "ppl": 5.5417, + "step": 4851 + }, + { + "epoch": 0.03, + "global_step": 4852, + "learning_rate": 0.00048058430717863105, + "loss": 1.7161, + "loss_base2": 2.4758, + "loss_pixel": 0.1824, + "loss_text": 1.5338, + "ppl": 5.5628, + "step": 4852 + }, + { + "epoch": 0.03, + "global_step": 4853, + "learning_rate": 0.00048058013355592655, + "loss": 1.7063, + "loss_base2": 2.4617, + "loss_pixel": 0.1826, + "loss_text": 1.5237, + "ppl": 5.5085, + "step": 4853 + }, + { + "epoch": 0.03, + "global_step": 4854, + "learning_rate": 0.00048057595993322206, + "loss": 1.7247, + "loss_base2": 2.4882, + "loss_pixel": 0.185, + "loss_text": 1.5397, + "ppl": 5.6108, + "step": 4854 + }, + { + "epoch": 0.03, + "global_step": 4855, + "learning_rate": 0.00048057178631051757, + "loss": 1.7376, + "loss_base2": 2.5068, + "loss_pixel": 0.1939, + "loss_text": 1.5436, + "ppl": 5.6837, + "step": 4855 + }, + { + "epoch": 0.03, + "global_step": 4856, + "learning_rate": 0.000480567612687813, + "loss": 1.7333, + "loss_base2": 2.5006, + "loss_pixel": 0.192, + "loss_text": 1.5413, + "ppl": 5.6593, + "step": 4856 + }, + { + "epoch": 0.03, + "global_step": 4857, + "learning_rate": 0.00048056343906510853, + "loss": 1.7252, + "loss_base2": 2.4889, + "loss_pixel": 0.1883, + "loss_text": 1.5368, + "ppl": 5.6136, + "step": 4857 + }, + { + "epoch": 0.03, + "global_step": 4858, + "learning_rate": 0.00048055926544240404, + "loss": 1.7246, + "loss_base2": 2.4881, + "loss_pixel": 0.1835, + "loss_text": 1.5412, + "ppl": 5.6103, + "step": 4858 + }, + { + "epoch": 0.03, + "global_step": 4859, + "learning_rate": 0.00048055509181969954, + "loss": 1.7368, + "loss_base2": 2.5057, + "loss_pixel": 0.1842, + "loss_text": 1.5526, + "ppl": 5.6791, + "step": 4859 + }, + { + "epoch": 0.03, + "global_step": 4860, + "learning_rate": 0.000480550918196995, + "loss": 1.735, + "loss_base2": 2.5031, + "loss_pixel": 0.1833, + "loss_text": 1.5517, + "ppl": 5.6689, + "step": 4860 + }, + { + "epoch": 0.03, + "global_step": 4861, + "learning_rate": 0.0004805467445742905, + "loss": 1.7285, + "loss_base2": 2.4937, + "loss_pixel": 0.1843, + "loss_text": 1.5442, + "ppl": 5.6322, + "step": 4861 + }, + { + "epoch": 0.03, + "global_step": 4862, + "learning_rate": 0.000480542570951586, + "loss": 1.7399, + "loss_base2": 2.5101, + "loss_pixel": 0.1828, + "loss_text": 1.5572, + "ppl": 5.6968, + "step": 4862 + }, + { + "epoch": 0.03, + "global_step": 4863, + "learning_rate": 0.0004805383973288815, + "loss": 1.689, + "loss_base2": 2.4367, + "loss_pixel": 0.1837, + "loss_text": 1.5053, + "ppl": 5.4141, + "step": 4863 + }, + { + "epoch": 0.03, + "global_step": 4864, + "learning_rate": 0.00048053422370617697, + "loss": 1.7469, + "loss_base2": 2.5202, + "loss_pixel": 0.1841, + "loss_text": 1.5628, + "ppl": 5.7368, + "step": 4864 + }, + { + "epoch": 0.03, + "global_step": 4865, + "learning_rate": 0.0004805300500834724, + "loss": 1.7132, + "loss_base2": 2.4716, + "loss_pixel": 0.1827, + "loss_text": 1.5305, + "ppl": 5.5467, + "step": 4865 + }, + { + "epoch": 0.03, + "global_step": 4866, + "learning_rate": 0.00048052587646076793, + "loss": 1.727, + "loss_base2": 2.4915, + "loss_pixel": 0.1834, + "loss_text": 1.5436, + "ppl": 5.6238, + "step": 4866 + }, + { + "epoch": 0.03, + "global_step": 4867, + "learning_rate": 0.00048052170283806344, + "loss": 1.7247, + "loss_base2": 2.4882, + "loss_pixel": 0.1844, + "loss_text": 1.5403, + "ppl": 5.6108, + "step": 4867 + }, + { + "epoch": 0.03, + "global_step": 4868, + "learning_rate": 0.00048051752921535895, + "loss": 1.685, + "loss_base2": 2.4309, + "loss_pixel": 0.1838, + "loss_text": 1.5011, + "ppl": 5.3925, + "step": 4868 + }, + { + "epoch": 0.03, + "global_step": 4869, + "learning_rate": 0.0004805133555926544, + "loss": 1.725, + "loss_base2": 2.4886, + "loss_pixel": 0.1835, + "loss_text": 1.5415, + "ppl": 5.6125, + "step": 4869 + }, + { + "epoch": 0.03, + "global_step": 4870, + "learning_rate": 0.0004805091819699499, + "loss": 1.7002, + "loss_base2": 2.4529, + "loss_pixel": 0.1839, + "loss_text": 1.5163, + "ppl": 5.475, + "step": 4870 + }, + { + "epoch": 0.03, + "global_step": 4871, + "learning_rate": 0.0004805050083472454, + "loss": 1.7159, + "loss_base2": 2.4755, + "loss_pixel": 0.1847, + "loss_text": 1.5312, + "ppl": 5.5617, + "step": 4871 + }, + { + "epoch": 0.03, + "global_step": 4872, + "learning_rate": 0.0004805008347245409, + "loss": 1.7247, + "loss_base2": 2.4882, + "loss_pixel": 0.185, + "loss_text": 1.5397, + "ppl": 5.6108, + "step": 4872 + }, + { + "epoch": 0.03, + "global_step": 4873, + "learning_rate": 0.00048049666110183643, + "loss": 1.7135, + "loss_base2": 2.4721, + "loss_pixel": 0.183, + "loss_text": 1.5305, + "ppl": 5.5483, + "step": 4873 + }, + { + "epoch": 0.03, + "global_step": 4874, + "learning_rate": 0.0004804924874791319, + "loss": 1.7142, + "loss_base2": 2.4731, + "loss_pixel": 0.1837, + "loss_text": 1.5305, + "ppl": 5.5522, + "step": 4874 + }, + { + "epoch": 0.03, + "global_step": 4875, + "learning_rate": 0.0004804883138564274, + "loss": 1.7279, + "loss_base2": 2.4928, + "loss_pixel": 0.1844, + "loss_text": 1.5435, + "ppl": 5.6288, + "step": 4875 + }, + { + "epoch": 0.03, + "global_step": 4876, + "learning_rate": 0.0004804841402337229, + "loss": 1.7355, + "loss_base2": 2.5038, + "loss_pixel": 0.1834, + "loss_text": 1.5521, + "ppl": 5.6718, + "step": 4876 + }, + { + "epoch": 0.03, + "global_step": 4877, + "learning_rate": 0.0004804799666110184, + "loss": 1.7344, + "loss_base2": 2.5022, + "loss_pixel": 0.1849, + "loss_text": 1.5495, + "ppl": 5.6655, + "step": 4877 + }, + { + "epoch": 0.03, + "global_step": 4878, + "learning_rate": 0.00048047579298831386, + "loss": 1.7021, + "loss_base2": 2.4556, + "loss_pixel": 0.184, + "loss_text": 1.5181, + "ppl": 5.4855, + "step": 4878 + }, + { + "epoch": 0.03, + "global_step": 4879, + "learning_rate": 0.00048047161936560937, + "loss": 1.7262, + "loss_base2": 2.4904, + "loss_pixel": 0.1843, + "loss_text": 1.5419, + "ppl": 5.6193, + "step": 4879 + }, + { + "epoch": 0.03, + "global_step": 4880, + "learning_rate": 0.0004804674457429049, + "loss": 1.704, + "loss_base2": 2.4584, + "loss_pixel": 0.1841, + "loss_text": 1.5199, + "ppl": 5.4959, + "step": 4880 + }, + { + "epoch": 0.03, + "global_step": 4881, + "learning_rate": 0.0004804632721202004, + "loss": 1.7161, + "loss_base2": 2.4758, + "loss_pixel": 0.1832, + "loss_text": 1.533, + "ppl": 5.5628, + "step": 4881 + }, + { + "epoch": 0.03, + "global_step": 4882, + "learning_rate": 0.0004804590984974959, + "loss": 1.7118, + "loss_base2": 2.4696, + "loss_pixel": 0.1829, + "loss_text": 1.5289, + "ppl": 5.5389, + "step": 4882 + }, + { + "epoch": 0.03, + "global_step": 4883, + "learning_rate": 0.0004804549248747913, + "loss": 1.7288, + "loss_base2": 2.4941, + "loss_pixel": 0.183, + "loss_text": 1.5458, + "ppl": 5.6339, + "step": 4883 + }, + { + "epoch": 0.03, + "global_step": 4884, + "learning_rate": 0.0004804507512520868, + "loss": 1.7292, + "loss_base2": 2.4947, + "loss_pixel": 0.1826, + "loss_text": 1.5465, + "ppl": 5.6361, + "step": 4884 + }, + { + "epoch": 0.03, + "global_step": 4885, + "learning_rate": 0.0004804465776293823, + "loss": 1.7255, + "loss_base2": 2.4894, + "loss_pixel": 0.185, + "loss_text": 1.5405, + "ppl": 5.6153, + "step": 4885 + }, + { + "epoch": 0.03, + "global_step": 4886, + "learning_rate": 0.0004804424040066778, + "loss": 1.7185, + "loss_base2": 2.4793, + "loss_pixel": 0.1826, + "loss_text": 1.5359, + "ppl": 5.5762, + "step": 4886 + }, + { + "epoch": 0.03, + "global_step": 4887, + "learning_rate": 0.00048043823038397326, + "loss": 1.7112, + "loss_base2": 2.4687, + "loss_pixel": 0.1823, + "loss_text": 1.5289, + "ppl": 5.5356, + "step": 4887 + }, + { + "epoch": 0.03, + "global_step": 4888, + "learning_rate": 0.00048043405676126877, + "loss": 1.7363, + "loss_base2": 2.505, + "loss_pixel": 0.1825, + "loss_text": 1.5538, + "ppl": 5.6763, + "step": 4888 + }, + { + "epoch": 0.03, + "global_step": 4889, + "learning_rate": 0.0004804298831385643, + "loss": 1.7176, + "loss_base2": 2.478, + "loss_pixel": 0.1835, + "loss_text": 1.5341, + "ppl": 5.5711, + "step": 4889 + }, + { + "epoch": 0.03, + "global_step": 4890, + "learning_rate": 0.0004804257095158598, + "loss": 1.7363, + "loss_base2": 2.505, + "loss_pixel": 0.1847, + "loss_text": 1.5517, + "ppl": 5.6763, + "step": 4890 + }, + { + "epoch": 0.03, + "global_step": 4891, + "learning_rate": 0.0004804215358931553, + "loss": 1.6972, + "loss_base2": 2.4485, + "loss_pixel": 0.1835, + "loss_text": 1.5137, + "ppl": 5.4586, + "step": 4891 + }, + { + "epoch": 0.03, + "global_step": 4892, + "learning_rate": 0.00048041736227045074, + "loss": 1.6948, + "loss_base2": 2.4451, + "loss_pixel": 0.1859, + "loss_text": 1.509, + "ppl": 5.4456, + "step": 4892 + }, + { + "epoch": 0.03, + "global_step": 4893, + "learning_rate": 0.00048041318864774625, + "loss": 1.7304, + "loss_base2": 2.4964, + "loss_pixel": 0.1887, + "loss_text": 1.5417, + "ppl": 5.6429, + "step": 4893 + }, + { + "epoch": 0.03, + "global_step": 4894, + "learning_rate": 0.00048040901502504176, + "loss": 1.728, + "loss_base2": 2.493, + "loss_pixel": 0.1903, + "loss_text": 1.5378, + "ppl": 5.6294, + "step": 4894 + }, + { + "epoch": 0.03, + "global_step": 4895, + "learning_rate": 0.00048040484140233727, + "loss": 1.7406, + "loss_base2": 2.5112, + "loss_pixel": 0.1906, + "loss_text": 1.55, + "ppl": 5.7008, + "step": 4895 + }, + { + "epoch": 0.03, + "global_step": 4896, + "learning_rate": 0.0004804006677796327, + "loss": 1.7196, + "loss_base2": 2.4809, + "loss_pixel": 0.1915, + "loss_text": 1.5282, + "ppl": 5.5823, + "step": 4896 + }, + { + "epoch": 0.03, + "global_step": 4897, + "learning_rate": 0.0004803964941569282, + "loss": 1.7311, + "loss_base2": 2.4974, + "loss_pixel": 0.1921, + "loss_text": 1.539, + "ppl": 5.6469, + "step": 4897 + }, + { + "epoch": 0.03, + "global_step": 4898, + "learning_rate": 0.00048039232053422373, + "loss": 1.7318, + "loss_base2": 2.4985, + "loss_pixel": 0.1909, + "loss_text": 1.5409, + "ppl": 5.6508, + "step": 4898 + }, + { + "epoch": 0.03, + "global_step": 4899, + "learning_rate": 0.00048038814691151924, + "loss": 1.5155, + "loss_base2": 2.1864, + "loss_pixel": 0.189, + "loss_text": 1.3266, + "ppl": 4.5517, + "step": 4899 + }, + { + "epoch": 0.03, + "global_step": 4900, + "learning_rate": 0.00048038397328881475, + "loss": 1.4987, + "loss_base2": 2.1622, + "loss_pixel": 0.1885, + "loss_text": 1.3102, + "ppl": 4.4759, + "step": 4900 + }, + { + "epoch": 0.03, + "global_step": 4901, + "learning_rate": 0.00048037979966611015, + "loss": 1.526, + "loss_base2": 2.2016, + "loss_pixel": 0.1879, + "loss_text": 1.3381, + "ppl": 4.5997, + "step": 4901 + }, + { + "epoch": 0.03, + "global_step": 4902, + "learning_rate": 0.00048037562604340565, + "loss": 1.5084, + "loss_base2": 2.1762, + "loss_pixel": 0.1885, + "loss_text": 1.3199, + "ppl": 4.5195, + "step": 4902 + }, + { + "epoch": 0.03, + "global_step": 4903, + "learning_rate": 0.00048037145242070116, + "loss": 1.5223, + "loss_base2": 2.1962, + "loss_pixel": 0.1862, + "loss_text": 1.3362, + "ppl": 4.5828, + "step": 4903 + }, + { + "epoch": 0.03, + "global_step": 4904, + "learning_rate": 0.00048036727879799667, + "loss": 1.5082, + "loss_base2": 2.1759, + "loss_pixel": 0.1873, + "loss_text": 1.3209, + "ppl": 4.5186, + "step": 4904 + }, + { + "epoch": 0.03, + "global_step": 4905, + "learning_rate": 0.0004803631051752921, + "loss": 1.5122, + "loss_base2": 2.1816, + "loss_pixel": 0.1873, + "loss_text": 1.3249, + "ppl": 4.5367, + "step": 4905 + }, + { + "epoch": 0.03, + "global_step": 4906, + "learning_rate": 0.00048035893155258763, + "loss": 1.5082, + "loss_base2": 2.1759, + "loss_pixel": 0.185, + "loss_text": 1.3232, + "ppl": 4.5186, + "step": 4906 + }, + { + "epoch": 0.03, + "global_step": 4907, + "learning_rate": 0.00048035475792988314, + "loss": 1.5095, + "loss_base2": 2.1777, + "loss_pixel": 0.1866, + "loss_text": 1.3229, + "ppl": 4.5245, + "step": 4907 + }, + { + "epoch": 0.03, + "global_step": 4908, + "learning_rate": 0.00048035058430717864, + "loss": 1.5282, + "loss_base2": 2.2047, + "loss_pixel": 0.1851, + "loss_text": 1.3431, + "ppl": 4.6099, + "step": 4908 + }, + { + "epoch": 0.03, + "global_step": 4909, + "learning_rate": 0.00048034641068447415, + "loss": 1.5154, + "loss_base2": 2.1863, + "loss_pixel": 0.1859, + "loss_text": 1.3295, + "ppl": 4.5512, + "step": 4909 + }, + { + "epoch": 0.03, + "global_step": 4910, + "learning_rate": 0.0004803422370617696, + "loss": 1.513, + "loss_base2": 2.1828, + "loss_pixel": 0.1861, + "loss_text": 1.3269, + "ppl": 4.5403, + "step": 4910 + }, + { + "epoch": 0.03, + "global_step": 4911, + "learning_rate": 0.0004803380634390651, + "loss": 1.5128, + "loss_base2": 2.1825, + "loss_pixel": 0.186, + "loss_text": 1.3268, + "ppl": 4.5394, + "step": 4911 + }, + { + "epoch": 0.03, + "global_step": 4912, + "learning_rate": 0.0004803338898163606, + "loss": 1.5284, + "loss_base2": 2.205, + "loss_pixel": 0.186, + "loss_text": 1.3424, + "ppl": 4.6108, + "step": 4912 + }, + { + "epoch": 0.03, + "global_step": 4913, + "learning_rate": 0.0004803297161936561, + "loss": 1.4922, + "loss_base2": 2.1528, + "loss_pixel": 0.184, + "loss_text": 1.3082, + "ppl": 4.4469, + "step": 4913 + }, + { + "epoch": 0.03, + "global_step": 4914, + "learning_rate": 0.00048032554257095163, + "loss": 1.6598, + "loss_base2": 2.3946, + "loss_pixel": 0.1852, + "loss_text": 1.4746, + "ppl": 5.2583, + "step": 4914 + }, + { + "epoch": 0.03, + "global_step": 4915, + "learning_rate": 0.0004803213689482471, + "loss": 1.7442, + "loss_base2": 2.5163, + "loss_pixel": 0.1847, + "loss_text": 1.5595, + "ppl": 5.7213, + "step": 4915 + }, + { + "epoch": 0.03, + "global_step": 4916, + "learning_rate": 0.0004803171953255426, + "loss": 1.7321, + "loss_base2": 2.4989, + "loss_pixel": 0.1836, + "loss_text": 1.5485, + "ppl": 5.6525, + "step": 4916 + }, + { + "epoch": 0.03, + "global_step": 4917, + "learning_rate": 0.0004803130217028381, + "loss": 1.7398, + "loss_base2": 2.51, + "loss_pixel": 0.1859, + "loss_text": 1.5539, + "ppl": 5.6962, + "step": 4917 + }, + { + "epoch": 0.03, + "global_step": 4918, + "learning_rate": 0.0004803088480801336, + "loss": 1.7433, + "loss_base2": 2.5151, + "loss_pixel": 0.1845, + "loss_text": 1.5588, + "ppl": 5.7162, + "step": 4918 + }, + { + "epoch": 0.03, + "global_step": 4919, + "learning_rate": 0.00048030467445742906, + "loss": 1.7326, + "loss_base2": 2.4996, + "loss_pixel": 0.1837, + "loss_text": 1.5489, + "ppl": 5.6553, + "step": 4919 + }, + { + "epoch": 0.03, + "global_step": 4920, + "learning_rate": 0.0004803005008347245, + "loss": 1.7438, + "loss_base2": 2.5158, + "loss_pixel": 0.1837, + "loss_text": 1.5601, + "ppl": 5.719, + "step": 4920 + }, + { + "epoch": 0.03, + "global_step": 4921, + "learning_rate": 0.00048029632721202, + "loss": 1.7375, + "loss_base2": 2.5067, + "loss_pixel": 0.1843, + "loss_text": 1.5531, + "ppl": 5.6831, + "step": 4921 + }, + { + "epoch": 0.03, + "global_step": 4922, + "learning_rate": 0.00048029215358931553, + "loss": 1.7365, + "loss_base2": 2.5052, + "loss_pixel": 0.1876, + "loss_text": 1.5488, + "ppl": 5.6774, + "step": 4922 + }, + { + "epoch": 0.03, + "global_step": 4923, + "learning_rate": 0.00048028797996661104, + "loss": 1.7382, + "loss_base2": 2.5077, + "loss_pixel": 0.1923, + "loss_text": 1.5459, + "ppl": 5.6871, + "step": 4923 + }, + { + "epoch": 0.03, + "global_step": 4924, + "learning_rate": 0.0004802838063439065, + "loss": 1.7329, + "loss_base2": 2.5, + "loss_pixel": 0.1929, + "loss_text": 1.5399, + "ppl": 5.657, + "step": 4924 + }, + { + "epoch": 0.03, + "global_step": 4925, + "learning_rate": 0.000480279632721202, + "loss": 1.7474, + "loss_base2": 2.521, + "loss_pixel": 0.1925, + "loss_text": 1.5549, + "ppl": 5.7397, + "step": 4925 + }, + { + "epoch": 0.03, + "global_step": 4926, + "learning_rate": 0.0004802754590984975, + "loss": 1.744, + "loss_base2": 2.5161, + "loss_pixel": 0.1929, + "loss_text": 1.5511, + "ppl": 5.7202, + "step": 4926 + }, + { + "epoch": 0.03, + "global_step": 4927, + "learning_rate": 0.000480271285475793, + "loss": 1.7519, + "loss_base2": 2.5275, + "loss_pixel": 0.1922, + "loss_text": 1.5597, + "ppl": 5.7655, + "step": 4927 + }, + { + "epoch": 0.03, + "global_step": 4928, + "learning_rate": 0.00048026711185308847, + "loss": 1.7506, + "loss_base2": 2.5256, + "loss_pixel": 0.1927, + "loss_text": 1.5579, + "ppl": 5.7581, + "step": 4928 + }, + { + "epoch": 0.03, + "global_step": 4929, + "learning_rate": 0.00048026293823038397, + "loss": 1.7316, + "loss_base2": 2.4982, + "loss_pixel": 0.1937, + "loss_text": 1.5379, + "ppl": 5.6497, + "step": 4929 + }, + { + "epoch": 0.03, + "global_step": 4930, + "learning_rate": 0.0004802587646076795, + "loss": 1.7331, + "loss_base2": 2.5003, + "loss_pixel": 0.1887, + "loss_text": 1.5444, + "ppl": 5.6582, + "step": 4930 + }, + { + "epoch": 0.03, + "global_step": 4931, + "learning_rate": 0.000480254590984975, + "loss": 1.7376, + "loss_base2": 2.5068, + "loss_pixel": 0.1857, + "loss_text": 1.5519, + "ppl": 5.6837, + "step": 4931 + }, + { + "epoch": 0.03, + "global_step": 4932, + "learning_rate": 0.0004802504173622705, + "loss": 1.7087, + "loss_base2": 2.4651, + "loss_pixel": 0.1861, + "loss_text": 1.5226, + "ppl": 5.5218, + "step": 4932 + }, + { + "epoch": 0.03, + "global_step": 4933, + "learning_rate": 0.00048024624373956595, + "loss": 1.7202, + "loss_base2": 2.4817, + "loss_pixel": 0.1862, + "loss_text": 1.534, + "ppl": 5.5856, + "step": 4933 + }, + { + "epoch": 0.03, + "global_step": 4934, + "learning_rate": 0.00048024207011686146, + "loss": 1.731, + "loss_base2": 2.4973, + "loss_pixel": 0.1888, + "loss_text": 1.5422, + "ppl": 5.6463, + "step": 4934 + }, + { + "epoch": 0.03, + "global_step": 4935, + "learning_rate": 0.00048023789649415696, + "loss": 1.7311, + "loss_base2": 2.4974, + "loss_pixel": 0.1868, + "loss_text": 1.5444, + "ppl": 5.6469, + "step": 4935 + }, + { + "epoch": 0.03, + "global_step": 4936, + "learning_rate": 0.00048023372287145247, + "loss": 1.556, + "loss_base2": 2.2448, + "loss_pixel": 0.1876, + "loss_text": 1.3685, + "ppl": 4.7398, + "step": 4936 + }, + { + "epoch": 0.03, + "global_step": 4937, + "learning_rate": 0.0004802295492487479, + "loss": 1.5079, + "loss_base2": 2.1754, + "loss_pixel": 0.1876, + "loss_text": 1.3203, + "ppl": 4.5172, + "step": 4937 + }, + { + "epoch": 0.03, + "global_step": 4938, + "learning_rate": 0.00048022537562604343, + "loss": 1.5093, + "loss_base2": 2.1775, + "loss_pixel": 0.1864, + "loss_text": 1.3229, + "ppl": 4.5236, + "step": 4938 + }, + { + "epoch": 0.03, + "global_step": 4939, + "learning_rate": 0.0004802212020033389, + "loss": 1.5149, + "loss_base2": 2.1855, + "loss_pixel": 0.1855, + "loss_text": 1.3294, + "ppl": 4.549, + "step": 4939 + }, + { + "epoch": 0.03, + "global_step": 4940, + "learning_rate": 0.0004802170283806344, + "loss": 1.4827, + "loss_base2": 2.1391, + "loss_pixel": 0.1858, + "loss_text": 1.2969, + "ppl": 4.4048, + "step": 4940 + }, + { + "epoch": 0.03, + "global_step": 4941, + "learning_rate": 0.0004802128547579299, + "loss": 1.501, + "loss_base2": 2.1655, + "loss_pixel": 0.1859, + "loss_text": 1.3151, + "ppl": 4.4862, + "step": 4941 + }, + { + "epoch": 0.03, + "global_step": 4942, + "learning_rate": 0.00048020868113522535, + "loss": 1.4981, + "loss_base2": 2.1613, + "loss_pixel": 0.1852, + "loss_text": 1.3129, + "ppl": 4.4732, + "step": 4942 + }, + { + "epoch": 0.03, + "global_step": 4943, + "learning_rate": 0.00048020450751252086, + "loss": 1.487, + "loss_base2": 2.1453, + "loss_pixel": 0.1857, + "loss_text": 1.3013, + "ppl": 4.4238, + "step": 4943 + }, + { + "epoch": 0.03, + "global_step": 4944, + "learning_rate": 0.00048020033388981637, + "loss": 1.4893, + "loss_base2": 2.1486, + "loss_pixel": 0.1852, + "loss_text": 1.3041, + "ppl": 4.434, + "step": 4944 + }, + { + "epoch": 0.03, + "global_step": 4945, + "learning_rate": 0.0004801961602671119, + "loss": 1.5157, + "loss_base2": 2.1867, + "loss_pixel": 0.1845, + "loss_text": 1.3311, + "ppl": 4.5526, + "step": 4945 + }, + { + "epoch": 0.03, + "global_step": 4946, + "learning_rate": 0.0004801919866444073, + "loss": 1.4897, + "loss_base2": 2.1492, + "loss_pixel": 0.1848, + "loss_text": 1.3049, + "ppl": 4.4358, + "step": 4946 + }, + { + "epoch": 0.03, + "global_step": 4947, + "learning_rate": 0.00048018781302170283, + "loss": 1.4932, + "loss_base2": 2.1542, + "loss_pixel": 0.1856, + "loss_text": 1.3076, + "ppl": 4.4513, + "step": 4947 + }, + { + "epoch": 0.03, + "global_step": 4948, + "learning_rate": 0.00048018363939899834, + "loss": 1.4811, + "loss_base2": 2.1368, + "loss_pixel": 0.185, + "loss_text": 1.2961, + "ppl": 4.3978, + "step": 4948 + }, + { + "epoch": 0.03, + "global_step": 4949, + "learning_rate": 0.00048017946577629385, + "loss": 1.5067, + "loss_base2": 2.1737, + "loss_pixel": 0.184, + "loss_text": 1.3227, + "ppl": 4.5118, + "step": 4949 + }, + { + "epoch": 0.03, + "global_step": 4950, + "learning_rate": 0.00048017529215358936, + "loss": 1.479, + "loss_base2": 2.1337, + "loss_pixel": 0.1836, + "loss_text": 1.2954, + "ppl": 4.3886, + "step": 4950 + }, + { + "epoch": 0.03, + "global_step": 4951, + "learning_rate": 0.0004801711185308848, + "loss": 1.5017, + "loss_base2": 2.1665, + "loss_pixel": 0.1844, + "loss_text": 1.3173, + "ppl": 4.4893, + "step": 4951 + }, + { + "epoch": 0.03, + "global_step": 4952, + "learning_rate": 0.0004801669449081803, + "loss": 1.735, + "loss_base2": 2.5031, + "loss_pixel": 0.1836, + "loss_text": 1.5514, + "ppl": 5.6689, + "step": 4952 + }, + { + "epoch": 0.03, + "global_step": 4953, + "learning_rate": 0.0004801627712854758, + "loss": 1.7392, + "loss_base2": 2.5091, + "loss_pixel": 0.1865, + "loss_text": 1.5527, + "ppl": 5.6928, + "step": 4953 + }, + { + "epoch": 0.03, + "global_step": 4954, + "learning_rate": 0.00048015859766277133, + "loss": 1.7435, + "loss_base2": 2.5153, + "loss_pixel": 0.1838, + "loss_text": 1.5597, + "ppl": 5.7173, + "step": 4954 + }, + { + "epoch": 0.03, + "global_step": 4955, + "learning_rate": 0.0004801544240400668, + "loss": 1.7114, + "loss_base2": 2.469, + "loss_pixel": 0.1829, + "loss_text": 1.5285, + "ppl": 5.5367, + "step": 4955 + }, + { + "epoch": 0.03, + "global_step": 4956, + "learning_rate": 0.0004801502504173623, + "loss": 1.7292, + "loss_base2": 2.4947, + "loss_pixel": 0.1839, + "loss_text": 1.5453, + "ppl": 5.6361, + "step": 4956 + }, + { + "epoch": 0.03, + "global_step": 4957, + "learning_rate": 0.0004801460767946578, + "loss": 1.7311, + "loss_base2": 2.4974, + "loss_pixel": 0.1828, + "loss_text": 1.5483, + "ppl": 5.6469, + "step": 4957 + }, + { + "epoch": 0.03, + "global_step": 4958, + "learning_rate": 0.00048014190317195325, + "loss": 1.7329, + "loss_base2": 2.5, + "loss_pixel": 0.183, + "loss_text": 1.5499, + "ppl": 5.657, + "step": 4958 + }, + { + "epoch": 0.03, + "global_step": 4959, + "learning_rate": 0.00048013772954924876, + "loss": 1.7376, + "loss_base2": 2.5068, + "loss_pixel": 0.1824, + "loss_text": 1.5552, + "ppl": 5.6837, + "step": 4959 + }, + { + "epoch": 0.03, + "global_step": 4960, + "learning_rate": 0.0004801335559265442, + "loss": 1.7424, + "loss_base2": 2.5138, + "loss_pixel": 0.1833, + "loss_text": 1.5591, + "ppl": 5.711, + "step": 4960 + }, + { + "epoch": 0.03, + "global_step": 4961, + "learning_rate": 0.0004801293823038397, + "loss": 1.7102, + "loss_base2": 2.4673, + "loss_pixel": 0.1852, + "loss_text": 1.5249, + "ppl": 5.5301, + "step": 4961 + }, + { + "epoch": 0.03, + "global_step": 4962, + "learning_rate": 0.0004801252086811352, + "loss": 1.7332, + "loss_base2": 2.5005, + "loss_pixel": 0.1828, + "loss_text": 1.5503, + "ppl": 5.6587, + "step": 4962 + }, + { + "epoch": 0.03, + "global_step": 4963, + "learning_rate": 0.00048012103505843073, + "loss": 1.7313, + "loss_base2": 2.4977, + "loss_pixel": 0.1825, + "loss_text": 1.5489, + "ppl": 5.648, + "step": 4963 + }, + { + "epoch": 0.03, + "global_step": 4964, + "learning_rate": 0.0004801168614357262, + "loss": 1.6979, + "loss_base2": 2.4496, + "loss_pixel": 0.1829, + "loss_text": 1.515, + "ppl": 5.4625, + "step": 4964 + }, + { + "epoch": 0.03, + "global_step": 4965, + "learning_rate": 0.0004801126878130217, + "loss": 1.7162, + "loss_base2": 2.476, + "loss_pixel": 0.183, + "loss_text": 1.5331, + "ppl": 5.5633, + "step": 4965 + }, + { + "epoch": 0.03, + "global_step": 4966, + "learning_rate": 0.0004801085141903172, + "loss": 1.7243, + "loss_base2": 2.4876, + "loss_pixel": 0.1838, + "loss_text": 1.5405, + "ppl": 5.6086, + "step": 4966 + }, + { + "epoch": 0.03, + "global_step": 4967, + "learning_rate": 0.0004801043405676127, + "loss": 1.7233, + "loss_base2": 2.4862, + "loss_pixel": 0.1832, + "loss_text": 1.5401, + "ppl": 5.603, + "step": 4967 + }, + { + "epoch": 0.03, + "global_step": 4968, + "learning_rate": 0.0004801001669449082, + "loss": 1.7226, + "loss_base2": 2.4852, + "loss_pixel": 0.1814, + "loss_text": 1.5413, + "ppl": 5.5991, + "step": 4968 + }, + { + "epoch": 0.03, + "global_step": 4969, + "learning_rate": 0.00048009599332220367, + "loss": 1.731, + "loss_base2": 2.4973, + "loss_pixel": 0.1827, + "loss_text": 1.5483, + "ppl": 5.6463, + "step": 4969 + }, + { + "epoch": 0.03, + "global_step": 4970, + "learning_rate": 0.0004800918196994992, + "loss": 1.7279, + "loss_base2": 2.4928, + "loss_pixel": 0.1831, + "loss_text": 1.5448, + "ppl": 5.6288, + "step": 4970 + }, + { + "epoch": 0.03, + "global_step": 4971, + "learning_rate": 0.0004800876460767947, + "loss": 1.7216, + "loss_base2": 2.4837, + "loss_pixel": 0.1833, + "loss_text": 1.5383, + "ppl": 5.5935, + "step": 4971 + }, + { + "epoch": 0.03, + "global_step": 4972, + "learning_rate": 0.0004800834724540902, + "loss": 1.719, + "loss_base2": 2.48, + "loss_pixel": 0.1828, + "loss_text": 1.5361, + "ppl": 5.5789, + "step": 4972 + }, + { + "epoch": 0.03, + "global_step": 4973, + "learning_rate": 0.0004800792988313857, + "loss": 1.7267, + "loss_base2": 2.4911, + "loss_pixel": 0.1831, + "loss_text": 1.5436, + "ppl": 5.6221, + "step": 4973 + }, + { + "epoch": 0.03, + "global_step": 4974, + "learning_rate": 0.00048007512520868115, + "loss": 1.735, + "loss_base2": 2.5031, + "loss_pixel": 0.183, + "loss_text": 1.5519, + "ppl": 5.6689, + "step": 4974 + }, + { + "epoch": 0.03, + "global_step": 4975, + "learning_rate": 0.00048007095158597666, + "loss": 1.7186, + "loss_base2": 2.4794, + "loss_pixel": 0.1817, + "loss_text": 1.5368, + "ppl": 5.5767, + "step": 4975 + }, + { + "epoch": 0.03, + "global_step": 4976, + "learning_rate": 0.0004800667779632721, + "loss": 1.6817, + "loss_base2": 2.4262, + "loss_pixel": 0.1829, + "loss_text": 1.4987, + "ppl": 5.3747, + "step": 4976 + }, + { + "epoch": 0.03, + "global_step": 4977, + "learning_rate": 0.0004800626043405676, + "loss": 1.5222, + "loss_base2": 2.1961, + "loss_pixel": 0.183, + "loss_text": 1.3392, + "ppl": 4.5823, + "step": 4977 + }, + { + "epoch": 0.03, + "global_step": 4978, + "learning_rate": 0.00048005843071786307, + "loss": 1.4943, + "loss_base2": 2.1558, + "loss_pixel": 0.1843, + "loss_text": 1.3101, + "ppl": 4.4562, + "step": 4978 + }, + { + "epoch": 0.03, + "global_step": 4979, + "learning_rate": 0.0004800542570951586, + "loss": 1.4925, + "loss_base2": 2.1532, + "loss_pixel": 0.1831, + "loss_text": 1.3094, + "ppl": 4.4482, + "step": 4979 + }, + { + "epoch": 0.03, + "global_step": 4980, + "learning_rate": 0.0004800500834724541, + "loss": 1.4883, + "loss_base2": 2.1472, + "loss_pixel": 0.1827, + "loss_text": 1.3056, + "ppl": 4.4296, + "step": 4980 + }, + { + "epoch": 0.03, + "global_step": 4981, + "learning_rate": 0.0004800459098497496, + "loss": 1.4788, + "loss_base2": 2.1335, + "loss_pixel": 0.1846, + "loss_text": 1.2942, + "ppl": 4.3877, + "step": 4981 + }, + { + "epoch": 0.03, + "global_step": 4982, + "learning_rate": 0.0004800417362270451, + "loss": 1.4889, + "loss_base2": 2.148, + "loss_pixel": 0.1831, + "loss_text": 1.3058, + "ppl": 4.4322, + "step": 4982 + }, + { + "epoch": 0.03, + "global_step": 4983, + "learning_rate": 0.00048003756260434055, + "loss": 1.4766, + "loss_base2": 2.1303, + "loss_pixel": 0.182, + "loss_text": 1.2946, + "ppl": 4.378, + "step": 4983 + }, + { + "epoch": 0.03, + "global_step": 4984, + "learning_rate": 0.00048003338898163606, + "loss": 1.4921, + "loss_base2": 2.1526, + "loss_pixel": 0.1834, + "loss_text": 1.3086, + "ppl": 4.4464, + "step": 4984 + }, + { + "epoch": 0.03, + "global_step": 4985, + "learning_rate": 0.00048002921535893157, + "loss": 1.4994, + "loss_base2": 2.1632, + "loss_pixel": 0.1829, + "loss_text": 1.3165, + "ppl": 4.479, + "step": 4985 + }, + { + "epoch": 0.03, + "global_step": 4986, + "learning_rate": 0.0004800250417362271, + "loss": 1.4763, + "loss_base2": 2.1299, + "loss_pixel": 0.1812, + "loss_text": 1.2951, + "ppl": 4.3767, + "step": 4986 + }, + { + "epoch": 0.03, + "global_step": 4987, + "learning_rate": 0.00048002086811352253, + "loss": 1.4939, + "loss_base2": 2.1552, + "loss_pixel": 0.1827, + "loss_text": 1.3112, + "ppl": 4.4544, + "step": 4987 + }, + { + "epoch": 0.03, + "global_step": 4988, + "learning_rate": 0.00048001669449081804, + "loss": 1.4849, + "loss_base2": 2.1423, + "loss_pixel": 0.1831, + "loss_text": 1.3018, + "ppl": 4.4145, + "step": 4988 + }, + { + "epoch": 0.03, + "global_step": 4989, + "learning_rate": 0.00048001252086811354, + "loss": 1.4867, + "loss_base2": 2.1449, + "loss_pixel": 0.1821, + "loss_text": 1.3046, + "ppl": 4.4225, + "step": 4989 + }, + { + "epoch": 0.03, + "global_step": 4990, + "learning_rate": 0.00048000834724540905, + "loss": 1.4971, + "loss_base2": 2.1599, + "loss_pixel": 0.1833, + "loss_text": 1.3139, + "ppl": 4.4687, + "step": 4990 + }, + { + "epoch": 0.03, + "global_step": 4991, + "learning_rate": 0.00048000417362270456, + "loss": 1.4979, + "loss_base2": 2.161, + "loss_pixel": 0.1813, + "loss_text": 1.3166, + "ppl": 4.4723, + "step": 4991 + }, + { + "epoch": 0.03, + "global_step": 4992, + "learning_rate": 0.00048, + "loss": 1.5032, + "loss_base2": 2.1687, + "loss_pixel": 0.1825, + "loss_text": 1.3207, + "ppl": 4.4961, + "step": 4992 + }, + { + "epoch": 0.03, + "global_step": 4993, + "learning_rate": 0.0004799958263772955, + "loss": 1.4874, + "loss_base2": 2.1459, + "loss_pixel": 0.183, + "loss_text": 1.3044, + "ppl": 4.4256, + "step": 4993 + }, + { + "epoch": 0.03, + "global_step": 4994, + "learning_rate": 0.000479991652754591, + "loss": 1.4836, + "loss_base2": 2.1404, + "loss_pixel": 0.1833, + "loss_text": 1.3003, + "ppl": 4.4088, + "step": 4994 + }, + { + "epoch": 0.03, + "global_step": 4995, + "learning_rate": 0.0004799874791318865, + "loss": 1.4831, + "loss_base2": 2.1397, + "loss_pixel": 0.1813, + "loss_text": 1.3018, + "ppl": 4.4066, + "step": 4995 + }, + { + "epoch": 0.03, + "global_step": 4996, + "learning_rate": 0.00047998330550918193, + "loss": 1.4919, + "loss_base2": 2.1524, + "loss_pixel": 0.1828, + "loss_text": 1.3091, + "ppl": 4.4455, + "step": 4996 + }, + { + "epoch": 0.03, + "global_step": 4997, + "learning_rate": 0.00047997913188647744, + "loss": 1.4727, + "loss_base2": 2.1247, + "loss_pixel": 0.1814, + "loss_text": 1.2913, + "ppl": 4.361, + "step": 4997 + }, + { + "epoch": 0.03, + "global_step": 4998, + "learning_rate": 0.00047997495826377295, + "loss": 1.4809, + "loss_base2": 2.1365, + "loss_pixel": 0.1819, + "loss_text": 1.299, + "ppl": 4.3969, + "step": 4998 + }, + { + "epoch": 0.03, + "global_step": 4999, + "learning_rate": 0.00047997078464106845, + "loss": 1.4799, + "loss_base2": 2.135, + "loss_pixel": 0.1825, + "loss_text": 1.2974, + "ppl": 4.3925, + "step": 4999 + }, + { + "epoch": 0.03, + "global_step": 5000, + "learning_rate": 0.00047996661101836396, + "loss": 1.4847, + "loss_base2": 2.142, + "loss_pixel": 0.1825, + "loss_text": 1.3022, + "ppl": 4.4136, + "step": 5000 + }, + { + "epoch": 0.03, + "global_step": 5001, + "learning_rate": 0.0004799624373956594, + "loss": 1.7647, + "loss_base2": 2.5459, + "loss_pixel": 0.1827, + "loss_text": 1.582, + "ppl": 5.8398, + "step": 5001 + }, + { + "epoch": 0.03, + "global_step": 5002, + "learning_rate": 0.0004799582637729549, + "loss": 1.7469, + "loss_base2": 2.5202, + "loss_pixel": 0.1824, + "loss_text": 1.5644, + "ppl": 5.7368, + "step": 5002 + }, + { + "epoch": 0.03, + "global_step": 5003, + "learning_rate": 0.00047995409015025043, + "loss": 1.7516, + "loss_base2": 2.527, + "loss_pixel": 0.1826, + "loss_text": 1.5691, + "ppl": 5.7638, + "step": 5003 + }, + { + "epoch": 0.03, + "global_step": 5004, + "learning_rate": 0.00047994991652754594, + "loss": 1.7252, + "loss_base2": 2.4889, + "loss_pixel": 0.1825, + "loss_text": 1.5427, + "ppl": 5.6136, + "step": 5004 + }, + { + "epoch": 0.03, + "global_step": 5005, + "learning_rate": 0.0004799457429048414, + "loss": 1.7408, + "loss_base2": 2.5114, + "loss_pixel": 0.1811, + "loss_text": 1.5596, + "ppl": 5.7019, + "step": 5005 + }, + { + "epoch": 0.03, + "global_step": 5006, + "learning_rate": 0.0004799415692821369, + "loss": 1.7319, + "loss_base2": 2.4986, + "loss_pixel": 0.1822, + "loss_text": 1.5497, + "ppl": 5.6514, + "step": 5006 + }, + { + "epoch": 0.03, + "global_step": 5007, + "learning_rate": 0.0004799373956594324, + "loss": 1.7301, + "loss_base2": 2.496, + "loss_pixel": 0.1823, + "loss_text": 1.5478, + "ppl": 5.6412, + "step": 5007 + }, + { + "epoch": 0.03, + "global_step": 5008, + "learning_rate": 0.0004799332220367279, + "loss": 1.7364, + "loss_base2": 2.5051, + "loss_pixel": 0.1825, + "loss_text": 1.5539, + "ppl": 5.6769, + "step": 5008 + }, + { + "epoch": 0.03, + "global_step": 5009, + "learning_rate": 0.0004799290484140234, + "loss": 1.7314, + "loss_base2": 2.4979, + "loss_pixel": 0.1823, + "loss_text": 1.5492, + "ppl": 5.6486, + "step": 5009 + }, + { + "epoch": 0.03, + "global_step": 5010, + "learning_rate": 0.00047992487479131887, + "loss": 1.7234, + "loss_base2": 2.4863, + "loss_pixel": 0.183, + "loss_text": 1.5405, + "ppl": 5.6035, + "step": 5010 + }, + { + "epoch": 0.03, + "global_step": 5011, + "learning_rate": 0.0004799207011686144, + "loss": 1.7165, + "loss_base2": 2.4764, + "loss_pixel": 0.182, + "loss_text": 1.5344, + "ppl": 5.565, + "step": 5011 + }, + { + "epoch": 0.03, + "global_step": 5012, + "learning_rate": 0.0004799165275459099, + "loss": 1.7337, + "loss_base2": 2.5012, + "loss_pixel": 0.1842, + "loss_text": 1.5496, + "ppl": 5.6616, + "step": 5012 + }, + { + "epoch": 0.03, + "global_step": 5013, + "learning_rate": 0.0004799123539232054, + "loss": 1.7284, + "loss_base2": 2.4936, + "loss_pixel": 0.1827, + "loss_text": 1.5457, + "ppl": 5.6316, + "step": 5013 + }, + { + "epoch": 0.03, + "global_step": 5014, + "learning_rate": 0.0004799081803005008, + "loss": 1.7182, + "loss_base2": 2.4788, + "loss_pixel": 0.184, + "loss_text": 1.5342, + "ppl": 5.5745, + "step": 5014 + }, + { + "epoch": 0.03, + "global_step": 5015, + "learning_rate": 0.0004799040066777963, + "loss": 1.7305, + "loss_base2": 2.4966, + "loss_pixel": 0.1834, + "loss_text": 1.5471, + "ppl": 5.6435, + "step": 5015 + }, + { + "epoch": 0.03, + "global_step": 5016, + "learning_rate": 0.0004798998330550918, + "loss": 1.7402, + "loss_base2": 2.5106, + "loss_pixel": 0.1817, + "loss_text": 1.5585, + "ppl": 5.6985, + "step": 5016 + }, + { + "epoch": 0.03, + "global_step": 5017, + "learning_rate": 0.0004798956594323873, + "loss": 1.7245, + "loss_base2": 2.4879, + "loss_pixel": 0.1831, + "loss_text": 1.5414, + "ppl": 5.6097, + "step": 5017 + }, + { + "epoch": 0.03, + "global_step": 5018, + "learning_rate": 0.0004798914858096828, + "loss": 1.7226, + "loss_base2": 2.4852, + "loss_pixel": 0.182, + "loss_text": 1.5406, + "ppl": 5.5991, + "step": 5018 + }, + { + "epoch": 0.03, + "global_step": 5019, + "learning_rate": 0.0004798873121869783, + "loss": 1.7258, + "loss_base2": 2.4898, + "loss_pixel": 0.1812, + "loss_text": 1.5445, + "ppl": 5.617, + "step": 5019 + }, + { + "epoch": 0.03, + "global_step": 5020, + "learning_rate": 0.0004798831385642738, + "loss": 1.7223, + "loss_base2": 2.4848, + "loss_pixel": 0.1814, + "loss_text": 1.5409, + "ppl": 5.5974, + "step": 5020 + }, + { + "epoch": 0.03, + "global_step": 5021, + "learning_rate": 0.0004798789649415693, + "loss": 1.7245, + "loss_base2": 2.4879, + "loss_pixel": 0.1808, + "loss_text": 1.5437, + "ppl": 5.6097, + "step": 5021 + }, + { + "epoch": 0.03, + "global_step": 5022, + "learning_rate": 0.0004798747913188648, + "loss": 1.6997, + "loss_base2": 2.4521, + "loss_pixel": 0.1814, + "loss_text": 1.5183, + "ppl": 5.4723, + "step": 5022 + }, + { + "epoch": 0.03, + "global_step": 5023, + "learning_rate": 0.00047987061769616025, + "loss": 1.73, + "loss_base2": 2.4959, + "loss_pixel": 0.1815, + "loss_text": 1.5485, + "ppl": 5.6407, + "step": 5023 + }, + { + "epoch": 0.03, + "global_step": 5024, + "learning_rate": 0.00047986644407345576, + "loss": 1.7207, + "loss_base2": 2.4824, + "loss_pixel": 0.1818, + "loss_text": 1.5389, + "ppl": 5.5884, + "step": 5024 + }, + { + "epoch": 0.03, + "global_step": 5025, + "learning_rate": 0.00047986227045075127, + "loss": 1.7376, + "loss_base2": 2.5068, + "loss_pixel": 0.1823, + "loss_text": 1.5553, + "ppl": 5.6837, + "step": 5025 + }, + { + "epoch": 0.03, + "global_step": 5026, + "learning_rate": 0.0004798580968280468, + "loss": 1.7294, + "loss_base2": 2.495, + "loss_pixel": 0.1829, + "loss_text": 1.5465, + "ppl": 5.6373, + "step": 5026 + }, + { + "epoch": 0.03, + "global_step": 5027, + "learning_rate": 0.0004798539232053423, + "loss": 1.7279, + "loss_base2": 2.4928, + "loss_pixel": 0.1812, + "loss_text": 1.5467, + "ppl": 5.6288, + "step": 5027 + }, + { + "epoch": 0.03, + "global_step": 5028, + "learning_rate": 0.00047984974958263773, + "loss": 1.7406, + "loss_base2": 2.5112, + "loss_pixel": 0.1823, + "loss_text": 1.5584, + "ppl": 5.7008, + "step": 5028 + }, + { + "epoch": 0.03, + "global_step": 5029, + "learning_rate": 0.00047984557595993324, + "loss": 1.7354, + "loss_base2": 2.5037, + "loss_pixel": 0.1814, + "loss_text": 1.5539, + "ppl": 5.6712, + "step": 5029 + }, + { + "epoch": 0.03, + "global_step": 5030, + "learning_rate": 0.00047984140233722875, + "loss": 1.7198, + "loss_base2": 2.4811, + "loss_pixel": 0.1823, + "loss_text": 1.5375, + "ppl": 5.5834, + "step": 5030 + }, + { + "epoch": 0.03, + "global_step": 5031, + "learning_rate": 0.00047983722871452426, + "loss": 1.7181, + "loss_base2": 2.4787, + "loss_pixel": 0.182, + "loss_text": 1.5361, + "ppl": 5.5739, + "step": 5031 + }, + { + "epoch": 0.03, + "global_step": 5032, + "learning_rate": 0.00047983305509181976, + "loss": 1.7213, + "loss_base2": 2.4833, + "loss_pixel": 0.1809, + "loss_text": 1.5404, + "ppl": 5.5918, + "step": 5032 + }, + { + "epoch": 0.03, + "global_step": 5033, + "learning_rate": 0.00047982888146911516, + "loss": 1.7267, + "loss_base2": 2.4911, + "loss_pixel": 0.1817, + "loss_text": 1.545, + "ppl": 5.6221, + "step": 5033 + }, + { + "epoch": 0.03, + "global_step": 5034, + "learning_rate": 0.00047982470784641067, + "loss": 1.7117, + "loss_base2": 2.4695, + "loss_pixel": 0.1817, + "loss_text": 1.53, + "ppl": 5.5384, + "step": 5034 + }, + { + "epoch": 0.03, + "global_step": 5035, + "learning_rate": 0.0004798205342237062, + "loss": 1.7102, + "loss_base2": 2.4673, + "loss_pixel": 0.182, + "loss_text": 1.5282, + "ppl": 5.5301, + "step": 5035 + }, + { + "epoch": 0.03, + "global_step": 5036, + "learning_rate": 0.0004798163606010017, + "loss": 1.7203, + "loss_base2": 2.4819, + "loss_pixel": 0.1824, + "loss_text": 1.5379, + "ppl": 5.5862, + "step": 5036 + }, + { + "epoch": 0.03, + "global_step": 5037, + "learning_rate": 0.00047981218697829714, + "loss": 1.7105, + "loss_base2": 2.4677, + "loss_pixel": 0.1811, + "loss_text": 1.5294, + "ppl": 5.5317, + "step": 5037 + }, + { + "epoch": 0.03, + "global_step": 5038, + "learning_rate": 0.00047980801335559264, + "loss": 1.7316, + "loss_base2": 2.4982, + "loss_pixel": 0.1822, + "loss_text": 1.5494, + "ppl": 5.6497, + "step": 5038 + }, + { + "epoch": 0.03, + "global_step": 5039, + "learning_rate": 0.00047980383973288815, + "loss": 1.7061, + "loss_base2": 2.4614, + "loss_pixel": 0.1809, + "loss_text": 1.5252, + "ppl": 5.5074, + "step": 5039 + }, + { + "epoch": 0.03, + "global_step": 5040, + "learning_rate": 0.00047979966611018366, + "loss": 1.7239, + "loss_base2": 2.4871, + "loss_pixel": 0.1818, + "loss_text": 1.5421, + "ppl": 5.6064, + "step": 5040 + }, + { + "epoch": 0.03, + "global_step": 5041, + "learning_rate": 0.00047979549248747917, + "loss": 1.7104, + "loss_base2": 2.4676, + "loss_pixel": 0.1817, + "loss_text": 1.5287, + "ppl": 5.5312, + "step": 5041 + }, + { + "epoch": 0.03, + "global_step": 5042, + "learning_rate": 0.0004797913188647746, + "loss": 1.722, + "loss_base2": 2.4843, + "loss_pixel": 0.1801, + "loss_text": 1.5419, + "ppl": 5.5957, + "step": 5042 + }, + { + "epoch": 0.03, + "global_step": 5043, + "learning_rate": 0.0004797871452420701, + "loss": 1.7211, + "loss_base2": 2.483, + "loss_pixel": 0.1811, + "loss_text": 1.54, + "ppl": 5.5907, + "step": 5043 + }, + { + "epoch": 0.03, + "global_step": 5044, + "learning_rate": 0.00047978297161936563, + "loss": 1.7174, + "loss_base2": 2.4777, + "loss_pixel": 0.1803, + "loss_text": 1.5371, + "ppl": 5.57, + "step": 5044 + }, + { + "epoch": 0.03, + "global_step": 5045, + "learning_rate": 0.00047977879799666114, + "loss": 1.7104, + "loss_base2": 2.4676, + "loss_pixel": 0.1814, + "loss_text": 1.529, + "ppl": 5.5312, + "step": 5045 + }, + { + "epoch": 0.03, + "global_step": 5046, + "learning_rate": 0.0004797746243739566, + "loss": 1.7167, + "loss_base2": 2.4767, + "loss_pixel": 0.1826, + "loss_text": 1.5342, + "ppl": 5.5661, + "step": 5046 + }, + { + "epoch": 0.03, + "global_step": 5047, + "learning_rate": 0.0004797704507512521, + "loss": 1.7219, + "loss_base2": 2.4842, + "loss_pixel": 0.1804, + "loss_text": 1.5415, + "ppl": 5.5951, + "step": 5047 + }, + { + "epoch": 0.03, + "global_step": 5048, + "learning_rate": 0.0004797662771285476, + "loss": 1.7158, + "loss_base2": 2.4754, + "loss_pixel": 0.1838, + "loss_text": 1.5321, + "ppl": 5.5611, + "step": 5048 + }, + { + "epoch": 0.03, + "global_step": 5049, + "learning_rate": 0.0004797621035058431, + "loss": 1.7143, + "loss_base2": 2.4732, + "loss_pixel": 0.1811, + "loss_text": 1.5332, + "ppl": 5.5528, + "step": 5049 + }, + { + "epoch": 0.03, + "global_step": 5050, + "learning_rate": 0.0004797579298831386, + "loss": 1.7116, + "loss_base2": 2.4693, + "loss_pixel": 0.183, + "loss_text": 1.5286, + "ppl": 5.5378, + "step": 5050 + }, + { + "epoch": 0.03, + "global_step": 5051, + "learning_rate": 0.000479753756260434, + "loss": 1.708, + "loss_base2": 2.4641, + "loss_pixel": 0.1807, + "loss_text": 1.5273, + "ppl": 5.5179, + "step": 5051 + }, + { + "epoch": 0.03, + "global_step": 5052, + "learning_rate": 0.00047974958263772953, + "loss": 1.7221, + "loss_base2": 2.4845, + "loss_pixel": 0.1822, + "loss_text": 1.5398, + "ppl": 5.5963, + "step": 5052 + }, + { + "epoch": 0.03, + "global_step": 5053, + "learning_rate": 0.00047974540901502504, + "loss": 1.7012, + "loss_base2": 2.4543, + "loss_pixel": 0.1811, + "loss_text": 1.5202, + "ppl": 5.4805, + "step": 5053 + }, + { + "epoch": 0.03, + "global_step": 5054, + "learning_rate": 0.00047974123539232054, + "loss": 1.7366, + "loss_base2": 2.5054, + "loss_pixel": 0.1841, + "loss_text": 1.5525, + "ppl": 5.678, + "step": 5054 + }, + { + "epoch": 0.03, + "global_step": 5055, + "learning_rate": 0.000479737061769616, + "loss": 1.7146, + "loss_base2": 2.4736, + "loss_pixel": 0.183, + "loss_text": 1.5316, + "ppl": 5.5545, + "step": 5055 + }, + { + "epoch": 0.03, + "global_step": 5056, + "learning_rate": 0.0004797328881469115, + "loss": 1.7186, + "loss_base2": 2.4794, + "loss_pixel": 0.1828, + "loss_text": 1.5358, + "ppl": 5.5767, + "step": 5056 + }, + { + "epoch": 0.03, + "global_step": 5057, + "learning_rate": 0.000479728714524207, + "loss": 1.7119, + "loss_base2": 2.4697, + "loss_pixel": 0.1838, + "loss_text": 1.5281, + "ppl": 5.5395, + "step": 5057 + }, + { + "epoch": 0.03, + "global_step": 5058, + "learning_rate": 0.0004797245409015025, + "loss": 1.7136, + "loss_base2": 2.4722, + "loss_pixel": 0.1831, + "loss_text": 1.5306, + "ppl": 5.5489, + "step": 5058 + }, + { + "epoch": 0.03, + "global_step": 5059, + "learning_rate": 0.000479720367278798, + "loss": 1.7131, + "loss_base2": 2.4715, + "loss_pixel": 0.1821, + "loss_text": 1.5309, + "ppl": 5.5461, + "step": 5059 + }, + { + "epoch": 0.03, + "global_step": 5060, + "learning_rate": 0.0004797161936560935, + "loss": 1.7141, + "loss_base2": 2.4729, + "loss_pixel": 0.1819, + "loss_text": 1.5322, + "ppl": 5.5517, + "step": 5060 + }, + { + "epoch": 0.03, + "global_step": 5061, + "learning_rate": 0.000479712020033389, + "loss": 1.7279, + "loss_base2": 2.4928, + "loss_pixel": 0.1847, + "loss_text": 1.5433, + "ppl": 5.6288, + "step": 5061 + }, + { + "epoch": 0.03, + "global_step": 5062, + "learning_rate": 0.0004797078464106845, + "loss": 1.7141, + "loss_base2": 2.4729, + "loss_pixel": 0.1821, + "loss_text": 1.532, + "ppl": 5.5517, + "step": 5062 + }, + { + "epoch": 0.03, + "global_step": 5063, + "learning_rate": 0.00047970367278798, + "loss": 1.7111, + "loss_base2": 2.4686, + "loss_pixel": 0.1859, + "loss_text": 1.5252, + "ppl": 5.535, + "step": 5063 + }, + { + "epoch": 0.03, + "global_step": 5064, + "learning_rate": 0.00047969949916527545, + "loss": 1.7052, + "loss_base2": 2.4601, + "loss_pixel": 0.1826, + "loss_text": 1.5227, + "ppl": 5.5025, + "step": 5064 + }, + { + "epoch": 0.03, + "global_step": 5065, + "learning_rate": 0.00047969532554257096, + "loss": 1.7195, + "loss_base2": 2.4807, + "loss_pixel": 0.1809, + "loss_text": 1.5386, + "ppl": 5.5817, + "step": 5065 + }, + { + "epoch": 0.03, + "global_step": 5066, + "learning_rate": 0.00047969115191986647, + "loss": 1.7169, + "loss_base2": 2.477, + "loss_pixel": 0.1831, + "loss_text": 1.5338, + "ppl": 5.5672, + "step": 5066 + }, + { + "epoch": 0.03, + "global_step": 5067, + "learning_rate": 0.000479686978297162, + "loss": 1.7215, + "loss_base2": 2.4836, + "loss_pixel": 0.1823, + "loss_text": 1.5392, + "ppl": 5.5929, + "step": 5067 + }, + { + "epoch": 0.03, + "global_step": 5068, + "learning_rate": 0.0004796828046744575, + "loss": 1.7202, + "loss_base2": 2.4817, + "loss_pixel": 0.1802, + "loss_text": 1.5401, + "ppl": 5.5856, + "step": 5068 + }, + { + "epoch": 0.03, + "global_step": 5069, + "learning_rate": 0.00047967863105175294, + "loss": 1.7193, + "loss_base2": 2.4804, + "loss_pixel": 0.1805, + "loss_text": 1.5388, + "ppl": 5.5806, + "step": 5069 + }, + { + "epoch": 0.03, + "global_step": 5070, + "learning_rate": 0.0004796744574290484, + "loss": 1.7216, + "loss_base2": 2.4837, + "loss_pixel": 0.1778, + "loss_text": 1.5438, + "ppl": 5.5935, + "step": 5070 + }, + { + "epoch": 0.03, + "global_step": 5071, + "learning_rate": 0.0004796702838063439, + "loss": 1.7172, + "loss_base2": 2.4774, + "loss_pixel": 0.1854, + "loss_text": 1.5318, + "ppl": 5.5689, + "step": 5071 + }, + { + "epoch": 0.03, + "global_step": 5072, + "learning_rate": 0.0004796661101836394, + "loss": 1.7004, + "loss_base2": 2.4532, + "loss_pixel": 0.1802, + "loss_text": 1.5202, + "ppl": 5.4761, + "step": 5072 + }, + { + "epoch": 0.03, + "global_step": 5073, + "learning_rate": 0.00047966193656093486, + "loss": 1.7093, + "loss_base2": 2.466, + "loss_pixel": 0.1804, + "loss_text": 1.5288, + "ppl": 5.5251, + "step": 5073 + }, + { + "epoch": 0.03, + "global_step": 5074, + "learning_rate": 0.00047965776293823037, + "loss": 1.7243, + "loss_base2": 2.4876, + "loss_pixel": 0.1815, + "loss_text": 1.5428, + "ppl": 5.6086, + "step": 5074 + }, + { + "epoch": 0.03, + "global_step": 5075, + "learning_rate": 0.00047965358931552587, + "loss": 1.7169, + "loss_base2": 2.477, + "loss_pixel": 0.179, + "loss_text": 1.5379, + "ppl": 5.5672, + "step": 5075 + }, + { + "epoch": 0.03, + "global_step": 5076, + "learning_rate": 0.0004796494156928214, + "loss": 1.7112, + "loss_base2": 2.4687, + "loss_pixel": 0.1796, + "loss_text": 1.5316, + "ppl": 5.5356, + "step": 5076 + }, + { + "epoch": 0.03, + "global_step": 5077, + "learning_rate": 0.0004796452420701169, + "loss": 1.7078, + "loss_base2": 2.4638, + "loss_pixel": 0.178, + "loss_text": 1.5298, + "ppl": 5.5168, + "step": 5077 + }, + { + "epoch": 0.03, + "global_step": 5078, + "learning_rate": 0.00047964106844741234, + "loss": 1.6936, + "loss_base2": 2.4433, + "loss_pixel": 0.1781, + "loss_text": 1.5155, + "ppl": 5.439, + "step": 5078 + }, + { + "epoch": 0.03, + "global_step": 5079, + "learning_rate": 0.00047963689482470785, + "loss": 1.7184, + "loss_base2": 2.4791, + "loss_pixel": 0.178, + "loss_text": 1.5404, + "ppl": 5.5756, + "step": 5079 + }, + { + "epoch": 0.03, + "global_step": 5080, + "learning_rate": 0.00047963272120200336, + "loss": 1.6985, + "loss_base2": 2.4504, + "loss_pixel": 0.179, + "loss_text": 1.5195, + "ppl": 5.4657, + "step": 5080 + }, + { + "epoch": 0.03, + "global_step": 5081, + "learning_rate": 0.00047962854757929886, + "loss": 1.6873, + "loss_base2": 2.4343, + "loss_pixel": 0.1776, + "loss_text": 1.5098, + "ppl": 5.4049, + "step": 5081 + }, + { + "epoch": 0.03, + "global_step": 5082, + "learning_rate": 0.0004796243739565943, + "loss": 1.7003, + "loss_base2": 2.453, + "loss_pixel": 0.1797, + "loss_text": 1.5206, + "ppl": 5.4756, + "step": 5082 + }, + { + "epoch": 0.03, + "global_step": 5083, + "learning_rate": 0.0004796202003338898, + "loss": 1.7128, + "loss_base2": 2.471, + "loss_pixel": 0.1766, + "loss_text": 1.5362, + "ppl": 5.5445, + "step": 5083 + }, + { + "epoch": 0.03, + "global_step": 5084, + "learning_rate": 0.00047961602671118533, + "loss": 1.7109, + "loss_base2": 2.4683, + "loss_pixel": 0.1777, + "loss_text": 1.5333, + "ppl": 5.5339, + "step": 5084 + }, + { + "epoch": 0.03, + "global_step": 5085, + "learning_rate": 0.00047961185308848084, + "loss": 1.7195, + "loss_base2": 2.4807, + "loss_pixel": 0.1755, + "loss_text": 1.544, + "ppl": 5.5817, + "step": 5085 + }, + { + "epoch": 0.03, + "global_step": 5086, + "learning_rate": 0.00047960767946577634, + "loss": 1.7063, + "loss_base2": 2.4617, + "loss_pixel": 0.176, + "loss_text": 1.5303, + "ppl": 5.5085, + "step": 5086 + }, + { + "epoch": 0.03, + "global_step": 5087, + "learning_rate": 0.0004796035058430718, + "loss": 1.7027, + "loss_base2": 2.4565, + "loss_pixel": 0.1769, + "loss_text": 1.5257, + "ppl": 5.4887, + "step": 5087 + }, + { + "epoch": 0.03, + "global_step": 5088, + "learning_rate": 0.0004795993322203673, + "loss": 1.7217, + "loss_base2": 2.4839, + "loss_pixel": 0.1788, + "loss_text": 1.5429, + "ppl": 5.594, + "step": 5088 + }, + { + "epoch": 0.03, + "global_step": 5089, + "learning_rate": 0.00047959515859766276, + "loss": 1.7051, + "loss_base2": 2.4599, + "loss_pixel": 0.1789, + "loss_text": 1.5262, + "ppl": 5.5019, + "step": 5089 + }, + { + "epoch": 0.03, + "global_step": 5090, + "learning_rate": 0.00047959098497495827, + "loss": 1.5792, + "loss_base2": 2.2783, + "loss_pixel": 0.1776, + "loss_text": 1.4016, + "ppl": 4.8511, + "step": 5090 + }, + { + "epoch": 0.03, + "global_step": 5091, + "learning_rate": 0.0004795868113522538, + "loss": 1.4977, + "loss_base2": 2.1607, + "loss_pixel": 0.1762, + "loss_text": 1.3216, + "ppl": 4.4714, + "step": 5091 + }, + { + "epoch": 0.03, + "global_step": 5092, + "learning_rate": 0.0004795826377295492, + "loss": 1.4915, + "loss_base2": 2.1518, + "loss_pixel": 0.1758, + "loss_text": 1.3157, + "ppl": 4.4438, + "step": 5092 + }, + { + "epoch": 0.03, + "global_step": 5093, + "learning_rate": 0.00047957846410684473, + "loss": 1.4873, + "loss_base2": 2.1457, + "loss_pixel": 0.1767, + "loss_text": 1.3106, + "ppl": 4.4251, + "step": 5093 + }, + { + "epoch": 0.03, + "global_step": 5094, + "learning_rate": 0.00047957429048414024, + "loss": 1.4912, + "loss_base2": 2.1513, + "loss_pixel": 0.1761, + "loss_text": 1.3151, + "ppl": 4.4424, + "step": 5094 + }, + { + "epoch": 0.03, + "global_step": 5095, + "learning_rate": 0.00047957011686143575, + "loss": 1.5017, + "loss_base2": 2.1665, + "loss_pixel": 0.1769, + "loss_text": 1.3247, + "ppl": 4.4893, + "step": 5095 + }, + { + "epoch": 0.03, + "global_step": 5096, + "learning_rate": 0.0004795659432387312, + "loss": 1.4939, + "loss_base2": 2.1552, + "loss_pixel": 0.1966, + "loss_text": 1.2973, + "ppl": 4.4544, + "step": 5096 + }, + { + "epoch": 0.03, + "global_step": 5097, + "learning_rate": 0.0004795617696160267, + "loss": 1.4925, + "loss_base2": 2.1532, + "loss_pixel": 0.1946, + "loss_text": 1.2979, + "ppl": 4.4482, + "step": 5097 + }, + { + "epoch": 0.03, + "global_step": 5098, + "learning_rate": 0.0004795575959933222, + "loss": 1.497, + "loss_base2": 2.1597, + "loss_pixel": 0.1932, + "loss_text": 1.3038, + "ppl": 4.4683, + "step": 5098 + }, + { + "epoch": 0.03, + "global_step": 5099, + "learning_rate": 0.0004795534223706177, + "loss": 1.4809, + "loss_base2": 2.1365, + "loss_pixel": 0.1929, + "loss_text": 1.2881, + "ppl": 4.3969, + "step": 5099 + }, + { + "epoch": 0.03, + "global_step": 5100, + "learning_rate": 0.00047954924874791323, + "loss": 1.4794, + "loss_base2": 2.1343, + "loss_pixel": 0.1924, + "loss_text": 1.2871, + "ppl": 4.3903, + "step": 5100 + }, + { + "epoch": 0.03, + "global_step": 5101, + "learning_rate": 0.0004795450751252087, + "loss": 1.477, + "loss_base2": 2.1309, + "loss_pixel": 0.1861, + "loss_text": 1.291, + "ppl": 4.3798, + "step": 5101 + }, + { + "epoch": 0.03, + "global_step": 5102, + "learning_rate": 0.0004795409015025042, + "loss": 1.5033, + "loss_base2": 2.1688, + "loss_pixel": 0.1859, + "loss_text": 1.3174, + "ppl": 4.4965, + "step": 5102 + }, + { + "epoch": 0.03, + "global_step": 5103, + "learning_rate": 0.0004795367278797997, + "loss": 1.4859, + "loss_base2": 2.1437, + "loss_pixel": 0.1844, + "loss_text": 1.3015, + "ppl": 4.4189, + "step": 5103 + }, + { + "epoch": 0.03, + "global_step": 5104, + "learning_rate": 0.0004795325542570952, + "loss": 1.4967, + "loss_base2": 2.1593, + "loss_pixel": 0.188, + "loss_text": 1.3087, + "ppl": 4.4669, + "step": 5104 + }, + { + "epoch": 0.03, + "global_step": 5105, + "learning_rate": 0.00047952838063439066, + "loss": 1.4824, + "loss_base2": 2.1387, + "loss_pixel": 0.1849, + "loss_text": 1.2975, + "ppl": 4.4035, + "step": 5105 + }, + { + "epoch": 0.03, + "global_step": 5106, + "learning_rate": 0.00047952420701168617, + "loss": 1.5131, + "loss_base2": 2.1829, + "loss_pixel": 0.1838, + "loss_text": 1.3294, + "ppl": 4.5408, + "step": 5106 + }, + { + "epoch": 0.03, + "global_step": 5107, + "learning_rate": 0.0004795200333889817, + "loss": 1.4734, + "loss_base2": 2.1257, + "loss_pixel": 0.1846, + "loss_text": 1.2889, + "ppl": 4.364, + "step": 5107 + }, + { + "epoch": 0.03, + "global_step": 5108, + "learning_rate": 0.0004795158597662771, + "loss": 1.4701, + "loss_base2": 2.1209, + "loss_pixel": 0.1829, + "loss_text": 1.2873, + "ppl": 4.3497, + "step": 5108 + }, + { + "epoch": 0.03, + "global_step": 5109, + "learning_rate": 0.00047951168614357263, + "loss": 1.5143, + "loss_base2": 2.1847, + "loss_pixel": 0.1844, + "loss_text": 1.3298, + "ppl": 4.5462, + "step": 5109 + }, + { + "epoch": 0.03, + "global_step": 5110, + "learning_rate": 0.0004795075125208681, + "loss": 1.4788, + "loss_base2": 2.1335, + "loss_pixel": 0.1846, + "loss_text": 1.2942, + "ppl": 4.3877, + "step": 5110 + }, + { + "epoch": 0.03, + "global_step": 5111, + "learning_rate": 0.0004795033388981636, + "loss": 1.4778, + "loss_base2": 2.132, + "loss_pixel": 0.1827, + "loss_text": 1.2951, + "ppl": 4.3833, + "step": 5111 + }, + { + "epoch": 0.03, + "global_step": 5112, + "learning_rate": 0.0004794991652754591, + "loss": 1.4891, + "loss_base2": 2.1483, + "loss_pixel": 0.1845, + "loss_text": 1.3046, + "ppl": 4.4331, + "step": 5112 + }, + { + "epoch": 0.03, + "global_step": 5113, + "learning_rate": 0.0004794949916527546, + "loss": 1.4757, + "loss_base2": 2.129, + "loss_pixel": 0.1831, + "loss_text": 1.2926, + "ppl": 4.3741, + "step": 5113 + }, + { + "epoch": 0.03, + "global_step": 5114, + "learning_rate": 0.00047949081803005006, + "loss": 1.4862, + "loss_base2": 2.1441, + "loss_pixel": 0.1824, + "loss_text": 1.3038, + "ppl": 4.4203, + "step": 5114 + }, + { + "epoch": 0.03, + "global_step": 5115, + "learning_rate": 0.00047948664440734557, + "loss": 1.6427, + "loss_base2": 2.3699, + "loss_pixel": 0.1824, + "loss_text": 1.4603, + "ppl": 5.1691, + "step": 5115 + }, + { + "epoch": 0.03, + "global_step": 5116, + "learning_rate": 0.0004794824707846411, + "loss": 1.4852, + "loss_base2": 2.1427, + "loss_pixel": 0.1826, + "loss_text": 1.3025, + "ppl": 4.4158, + "step": 5116 + }, + { + "epoch": 0.03, + "global_step": 5117, + "learning_rate": 0.0004794782971619366, + "loss": 1.4865, + "loss_base2": 2.1446, + "loss_pixel": 0.1827, + "loss_text": 1.3038, + "ppl": 4.4216, + "step": 5117 + }, + { + "epoch": 0.03, + "global_step": 5118, + "learning_rate": 0.0004794741235392321, + "loss": 1.4718, + "loss_base2": 2.1234, + "loss_pixel": 0.1814, + "loss_text": 1.2903, + "ppl": 4.3571, + "step": 5118 + }, + { + "epoch": 0.03, + "global_step": 5119, + "learning_rate": 0.00047946994991652754, + "loss": 1.4661, + "loss_base2": 2.1151, + "loss_pixel": 0.1835, + "loss_text": 1.2825, + "ppl": 4.3323, + "step": 5119 + }, + { + "epoch": 0.03, + "global_step": 5120, + "learning_rate": 0.00047946577629382305, + "loss": 1.4965, + "loss_base2": 2.159, + "loss_pixel": 0.1827, + "loss_text": 1.3138, + "ppl": 4.466, + "step": 5120 + }, + { + "epoch": 0.03, + "global_step": 5121, + "learning_rate": 0.00047946160267111856, + "loss": 1.4803, + "loss_base2": 2.1356, + "loss_pixel": 0.1819, + "loss_text": 1.2983, + "ppl": 4.3943, + "step": 5121 + }, + { + "epoch": 0.03, + "global_step": 5122, + "learning_rate": 0.00047945742904841407, + "loss": 1.4848, + "loss_base2": 2.1421, + "loss_pixel": 0.1822, + "loss_text": 1.3025, + "ppl": 4.4141, + "step": 5122 + }, + { + "epoch": 0.03, + "global_step": 5123, + "learning_rate": 0.0004794532554257095, + "loss": 1.4892, + "loss_base2": 2.1485, + "loss_pixel": 0.1822, + "loss_text": 1.307, + "ppl": 4.4335, + "step": 5123 + }, + { + "epoch": 0.03, + "global_step": 5124, + "learning_rate": 0.000479449081803005, + "loss": 1.5935, + "loss_base2": 2.2989, + "loss_pixel": 0.182, + "loss_text": 1.4115, + "ppl": 4.9209, + "step": 5124 + }, + { + "epoch": 0.03, + "global_step": 5125, + "learning_rate": 0.00047944490818030053, + "loss": 1.5684, + "loss_base2": 2.2627, + "loss_pixel": 0.1822, + "loss_text": 1.3862, + "ppl": 4.799, + "step": 5125 + }, + { + "epoch": 0.03, + "global_step": 5126, + "learning_rate": 0.00047944073455759604, + "loss": 1.4691, + "loss_base2": 2.1195, + "loss_pixel": 0.1818, + "loss_text": 1.2873, + "ppl": 4.3453, + "step": 5126 + }, + { + "epoch": 0.03, + "global_step": 5127, + "learning_rate": 0.0004794365609348915, + "loss": 1.4621, + "loss_base2": 2.1094, + "loss_pixel": 0.1815, + "loss_text": 1.2806, + "ppl": 4.315, + "step": 5127 + }, + { + "epoch": 0.03, + "global_step": 5128, + "learning_rate": 0.00047943238731218695, + "loss": 1.4851, + "loss_base2": 2.1425, + "loss_pixel": 0.1827, + "loss_text": 1.3024, + "ppl": 4.4154, + "step": 5128 + }, + { + "epoch": 0.03, + "global_step": 5129, + "learning_rate": 0.00047942821368948245, + "loss": 1.4931, + "loss_base2": 2.1541, + "loss_pixel": 0.1823, + "loss_text": 1.3108, + "ppl": 4.4509, + "step": 5129 + }, + { + "epoch": 0.03, + "global_step": 5130, + "learning_rate": 0.00047942404006677796, + "loss": 1.484, + "loss_base2": 2.141, + "loss_pixel": 0.1815, + "loss_text": 1.3025, + "ppl": 4.4106, + "step": 5130 + }, + { + "epoch": 0.03, + "global_step": 5131, + "learning_rate": 0.00047941986644407347, + "loss": 1.4856, + "loss_base2": 2.1433, + "loss_pixel": 0.1827, + "loss_text": 1.3029, + "ppl": 4.4176, + "step": 5131 + }, + { + "epoch": 0.03, + "global_step": 5132, + "learning_rate": 0.0004794156928213689, + "loss": 1.4908, + "loss_base2": 2.1508, + "loss_pixel": 0.1817, + "loss_text": 1.309, + "ppl": 4.4406, + "step": 5132 + }, + { + "epoch": 0.03, + "global_step": 5133, + "learning_rate": 0.00047941151919866443, + "loss": 1.549, + "loss_base2": 2.2347, + "loss_pixel": 0.1818, + "loss_text": 1.3673, + "ppl": 4.7068, + "step": 5133 + }, + { + "epoch": 0.03, + "global_step": 5134, + "learning_rate": 0.00047940734557595994, + "loss": 1.7655, + "loss_base2": 2.5471, + "loss_pixel": 0.181, + "loss_text": 1.5845, + "ppl": 5.8445, + "step": 5134 + }, + { + "epoch": 0.03, + "global_step": 5135, + "learning_rate": 0.00047940317195325544, + "loss": 1.7598, + "loss_base2": 2.5389, + "loss_pixel": 0.1825, + "loss_text": 1.5773, + "ppl": 5.8113, + "step": 5135 + }, + { + "epoch": 0.03, + "global_step": 5136, + "learning_rate": 0.00047939899833055095, + "loss": 1.7589, + "loss_base2": 2.5376, + "loss_pixel": 0.1825, + "loss_text": 1.5764, + "ppl": 5.806, + "step": 5136 + }, + { + "epoch": 0.03, + "global_step": 5137, + "learning_rate": 0.0004793948247078464, + "loss": 1.7389, + "loss_base2": 2.5087, + "loss_pixel": 0.1813, + "loss_text": 1.5576, + "ppl": 5.6911, + "step": 5137 + }, + { + "epoch": 0.03, + "global_step": 5138, + "learning_rate": 0.0004793906510851419, + "loss": 1.7282, + "loss_base2": 2.4933, + "loss_pixel": 0.1808, + "loss_text": 1.5474, + "ppl": 5.6305, + "step": 5138 + }, + { + "epoch": 0.03, + "global_step": 5139, + "learning_rate": 0.0004793864774624374, + "loss": 1.7425, + "loss_base2": 2.5139, + "loss_pixel": 0.1814, + "loss_text": 1.561, + "ppl": 5.7116, + "step": 5139 + }, + { + "epoch": 0.03, + "global_step": 5140, + "learning_rate": 0.0004793823038397329, + "loss": 1.7532, + "loss_base2": 2.5293, + "loss_pixel": 0.181, + "loss_text": 1.5723, + "ppl": 5.773, + "step": 5140 + }, + { + "epoch": 0.03, + "global_step": 5141, + "learning_rate": 0.0004793781302170284, + "loss": 1.7379, + "loss_base2": 2.5073, + "loss_pixel": 0.1822, + "loss_text": 1.5558, + "ppl": 5.6854, + "step": 5141 + }, + { + "epoch": 0.03, + "global_step": 5142, + "learning_rate": 0.0004793739565943239, + "loss": 1.7356, + "loss_base2": 2.5039, + "loss_pixel": 0.1818, + "loss_text": 1.5538, + "ppl": 5.6723, + "step": 5142 + }, + { + "epoch": 0.03, + "global_step": 5143, + "learning_rate": 0.0004793697829716194, + "loss": 1.7566, + "loss_base2": 2.5342, + "loss_pixel": 0.1822, + "loss_text": 1.5744, + "ppl": 5.7927, + "step": 5143 + }, + { + "epoch": 0.03, + "global_step": 5144, + "learning_rate": 0.0004793656093489149, + "loss": 1.7324, + "loss_base2": 2.4993, + "loss_pixel": 0.181, + "loss_text": 1.5514, + "ppl": 5.6542, + "step": 5144 + }, + { + "epoch": 0.03, + "global_step": 5145, + "learning_rate": 0.00047936143572621036, + "loss": 1.7222, + "loss_base2": 2.4846, + "loss_pixel": 0.1815, + "loss_text": 1.5407, + "ppl": 5.5968, + "step": 5145 + }, + { + "epoch": 0.03, + "global_step": 5146, + "learning_rate": 0.0004793572621035058, + "loss": 1.7249, + "loss_base2": 2.4885, + "loss_pixel": 0.1819, + "loss_text": 1.543, + "ppl": 5.612, + "step": 5146 + }, + { + "epoch": 0.03, + "global_step": 5147, + "learning_rate": 0.0004793530884808013, + "loss": 1.7252, + "loss_base2": 2.4889, + "loss_pixel": 0.1824, + "loss_text": 1.5428, + "ppl": 5.6136, + "step": 5147 + }, + { + "epoch": 0.03, + "global_step": 5148, + "learning_rate": 0.0004793489148580968, + "loss": 1.721, + "loss_base2": 2.4829, + "loss_pixel": 0.181, + "loss_text": 1.54, + "ppl": 5.5901, + "step": 5148 + }, + { + "epoch": 0.03, + "global_step": 5149, + "learning_rate": 0.00047934474123539233, + "loss": 1.7269, + "loss_base2": 2.4914, + "loss_pixel": 0.1819, + "loss_text": 1.545, + "ppl": 5.6232, + "step": 5149 + }, + { + "epoch": 0.03, + "global_step": 5150, + "learning_rate": 0.00047934056761268784, + "loss": 1.714, + "loss_base2": 2.4728, + "loss_pixel": 0.183, + "loss_text": 1.531, + "ppl": 5.5511, + "step": 5150 + }, + { + "epoch": 0.03, + "global_step": 5151, + "learning_rate": 0.0004793363939899833, + "loss": 1.7283, + "loss_base2": 2.4934, + "loss_pixel": 0.1829, + "loss_text": 1.5454, + "ppl": 5.6311, + "step": 5151 + }, + { + "epoch": 0.03, + "global_step": 5152, + "learning_rate": 0.0004793322203672788, + "loss": 1.7259, + "loss_base2": 2.4899, + "loss_pixel": 0.1803, + "loss_text": 1.5456, + "ppl": 5.6176, + "step": 5152 + }, + { + "epoch": 0.03, + "global_step": 5153, + "learning_rate": 0.0004793280467445743, + "loss": 1.7292, + "loss_base2": 2.4947, + "loss_pixel": 0.1819, + "loss_text": 1.5473, + "ppl": 5.6361, + "step": 5153 + }, + { + "epoch": 0.03, + "global_step": 5154, + "learning_rate": 0.0004793238731218698, + "loss": 1.7375, + "loss_base2": 2.5067, + "loss_pixel": 0.1801, + "loss_text": 1.5575, + "ppl": 5.6831, + "step": 5154 + }, + { + "epoch": 0.03, + "global_step": 5155, + "learning_rate": 0.00047931969949916527, + "loss": 1.7141, + "loss_base2": 2.4729, + "loss_pixel": 0.1812, + "loss_text": 1.5329, + "ppl": 5.5517, + "step": 5155 + }, + { + "epoch": 0.03, + "global_step": 5156, + "learning_rate": 0.0004793155258764608, + "loss": 1.737, + "loss_base2": 2.506, + "loss_pixel": 0.1812, + "loss_text": 1.5558, + "ppl": 5.6803, + "step": 5156 + }, + { + "epoch": 0.03, + "global_step": 5157, + "learning_rate": 0.0004793113522537563, + "loss": 1.7142, + "loss_base2": 2.4731, + "loss_pixel": 0.18, + "loss_text": 1.5342, + "ppl": 5.5522, + "step": 5157 + }, + { + "epoch": 0.03, + "global_step": 5158, + "learning_rate": 0.0004793071786310518, + "loss": 1.7268, + "loss_base2": 2.4912, + "loss_pixel": 0.1818, + "loss_text": 1.5451, + "ppl": 5.6226, + "step": 5158 + }, + { + "epoch": 0.03, + "global_step": 5159, + "learning_rate": 0.0004793030050083473, + "loss": 1.7071, + "loss_base2": 2.4628, + "loss_pixel": 0.1815, + "loss_text": 1.5256, + "ppl": 5.513, + "step": 5159 + }, + { + "epoch": 0.03, + "global_step": 5160, + "learning_rate": 0.00047929883138564275, + "loss": 1.7239, + "loss_base2": 2.4871, + "loss_pixel": 0.1822, + "loss_text": 1.5417, + "ppl": 5.6064, + "step": 5160 + }, + { + "epoch": 0.03, + "global_step": 5161, + "learning_rate": 0.00047929465776293826, + "loss": 1.7252, + "loss_base2": 2.4889, + "loss_pixel": 0.1816, + "loss_text": 1.5436, + "ppl": 5.6136, + "step": 5161 + }, + { + "epoch": 0.03, + "global_step": 5162, + "learning_rate": 0.00047929048414023376, + "loss": 1.712, + "loss_base2": 2.4699, + "loss_pixel": 0.1814, + "loss_text": 1.5306, + "ppl": 5.54, + "step": 5162 + }, + { + "epoch": 0.03, + "global_step": 5163, + "learning_rate": 0.00047928631051752927, + "loss": 1.716, + "loss_base2": 2.4757, + "loss_pixel": 0.1828, + "loss_text": 1.5332, + "ppl": 5.5622, + "step": 5163 + }, + { + "epoch": 0.03, + "global_step": 5164, + "learning_rate": 0.00047928213689482467, + "loss": 1.7187, + "loss_base2": 2.4796, + "loss_pixel": 0.181, + "loss_text": 1.5377, + "ppl": 5.5773, + "step": 5164 + }, + { + "epoch": 0.03, + "global_step": 5165, + "learning_rate": 0.0004792779632721202, + "loss": 1.7128, + "loss_base2": 2.471, + "loss_pixel": 0.1812, + "loss_text": 1.5316, + "ppl": 5.5445, + "step": 5165 + }, + { + "epoch": 0.03, + "global_step": 5166, + "learning_rate": 0.0004792737896494157, + "loss": 1.711, + "loss_base2": 2.4685, + "loss_pixel": 0.1811, + "loss_text": 1.5298, + "ppl": 5.5345, + "step": 5166 + }, + { + "epoch": 0.03, + "global_step": 5167, + "learning_rate": 0.0004792696160267112, + "loss": 1.7302, + "loss_base2": 2.4962, + "loss_pixel": 0.1815, + "loss_text": 1.5487, + "ppl": 5.6418, + "step": 5167 + }, + { + "epoch": 0.03, + "global_step": 5168, + "learning_rate": 0.0004792654424040067, + "loss": 1.7233, + "loss_base2": 2.4862, + "loss_pixel": 0.1798, + "loss_text": 1.5435, + "ppl": 5.603, + "step": 5168 + }, + { + "epoch": 0.03, + "global_step": 5169, + "learning_rate": 0.00047926126878130215, + "loss": 1.7087, + "loss_base2": 2.4651, + "loss_pixel": 0.1817, + "loss_text": 1.527, + "ppl": 5.5218, + "step": 5169 + }, + { + "epoch": 0.03, + "global_step": 5170, + "learning_rate": 0.00047925709515859766, + "loss": 1.713, + "loss_base2": 2.4713, + "loss_pixel": 0.1806, + "loss_text": 1.5324, + "ppl": 5.5456, + "step": 5170 + }, + { + "epoch": 0.03, + "global_step": 5171, + "learning_rate": 0.00047925292153589317, + "loss": 1.7191, + "loss_base2": 2.4801, + "loss_pixel": 0.1811, + "loss_text": 1.5381, + "ppl": 5.5795, + "step": 5171 + }, + { + "epoch": 0.03, + "global_step": 5172, + "learning_rate": 0.0004792487479131887, + "loss": 1.7071, + "loss_base2": 2.4628, + "loss_pixel": 0.1816, + "loss_text": 1.5255, + "ppl": 5.513, + "step": 5172 + }, + { + "epoch": 0.03, + "global_step": 5173, + "learning_rate": 0.0004792445742904841, + "loss": 1.7268, + "loss_base2": 2.4912, + "loss_pixel": 0.1827, + "loss_text": 1.5441, + "ppl": 5.6226, + "step": 5173 + }, + { + "epoch": 0.03, + "global_step": 5174, + "learning_rate": 0.00047924040066777963, + "loss": 1.7089, + "loss_base2": 2.4654, + "loss_pixel": 0.1816, + "loss_text": 1.5273, + "ppl": 5.5229, + "step": 5174 + }, + { + "epoch": 0.03, + "global_step": 5175, + "learning_rate": 0.00047923622704507514, + "loss": 1.735, + "loss_base2": 2.5031, + "loss_pixel": 0.181, + "loss_text": 1.554, + "ppl": 5.6689, + "step": 5175 + }, + { + "epoch": 0.03, + "global_step": 5176, + "learning_rate": 0.00047923205342237065, + "loss": 1.7166, + "loss_base2": 2.4765, + "loss_pixel": 0.1765, + "loss_text": 1.5402, + "ppl": 5.5656, + "step": 5176 + }, + { + "epoch": 0.03, + "global_step": 5177, + "learning_rate": 0.00047922787979966616, + "loss": 1.6978, + "loss_base2": 2.4494, + "loss_pixel": 0.1767, + "loss_text": 1.5211, + "ppl": 5.4619, + "step": 5177 + }, + { + "epoch": 0.03, + "global_step": 5178, + "learning_rate": 0.0004792237061769616, + "loss": 1.7012, + "loss_base2": 2.4543, + "loss_pixel": 0.1791, + "loss_text": 1.5222, + "ppl": 5.4805, + "step": 5178 + }, + { + "epoch": 0.03, + "global_step": 5179, + "learning_rate": 0.0004792195325542571, + "loss": 1.5234, + "loss_base2": 2.1978, + "loss_pixel": 0.1756, + "loss_text": 1.3478, + "ppl": 4.5878, + "step": 5179 + }, + { + "epoch": 0.03, + "global_step": 5180, + "learning_rate": 0.0004792153589315526, + "loss": 1.4915, + "loss_base2": 2.1518, + "loss_pixel": 0.1782, + "loss_text": 1.3133, + "ppl": 4.4438, + "step": 5180 + }, + { + "epoch": 0.03, + "global_step": 5181, + "learning_rate": 0.00047921118530884813, + "loss": 1.4724, + "loss_base2": 2.1242, + "loss_pixel": 0.1757, + "loss_text": 1.2967, + "ppl": 4.3597, + "step": 5181 + }, + { + "epoch": 0.03, + "global_step": 5182, + "learning_rate": 0.0004792070116861436, + "loss": 1.4542, + "loss_base2": 2.098, + "loss_pixel": 0.1765, + "loss_text": 1.2777, + "ppl": 4.2811, + "step": 5182 + }, + { + "epoch": 0.03, + "global_step": 5183, + "learning_rate": 0.00047920283806343904, + "loss": 1.4628, + "loss_base2": 2.1104, + "loss_pixel": 0.1782, + "loss_text": 1.2847, + "ppl": 4.318, + "step": 5183 + }, + { + "epoch": 0.03, + "global_step": 5184, + "learning_rate": 0.00047919866444073454, + "loss": 1.4671, + "loss_base2": 2.1166, + "loss_pixel": 0.1784, + "loss_text": 1.2886, + "ppl": 4.3366, + "step": 5184 + }, + { + "epoch": 0.03, + "global_step": 5185, + "learning_rate": 0.00047919449081803005, + "loss": 1.4649, + "loss_base2": 2.1134, + "loss_pixel": 0.1794, + "loss_text": 1.2855, + "ppl": 4.3271, + "step": 5185 + }, + { + "epoch": 0.03, + "global_step": 5186, + "learning_rate": 0.00047919031719532556, + "loss": 1.5509, + "loss_base2": 2.2375, + "loss_pixel": 0.1761, + "loss_text": 1.3749, + "ppl": 4.7157, + "step": 5186 + }, + { + "epoch": 0.03, + "global_step": 5187, + "learning_rate": 0.000479186143572621, + "loss": 1.7298, + "loss_base2": 2.4956, + "loss_pixel": 0.1759, + "loss_text": 1.5539, + "ppl": 5.6395, + "step": 5187 + }, + { + "epoch": 0.03, + "global_step": 5188, + "learning_rate": 0.0004791819699499165, + "loss": 1.7253, + "loss_base2": 2.4891, + "loss_pixel": 0.1748, + "loss_text": 1.5505, + "ppl": 5.6142, + "step": 5188 + }, + { + "epoch": 0.03, + "global_step": 5189, + "learning_rate": 0.000479177796327212, + "loss": 1.7316, + "loss_base2": 2.4982, + "loss_pixel": 0.1757, + "loss_text": 1.5559, + "ppl": 5.6497, + "step": 5189 + }, + { + "epoch": 0.03, + "global_step": 5190, + "learning_rate": 0.00047917362270450753, + "loss": 1.6843, + "loss_base2": 2.4299, + "loss_pixel": 0.1766, + "loss_text": 1.5077, + "ppl": 5.3887, + "step": 5190 + }, + { + "epoch": 0.03, + "global_step": 5191, + "learning_rate": 0.000479169449081803, + "loss": 1.7022, + "loss_base2": 2.4558, + "loss_pixel": 0.1766, + "loss_text": 1.5256, + "ppl": 5.486, + "step": 5191 + }, + { + "epoch": 0.03, + "global_step": 5192, + "learning_rate": 0.0004791652754590985, + "loss": 1.6908, + "loss_base2": 2.4393, + "loss_pixel": 0.1752, + "loss_text": 1.5155, + "ppl": 5.4238, + "step": 5192 + }, + { + "epoch": 0.03, + "global_step": 5193, + "learning_rate": 0.000479161101836394, + "loss": 1.7224, + "loss_base2": 2.4849, + "loss_pixel": 0.1739, + "loss_text": 1.5484, + "ppl": 5.5979, + "step": 5193 + }, + { + "epoch": 0.03, + "global_step": 5194, + "learning_rate": 0.0004791569282136895, + "loss": 1.7273, + "loss_base2": 2.492, + "loss_pixel": 0.1769, + "loss_text": 1.5504, + "ppl": 5.6254, + "step": 5194 + }, + { + "epoch": 0.03, + "global_step": 5195, + "learning_rate": 0.000479152754590985, + "loss": 1.6994, + "loss_base2": 2.4517, + "loss_pixel": 0.1746, + "loss_text": 1.5247, + "ppl": 5.4707, + "step": 5195 + }, + { + "epoch": 0.03, + "global_step": 5196, + "learning_rate": 0.00047914858096828047, + "loss": 1.7106, + "loss_base2": 2.4679, + "loss_pixel": 0.1757, + "loss_text": 1.5349, + "ppl": 5.5323, + "step": 5196 + }, + { + "epoch": 0.03, + "global_step": 5197, + "learning_rate": 0.000479144407345576, + "loss": 1.7247, + "loss_base2": 2.4882, + "loss_pixel": 0.1766, + "loss_text": 1.5481, + "ppl": 5.6108, + "step": 5197 + }, + { + "epoch": 0.03, + "global_step": 5198, + "learning_rate": 0.0004791402337228715, + "loss": 1.7044, + "loss_base2": 2.4589, + "loss_pixel": 0.1762, + "loss_text": 1.5282, + "ppl": 5.4981, + "step": 5198 + }, + { + "epoch": 0.03, + "global_step": 5199, + "learning_rate": 0.000479136060100167, + "loss": 1.7011, + "loss_base2": 2.4542, + "loss_pixel": 0.176, + "loss_text": 1.5251, + "ppl": 5.48, + "step": 5199 + }, + { + "epoch": 0.03, + "global_step": 5200, + "learning_rate": 0.00047913188647746244, + "loss": 1.7119, + "loss_base2": 2.4697, + "loss_pixel": 0.1754, + "loss_text": 1.5366, + "ppl": 5.5395, + "step": 5200 + }, + { + "epoch": 0.03, + "global_step": 5201, + "learning_rate": 0.0004791277128547579, + "loss": 1.6787, + "loss_base2": 2.4219, + "loss_pixel": 0.1756, + "loss_text": 1.5032, + "ppl": 5.3586, + "step": 5201 + }, + { + "epoch": 0.03, + "global_step": 5202, + "learning_rate": 0.0004791235392320534, + "loss": 1.7079, + "loss_base2": 2.464, + "loss_pixel": 0.1745, + "loss_text": 1.5335, + "ppl": 5.5174, + "step": 5202 + }, + { + "epoch": 0.03, + "global_step": 5203, + "learning_rate": 0.0004791193656093489, + "loss": 1.7213, + "loss_base2": 2.4833, + "loss_pixel": 0.1928, + "loss_text": 1.5284, + "ppl": 5.5918, + "step": 5203 + }, + { + "epoch": 0.03, + "global_step": 5204, + "learning_rate": 0.0004791151919866444, + "loss": 1.6971, + "loss_base2": 2.4484, + "loss_pixel": 0.1933, + "loss_text": 1.5038, + "ppl": 5.4581, + "step": 5204 + }, + { + "epoch": 0.03, + "global_step": 5205, + "learning_rate": 0.00047911101836393987, + "loss": 1.7359, + "loss_base2": 2.5044, + "loss_pixel": 0.1956, + "loss_text": 1.5403, + "ppl": 5.674, + "step": 5205 + }, + { + "epoch": 0.03, + "global_step": 5206, + "learning_rate": 0.0004791068447412354, + "loss": 1.7152, + "loss_base2": 2.4745, + "loss_pixel": 0.1932, + "loss_text": 1.522, + "ppl": 5.5578, + "step": 5206 + }, + { + "epoch": 0.03, + "global_step": 5207, + "learning_rate": 0.0004791026711185309, + "loss": 1.7474, + "loss_base2": 2.521, + "loss_pixel": 0.1896, + "loss_text": 1.5578, + "ppl": 5.7397, + "step": 5207 + }, + { + "epoch": 0.03, + "global_step": 5208, + "learning_rate": 0.0004790984974958264, + "loss": 1.6958, + "loss_base2": 2.4465, + "loss_pixel": 0.1782, + "loss_text": 1.5176, + "ppl": 5.451, + "step": 5208 + }, + { + "epoch": 0.03, + "global_step": 5209, + "learning_rate": 0.0004790943238731219, + "loss": 1.7013, + "loss_base2": 2.4545, + "loss_pixel": 0.1786, + "loss_text": 1.5228, + "ppl": 5.4811, + "step": 5209 + }, + { + "epoch": 0.03, + "global_step": 5210, + "learning_rate": 0.00047909015025041736, + "loss": 1.7235, + "loss_base2": 2.4865, + "loss_pixel": 0.1782, + "loss_text": 1.5453, + "ppl": 5.6041, + "step": 5210 + }, + { + "epoch": 0.03, + "global_step": 5211, + "learning_rate": 0.00047908597662771286, + "loss": 1.5585, + "loss_base2": 2.2484, + "loss_pixel": 0.1772, + "loss_text": 1.3813, + "ppl": 4.7517, + "step": 5211 + }, + { + "epoch": 0.03, + "global_step": 5212, + "learning_rate": 0.00047908180300500837, + "loss": 1.465, + "loss_base2": 2.1135, + "loss_pixel": 0.1736, + "loss_text": 1.2914, + "ppl": 4.3275, + "step": 5212 + }, + { + "epoch": 0.03, + "global_step": 5213, + "learning_rate": 0.0004790776293823039, + "loss": 1.4568, + "loss_base2": 2.1017, + "loss_pixel": 0.1749, + "loss_text": 1.282, + "ppl": 4.2922, + "step": 5213 + }, + { + "epoch": 0.03, + "global_step": 5214, + "learning_rate": 0.00047907345575959933, + "loss": 1.483, + "loss_base2": 2.1395, + "loss_pixel": 0.1764, + "loss_text": 1.3066, + "ppl": 4.4061, + "step": 5214 + }, + { + "epoch": 0.03, + "global_step": 5215, + "learning_rate": 0.00047906928213689484, + "loss": 1.4674, + "loss_base2": 2.117, + "loss_pixel": 0.1753, + "loss_text": 1.2921, + "ppl": 4.3379, + "step": 5215 + }, + { + "epoch": 0.03, + "global_step": 5216, + "learning_rate": 0.00047906510851419034, + "loss": 1.4846, + "loss_base2": 2.1418, + "loss_pixel": 0.1765, + "loss_text": 1.3082, + "ppl": 4.4132, + "step": 5216 + }, + { + "epoch": 0.03, + "global_step": 5217, + "learning_rate": 0.00047906093489148585, + "loss": 1.4875, + "loss_base2": 2.146, + "loss_pixel": 0.1737, + "loss_text": 1.3138, + "ppl": 4.426, + "step": 5217 + }, + { + "epoch": 0.03, + "global_step": 5218, + "learning_rate": 0.00047905676126878136, + "loss": 1.5991, + "loss_base2": 2.307, + "loss_pixel": 0.1754, + "loss_text": 1.4238, + "ppl": 4.9486, + "step": 5218 + }, + { + "epoch": 0.03, + "global_step": 5219, + "learning_rate": 0.0004790525876460768, + "loss": 1.7154, + "loss_base2": 2.4748, + "loss_pixel": 0.174, + "loss_text": 1.5413, + "ppl": 5.5589, + "step": 5219 + }, + { + "epoch": 0.03, + "global_step": 5220, + "learning_rate": 0.00047904841402337227, + "loss": 1.7271, + "loss_base2": 2.4917, + "loss_pixel": 0.1744, + "loss_text": 1.5527, + "ppl": 5.6243, + "step": 5220 + }, + { + "epoch": 0.03, + "global_step": 5221, + "learning_rate": 0.0004790442404006678, + "loss": 1.708, + "loss_base2": 2.4641, + "loss_pixel": 0.1746, + "loss_text": 1.5335, + "ppl": 5.5179, + "step": 5221 + }, + { + "epoch": 0.03, + "global_step": 5222, + "learning_rate": 0.0004790400667779633, + "loss": 1.7317, + "loss_base2": 2.4983, + "loss_pixel": 0.1793, + "loss_text": 1.5524, + "ppl": 5.6503, + "step": 5222 + }, + { + "epoch": 0.03, + "global_step": 5223, + "learning_rate": 0.00047903589315525873, + "loss": 1.7292, + "loss_base2": 2.4947, + "loss_pixel": 0.1921, + "loss_text": 1.5371, + "ppl": 5.6361, + "step": 5223 + }, + { + "epoch": 0.03, + "global_step": 5224, + "learning_rate": 0.00047903171953255424, + "loss": 1.7355, + "loss_base2": 2.5038, + "loss_pixel": 0.1915, + "loss_text": 1.544, + "ppl": 5.6718, + "step": 5224 + }, + { + "epoch": 0.03, + "global_step": 5225, + "learning_rate": 0.00047902754590984975, + "loss": 1.7275, + "loss_base2": 2.4923, + "loss_pixel": 0.1826, + "loss_text": 1.5449, + "ppl": 5.6266, + "step": 5225 + }, + { + "epoch": 0.03, + "global_step": 5226, + "learning_rate": 0.00047902337228714526, + "loss": 1.7303, + "loss_base2": 2.4963, + "loss_pixel": 0.1791, + "loss_text": 1.5512, + "ppl": 5.6423, + "step": 5226 + }, + { + "epoch": 0.03, + "global_step": 5227, + "learning_rate": 0.00047901919866444076, + "loss": 1.7187, + "loss_base2": 2.4796, + "loss_pixel": 0.1752, + "loss_text": 1.5435, + "ppl": 5.5773, + "step": 5227 + }, + { + "epoch": 0.03, + "global_step": 5228, + "learning_rate": 0.0004790150250417362, + "loss": 1.7141, + "loss_base2": 2.4729, + "loss_pixel": 0.1772, + "loss_text": 1.5368, + "ppl": 5.5517, + "step": 5228 + }, + { + "epoch": 0.03, + "global_step": 5229, + "learning_rate": 0.0004790108514190317, + "loss": 1.6929, + "loss_base2": 2.4423, + "loss_pixel": 0.1762, + "loss_text": 1.5167, + "ppl": 5.4352, + "step": 5229 + }, + { + "epoch": 0.03, + "global_step": 5230, + "learning_rate": 0.00047900667779632723, + "loss": 1.7117, + "loss_base2": 2.4695, + "loss_pixel": 0.1755, + "loss_text": 1.5362, + "ppl": 5.5384, + "step": 5230 + }, + { + "epoch": 0.03, + "global_step": 5231, + "learning_rate": 0.00047900250417362274, + "loss": 1.7188, + "loss_base2": 2.4797, + "loss_pixel": 0.1742, + "loss_text": 1.5446, + "ppl": 5.5778, + "step": 5231 + }, + { + "epoch": 0.03, + "global_step": 5232, + "learning_rate": 0.0004789983305509182, + "loss": 1.7297, + "loss_base2": 2.4954, + "loss_pixel": 0.1791, + "loss_text": 1.5506, + "ppl": 5.639, + "step": 5232 + }, + { + "epoch": 0.03, + "global_step": 5233, + "learning_rate": 0.0004789941569282137, + "loss": 1.6957, + "loss_base2": 2.4464, + "loss_pixel": 0.1754, + "loss_text": 1.5203, + "ppl": 5.4505, + "step": 5233 + }, + { + "epoch": 0.03, + "global_step": 5234, + "learning_rate": 0.0004789899833055092, + "loss": 1.7132, + "loss_base2": 2.4716, + "loss_pixel": 0.1761, + "loss_text": 1.5371, + "ppl": 5.5467, + "step": 5234 + }, + { + "epoch": 0.03, + "global_step": 5235, + "learning_rate": 0.0004789858096828047, + "loss": 1.6948, + "loss_base2": 2.4451, + "loss_pixel": 0.1773, + "loss_text": 1.5175, + "ppl": 5.4456, + "step": 5235 + }, + { + "epoch": 0.03, + "global_step": 5236, + "learning_rate": 0.0004789816360601002, + "loss": 1.7002, + "loss_base2": 2.4529, + "loss_pixel": 0.1759, + "loss_text": 1.5243, + "ppl": 5.475, + "step": 5236 + }, + { + "epoch": 0.03, + "global_step": 5237, + "learning_rate": 0.0004789774624373957, + "loss": 1.7172, + "loss_base2": 2.4774, + "loss_pixel": 0.1746, + "loss_text": 1.5426, + "ppl": 5.5689, + "step": 5237 + }, + { + "epoch": 0.03, + "global_step": 5238, + "learning_rate": 0.0004789732888146912, + "loss": 1.7058, + "loss_base2": 2.4609, + "loss_pixel": 0.1751, + "loss_text": 1.5307, + "ppl": 5.5058, + "step": 5238 + }, + { + "epoch": 0.03, + "global_step": 5239, + "learning_rate": 0.00047896911519198663, + "loss": 1.717, + "loss_base2": 2.4771, + "loss_pixel": 0.1755, + "loss_text": 1.5415, + "ppl": 5.5678, + "step": 5239 + }, + { + "epoch": 0.03, + "global_step": 5240, + "learning_rate": 0.00047896494156928214, + "loss": 1.5183, + "loss_base2": 2.1904, + "loss_pixel": 0.1742, + "loss_text": 1.3441, + "ppl": 4.5645, + "step": 5240 + }, + { + "epoch": 0.03, + "global_step": 5241, + "learning_rate": 0.0004789607679465776, + "loss": 1.4793, + "loss_base2": 2.1342, + "loss_pixel": 0.1882, + "loss_text": 1.2911, + "ppl": 4.3899, + "step": 5241 + }, + { + "epoch": 0.03, + "global_step": 5242, + "learning_rate": 0.0004789565943238731, + "loss": 1.4817, + "loss_base2": 2.1376, + "loss_pixel": 0.1946, + "loss_text": 1.2871, + "ppl": 4.4004, + "step": 5242 + }, + { + "epoch": 0.03, + "global_step": 5243, + "learning_rate": 0.0004789524207011686, + "loss": 1.4843, + "loss_base2": 2.1414, + "loss_pixel": 0.1887, + "loss_text": 1.2957, + "ppl": 4.4119, + "step": 5243 + }, + { + "epoch": 0.03, + "global_step": 5244, + "learning_rate": 0.0004789482470784641, + "loss": 1.4549, + "loss_base2": 2.099, + "loss_pixel": 0.1764, + "loss_text": 1.2784, + "ppl": 4.2841, + "step": 5244 + }, + { + "epoch": 0.03, + "global_step": 5245, + "learning_rate": 0.0004789440734557596, + "loss": 1.4869, + "loss_base2": 2.1451, + "loss_pixel": 0.1761, + "loss_text": 1.3108, + "ppl": 4.4234, + "step": 5245 + }, + { + "epoch": 0.03, + "global_step": 5246, + "learning_rate": 0.0004789398998330551, + "loss": 1.4717, + "loss_base2": 2.1232, + "loss_pixel": 0.1747, + "loss_text": 1.2969, + "ppl": 4.3566, + "step": 5246 + }, + { + "epoch": 0.03, + "global_step": 5247, + "learning_rate": 0.0004789357262103506, + "loss": 1.4789, + "loss_base2": 2.1336, + "loss_pixel": 0.1746, + "loss_text": 1.3043, + "ppl": 4.3881, + "step": 5247 + }, + { + "epoch": 0.03, + "global_step": 5248, + "learning_rate": 0.0004789315525876461, + "loss": 1.7227, + "loss_base2": 2.4853, + "loss_pixel": 0.1755, + "loss_text": 1.5471, + "ppl": 5.5996, + "step": 5248 + }, + { + "epoch": 0.03, + "global_step": 5249, + "learning_rate": 0.0004789273789649416, + "loss": 1.7274, + "loss_base2": 2.4921, + "loss_pixel": 0.1747, + "loss_text": 1.5527, + "ppl": 5.626, + "step": 5249 + }, + { + "epoch": 0.03, + "global_step": 5250, + "learning_rate": 0.00047892320534223705, + "loss": 1.7384, + "loss_base2": 2.508, + "loss_pixel": 0.1735, + "loss_text": 1.5649, + "ppl": 5.6882, + "step": 5250 + }, + { + "epoch": 0.03, + "global_step": 5251, + "learning_rate": 0.00047891903171953256, + "loss": 1.7033, + "loss_base2": 2.4573, + "loss_pixel": 0.1751, + "loss_text": 1.5282, + "ppl": 5.492, + "step": 5251 + }, + { + "epoch": 0.03, + "global_step": 5252, + "learning_rate": 0.00047891485809682807, + "loss": 1.7148, + "loss_base2": 2.4739, + "loss_pixel": 0.1721, + "loss_text": 1.5427, + "ppl": 5.5556, + "step": 5252 + }, + { + "epoch": 0.03, + "global_step": 5253, + "learning_rate": 0.0004789106844741236, + "loss": 1.7149, + "loss_base2": 2.4741, + "loss_pixel": 0.1756, + "loss_text": 1.5394, + "ppl": 5.5561, + "step": 5253 + }, + { + "epoch": 0.03, + "global_step": 5254, + "learning_rate": 0.0004789065108514191, + "loss": 1.7143, + "loss_base2": 2.4732, + "loss_pixel": 0.1741, + "loss_text": 1.5401, + "ppl": 5.5528, + "step": 5254 + }, + { + "epoch": 0.03, + "global_step": 5255, + "learning_rate": 0.00047890233722871453, + "loss": 1.7239, + "loss_base2": 2.4871, + "loss_pixel": 0.1736, + "loss_text": 1.5503, + "ppl": 5.6064, + "step": 5255 + }, + { + "epoch": 0.03, + "global_step": 5256, + "learning_rate": 0.00047889816360601004, + "loss": 1.7332, + "loss_base2": 2.5005, + "loss_pixel": 0.1766, + "loss_text": 1.5566, + "ppl": 5.6587, + "step": 5256 + }, + { + "epoch": 0.03, + "global_step": 5257, + "learning_rate": 0.00047889398998330555, + "loss": 1.72, + "loss_base2": 2.4814, + "loss_pixel": 0.1735, + "loss_text": 1.5465, + "ppl": 5.5845, + "step": 5257 + }, + { + "epoch": 0.03, + "global_step": 5258, + "learning_rate": 0.000478889816360601, + "loss": 1.7193, + "loss_base2": 2.4804, + "loss_pixel": 0.1752, + "loss_text": 1.5441, + "ppl": 5.5806, + "step": 5258 + }, + { + "epoch": 0.03, + "global_step": 5259, + "learning_rate": 0.00047888564273789645, + "loss": 1.7185, + "loss_base2": 2.4793, + "loss_pixel": 0.1749, + "loss_text": 1.5436, + "ppl": 5.5762, + "step": 5259 + }, + { + "epoch": 0.03, + "global_step": 5260, + "learning_rate": 0.00047888146911519196, + "loss": 1.7026, + "loss_base2": 2.4563, + "loss_pixel": 0.1731, + "loss_text": 1.5295, + "ppl": 5.4882, + "step": 5260 + }, + { + "epoch": 0.03, + "global_step": 5261, + "learning_rate": 0.00047887729549248747, + "loss": 1.7121, + "loss_base2": 2.47, + "loss_pixel": 0.1752, + "loss_text": 1.5369, + "ppl": 5.5406, + "step": 5261 + }, + { + "epoch": 0.03, + "global_step": 5262, + "learning_rate": 0.000478873121869783, + "loss": 1.7102, + "loss_base2": 2.4673, + "loss_pixel": 0.1747, + "loss_text": 1.5355, + "ppl": 5.5301, + "step": 5262 + }, + { + "epoch": 0.03, + "global_step": 5263, + "learning_rate": 0.0004788689482470785, + "loss": 1.7075, + "loss_base2": 2.4634, + "loss_pixel": 0.1727, + "loss_text": 1.5347, + "ppl": 5.5152, + "step": 5263 + }, + { + "epoch": 0.03, + "global_step": 5264, + "learning_rate": 0.00047886477462437394, + "loss": 1.7175, + "loss_base2": 2.4778, + "loss_pixel": 0.1748, + "loss_text": 1.5428, + "ppl": 5.5706, + "step": 5264 + }, + { + "epoch": 0.03, + "global_step": 5265, + "learning_rate": 0.00047886060100166944, + "loss": 1.7118, + "loss_base2": 2.4696, + "loss_pixel": 0.1732, + "loss_text": 1.5386, + "ppl": 5.5389, + "step": 5265 + }, + { + "epoch": 0.03, + "global_step": 5266, + "learning_rate": 0.00047885642737896495, + "loss": 1.7066, + "loss_base2": 2.4621, + "loss_pixel": 0.1737, + "loss_text": 1.5329, + "ppl": 5.5102, + "step": 5266 + }, + { + "epoch": 0.03, + "global_step": 5267, + "learning_rate": 0.00047885225375626046, + "loss": 1.7049, + "loss_base2": 2.4597, + "loss_pixel": 0.1727, + "loss_text": 1.5322, + "ppl": 5.5008, + "step": 5267 + }, + { + "epoch": 0.03, + "global_step": 5268, + "learning_rate": 0.00047884808013355597, + "loss": 1.7103, + "loss_base2": 2.4674, + "loss_pixel": 0.1728, + "loss_text": 1.5376, + "ppl": 5.5306, + "step": 5268 + }, + { + "epoch": 0.03, + "global_step": 5269, + "learning_rate": 0.0004788439065108514, + "loss": 1.6881, + "loss_base2": 2.4354, + "loss_pixel": 0.1751, + "loss_text": 1.5129, + "ppl": 5.4092, + "step": 5269 + }, + { + "epoch": 0.03, + "global_step": 5270, + "learning_rate": 0.0004788397328881469, + "loss": 1.6884, + "loss_base2": 2.4358, + "loss_pixel": 0.1723, + "loss_text": 1.5161, + "ppl": 5.4108, + "step": 5270 + }, + { + "epoch": 0.03, + "global_step": 5271, + "learning_rate": 0.00047883555926544243, + "loss": 1.6053, + "loss_base2": 2.316, + "loss_pixel": 0.1761, + "loss_text": 1.4293, + "ppl": 4.9794, + "step": 5271 + }, + { + "epoch": 0.03, + "global_step": 5272, + "learning_rate": 0.00047883138564273794, + "loss": 1.4906, + "loss_base2": 2.1505, + "loss_pixel": 0.1721, + "loss_text": 1.3184, + "ppl": 4.4398, + "step": 5272 + }, + { + "epoch": 0.03, + "global_step": 5273, + "learning_rate": 0.0004788272120200334, + "loss": 1.4861, + "loss_base2": 2.144, + "loss_pixel": 0.1719, + "loss_text": 1.3142, + "ppl": 4.4198, + "step": 5273 + }, + { + "epoch": 0.03, + "global_step": 5274, + "learning_rate": 0.0004788230383973289, + "loss": 1.4766, + "loss_base2": 2.1303, + "loss_pixel": 0.174, + "loss_text": 1.3025, + "ppl": 4.378, + "step": 5274 + }, + { + "epoch": 0.03, + "global_step": 5275, + "learning_rate": 0.0004788188647746244, + "loss": 1.4832, + "loss_base2": 2.1398, + "loss_pixel": 0.171, + "loss_text": 1.3123, + "ppl": 4.407, + "step": 5275 + }, + { + "epoch": 0.03, + "global_step": 5276, + "learning_rate": 0.0004788146911519199, + "loss": 1.461, + "loss_base2": 2.1078, + "loss_pixel": 0.1744, + "loss_text": 1.2866, + "ppl": 4.3103, + "step": 5276 + }, + { + "epoch": 0.03, + "global_step": 5277, + "learning_rate": 0.00047881051752921537, + "loss": 1.4906, + "loss_base2": 2.1505, + "loss_pixel": 0.1724, + "loss_text": 1.3181, + "ppl": 4.4398, + "step": 5277 + }, + { + "epoch": 0.03, + "global_step": 5278, + "learning_rate": 0.0004788063439065108, + "loss": 1.4733, + "loss_base2": 2.1255, + "loss_pixel": 0.1738, + "loss_text": 1.2996, + "ppl": 4.3636, + "step": 5278 + }, + { + "epoch": 0.03, + "global_step": 5279, + "learning_rate": 0.00047880217028380633, + "loss": 1.5465, + "loss_base2": 2.2311, + "loss_pixel": 0.1726, + "loss_text": 1.3739, + "ppl": 4.695, + "step": 5279 + }, + { + "epoch": 0.03, + "global_step": 5280, + "learning_rate": 0.00047879799666110184, + "loss": 1.6834, + "loss_base2": 2.4286, + "loss_pixel": 0.1719, + "loss_text": 1.5115, + "ppl": 5.3838, + "step": 5280 + }, + { + "epoch": 0.03, + "global_step": 5281, + "learning_rate": 0.00047879382303839734, + "loss": 1.6928, + "loss_base2": 2.4422, + "loss_pixel": 0.1713, + "loss_text": 1.5215, + "ppl": 5.4347, + "step": 5281 + }, + { + "epoch": 0.03, + "global_step": 5282, + "learning_rate": 0.0004787896494156928, + "loss": 1.7161, + "loss_base2": 2.4758, + "loss_pixel": 0.1723, + "loss_text": 1.5438, + "ppl": 5.5628, + "step": 5282 + }, + { + "epoch": 0.03, + "global_step": 5283, + "learning_rate": 0.0004787854757929883, + "loss": 1.7227, + "loss_base2": 2.4853, + "loss_pixel": 0.1735, + "loss_text": 1.5491, + "ppl": 5.5996, + "step": 5283 + }, + { + "epoch": 0.03, + "global_step": 5284, + "learning_rate": 0.0004787813021702838, + "loss": 1.7134, + "loss_base2": 2.4719, + "loss_pixel": 0.1732, + "loss_text": 1.5403, + "ppl": 5.5478, + "step": 5284 + }, + { + "epoch": 0.03, + "global_step": 5285, + "learning_rate": 0.0004787771285475793, + "loss": 1.7147, + "loss_base2": 2.4738, + "loss_pixel": 0.1722, + "loss_text": 1.5425, + "ppl": 5.555, + "step": 5285 + }, + { + "epoch": 0.03, + "global_step": 5286, + "learning_rate": 0.0004787729549248748, + "loss": 1.6985, + "loss_base2": 2.4504, + "loss_pixel": 0.1709, + "loss_text": 1.5276, + "ppl": 5.4657, + "step": 5286 + }, + { + "epoch": 0.03, + "global_step": 5287, + "learning_rate": 0.0004787687813021703, + "loss": 1.6923, + "loss_base2": 2.4415, + "loss_pixel": 0.1735, + "loss_text": 1.5188, + "ppl": 5.432, + "step": 5287 + }, + { + "epoch": 0.03, + "global_step": 5288, + "learning_rate": 0.0004787646076794658, + "loss": 1.717, + "loss_base2": 2.4771, + "loss_pixel": 0.1725, + "loss_text": 1.5445, + "ppl": 5.5678, + "step": 5288 + }, + { + "epoch": 0.03, + "global_step": 5289, + "learning_rate": 0.0004787604340567613, + "loss": 1.7015, + "loss_base2": 2.4547, + "loss_pixel": 0.1716, + "loss_text": 1.5299, + "ppl": 5.4822, + "step": 5289 + }, + { + "epoch": 0.03, + "global_step": 5290, + "learning_rate": 0.0004787562604340568, + "loss": 1.7144, + "loss_base2": 2.4734, + "loss_pixel": 0.1717, + "loss_text": 1.5428, + "ppl": 5.5533, + "step": 5290 + }, + { + "epoch": 0.03, + "global_step": 5291, + "learning_rate": 0.00047875208681135226, + "loss": 1.7049, + "loss_base2": 2.4597, + "loss_pixel": 0.1725, + "loss_text": 1.5324, + "ppl": 5.5008, + "step": 5291 + }, + { + "epoch": 0.03, + "global_step": 5292, + "learning_rate": 0.00047874791318864776, + "loss": 1.7087, + "loss_base2": 2.4651, + "loss_pixel": 0.1706, + "loss_text": 1.5381, + "ppl": 5.5218, + "step": 5292 + }, + { + "epoch": 0.03, + "global_step": 5293, + "learning_rate": 0.00047874373956594327, + "loss": 1.7283, + "loss_base2": 2.4934, + "loss_pixel": 0.1802, + "loss_text": 1.5481, + "ppl": 5.6311, + "step": 5293 + }, + { + "epoch": 0.03, + "global_step": 5294, + "learning_rate": 0.0004787395659432388, + "loss": 1.726, + "loss_base2": 2.4901, + "loss_pixel": 0.1851, + "loss_text": 1.5408, + "ppl": 5.6181, + "step": 5294 + }, + { + "epoch": 0.03, + "global_step": 5295, + "learning_rate": 0.0004787353923205343, + "loss": 1.7092, + "loss_base2": 2.4659, + "loss_pixel": 0.1857, + "loss_text": 1.5235, + "ppl": 5.5245, + "step": 5295 + }, + { + "epoch": 0.03, + "global_step": 5296, + "learning_rate": 0.0004787312186978297, + "loss": 1.7177, + "loss_base2": 2.4781, + "loss_pixel": 0.1848, + "loss_text": 1.5329, + "ppl": 5.5717, + "step": 5296 + }, + { + "epoch": 0.03, + "global_step": 5297, + "learning_rate": 0.0004787270450751252, + "loss": 1.7032, + "loss_base2": 2.4572, + "loss_pixel": 0.1844, + "loss_text": 1.5188, + "ppl": 5.4915, + "step": 5297 + }, + { + "epoch": 0.03, + "global_step": 5298, + "learning_rate": 0.0004787228714524207, + "loss": 1.7242, + "loss_base2": 2.4875, + "loss_pixel": 0.1842, + "loss_text": 1.5399, + "ppl": 5.608, + "step": 5298 + }, + { + "epoch": 0.03, + "global_step": 5299, + "learning_rate": 0.0004787186978297162, + "loss": 1.7191, + "loss_base2": 2.4801, + "loss_pixel": 0.1854, + "loss_text": 1.5338, + "ppl": 5.5795, + "step": 5299 + }, + { + "epoch": 0.03, + "global_step": 5300, + "learning_rate": 0.00047871452420701166, + "loss": 1.734, + "loss_base2": 2.5016, + "loss_pixel": 0.1854, + "loss_text": 1.5486, + "ppl": 5.6633, + "step": 5300 + }, + { + "epoch": 0.03, + "global_step": 5301, + "learning_rate": 0.00047871035058430717, + "loss": 1.7295, + "loss_base2": 2.4951, + "loss_pixel": 0.1829, + "loss_text": 1.5465, + "ppl": 5.6378, + "step": 5301 + }, + { + "epoch": 0.03, + "global_step": 5302, + "learning_rate": 0.0004787061769616027, + "loss": 1.718, + "loss_base2": 2.4786, + "loss_pixel": 0.1833, + "loss_text": 1.5346, + "ppl": 5.5734, + "step": 5302 + }, + { + "epoch": 0.03, + "global_step": 5303, + "learning_rate": 0.0004787020033388982, + "loss": 1.7262, + "loss_base2": 2.4904, + "loss_pixel": 0.1843, + "loss_text": 1.5419, + "ppl": 5.6193, + "step": 5303 + }, + { + "epoch": 0.03, + "global_step": 5304, + "learning_rate": 0.0004786978297161937, + "loss": 1.6969, + "loss_base2": 2.4481, + "loss_pixel": 0.1822, + "loss_text": 1.5147, + "ppl": 5.457, + "step": 5304 + }, + { + "epoch": 0.03, + "global_step": 5305, + "learning_rate": 0.00047869365609348914, + "loss": 1.7002, + "loss_base2": 2.4529, + "loss_pixel": 0.1833, + "loss_text": 1.5169, + "ppl": 5.475, + "step": 5305 + }, + { + "epoch": 0.03, + "global_step": 5306, + "learning_rate": 0.00047868948247078465, + "loss": 1.7246, + "loss_base2": 2.4881, + "loss_pixel": 0.1832, + "loss_text": 1.5414, + "ppl": 5.6103, + "step": 5306 + }, + { + "epoch": 0.03, + "global_step": 5307, + "learning_rate": 0.00047868530884808016, + "loss": 1.6844, + "loss_base2": 2.4301, + "loss_pixel": 0.1827, + "loss_text": 1.5017, + "ppl": 5.3892, + "step": 5307 + }, + { + "epoch": 0.03, + "global_step": 5308, + "learning_rate": 0.00047868113522537566, + "loss": 1.708, + "loss_base2": 2.4641, + "loss_pixel": 0.1832, + "loss_text": 1.5247, + "ppl": 5.5179, + "step": 5308 + }, + { + "epoch": 0.03, + "global_step": 5309, + "learning_rate": 0.0004786769616026711, + "loss": 1.7304, + "loss_base2": 2.4964, + "loss_pixel": 0.1824, + "loss_text": 1.548, + "ppl": 5.6429, + "step": 5309 + }, + { + "epoch": 0.03, + "global_step": 5310, + "learning_rate": 0.0004786727879799666, + "loss": 1.7276, + "loss_base2": 2.4924, + "loss_pixel": 0.1814, + "loss_text": 1.5461, + "ppl": 5.6271, + "step": 5310 + }, + { + "epoch": 0.03, + "global_step": 5311, + "learning_rate": 0.00047866861435726213, + "loss": 1.7157, + "loss_base2": 2.4752, + "loss_pixel": 0.1822, + "loss_text": 1.5335, + "ppl": 5.5606, + "step": 5311 + }, + { + "epoch": 0.03, + "global_step": 5312, + "learning_rate": 0.00047866444073455764, + "loss": 1.7193, + "loss_base2": 2.4804, + "loss_pixel": 0.1827, + "loss_text": 1.5366, + "ppl": 5.5806, + "step": 5312 + }, + { + "epoch": 0.03, + "global_step": 5313, + "learning_rate": 0.00047866026711185315, + "loss": 1.7232, + "loss_base2": 2.4861, + "loss_pixel": 0.183, + "loss_text": 1.5402, + "ppl": 5.6024, + "step": 5313 + }, + { + "epoch": 0.03, + "global_step": 5314, + "learning_rate": 0.00047865609348914854, + "loss": 1.7006, + "loss_base2": 2.4534, + "loss_pixel": 0.1812, + "loss_text": 1.5195, + "ppl": 5.4772, + "step": 5314 + }, + { + "epoch": 0.03, + "global_step": 5315, + "learning_rate": 0.00047865191986644405, + "loss": 1.7043, + "loss_base2": 2.4588, + "loss_pixel": 0.1814, + "loss_text": 1.5228, + "ppl": 5.4975, + "step": 5315 + }, + { + "epoch": 0.03, + "global_step": 5316, + "learning_rate": 0.00047864774624373956, + "loss": 1.7243, + "loss_base2": 2.4876, + "loss_pixel": 0.1823, + "loss_text": 1.5421, + "ppl": 5.6086, + "step": 5316 + }, + { + "epoch": 0.03, + "global_step": 5317, + "learning_rate": 0.00047864357262103507, + "loss": 1.7095, + "loss_base2": 2.4663, + "loss_pixel": 0.1819, + "loss_text": 1.5275, + "ppl": 5.5262, + "step": 5317 + }, + { + "epoch": 0.03, + "global_step": 5318, + "learning_rate": 0.0004786393989983306, + "loss": 1.7049, + "loss_base2": 2.4597, + "loss_pixel": 0.182, + "loss_text": 1.5229, + "ppl": 5.5008, + "step": 5318 + }, + { + "epoch": 0.03, + "global_step": 5319, + "learning_rate": 0.000478635225375626, + "loss": 1.6925, + "loss_base2": 2.4418, + "loss_pixel": 0.1819, + "loss_text": 1.5106, + "ppl": 5.433, + "step": 5319 + }, + { + "epoch": 0.03, + "global_step": 5320, + "learning_rate": 0.00047863105175292153, + "loss": 1.719, + "loss_base2": 2.48, + "loss_pixel": 0.1817, + "loss_text": 1.5373, + "ppl": 5.5789, + "step": 5320 + }, + { + "epoch": 0.03, + "global_step": 5321, + "learning_rate": 0.00047862687813021704, + "loss": 1.7011, + "loss_base2": 2.4542, + "loss_pixel": 0.1839, + "loss_text": 1.5171, + "ppl": 5.48, + "step": 5321 + }, + { + "epoch": 0.03, + "global_step": 5322, + "learning_rate": 0.00047862270450751255, + "loss": 1.7167, + "loss_base2": 2.4767, + "loss_pixel": 0.1866, + "loss_text": 1.5301, + "ppl": 5.5661, + "step": 5322 + }, + { + "epoch": 0.03, + "global_step": 5323, + "learning_rate": 0.000478618530884808, + "loss": 1.7094, + "loss_base2": 2.4661, + "loss_pixel": 0.192, + "loss_text": 1.5173, + "ppl": 5.5256, + "step": 5323 + }, + { + "epoch": 0.03, + "global_step": 5324, + "learning_rate": 0.0004786143572621035, + "loss": 1.7326, + "loss_base2": 2.4996, + "loss_pixel": 0.1917, + "loss_text": 1.5409, + "ppl": 5.6553, + "step": 5324 + }, + { + "epoch": 0.03, + "global_step": 5325, + "learning_rate": 0.000478610183639399, + "loss": 1.7262, + "loss_base2": 2.4904, + "loss_pixel": 0.1909, + "loss_text": 1.5353, + "ppl": 5.6193, + "step": 5325 + }, + { + "epoch": 0.03, + "global_step": 5326, + "learning_rate": 0.0004786060100166945, + "loss": 1.719, + "loss_base2": 2.48, + "loss_pixel": 0.1974, + "loss_text": 1.5216, + "ppl": 5.5789, + "step": 5326 + }, + { + "epoch": 0.03, + "global_step": 5327, + "learning_rate": 0.00047860183639399003, + "loss": 1.7064, + "loss_base2": 2.4618, + "loss_pixel": 0.1966, + "loss_text": 1.5099, + "ppl": 5.5091, + "step": 5327 + }, + { + "epoch": 0.03, + "global_step": 5328, + "learning_rate": 0.0004785976627712855, + "loss": 1.5493, + "loss_base2": 2.2352, + "loss_pixel": 0.194, + "loss_text": 1.3553, + "ppl": 4.7082, + "step": 5328 + }, + { + "epoch": 0.03, + "global_step": 5329, + "learning_rate": 0.000478593489148581, + "loss": 1.5015, + "loss_base2": 2.1662, + "loss_pixel": 0.1929, + "loss_text": 1.3085, + "ppl": 4.4884, + "step": 5329 + }, + { + "epoch": 0.03, + "global_step": 5330, + "learning_rate": 0.0004785893155258765, + "loss": 1.4929, + "loss_base2": 2.1538, + "loss_pixel": 0.1928, + "loss_text": 1.3001, + "ppl": 4.45, + "step": 5330 + }, + { + "epoch": 0.03, + "global_step": 5331, + "learning_rate": 0.000478585141903172, + "loss": 1.4794, + "loss_base2": 2.1343, + "loss_pixel": 0.192, + "loss_text": 1.2874, + "ppl": 4.3903, + "step": 5331 + }, + { + "epoch": 0.03, + "global_step": 5332, + "learning_rate": 0.00047858096828046746, + "loss": 1.4927, + "loss_base2": 2.1535, + "loss_pixel": 0.1901, + "loss_text": 1.3026, + "ppl": 4.4491, + "step": 5332 + }, + { + "epoch": 0.03, + "global_step": 5333, + "learning_rate": 0.0004785767946577629, + "loss": 1.4845, + "loss_base2": 2.1417, + "loss_pixel": 0.1913, + "loss_text": 1.2932, + "ppl": 4.4128, + "step": 5333 + }, + { + "epoch": 0.03, + "global_step": 5334, + "learning_rate": 0.0004785726210350584, + "loss": 1.4792, + "loss_base2": 2.134, + "loss_pixel": 0.1896, + "loss_text": 1.2895, + "ppl": 4.3894, + "step": 5334 + }, + { + "epoch": 0.03, + "global_step": 5335, + "learning_rate": 0.0004785684474123539, + "loss": 1.5703, + "loss_base2": 2.2655, + "loss_pixel": 0.1895, + "loss_text": 1.3808, + "ppl": 4.8081, + "step": 5335 + }, + { + "epoch": 0.03, + "global_step": 5336, + "learning_rate": 0.00047856427378964943, + "loss": 1.5507, + "loss_base2": 2.2372, + "loss_pixel": 0.1873, + "loss_text": 1.3634, + "ppl": 4.7148, + "step": 5336 + }, + { + "epoch": 0.03, + "global_step": 5337, + "learning_rate": 0.0004785601001669449, + "loss": 1.4804, + "loss_base2": 2.1358, + "loss_pixel": 0.1873, + "loss_text": 1.2931, + "ppl": 4.3947, + "step": 5337 + }, + { + "epoch": 0.03, + "global_step": 5338, + "learning_rate": 0.0004785559265442404, + "loss": 1.5088, + "loss_base2": 2.1767, + "loss_pixel": 0.187, + "loss_text": 1.3218, + "ppl": 4.5213, + "step": 5338 + }, + { + "epoch": 0.03, + "global_step": 5339, + "learning_rate": 0.0004785517529215359, + "loss": 1.4941, + "loss_base2": 2.1555, + "loss_pixel": 0.1853, + "loss_text": 1.3088, + "ppl": 4.4553, + "step": 5339 + }, + { + "epoch": 0.03, + "global_step": 5340, + "learning_rate": 0.0004785475792988314, + "loss": 1.5086, + "loss_base2": 2.1764, + "loss_pixel": 0.1855, + "loss_text": 1.3231, + "ppl": 4.5204, + "step": 5340 + }, + { + "epoch": 0.03, + "global_step": 5341, + "learning_rate": 0.00047854340567612686, + "loss": 1.4774, + "loss_base2": 2.1314, + "loss_pixel": 0.1863, + "loss_text": 1.2911, + "ppl": 4.3815, + "step": 5341 + }, + { + "epoch": 0.03, + "global_step": 5342, + "learning_rate": 0.00047853923205342237, + "loss": 1.5073, + "loss_base2": 2.1746, + "loss_pixel": 0.1853, + "loss_text": 1.322, + "ppl": 4.5145, + "step": 5342 + }, + { + "epoch": 0.03, + "global_step": 5343, + "learning_rate": 0.0004785350584307179, + "loss": 1.4856, + "loss_base2": 2.1433, + "loss_pixel": 0.1859, + "loss_text": 1.2998, + "ppl": 4.4176, + "step": 5343 + }, + { + "epoch": 0.03, + "global_step": 5344, + "learning_rate": 0.0004785308848080134, + "loss": 1.6199, + "loss_base2": 2.337, + "loss_pixel": 0.1846, + "loss_text": 1.4353, + "ppl": 5.0526, + "step": 5344 + }, + { + "epoch": 0.03, + "global_step": 5345, + "learning_rate": 0.0004785267111853089, + "loss": 1.73, + "loss_base2": 2.4959, + "loss_pixel": 0.1842, + "loss_text": 1.5459, + "ppl": 5.6407, + "step": 5345 + }, + { + "epoch": 0.03, + "global_step": 5346, + "learning_rate": 0.00047852253756260434, + "loss": 1.7226, + "loss_base2": 2.4852, + "loss_pixel": 0.1849, + "loss_text": 1.5377, + "ppl": 5.5991, + "step": 5346 + }, + { + "epoch": 0.03, + "global_step": 5347, + "learning_rate": 0.00047851836393989985, + "loss": 1.7195, + "loss_base2": 2.4807, + "loss_pixel": 0.1845, + "loss_text": 1.535, + "ppl": 5.5817, + "step": 5347 + }, + { + "epoch": 0.03, + "global_step": 5348, + "learning_rate": 0.00047851419031719536, + "loss": 1.7185, + "loss_base2": 2.4793, + "loss_pixel": 0.1839, + "loss_text": 1.5346, + "ppl": 5.5762, + "step": 5348 + }, + { + "epoch": 0.03, + "global_step": 5349, + "learning_rate": 0.00047851001669449087, + "loss": 1.7245, + "loss_base2": 2.4879, + "loss_pixel": 0.1846, + "loss_text": 1.5399, + "ppl": 5.6097, + "step": 5349 + }, + { + "epoch": 0.03, + "global_step": 5350, + "learning_rate": 0.0004785058430717863, + "loss": 1.7243, + "loss_base2": 2.4876, + "loss_pixel": 0.184, + "loss_text": 1.5403, + "ppl": 5.6086, + "step": 5350 + }, + { + "epoch": 0.03, + "global_step": 5351, + "learning_rate": 0.0004785016694490818, + "loss": 1.7213, + "loss_base2": 2.4833, + "loss_pixel": 0.1827, + "loss_text": 1.5386, + "ppl": 5.5918, + "step": 5351 + }, + { + "epoch": 0.03, + "global_step": 5352, + "learning_rate": 0.0004784974958263773, + "loss": 1.7062, + "loss_base2": 2.4615, + "loss_pixel": 0.1828, + "loss_text": 1.5234, + "ppl": 5.508, + "step": 5352 + }, + { + "epoch": 0.03, + "global_step": 5353, + "learning_rate": 0.0004784933222036728, + "loss": 1.7153, + "loss_base2": 2.4747, + "loss_pixel": 0.1827, + "loss_text": 1.5326, + "ppl": 5.5583, + "step": 5353 + }, + { + "epoch": 0.03, + "global_step": 5354, + "learning_rate": 0.0004784891485809683, + "loss": 1.7278, + "loss_base2": 2.4927, + "loss_pixel": 0.1824, + "loss_text": 1.5454, + "ppl": 5.6283, + "step": 5354 + }, + { + "epoch": 0.03, + "global_step": 5355, + "learning_rate": 0.00047848497495826375, + "loss": 1.7105, + "loss_base2": 2.4677, + "loss_pixel": 0.183, + "loss_text": 1.5274, + "ppl": 5.5317, + "step": 5355 + }, + { + "epoch": 0.03, + "global_step": 5356, + "learning_rate": 0.00047848080133555926, + "loss": 1.7098, + "loss_base2": 2.4667, + "loss_pixel": 0.1831, + "loss_text": 1.5267, + "ppl": 5.5279, + "step": 5356 + }, + { + "epoch": 0.03, + "global_step": 5357, + "learning_rate": 0.00047847662771285476, + "loss": 1.7066, + "loss_base2": 2.4621, + "loss_pixel": 0.1832, + "loss_text": 1.5234, + "ppl": 5.5102, + "step": 5357 + }, + { + "epoch": 0.03, + "global_step": 5358, + "learning_rate": 0.00047847245409015027, + "loss": 1.6912, + "loss_base2": 2.4399, + "loss_pixel": 0.1832, + "loss_text": 1.508, + "ppl": 5.426, + "step": 5358 + }, + { + "epoch": 0.03, + "global_step": 5359, + "learning_rate": 0.0004784682804674457, + "loss": 1.7182, + "loss_base2": 2.4788, + "loss_pixel": 0.1814, + "loss_text": 1.5368, + "ppl": 5.5745, + "step": 5359 + }, + { + "epoch": 0.03, + "global_step": 5360, + "learning_rate": 0.00047846410684474123, + "loss": 1.7125, + "loss_base2": 2.4706, + "loss_pixel": 0.1821, + "loss_text": 1.5304, + "ppl": 5.5428, + "step": 5360 + }, + { + "epoch": 0.03, + "global_step": 5361, + "learning_rate": 0.00047845993322203674, + "loss": 1.6954, + "loss_base2": 2.4459, + "loss_pixel": 0.1825, + "loss_text": 1.5129, + "ppl": 5.4488, + "step": 5361 + }, + { + "epoch": 0.03, + "global_step": 5362, + "learning_rate": 0.00047845575959933224, + "loss": 1.7162, + "loss_base2": 2.476, + "loss_pixel": 0.1815, + "loss_text": 1.5346, + "ppl": 5.5633, + "step": 5362 + }, + { + "epoch": 0.03, + "global_step": 5363, + "learning_rate": 0.00047845158597662775, + "loss": 1.7158, + "loss_base2": 2.4754, + "loss_pixel": 0.1824, + "loss_text": 1.5334, + "ppl": 5.5611, + "step": 5363 + }, + { + "epoch": 0.03, + "global_step": 5364, + "learning_rate": 0.0004784474123539232, + "loss": 1.7173, + "loss_base2": 2.4775, + "loss_pixel": 0.1769, + "loss_text": 1.5404, + "ppl": 5.5695, + "step": 5364 + }, + { + "epoch": 0.03, + "global_step": 5365, + "learning_rate": 0.0004784432387312187, + "loss": 1.6834, + "loss_base2": 2.4286, + "loss_pixel": 0.1778, + "loss_text": 1.5056, + "ppl": 5.3838, + "step": 5365 + }, + { + "epoch": 0.03, + "global_step": 5366, + "learning_rate": 0.0004784390651085142, + "loss": 1.6882, + "loss_base2": 2.4356, + "loss_pixel": 0.1744, + "loss_text": 1.5138, + "ppl": 5.4097, + "step": 5366 + }, + { + "epoch": 0.03, + "global_step": 5367, + "learning_rate": 0.00047843489148580973, + "loss": 1.7028, + "loss_base2": 2.4566, + "loss_pixel": 0.1739, + "loss_text": 1.5289, + "ppl": 5.4893, + "step": 5367 + }, + { + "epoch": 0.03, + "global_step": 5368, + "learning_rate": 0.0004784307178631052, + "loss": 1.7103, + "loss_base2": 2.4674, + "loss_pixel": 0.1762, + "loss_text": 1.5341, + "ppl": 5.5306, + "step": 5368 + }, + { + "epoch": 0.03, + "global_step": 5369, + "learning_rate": 0.0004784265442404007, + "loss": 1.6935, + "loss_base2": 2.4432, + "loss_pixel": 0.1732, + "loss_text": 1.5203, + "ppl": 5.4385, + "step": 5369 + }, + { + "epoch": 0.03, + "global_step": 5370, + "learning_rate": 0.00047842237061769614, + "loss": 1.7056, + "loss_base2": 2.4607, + "loss_pixel": 0.1753, + "loss_text": 1.5303, + "ppl": 5.5047, + "step": 5370 + }, + { + "epoch": 0.03, + "global_step": 5371, + "learning_rate": 0.00047841819699499165, + "loss": 1.6931, + "loss_base2": 2.4426, + "loss_pixel": 0.1743, + "loss_text": 1.5188, + "ppl": 5.4363, + "step": 5371 + }, + { + "epoch": 0.03, + "global_step": 5372, + "learning_rate": 0.00047841402337228716, + "loss": 1.7066, + "loss_base2": 2.4621, + "loss_pixel": 0.1732, + "loss_text": 1.5335, + "ppl": 5.5102, + "step": 5372 + }, + { + "epoch": 0.03, + "global_step": 5373, + "learning_rate": 0.0004784098497495826, + "loss": 1.7103, + "loss_base2": 2.4674, + "loss_pixel": 0.1743, + "loss_text": 1.536, + "ppl": 5.5306, + "step": 5373 + }, + { + "epoch": 0.03, + "global_step": 5374, + "learning_rate": 0.0004784056761268781, + "loss": 1.6984, + "loss_base2": 2.4503, + "loss_pixel": 0.1756, + "loss_text": 1.5228, + "ppl": 5.4652, + "step": 5374 + }, + { + "epoch": 0.03, + "global_step": 5375, + "learning_rate": 0.0004784015025041736, + "loss": 1.7005, + "loss_base2": 2.4533, + "loss_pixel": 0.1742, + "loss_text": 1.5262, + "ppl": 5.4767, + "step": 5375 + }, + { + "epoch": 0.03, + "global_step": 5376, + "learning_rate": 0.00047839732888146913, + "loss": 1.6999, + "loss_base2": 2.4524, + "loss_pixel": 0.1733, + "loss_text": 1.5265, + "ppl": 5.4734, + "step": 5376 + }, + { + "epoch": 0.03, + "global_step": 5377, + "learning_rate": 0.00047839315525876464, + "loss": 1.6945, + "loss_base2": 2.4446, + "loss_pixel": 0.174, + "loss_text": 1.5205, + "ppl": 5.4439, + "step": 5377 + }, + { + "epoch": 0.03, + "global_step": 5378, + "learning_rate": 0.0004783889816360601, + "loss": 1.6942, + "loss_base2": 2.4442, + "loss_pixel": 0.1754, + "loss_text": 1.5189, + "ppl": 5.4423, + "step": 5378 + }, + { + "epoch": 0.03, + "global_step": 5379, + "learning_rate": 0.0004783848080133556, + "loss": 1.7154, + "loss_base2": 2.4748, + "loss_pixel": 0.1721, + "loss_text": 1.5433, + "ppl": 5.5589, + "step": 5379 + }, + { + "epoch": 0.03, + "global_step": 5380, + "learning_rate": 0.0004783806343906511, + "loss": 1.6943, + "loss_base2": 2.4444, + "loss_pixel": 0.1731, + "loss_text": 1.5213, + "ppl": 5.4428, + "step": 5380 + }, + { + "epoch": 0.03, + "global_step": 5381, + "learning_rate": 0.0004783764607679466, + "loss": 1.7, + "loss_base2": 2.4526, + "loss_pixel": 0.1737, + "loss_text": 1.5263, + "ppl": 5.4739, + "step": 5381 + }, + { + "epoch": 0.03, + "global_step": 5382, + "learning_rate": 0.00047837228714524207, + "loss": 1.7007, + "loss_base2": 2.4536, + "loss_pixel": 0.172, + "loss_text": 1.5286, + "ppl": 5.4778, + "step": 5382 + }, + { + "epoch": 0.03, + "global_step": 5383, + "learning_rate": 0.0004783681135225376, + "loss": 1.6812, + "loss_base2": 2.4255, + "loss_pixel": 0.1719, + "loss_text": 1.5094, + "ppl": 5.372, + "step": 5383 + }, + { + "epoch": 0.03, + "global_step": 5384, + "learning_rate": 0.0004783639398998331, + "loss": 1.7128, + "loss_base2": 2.471, + "loss_pixel": 0.1719, + "loss_text": 1.5409, + "ppl": 5.5445, + "step": 5384 + }, + { + "epoch": 0.03, + "global_step": 5385, + "learning_rate": 0.0004783597662771286, + "loss": 1.6868, + "loss_base2": 2.4335, + "loss_pixel": 0.1727, + "loss_text": 1.5141, + "ppl": 5.4022, + "step": 5385 + }, + { + "epoch": 0.03, + "global_step": 5386, + "learning_rate": 0.0004783555926544241, + "loss": 1.697, + "loss_base2": 2.4483, + "loss_pixel": 0.1718, + "loss_text": 1.5251, + "ppl": 5.4576, + "step": 5386 + }, + { + "epoch": 0.03, + "global_step": 5387, + "learning_rate": 0.00047835141903171955, + "loss": 1.6728, + "loss_base2": 2.4133, + "loss_pixel": 0.1727, + "loss_text": 1.5001, + "ppl": 5.3271, + "step": 5387 + }, + { + "epoch": 0.03, + "global_step": 5388, + "learning_rate": 0.00047834724540901506, + "loss": 1.5053, + "loss_base2": 2.1717, + "loss_pixel": 0.171, + "loss_text": 1.3343, + "ppl": 4.5055, + "step": 5388 + }, + { + "epoch": 0.03, + "global_step": 5389, + "learning_rate": 0.0004783430717863105, + "loss": 1.4641, + "loss_base2": 2.1122, + "loss_pixel": 0.1735, + "loss_text": 1.2906, + "ppl": 4.3237, + "step": 5389 + }, + { + "epoch": 0.03, + "global_step": 5390, + "learning_rate": 0.000478338898163606, + "loss": 1.4644, + "loss_base2": 2.1127, + "loss_pixel": 0.1727, + "loss_text": 1.2917, + "ppl": 4.3249, + "step": 5390 + }, + { + "epoch": 0.03, + "global_step": 5391, + "learning_rate": 0.00047833472454090147, + "loss": 1.4871, + "loss_base2": 2.1454, + "loss_pixel": 0.1719, + "loss_text": 1.3152, + "ppl": 4.4242, + "step": 5391 + }, + { + "epoch": 0.03, + "global_step": 5392, + "learning_rate": 0.000478330550918197, + "loss": 1.4516, + "loss_base2": 2.0942, + "loss_pixel": 0.1718, + "loss_text": 1.2798, + "ppl": 4.2699, + "step": 5392 + }, + { + "epoch": 0.03, + "global_step": 5393, + "learning_rate": 0.0004783263772954925, + "loss": 1.4598, + "loss_base2": 2.106, + "loss_pixel": 0.1699, + "loss_text": 1.2899, + "ppl": 4.3051, + "step": 5393 + }, + { + "epoch": 0.03, + "global_step": 5394, + "learning_rate": 0.000478322203672788, + "loss": 1.4562, + "loss_base2": 2.1009, + "loss_pixel": 0.1721, + "loss_text": 1.2841, + "ppl": 4.2896, + "step": 5394 + }, + { + "epoch": 0.03, + "global_step": 5395, + "learning_rate": 0.0004783180300500835, + "loss": 1.4603, + "loss_base2": 2.1068, + "loss_pixel": 0.1726, + "loss_text": 1.2878, + "ppl": 4.3073, + "step": 5395 + }, + { + "epoch": 0.03, + "global_step": 5396, + "learning_rate": 0.00047831385642737895, + "loss": 1.5953, + "loss_base2": 2.3015, + "loss_pixel": 0.1712, + "loss_text": 1.4241, + "ppl": 4.9298, + "step": 5396 + }, + { + "epoch": 0.03, + "global_step": 5397, + "learning_rate": 0.00047830968280467446, + "loss": 1.5015, + "loss_base2": 2.1662, + "loss_pixel": 0.1829, + "loss_text": 1.3187, + "ppl": 4.4884, + "step": 5397 + }, + { + "epoch": 0.03, + "global_step": 5398, + "learning_rate": 0.00047830550918196997, + "loss": 1.4912, + "loss_base2": 2.1513, + "loss_pixel": 0.1917, + "loss_text": 1.2994, + "ppl": 4.4424, + "step": 5398 + }, + { + "epoch": 0.03, + "global_step": 5399, + "learning_rate": 0.0004783013355592655, + "loss": 1.481, + "loss_base2": 2.1366, + "loss_pixel": 0.1919, + "loss_text": 1.289, + "ppl": 4.3973, + "step": 5399 + }, + { + "epoch": 0.03, + "global_step": 5400, + "learning_rate": 0.0004782971619365609, + "loss": 1.4925, + "loss_base2": 2.1532, + "loss_pixel": 0.1906, + "loss_text": 1.3019, + "ppl": 4.4482, + "step": 5400 + }, + { + "epoch": 0.03, + "global_step": 5401, + "learning_rate": 0.00047829298831385643, + "loss": 1.4633, + "loss_base2": 2.1111, + "loss_pixel": 0.1895, + "loss_text": 1.2737, + "ppl": 4.3202, + "step": 5401 + }, + { + "epoch": 0.03, + "global_step": 5402, + "learning_rate": 0.00047828881469115194, + "loss": 1.4956, + "loss_base2": 2.1577, + "loss_pixel": 0.1843, + "loss_text": 1.3113, + "ppl": 4.462, + "step": 5402 + }, + { + "epoch": 0.03, + "global_step": 5403, + "learning_rate": 0.00047828464106844745, + "loss": 1.4773, + "loss_base2": 2.1313, + "loss_pixel": 0.1768, + "loss_text": 1.3006, + "ppl": 4.3811, + "step": 5403 + }, + { + "epoch": 0.03, + "global_step": 5404, + "learning_rate": 0.00047828046744574296, + "loss": 1.4726, + "loss_base2": 2.1245, + "loss_pixel": 0.1753, + "loss_text": 1.2974, + "ppl": 4.3606, + "step": 5404 + }, + { + "epoch": 0.03, + "global_step": 5405, + "learning_rate": 0.0004782762938230384, + "loss": 1.638, + "loss_base2": 2.3631, + "loss_pixel": 0.176, + "loss_text": 1.462, + "ppl": 5.1449, + "step": 5405 + }, + { + "epoch": 0.03, + "global_step": 5406, + "learning_rate": 0.0004782721202003339, + "loss": 1.7264, + "loss_base2": 2.4907, + "loss_pixel": 0.1732, + "loss_text": 1.5532, + "ppl": 5.6204, + "step": 5406 + }, + { + "epoch": 0.03, + "global_step": 5407, + "learning_rate": 0.0004782679465776294, + "loss": 1.7224, + "loss_base2": 2.4849, + "loss_pixel": 0.1742, + "loss_text": 1.5483, + "ppl": 5.5979, + "step": 5407 + }, + { + "epoch": 0.03, + "global_step": 5408, + "learning_rate": 0.0004782637729549249, + "loss": 1.7219, + "loss_base2": 2.4842, + "loss_pixel": 0.1729, + "loss_text": 1.549, + "ppl": 5.5951, + "step": 5408 + }, + { + "epoch": 0.03, + "global_step": 5409, + "learning_rate": 0.00047825959933222033, + "loss": 1.7171, + "loss_base2": 2.4773, + "loss_pixel": 0.1756, + "loss_text": 1.5416, + "ppl": 5.5684, + "step": 5409 + }, + { + "epoch": 0.03, + "global_step": 5410, + "learning_rate": 0.00047825542570951584, + "loss": 1.7095, + "loss_base2": 2.4663, + "loss_pixel": 0.171, + "loss_text": 1.5385, + "ppl": 5.5262, + "step": 5410 + }, + { + "epoch": 0.03, + "global_step": 5411, + "learning_rate": 0.00047825125208681134, + "loss": 1.719, + "loss_base2": 2.48, + "loss_pixel": 0.1709, + "loss_text": 1.5481, + "ppl": 5.5789, + "step": 5411 + }, + { + "epoch": 0.03, + "global_step": 5412, + "learning_rate": 0.00047824707846410685, + "loss": 1.6945, + "loss_base2": 2.4446, + "loss_pixel": 0.1742, + "loss_text": 1.5202, + "ppl": 5.4439, + "step": 5412 + }, + { + "epoch": 0.03, + "global_step": 5413, + "learning_rate": 0.00047824290484140236, + "loss": 1.7047, + "loss_base2": 2.4594, + "loss_pixel": 0.1721, + "loss_text": 1.5326, + "ppl": 5.4997, + "step": 5413 + }, + { + "epoch": 0.03, + "global_step": 5414, + "learning_rate": 0.0004782387312186978, + "loss": 1.7072, + "loss_base2": 2.463, + "loss_pixel": 0.1735, + "loss_text": 1.5337, + "ppl": 5.5135, + "step": 5414 + }, + { + "epoch": 0.03, + "global_step": 5415, + "learning_rate": 0.0004782345575959933, + "loss": 1.7163, + "loss_base2": 2.4761, + "loss_pixel": 0.1718, + "loss_text": 1.5445, + "ppl": 5.5639, + "step": 5415 + }, + { + "epoch": 0.03, + "global_step": 5416, + "learning_rate": 0.0004782303839732888, + "loss": 1.7069, + "loss_base2": 2.4625, + "loss_pixel": 0.17, + "loss_text": 1.5369, + "ppl": 5.5118, + "step": 5416 + }, + { + "epoch": 0.03, + "global_step": 5417, + "learning_rate": 0.00047822621035058433, + "loss": 1.6913, + "loss_base2": 2.44, + "loss_pixel": 0.1729, + "loss_text": 1.5183, + "ppl": 5.4265, + "step": 5417 + }, + { + "epoch": 0.03, + "global_step": 5418, + "learning_rate": 0.0004782220367278798, + "loss": 1.7076, + "loss_base2": 2.4635, + "loss_pixel": 0.1717, + "loss_text": 1.5359, + "ppl": 5.5157, + "step": 5418 + }, + { + "epoch": 0.03, + "global_step": 5419, + "learning_rate": 0.0004782178631051753, + "loss": 1.6997, + "loss_base2": 2.4521, + "loss_pixel": 0.1729, + "loss_text": 1.5268, + "ppl": 5.4723, + "step": 5419 + }, + { + "epoch": 0.03, + "global_step": 5420, + "learning_rate": 0.0004782136894824708, + "loss": 1.6929, + "loss_base2": 2.4423, + "loss_pixel": 0.1706, + "loss_text": 1.5223, + "ppl": 5.4352, + "step": 5420 + }, + { + "epoch": 0.03, + "global_step": 5421, + "learning_rate": 0.0004782095158597663, + "loss": 1.7269, + "loss_base2": 2.4914, + "loss_pixel": 0.1739, + "loss_text": 1.553, + "ppl": 5.6232, + "step": 5421 + }, + { + "epoch": 0.03, + "global_step": 5422, + "learning_rate": 0.0004782053422370618, + "loss": 1.7061, + "loss_base2": 2.4614, + "loss_pixel": 0.1724, + "loss_text": 1.5337, + "ppl": 5.5074, + "step": 5422 + }, + { + "epoch": 0.03, + "global_step": 5423, + "learning_rate": 0.00047820116861435727, + "loss": 1.6875, + "loss_base2": 2.4345, + "loss_pixel": 0.1723, + "loss_text": 1.5152, + "ppl": 5.4059, + "step": 5423 + }, + { + "epoch": 0.03, + "global_step": 5424, + "learning_rate": 0.0004781969949916528, + "loss": 1.7266, + "loss_base2": 2.491, + "loss_pixel": 0.1721, + "loss_text": 1.5545, + "ppl": 5.6215, + "step": 5424 + }, + { + "epoch": 0.03, + "global_step": 5425, + "learning_rate": 0.0004781928213689483, + "loss": 1.7065, + "loss_base2": 2.462, + "loss_pixel": 0.1718, + "loss_text": 1.5346, + "ppl": 5.5096, + "step": 5425 + }, + { + "epoch": 0.03, + "global_step": 5426, + "learning_rate": 0.0004781886477462438, + "loss": 1.5974, + "loss_base2": 2.3046, + "loss_pixel": 0.1729, + "loss_text": 1.4245, + "ppl": 4.9402, + "step": 5426 + }, + { + "epoch": 0.03, + "global_step": 5427, + "learning_rate": 0.0004781844741235392, + "loss": 1.4781, + "loss_base2": 2.1324, + "loss_pixel": 0.174, + "loss_text": 1.3041, + "ppl": 4.3846, + "step": 5427 + }, + { + "epoch": 0.03, + "global_step": 5428, + "learning_rate": 0.0004781803005008347, + "loss": 1.5025, + "loss_base2": 2.1676, + "loss_pixel": 0.1703, + "loss_text": 1.3322, + "ppl": 4.4929, + "step": 5428 + }, + { + "epoch": 0.03, + "global_step": 5429, + "learning_rate": 0.0004781761268781302, + "loss": 1.4691, + "loss_base2": 2.1195, + "loss_pixel": 0.1706, + "loss_text": 1.2984, + "ppl": 4.3453, + "step": 5429 + }, + { + "epoch": 0.03, + "global_step": 5430, + "learning_rate": 0.0004781719532554257, + "loss": 1.4859, + "loss_base2": 2.1437, + "loss_pixel": 0.1711, + "loss_text": 1.3149, + "ppl": 4.4189, + "step": 5430 + }, + { + "epoch": 0.03, + "global_step": 5431, + "learning_rate": 0.0004781677796327212, + "loss": 1.4897, + "loss_base2": 2.1492, + "loss_pixel": 0.1722, + "loss_text": 1.3175, + "ppl": 4.4358, + "step": 5431 + }, + { + "epoch": 0.03, + "global_step": 5432, + "learning_rate": 0.0004781636060100167, + "loss": 1.4539, + "loss_base2": 2.0975, + "loss_pixel": 0.172, + "loss_text": 1.2819, + "ppl": 4.2798, + "step": 5432 + }, + { + "epoch": 0.03, + "global_step": 5433, + "learning_rate": 0.0004781594323873122, + "loss": 1.4388, + "loss_base2": 2.0757, + "loss_pixel": 0.1712, + "loss_text": 1.2677, + "ppl": 4.2156, + "step": 5433 + }, + { + "epoch": 0.03, + "global_step": 5434, + "learning_rate": 0.0004781552587646077, + "loss": 1.5622, + "loss_base2": 2.2538, + "loss_pixel": 0.1709, + "loss_text": 1.3913, + "ppl": 4.7693, + "step": 5434 + }, + { + "epoch": 0.03, + "global_step": 5435, + "learning_rate": 0.0004781510851419032, + "loss": 1.7303, + "loss_base2": 2.4963, + "loss_pixel": 0.1703, + "loss_text": 1.56, + "ppl": 5.6423, + "step": 5435 + }, + { + "epoch": 0.03, + "global_step": 5436, + "learning_rate": 0.0004781469115191987, + "loss": 1.6829, + "loss_base2": 2.4279, + "loss_pixel": 0.1712, + "loss_text": 1.5117, + "ppl": 5.3811, + "step": 5436 + }, + { + "epoch": 0.03, + "global_step": 5437, + "learning_rate": 0.00047814273789649416, + "loss": 1.7007, + "loss_base2": 2.4536, + "loss_pixel": 0.1843, + "loss_text": 1.5165, + "ppl": 5.4778, + "step": 5437 + }, + { + "epoch": 0.03, + "global_step": 5438, + "learning_rate": 0.00047813856427378966, + "loss": 1.7285, + "loss_base2": 2.4937, + "loss_pixel": 0.1868, + "loss_text": 1.5417, + "ppl": 5.6322, + "step": 5438 + }, + { + "epoch": 0.03, + "global_step": 5439, + "learning_rate": 0.00047813439065108517, + "loss": 1.709, + "loss_base2": 2.4656, + "loss_pixel": 0.1846, + "loss_text": 1.5244, + "ppl": 5.5234, + "step": 5439 + }, + { + "epoch": 0.03, + "global_step": 5440, + "learning_rate": 0.0004781302170283807, + "loss": 1.7164, + "loss_base2": 2.4762, + "loss_pixel": 0.1844, + "loss_text": 1.532, + "ppl": 5.5645, + "step": 5440 + }, + { + "epoch": 0.03, + "global_step": 5441, + "learning_rate": 0.00047812604340567613, + "loss": 1.7321, + "loss_base2": 2.4989, + "loss_pixel": 0.1842, + "loss_text": 1.5478, + "ppl": 5.6525, + "step": 5441 + }, + { + "epoch": 0.03, + "global_step": 5442, + "learning_rate": 0.00047812186978297164, + "loss": 1.7115, + "loss_base2": 2.4692, + "loss_pixel": 0.1825, + "loss_text": 1.529, + "ppl": 5.5373, + "step": 5442 + }, + { + "epoch": 0.03, + "global_step": 5443, + "learning_rate": 0.00047811769616026715, + "loss": 1.7235, + "loss_base2": 2.4865, + "loss_pixel": 0.1828, + "loss_text": 1.5406, + "ppl": 5.6041, + "step": 5443 + }, + { + "epoch": 0.03, + "global_step": 5444, + "learning_rate": 0.00047811352253756265, + "loss": 1.7115, + "loss_base2": 2.4692, + "loss_pixel": 0.1827, + "loss_text": 1.5287, + "ppl": 5.5373, + "step": 5444 + }, + { + "epoch": 0.03, + "global_step": 5445, + "learning_rate": 0.00047810934891485816, + "loss": 1.7039, + "loss_base2": 2.4582, + "loss_pixel": 0.1834, + "loss_text": 1.5205, + "ppl": 5.4953, + "step": 5445 + }, + { + "epoch": 0.03, + "global_step": 5446, + "learning_rate": 0.00047810517529215356, + "loss": 1.7172, + "loss_base2": 2.4774, + "loss_pixel": 0.1826, + "loss_text": 1.5346, + "ppl": 5.5689, + "step": 5446 + }, + { + "epoch": 0.03, + "global_step": 5447, + "learning_rate": 0.00047810100166944907, + "loss": 1.7198, + "loss_base2": 2.4811, + "loss_pixel": 0.1829, + "loss_text": 1.5369, + "ppl": 5.5834, + "step": 5447 + }, + { + "epoch": 0.03, + "global_step": 5448, + "learning_rate": 0.0004780968280467446, + "loss": 1.7185, + "loss_base2": 2.4793, + "loss_pixel": 0.184, + "loss_text": 1.5344, + "ppl": 5.5762, + "step": 5448 + }, + { + "epoch": 0.03, + "global_step": 5449, + "learning_rate": 0.0004780926544240401, + "loss": 1.7178, + "loss_base2": 2.4783, + "loss_pixel": 0.1825, + "loss_text": 1.5353, + "ppl": 5.5723, + "step": 5449 + }, + { + "epoch": 0.03, + "global_step": 5450, + "learning_rate": 0.00047808848080133553, + "loss": 1.7057, + "loss_base2": 2.4608, + "loss_pixel": 0.1818, + "loss_text": 1.524, + "ppl": 5.5052, + "step": 5450 + }, + { + "epoch": 0.03, + "global_step": 5451, + "learning_rate": 0.00047808430717863104, + "loss": 1.7212, + "loss_base2": 2.4832, + "loss_pixel": 0.1828, + "loss_text": 1.5385, + "ppl": 5.5912, + "step": 5451 + }, + { + "epoch": 0.03, + "global_step": 5452, + "learning_rate": 0.00047808013355592655, + "loss": 1.7308, + "loss_base2": 2.497, + "loss_pixel": 0.1831, + "loss_text": 1.5477, + "ppl": 5.6452, + "step": 5452 + }, + { + "epoch": 0.03, + "global_step": 5453, + "learning_rate": 0.00047807595993322206, + "loss": 1.7069, + "loss_base2": 2.4625, + "loss_pixel": 0.182, + "loss_text": 1.5249, + "ppl": 5.5118, + "step": 5453 + }, + { + "epoch": 0.03, + "global_step": 5454, + "learning_rate": 0.00047807178631051756, + "loss": 1.7243, + "loss_base2": 2.4876, + "loss_pixel": 0.1821, + "loss_text": 1.5422, + "ppl": 5.6086, + "step": 5454 + }, + { + "epoch": 0.03, + "global_step": 5455, + "learning_rate": 0.000478067612687813, + "loss": 1.7015, + "loss_base2": 2.4547, + "loss_pixel": 0.1816, + "loss_text": 1.5199, + "ppl": 5.4822, + "step": 5455 + }, + { + "epoch": 0.03, + "global_step": 5456, + "learning_rate": 0.0004780634390651085, + "loss": 1.6269, + "loss_base2": 2.3471, + "loss_pixel": 0.182, + "loss_text": 1.445, + "ppl": 5.0881, + "step": 5456 + }, + { + "epoch": 0.03, + "global_step": 5457, + "learning_rate": 0.00047805926544240403, + "loss": 1.4879, + "loss_base2": 2.1466, + "loss_pixel": 0.1813, + "loss_text": 1.3066, + "ppl": 4.4278, + "step": 5457 + }, + { + "epoch": 0.03, + "global_step": 5458, + "learning_rate": 0.00047805509181969954, + "loss": 1.5063, + "loss_base2": 2.1731, + "loss_pixel": 0.181, + "loss_text": 1.3253, + "ppl": 4.51, + "step": 5458 + }, + { + "epoch": 0.03, + "global_step": 5459, + "learning_rate": 0.000478050918196995, + "loss": 1.49, + "loss_base2": 2.1496, + "loss_pixel": 0.1812, + "loss_text": 1.3088, + "ppl": 4.4371, + "step": 5459 + }, + { + "epoch": 0.03, + "global_step": 5460, + "learning_rate": 0.0004780467445742905, + "loss": 1.4767, + "loss_base2": 2.1304, + "loss_pixel": 0.1806, + "loss_text": 1.296, + "ppl": 4.3785, + "step": 5460 + }, + { + "epoch": 0.03, + "global_step": 5461, + "learning_rate": 0.000478042570951586, + "loss": 1.4764, + "loss_base2": 2.13, + "loss_pixel": 0.1819, + "loss_text": 1.2946, + "ppl": 4.3772, + "step": 5461 + }, + { + "epoch": 0.03, + "global_step": 5462, + "learning_rate": 0.0004780383973288815, + "loss": 1.4704, + "loss_base2": 2.1213, + "loss_pixel": 0.1821, + "loss_text": 1.2884, + "ppl": 4.351, + "step": 5462 + }, + { + "epoch": 0.03, + "global_step": 5463, + "learning_rate": 0.000478034223706177, + "loss": 1.4999, + "loss_base2": 2.1639, + "loss_pixel": 0.1828, + "loss_text": 1.317, + "ppl": 4.4812, + "step": 5463 + }, + { + "epoch": 0.03, + "global_step": 5464, + "learning_rate": 0.0004780300500834724, + "loss": 1.4748, + "loss_base2": 2.1277, + "loss_pixel": 0.1796, + "loss_text": 1.2952, + "ppl": 4.3702, + "step": 5464 + }, + { + "epoch": 0.03, + "global_step": 5465, + "learning_rate": 0.0004780258764607679, + "loss": 1.4635, + "loss_base2": 2.1114, + "loss_pixel": 0.1809, + "loss_text": 1.2826, + "ppl": 4.3211, + "step": 5465 + }, + { + "epoch": 0.03, + "global_step": 5466, + "learning_rate": 0.00047802170283806343, + "loss": 1.4781, + "loss_base2": 2.1324, + "loss_pixel": 0.1816, + "loss_text": 1.2965, + "ppl": 4.3846, + "step": 5466 + }, + { + "epoch": 0.03, + "global_step": 5467, + "learning_rate": 0.00047801752921535894, + "loss": 1.4805, + "loss_base2": 2.1359, + "loss_pixel": 0.1806, + "loss_text": 1.3, + "ppl": 4.3951, + "step": 5467 + }, + { + "epoch": 0.03, + "global_step": 5468, + "learning_rate": 0.0004780133555926544, + "loss": 1.4791, + "loss_base2": 2.1339, + "loss_pixel": 0.1792, + "loss_text": 1.2999, + "ppl": 4.389, + "step": 5468 + }, + { + "epoch": 0.03, + "global_step": 5469, + "learning_rate": 0.0004780091819699499, + "loss": 1.4796, + "loss_base2": 2.1346, + "loss_pixel": 0.1796, + "loss_text": 1.3, + "ppl": 4.3912, + "step": 5469 + }, + { + "epoch": 0.03, + "global_step": 5470, + "learning_rate": 0.0004780050083472454, + "loss": 1.4901, + "loss_base2": 2.1498, + "loss_pixel": 0.1813, + "loss_text": 1.3088, + "ppl": 4.4375, + "step": 5470 + }, + { + "epoch": 0.03, + "global_step": 5471, + "learning_rate": 0.0004780008347245409, + "loss": 1.4932, + "loss_base2": 2.1542, + "loss_pixel": 0.1817, + "loss_text": 1.3114, + "ppl": 4.4513, + "step": 5471 + }, + { + "epoch": 0.03, + "global_step": 5472, + "learning_rate": 0.0004779966611018364, + "loss": 1.473, + "loss_base2": 2.1251, + "loss_pixel": 0.1812, + "loss_text": 1.2918, + "ppl": 4.3623, + "step": 5472 + }, + { + "epoch": 0.03, + "global_step": 5473, + "learning_rate": 0.0004779924874791319, + "loss": 1.5426, + "loss_base2": 2.2255, + "loss_pixel": 0.1813, + "loss_text": 1.3613, + "ppl": 4.6767, + "step": 5473 + }, + { + "epoch": 0.03, + "global_step": 5474, + "learning_rate": 0.0004779883138564274, + "loss": 1.7434, + "loss_base2": 2.5152, + "loss_pixel": 0.1801, + "loss_text": 1.5633, + "ppl": 5.7167, + "step": 5474 + }, + { + "epoch": 0.03, + "global_step": 5475, + "learning_rate": 0.0004779841402337229, + "loss": 1.7352, + "loss_base2": 2.5034, + "loss_pixel": 0.1802, + "loss_text": 1.5549, + "ppl": 5.6701, + "step": 5475 + }, + { + "epoch": 0.03, + "global_step": 5476, + "learning_rate": 0.0004779799666110184, + "loss": 1.7293, + "loss_base2": 2.4949, + "loss_pixel": 0.182, + "loss_text": 1.5473, + "ppl": 5.6367, + "step": 5476 + }, + { + "epoch": 0.03, + "global_step": 5477, + "learning_rate": 0.00047797579298831385, + "loss": 1.7197, + "loss_base2": 2.481, + "loss_pixel": 0.1827, + "loss_text": 1.5369, + "ppl": 5.5829, + "step": 5477 + }, + { + "epoch": 0.03, + "global_step": 5478, + "learning_rate": 0.00047797161936560936, + "loss": 1.7097, + "loss_base2": 2.4666, + "loss_pixel": 0.1823, + "loss_text": 1.5274, + "ppl": 5.5273, + "step": 5478 + }, + { + "epoch": 0.03, + "global_step": 5479, + "learning_rate": 0.00047796744574290487, + "loss": 1.7268, + "loss_base2": 2.4912, + "loss_pixel": 0.1824, + "loss_text": 1.5444, + "ppl": 5.6226, + "step": 5479 + }, + { + "epoch": 0.03, + "global_step": 5480, + "learning_rate": 0.0004779632721202004, + "loss": 1.7013, + "loss_base2": 2.4545, + "loss_pixel": 0.182, + "loss_text": 1.5192, + "ppl": 5.4811, + "step": 5480 + }, + { + "epoch": 0.03, + "global_step": 5481, + "learning_rate": 0.0004779590984974959, + "loss": 1.7243, + "loss_base2": 2.4876, + "loss_pixel": 0.1805, + "loss_text": 1.5438, + "ppl": 5.6086, + "step": 5481 + }, + { + "epoch": 0.03, + "global_step": 5482, + "learning_rate": 0.00047795492487479133, + "loss": 1.7171, + "loss_base2": 2.4773, + "loss_pixel": 0.1811, + "loss_text": 1.536, + "ppl": 5.5684, + "step": 5482 + }, + { + "epoch": 0.03, + "global_step": 5483, + "learning_rate": 0.0004779507512520868, + "loss": 1.7173, + "loss_base2": 2.4775, + "loss_pixel": 0.1806, + "loss_text": 1.5367, + "ppl": 5.5695, + "step": 5483 + }, + { + "epoch": 0.03, + "global_step": 5484, + "learning_rate": 0.0004779465776293823, + "loss": 1.7134, + "loss_base2": 2.4719, + "loss_pixel": 0.1806, + "loss_text": 1.5328, + "ppl": 5.5478, + "step": 5484 + }, + { + "epoch": 0.03, + "global_step": 5485, + "learning_rate": 0.0004779424040066778, + "loss": 1.7161, + "loss_base2": 2.4758, + "loss_pixel": 0.1808, + "loss_text": 1.5353, + "ppl": 5.5628, + "step": 5485 + }, + { + "epoch": 0.03, + "global_step": 5486, + "learning_rate": 0.00047793823038397326, + "loss": 1.7237, + "loss_base2": 2.4868, + "loss_pixel": 0.1806, + "loss_text": 1.5432, + "ppl": 5.6052, + "step": 5486 + }, + { + "epoch": 0.03, + "global_step": 5487, + "learning_rate": 0.00047793405676126876, + "loss": 1.7001, + "loss_base2": 2.4527, + "loss_pixel": 0.1805, + "loss_text": 1.5196, + "ppl": 5.4745, + "step": 5487 + }, + { + "epoch": 0.03, + "global_step": 5488, + "learning_rate": 0.00047792988313856427, + "loss": 1.722, + "loss_base2": 2.4843, + "loss_pixel": 0.1811, + "loss_text": 1.5409, + "ppl": 5.5957, + "step": 5488 + }, + { + "epoch": 0.03, + "global_step": 5489, + "learning_rate": 0.0004779257095158598, + "loss": 1.698, + "loss_base2": 2.4497, + "loss_pixel": 0.1802, + "loss_text": 1.5178, + "ppl": 5.463, + "step": 5489 + }, + { + "epoch": 0.03, + "global_step": 5490, + "learning_rate": 0.0004779215358931553, + "loss": 1.7277, + "loss_base2": 2.4925, + "loss_pixel": 0.181, + "loss_text": 1.5467, + "ppl": 5.6277, + "step": 5490 + }, + { + "epoch": 0.03, + "global_step": 5491, + "learning_rate": 0.00047791736227045074, + "loss": 1.73, + "loss_base2": 2.4959, + "loss_pixel": 0.1837, + "loss_text": 1.5463, + "ppl": 5.6407, + "step": 5491 + }, + { + "epoch": 0.03, + "global_step": 5492, + "learning_rate": 0.00047791318864774624, + "loss": 1.7039, + "loss_base2": 2.4582, + "loss_pixel": 0.1816, + "loss_text": 1.5223, + "ppl": 5.4953, + "step": 5492 + }, + { + "epoch": 0.03, + "global_step": 5493, + "learning_rate": 0.00047790901502504175, + "loss": 1.7323, + "loss_base2": 2.4992, + "loss_pixel": 0.1817, + "loss_text": 1.5506, + "ppl": 5.6536, + "step": 5493 + }, + { + "epoch": 0.03, + "global_step": 5494, + "learning_rate": 0.00047790484140233726, + "loss": 1.7066, + "loss_base2": 2.4621, + "loss_pixel": 0.1817, + "loss_text": 1.5249, + "ppl": 5.5102, + "step": 5494 + }, + { + "epoch": 0.03, + "global_step": 5495, + "learning_rate": 0.00047790066777963277, + "loss": 1.7091, + "loss_base2": 2.4657, + "loss_pixel": 0.1804, + "loss_text": 1.5288, + "ppl": 5.524, + "step": 5495 + }, + { + "epoch": 0.03, + "global_step": 5496, + "learning_rate": 0.0004778964941569282, + "loss": 1.7165, + "loss_base2": 2.4764, + "loss_pixel": 0.1796, + "loss_text": 1.5369, + "ppl": 5.565, + "step": 5496 + }, + { + "epoch": 0.03, + "global_step": 5497, + "learning_rate": 0.00047789232053422373, + "loss": 1.7191, + "loss_base2": 2.4801, + "loss_pixel": 0.1803, + "loss_text": 1.5389, + "ppl": 5.5795, + "step": 5497 + }, + { + "epoch": 0.03, + "global_step": 5498, + "learning_rate": 0.00047788814691151923, + "loss": 1.6892, + "loss_base2": 2.437, + "loss_pixel": 0.1812, + "loss_text": 1.508, + "ppl": 5.4151, + "step": 5498 + }, + { + "epoch": 0.03, + "global_step": 5499, + "learning_rate": 0.00047788397328881474, + "loss": 1.7142, + "loss_base2": 2.4731, + "loss_pixel": 0.1812, + "loss_text": 1.533, + "ppl": 5.5522, + "step": 5499 + }, + { + "epoch": 0.03, + "global_step": 5500, + "learning_rate": 0.0004778797996661102, + "loss": 1.7135, + "loss_base2": 2.4721, + "loss_pixel": 0.181, + "loss_text": 1.5325, + "ppl": 5.5483, + "step": 5500 + }, + { + "epoch": 0.03, + "global_step": 5501, + "learning_rate": 0.0004778756260434057, + "loss": 1.698, + "loss_base2": 2.4497, + "loss_pixel": 0.1797, + "loss_text": 1.5183, + "ppl": 5.463, + "step": 5501 + }, + { + "epoch": 0.03, + "global_step": 5502, + "learning_rate": 0.00047787145242070116, + "loss": 1.7132, + "loss_base2": 2.4716, + "loss_pixel": 0.1809, + "loss_text": 1.5323, + "ppl": 5.5467, + "step": 5502 + }, + { + "epoch": 0.03, + "global_step": 5503, + "learning_rate": 0.00047786727879799666, + "loss": 1.7002, + "loss_base2": 2.4529, + "loss_pixel": 0.1799, + "loss_text": 1.5203, + "ppl": 5.475, + "step": 5503 + }, + { + "epoch": 0.03, + "global_step": 5504, + "learning_rate": 0.00047786310517529217, + "loss": 1.6982, + "loss_base2": 2.45, + "loss_pixel": 0.1799, + "loss_text": 1.5183, + "ppl": 5.4641, + "step": 5504 + }, + { + "epoch": 0.03, + "global_step": 5505, + "learning_rate": 0.0004778589315525876, + "loss": 1.7009, + "loss_base2": 2.4539, + "loss_pixel": 0.1807, + "loss_text": 1.5201, + "ppl": 5.4789, + "step": 5505 + }, + { + "epoch": 0.03, + "global_step": 5506, + "learning_rate": 0.00047785475792988313, + "loss": 1.7035, + "loss_base2": 2.4576, + "loss_pixel": 0.1809, + "loss_text": 1.5226, + "ppl": 5.4931, + "step": 5506 + }, + { + "epoch": 0.03, + "global_step": 5507, + "learning_rate": 0.00047785058430717864, + "loss": 1.7031, + "loss_base2": 2.4571, + "loss_pixel": 0.1796, + "loss_text": 1.5235, + "ppl": 5.4909, + "step": 5507 + }, + { + "epoch": 0.03, + "global_step": 5508, + "learning_rate": 0.00047784641068447414, + "loss": 1.7209, + "loss_base2": 2.4827, + "loss_pixel": 0.1791, + "loss_text": 1.5418, + "ppl": 5.5896, + "step": 5508 + }, + { + "epoch": 0.03, + "global_step": 5509, + "learning_rate": 0.0004778422370617696, + "loss": 1.7087, + "loss_base2": 2.4651, + "loss_pixel": 0.1821, + "loss_text": 1.5266, + "ppl": 5.5218, + "step": 5509 + }, + { + "epoch": 0.03, + "global_step": 5510, + "learning_rate": 0.0004778380634390651, + "loss": 1.7047, + "loss_base2": 2.4594, + "loss_pixel": 0.1809, + "loss_text": 1.5238, + "ppl": 5.4997, + "step": 5510 + }, + { + "epoch": 0.03, + "global_step": 5511, + "learning_rate": 0.0004778338898163606, + "loss": 1.6875, + "loss_base2": 2.4345, + "loss_pixel": 0.1804, + "loss_text": 1.5071, + "ppl": 5.4059, + "step": 5511 + }, + { + "epoch": 0.03, + "global_step": 5512, + "learning_rate": 0.0004778297161936561, + "loss": 1.6894, + "loss_base2": 2.4373, + "loss_pixel": 0.1799, + "loss_text": 1.5095, + "ppl": 5.4162, + "step": 5512 + }, + { + "epoch": 0.03, + "global_step": 5513, + "learning_rate": 0.00047782554257095163, + "loss": 1.7008, + "loss_base2": 2.4537, + "loss_pixel": 0.1801, + "loss_text": 1.5207, + "ppl": 5.4783, + "step": 5513 + }, + { + "epoch": 0.03, + "global_step": 5514, + "learning_rate": 0.0004778213689482471, + "loss": 1.7146, + "loss_base2": 2.4736, + "loss_pixel": 0.1798, + "loss_text": 1.5348, + "ppl": 5.5545, + "step": 5514 + }, + { + "epoch": 0.03, + "global_step": 5515, + "learning_rate": 0.0004778171953255426, + "loss": 1.731, + "loss_base2": 2.4973, + "loss_pixel": 0.1809, + "loss_text": 1.5501, + "ppl": 5.6463, + "step": 5515 + }, + { + "epoch": 0.03, + "global_step": 5516, + "learning_rate": 0.0004778130217028381, + "loss": 1.7036, + "loss_base2": 2.4578, + "loss_pixel": 0.1794, + "loss_text": 1.5242, + "ppl": 5.4937, + "step": 5516 + }, + { + "epoch": 0.03, + "global_step": 5517, + "learning_rate": 0.0004778088480801336, + "loss": 1.7114, + "loss_base2": 2.469, + "loss_pixel": 0.1789, + "loss_text": 1.5325, + "ppl": 5.5367, + "step": 5517 + }, + { + "epoch": 0.03, + "global_step": 5518, + "learning_rate": 0.00047780467445742906, + "loss": 1.7069, + "loss_base2": 2.4625, + "loss_pixel": 0.18, + "loss_text": 1.5269, + "ppl": 5.5118, + "step": 5518 + }, + { + "epoch": 0.03, + "global_step": 5519, + "learning_rate": 0.00047780050083472456, + "loss": 1.7039, + "loss_base2": 2.4582, + "loss_pixel": 0.1809, + "loss_text": 1.5229, + "ppl": 5.4953, + "step": 5519 + }, + { + "epoch": 0.03, + "global_step": 5520, + "learning_rate": 0.00047779632721202007, + "loss": 1.7079, + "loss_base2": 2.464, + "loss_pixel": 0.1805, + "loss_text": 1.5274, + "ppl": 5.5174, + "step": 5520 + }, + { + "epoch": 0.03, + "global_step": 5521, + "learning_rate": 0.0004777921535893155, + "loss": 1.6883, + "loss_base2": 2.4357, + "loss_pixel": 0.1803, + "loss_text": 1.508, + "ppl": 5.4103, + "step": 5521 + }, + { + "epoch": 0.03, + "global_step": 5522, + "learning_rate": 0.00047778797996661103, + "loss": 1.7139, + "loss_base2": 2.4726, + "loss_pixel": 0.1821, + "loss_text": 1.5319, + "ppl": 5.5506, + "step": 5522 + }, + { + "epoch": 0.03, + "global_step": 5523, + "learning_rate": 0.0004777838063439065, + "loss": 1.7227, + "loss_base2": 2.4853, + "loss_pixel": 0.1794, + "loss_text": 1.5433, + "ppl": 5.5996, + "step": 5523 + }, + { + "epoch": 0.03, + "global_step": 5524, + "learning_rate": 0.000477779632721202, + "loss": 1.6964, + "loss_base2": 2.4474, + "loss_pixel": 0.1798, + "loss_text": 1.5166, + "ppl": 5.4543, + "step": 5524 + }, + { + "epoch": 0.03, + "global_step": 5525, + "learning_rate": 0.0004777754590984975, + "loss": 1.7054, + "loss_base2": 2.4604, + "loss_pixel": 0.18, + "loss_text": 1.5254, + "ppl": 5.5036, + "step": 5525 + }, + { + "epoch": 0.03, + "global_step": 5526, + "learning_rate": 0.000477771285475793, + "loss": 1.7039, + "loss_base2": 2.4582, + "loss_pixel": 0.1807, + "loss_text": 1.5233, + "ppl": 5.4953, + "step": 5526 + }, + { + "epoch": 0.03, + "global_step": 5527, + "learning_rate": 0.00047776711185308846, + "loss": 1.7019, + "loss_base2": 2.4553, + "loss_pixel": 0.1787, + "loss_text": 1.5232, + "ppl": 5.4844, + "step": 5527 + }, + { + "epoch": 0.03, + "global_step": 5528, + "learning_rate": 0.00047776293823038397, + "loss": 1.728, + "loss_base2": 2.493, + "loss_pixel": 0.1779, + "loss_text": 1.5501, + "ppl": 5.6294, + "step": 5528 + }, + { + "epoch": 0.03, + "global_step": 5529, + "learning_rate": 0.0004777587646076795, + "loss": 1.7051, + "loss_base2": 2.4599, + "loss_pixel": 0.1795, + "loss_text": 1.5257, + "ppl": 5.5019, + "step": 5529 + }, + { + "epoch": 0.03, + "global_step": 5530, + "learning_rate": 0.000477754590984975, + "loss": 1.7055, + "loss_base2": 2.4605, + "loss_pixel": 0.1791, + "loss_text": 1.5264, + "ppl": 5.5041, + "step": 5530 + }, + { + "epoch": 0.03, + "global_step": 5531, + "learning_rate": 0.0004777504173622705, + "loss": 1.6843, + "loss_base2": 2.4299, + "loss_pixel": 0.1792, + "loss_text": 1.5051, + "ppl": 5.3887, + "step": 5531 + }, + { + "epoch": 0.03, + "global_step": 5532, + "learning_rate": 0.00047774624373956594, + "loss": 1.6807, + "loss_base2": 2.4247, + "loss_pixel": 0.1796, + "loss_text": 1.501, + "ppl": 5.3693, + "step": 5532 + }, + { + "epoch": 0.03, + "global_step": 5533, + "learning_rate": 0.00047774207011686145, + "loss": 1.6913, + "loss_base2": 2.44, + "loss_pixel": 0.1799, + "loss_text": 1.5115, + "ppl": 5.4265, + "step": 5533 + }, + { + "epoch": 0.03, + "global_step": 5534, + "learning_rate": 0.00047773789649415696, + "loss": 1.7159, + "loss_base2": 2.4755, + "loss_pixel": 0.18, + "loss_text": 1.5359, + "ppl": 5.5617, + "step": 5534 + }, + { + "epoch": 0.03, + "global_step": 5535, + "learning_rate": 0.00047773372287145246, + "loss": 1.7094, + "loss_base2": 2.4661, + "loss_pixel": 0.1791, + "loss_text": 1.5303, + "ppl": 5.5256, + "step": 5535 + }, + { + "epoch": 0.03, + "global_step": 5536, + "learning_rate": 0.0004777295492487479, + "loss": 1.7041, + "loss_base2": 2.4585, + "loss_pixel": 0.1793, + "loss_text": 1.5248, + "ppl": 5.4964, + "step": 5536 + }, + { + "epoch": 0.03, + "global_step": 5537, + "learning_rate": 0.0004777253756260434, + "loss": 1.6939, + "loss_base2": 2.4438, + "loss_pixel": 0.1796, + "loss_text": 1.5143, + "ppl": 5.4407, + "step": 5537 + }, + { + "epoch": 0.03, + "global_step": 5538, + "learning_rate": 0.00047772120200333893, + "loss": 1.694, + "loss_base2": 2.4439, + "loss_pixel": 0.1782, + "loss_text": 1.5159, + "ppl": 5.4412, + "step": 5538 + }, + { + "epoch": 0.03, + "global_step": 5539, + "learning_rate": 0.0004777170283806344, + "loss": 1.7143, + "loss_base2": 2.4732, + "loss_pixel": 0.1795, + "loss_text": 1.5348, + "ppl": 5.5528, + "step": 5539 + }, + { + "epoch": 0.03, + "global_step": 5540, + "learning_rate": 0.0004777128547579299, + "loss": 1.6893, + "loss_base2": 2.4371, + "loss_pixel": 0.1795, + "loss_text": 1.5097, + "ppl": 5.4157, + "step": 5540 + }, + { + "epoch": 0.03, + "global_step": 5541, + "learning_rate": 0.00047770868113522534, + "loss": 1.701, + "loss_base2": 2.454, + "loss_pixel": 0.1796, + "loss_text": 1.5213, + "ppl": 5.4794, + "step": 5541 + }, + { + "epoch": 0.03, + "global_step": 5542, + "learning_rate": 0.00047770450751252085, + "loss": 1.7015, + "loss_base2": 2.4547, + "loss_pixel": 0.18, + "loss_text": 1.5215, + "ppl": 5.4822, + "step": 5542 + }, + { + "epoch": 0.03, + "global_step": 5543, + "learning_rate": 0.00047770033388981636, + "loss": 1.699, + "loss_base2": 2.4511, + "loss_pixel": 0.1791, + "loss_text": 1.5198, + "ppl": 5.4685, + "step": 5543 + }, + { + "epoch": 0.03, + "global_step": 5544, + "learning_rate": 0.00047769616026711187, + "loss": 1.6999, + "loss_base2": 2.4524, + "loss_pixel": 0.1798, + "loss_text": 1.5201, + "ppl": 5.4734, + "step": 5544 + }, + { + "epoch": 0.03, + "global_step": 5545, + "learning_rate": 0.0004776919866444073, + "loss": 1.687, + "loss_base2": 2.4338, + "loss_pixel": 0.1786, + "loss_text": 1.5084, + "ppl": 5.4032, + "step": 5545 + }, + { + "epoch": 0.03, + "global_step": 5546, + "learning_rate": 0.0004776878130217028, + "loss": 1.6759, + "loss_base2": 2.4178, + "loss_pixel": 0.1779, + "loss_text": 1.498, + "ppl": 5.3436, + "step": 5546 + }, + { + "epoch": 0.03, + "global_step": 5547, + "learning_rate": 0.00047768363939899833, + "loss": 1.7062, + "loss_base2": 2.4615, + "loss_pixel": 0.1795, + "loss_text": 1.5267, + "ppl": 5.508, + "step": 5547 + }, + { + "epoch": 0.03, + "global_step": 5548, + "learning_rate": 0.00047767946577629384, + "loss": 1.6608, + "loss_base2": 2.396, + "loss_pixel": 0.1801, + "loss_text": 1.4807, + "ppl": 5.2635, + "step": 5548 + }, + { + "epoch": 0.03, + "global_step": 5549, + "learning_rate": 0.00047767529215358935, + "loss": 1.6274, + "loss_base2": 2.3478, + "loss_pixel": 0.1793, + "loss_text": 1.4481, + "ppl": 5.0906, + "step": 5549 + }, + { + "epoch": 0.03, + "global_step": 5550, + "learning_rate": 0.0004776711185308848, + "loss": 1.6817, + "loss_base2": 2.4262, + "loss_pixel": 0.1797, + "loss_text": 1.502, + "ppl": 5.3747, + "step": 5550 + }, + { + "epoch": 0.03, + "global_step": 5551, + "learning_rate": 0.0004776669449081803, + "loss": 1.7007, + "loss_base2": 2.4536, + "loss_pixel": 0.1787, + "loss_text": 1.522, + "ppl": 5.4778, + "step": 5551 + }, + { + "epoch": 0.03, + "global_step": 5552, + "learning_rate": 0.0004776627712854758, + "loss": 1.7034, + "loss_base2": 2.4575, + "loss_pixel": 0.1802, + "loss_text": 1.5232, + "ppl": 5.4926, + "step": 5552 + }, + { + "epoch": 0.03, + "global_step": 5553, + "learning_rate": 0.0004776585976627713, + "loss": 1.7045, + "loss_base2": 2.4591, + "loss_pixel": 0.1798, + "loss_text": 1.5247, + "ppl": 5.4986, + "step": 5553 + }, + { + "epoch": 0.03, + "global_step": 5554, + "learning_rate": 0.00047765442404006683, + "loss": 1.7018, + "loss_base2": 2.4552, + "loss_pixel": 0.1795, + "loss_text": 1.5223, + "ppl": 5.4838, + "step": 5554 + }, + { + "epoch": 0.03, + "global_step": 5555, + "learning_rate": 0.0004776502504173623, + "loss": 1.7096, + "loss_base2": 2.4664, + "loss_pixel": 0.1805, + "loss_text": 1.5291, + "ppl": 5.5268, + "step": 5555 + }, + { + "epoch": 0.03, + "global_step": 5556, + "learning_rate": 0.0004776460767946578, + "loss": 1.714, + "loss_base2": 2.4728, + "loss_pixel": 0.1813, + "loss_text": 1.5327, + "ppl": 5.5511, + "step": 5556 + }, + { + "epoch": 0.03, + "global_step": 5557, + "learning_rate": 0.0004776419031719533, + "loss": 1.7095, + "loss_base2": 2.4663, + "loss_pixel": 0.1851, + "loss_text": 1.5243, + "ppl": 5.5262, + "step": 5557 + }, + { + "epoch": 0.03, + "global_step": 5558, + "learning_rate": 0.00047763772954924875, + "loss": 1.7129, + "loss_base2": 2.4712, + "loss_pixel": 0.184, + "loss_text": 1.5289, + "ppl": 5.545, + "step": 5558 + }, + { + "epoch": 0.03, + "global_step": 5559, + "learning_rate": 0.0004776335559265442, + "loss": 1.705, + "loss_base2": 2.4598, + "loss_pixel": 0.1855, + "loss_text": 1.5195, + "ppl": 5.5014, + "step": 5559 + }, + { + "epoch": 0.03, + "global_step": 5560, + "learning_rate": 0.0004776293823038397, + "loss": 1.7079, + "loss_base2": 2.464, + "loss_pixel": 0.1875, + "loss_text": 1.5204, + "ppl": 5.5174, + "step": 5560 + }, + { + "epoch": 0.03, + "global_step": 5561, + "learning_rate": 0.0004776252086811352, + "loss": 1.6983, + "loss_base2": 2.4501, + "loss_pixel": 0.1858, + "loss_text": 1.5125, + "ppl": 5.4646, + "step": 5561 + }, + { + "epoch": 0.03, + "global_step": 5562, + "learning_rate": 0.0004776210350584307, + "loss": 1.7123, + "loss_base2": 2.4703, + "loss_pixel": 0.1876, + "loss_text": 1.5247, + "ppl": 5.5417, + "step": 5562 + }, + { + "epoch": 0.03, + "global_step": 5563, + "learning_rate": 0.00047761686143572623, + "loss": 1.7047, + "loss_base2": 2.4594, + "loss_pixel": 0.1839, + "loss_text": 1.5208, + "ppl": 5.4997, + "step": 5563 + }, + { + "epoch": 0.03, + "global_step": 5564, + "learning_rate": 0.0004776126878130217, + "loss": 1.6931, + "loss_base2": 2.4426, + "loss_pixel": 0.1863, + "loss_text": 1.5068, + "ppl": 5.4363, + "step": 5564 + }, + { + "epoch": 0.03, + "global_step": 5565, + "learning_rate": 0.0004776085141903172, + "loss": 1.7071, + "loss_base2": 2.4628, + "loss_pixel": 0.183, + "loss_text": 1.5241, + "ppl": 5.513, + "step": 5565 + }, + { + "epoch": 0.03, + "global_step": 5566, + "learning_rate": 0.0004776043405676127, + "loss": 1.7266, + "loss_base2": 2.491, + "loss_pixel": 0.182, + "loss_text": 1.5446, + "ppl": 5.6215, + "step": 5566 + }, + { + "epoch": 0.03, + "global_step": 5567, + "learning_rate": 0.0004776001669449082, + "loss": 1.6989, + "loss_base2": 2.451, + "loss_pixel": 0.1817, + "loss_text": 1.5172, + "ppl": 5.4679, + "step": 5567 + }, + { + "epoch": 0.03, + "global_step": 5568, + "learning_rate": 0.00047759599332220366, + "loss": 1.6971, + "loss_base2": 2.4484, + "loss_pixel": 0.1782, + "loss_text": 1.5189, + "ppl": 5.4581, + "step": 5568 + }, + { + "epoch": 0.03, + "global_step": 5569, + "learning_rate": 0.00047759181969949917, + "loss": 1.6878, + "loss_base2": 2.435, + "loss_pixel": 0.1812, + "loss_text": 1.5065, + "ppl": 5.4076, + "step": 5569 + }, + { + "epoch": 0.03, + "global_step": 5570, + "learning_rate": 0.0004775876460767947, + "loss": 1.7073, + "loss_base2": 2.4631, + "loss_pixel": 0.1796, + "loss_text": 1.5277, + "ppl": 5.5141, + "step": 5570 + }, + { + "epoch": 0.03, + "global_step": 5571, + "learning_rate": 0.0004775834724540902, + "loss": 1.7131, + "loss_base2": 2.4715, + "loss_pixel": 0.181, + "loss_text": 1.532, + "ppl": 5.5461, + "step": 5571 + }, + { + "epoch": 0.03, + "global_step": 5572, + "learning_rate": 0.0004775792988313857, + "loss": 1.7187, + "loss_base2": 2.4796, + "loss_pixel": 0.1783, + "loss_text": 1.5405, + "ppl": 5.5773, + "step": 5572 + }, + { + "epoch": 0.03, + "global_step": 5573, + "learning_rate": 0.00047757512520868114, + "loss": 1.6933, + "loss_base2": 2.4429, + "loss_pixel": 0.1773, + "loss_text": 1.516, + "ppl": 5.4374, + "step": 5573 + }, + { + "epoch": 0.03, + "global_step": 5574, + "learning_rate": 0.00047757095158597665, + "loss": 1.7067, + "loss_base2": 2.4622, + "loss_pixel": 0.176, + "loss_text": 1.5307, + "ppl": 5.5107, + "step": 5574 + }, + { + "epoch": 0.03, + "global_step": 5575, + "learning_rate": 0.00047756677796327216, + "loss": 1.6892, + "loss_base2": 2.437, + "loss_pixel": 0.1769, + "loss_text": 1.5123, + "ppl": 5.4151, + "step": 5575 + }, + { + "epoch": 0.03, + "global_step": 5576, + "learning_rate": 0.00047756260434056767, + "loss": 1.7043, + "loss_base2": 2.4588, + "loss_pixel": 0.1774, + "loss_text": 1.5268, + "ppl": 5.4975, + "step": 5576 + }, + { + "epoch": 0.03, + "global_step": 5577, + "learning_rate": 0.00047755843071786307, + "loss": 1.6968, + "loss_base2": 2.448, + "loss_pixel": 0.1761, + "loss_text": 1.5207, + "ppl": 5.4565, + "step": 5577 + }, + { + "epoch": 0.03, + "global_step": 5578, + "learning_rate": 0.0004775542570951586, + "loss": 1.6922, + "loss_base2": 2.4413, + "loss_pixel": 0.1754, + "loss_text": 1.5168, + "ppl": 5.4314, + "step": 5578 + }, + { + "epoch": 0.03, + "global_step": 5579, + "learning_rate": 0.0004775500834724541, + "loss": 1.6968, + "loss_base2": 2.448, + "loss_pixel": 0.1733, + "loss_text": 1.5235, + "ppl": 5.4565, + "step": 5579 + }, + { + "epoch": 0.03, + "global_step": 5580, + "learning_rate": 0.0004775459098497496, + "loss": 1.6829, + "loss_base2": 2.4279, + "loss_pixel": 0.1729, + "loss_text": 1.51, + "ppl": 5.3811, + "step": 5580 + }, + { + "epoch": 0.03, + "global_step": 5581, + "learning_rate": 0.0004775417362270451, + "loss": 1.7066, + "loss_base2": 2.4621, + "loss_pixel": 0.1744, + "loss_text": 1.5322, + "ppl": 5.5102, + "step": 5581 + }, + { + "epoch": 0.03, + "global_step": 5582, + "learning_rate": 0.00047753756260434055, + "loss": 1.7172, + "loss_base2": 2.4774, + "loss_pixel": 0.1734, + "loss_text": 1.5438, + "ppl": 5.5689, + "step": 5582 + }, + { + "epoch": 0.03, + "global_step": 5583, + "learning_rate": 0.00047753338898163606, + "loss": 1.7047, + "loss_base2": 2.4594, + "loss_pixel": 0.1771, + "loss_text": 1.5276, + "ppl": 5.4997, + "step": 5583 + }, + { + "epoch": 0.03, + "global_step": 5584, + "learning_rate": 0.00047752921535893156, + "loss": 1.6944, + "loss_base2": 2.4445, + "loss_pixel": 0.193, + "loss_text": 1.5014, + "ppl": 5.4434, + "step": 5584 + }, + { + "epoch": 0.03, + "global_step": 5585, + "learning_rate": 0.00047752504173622707, + "loss": 1.7056, + "loss_base2": 2.4607, + "loss_pixel": 0.1908, + "loss_text": 1.5149, + "ppl": 5.5047, + "step": 5585 + }, + { + "epoch": 0.03, + "global_step": 5586, + "learning_rate": 0.0004775208681135225, + "loss": 1.6826, + "loss_base2": 2.4275, + "loss_pixel": 0.1779, + "loss_text": 1.5048, + "ppl": 5.3795, + "step": 5586 + }, + { + "epoch": 0.03, + "global_step": 5587, + "learning_rate": 0.00047751669449081803, + "loss": 1.6826, + "loss_base2": 2.4275, + "loss_pixel": 0.1744, + "loss_text": 1.5082, + "ppl": 5.3795, + "step": 5587 + }, + { + "epoch": 0.03, + "global_step": 5588, + "learning_rate": 0.00047751252086811354, + "loss": 1.6884, + "loss_base2": 2.4358, + "loss_pixel": 0.1758, + "loss_text": 1.5126, + "ppl": 5.4108, + "step": 5588 + }, + { + "epoch": 0.03, + "global_step": 5589, + "learning_rate": 0.00047750834724540905, + "loss": 1.7033, + "loss_base2": 2.4573, + "loss_pixel": 0.1734, + "loss_text": 1.53, + "ppl": 5.492, + "step": 5589 + }, + { + "epoch": 0.03, + "global_step": 5590, + "learning_rate": 0.00047750417362270455, + "loss": 1.6759, + "loss_base2": 2.4178, + "loss_pixel": 0.1723, + "loss_text": 1.5036, + "ppl": 5.3436, + "step": 5590 + }, + { + "epoch": 0.03, + "global_step": 5591, + "learning_rate": 0.0004775, + "loss": 1.6934, + "loss_base2": 2.4431, + "loss_pixel": 0.1731, + "loss_text": 1.5203, + "ppl": 5.4379, + "step": 5591 + }, + { + "epoch": 0.03, + "global_step": 5592, + "learning_rate": 0.0004774958263772955, + "loss": 1.6833, + "loss_base2": 2.4285, + "loss_pixel": 0.1737, + "loss_text": 1.5096, + "ppl": 5.3833, + "step": 5592 + }, + { + "epoch": 0.03, + "global_step": 5593, + "learning_rate": 0.000477491652754591, + "loss": 1.6721, + "loss_base2": 2.4123, + "loss_pixel": 0.174, + "loss_text": 1.4981, + "ppl": 5.3233, + "step": 5593 + }, + { + "epoch": 0.03, + "global_step": 5594, + "learning_rate": 0.00047748747913188653, + "loss": 1.6949, + "loss_base2": 2.4452, + "loss_pixel": 0.1748, + "loss_text": 1.5201, + "ppl": 5.4461, + "step": 5594 + }, + { + "epoch": 0.03, + "global_step": 5595, + "learning_rate": 0.0004774833055091819, + "loss": 1.6921, + "loss_base2": 2.4412, + "loss_pixel": 0.1725, + "loss_text": 1.5197, + "ppl": 5.4309, + "step": 5595 + }, + { + "epoch": 0.03, + "global_step": 5596, + "learning_rate": 0.00047747913188647743, + "loss": 1.7078, + "loss_base2": 2.4638, + "loss_pixel": 0.1723, + "loss_text": 1.5355, + "ppl": 5.5168, + "step": 5596 + }, + { + "epoch": 0.03, + "global_step": 5597, + "learning_rate": 0.00047747495826377294, + "loss": 1.6855, + "loss_base2": 2.4317, + "loss_pixel": 0.1733, + "loss_text": 1.5123, + "ppl": 5.3951, + "step": 5597 + }, + { + "epoch": 0.03, + "global_step": 5598, + "learning_rate": 0.00047747078464106845, + "loss": 1.7, + "loss_base2": 2.4526, + "loss_pixel": 0.1721, + "loss_text": 1.5279, + "ppl": 5.4739, + "step": 5598 + }, + { + "epoch": 0.03, + "global_step": 5599, + "learning_rate": 0.00047746661101836396, + "loss": 1.7142, + "loss_base2": 2.4731, + "loss_pixel": 0.1748, + "loss_text": 1.5394, + "ppl": 5.5522, + "step": 5599 + }, + { + "epoch": 0.03, + "global_step": 5600, + "learning_rate": 0.0004774624373956594, + "loss": 1.6697, + "loss_base2": 2.4089, + "loss_pixel": 0.1718, + "loss_text": 1.4979, + "ppl": 5.3106, + "step": 5600 + }, + { + "epoch": 0.03, + "global_step": 5601, + "learning_rate": 0.0004774582637729549, + "loss": 1.697, + "loss_base2": 2.4483, + "loss_pixel": 0.1726, + "loss_text": 1.5244, + "ppl": 5.4576, + "step": 5601 + }, + { + "epoch": 0.03, + "global_step": 5602, + "learning_rate": 0.0004774540901502504, + "loss": 1.6888, + "loss_base2": 2.4364, + "loss_pixel": 0.1711, + "loss_text": 1.5177, + "ppl": 5.413, + "step": 5602 + }, + { + "epoch": 0.03, + "global_step": 5603, + "learning_rate": 0.00047744991652754593, + "loss": 1.6969, + "loss_base2": 2.4481, + "loss_pixel": 0.1715, + "loss_text": 1.5254, + "ppl": 5.457, + "step": 5603 + }, + { + "epoch": 0.03, + "global_step": 5604, + "learning_rate": 0.0004774457429048414, + "loss": 1.7098, + "loss_base2": 2.4667, + "loss_pixel": 0.1698, + "loss_text": 1.54, + "ppl": 5.5279, + "step": 5604 + }, + { + "epoch": 0.03, + "global_step": 5605, + "learning_rate": 0.0004774415692821369, + "loss": 1.6974, + "loss_base2": 2.4488, + "loss_pixel": 0.1715, + "loss_text": 1.526, + "ppl": 5.4597, + "step": 5605 + }, + { + "epoch": 0.03, + "global_step": 5606, + "learning_rate": 0.0004774373956594324, + "loss": 1.6893, + "loss_base2": 2.4371, + "loss_pixel": 0.1702, + "loss_text": 1.5191, + "ppl": 5.4157, + "step": 5606 + }, + { + "epoch": 0.03, + "global_step": 5607, + "learning_rate": 0.0004774332220367279, + "loss": 1.68, + "loss_base2": 2.4237, + "loss_pixel": 0.1736, + "loss_text": 1.5064, + "ppl": 5.3656, + "step": 5607 + }, + { + "epoch": 0.03, + "global_step": 5608, + "learning_rate": 0.0004774290484140234, + "loss": 1.7008, + "loss_base2": 2.4537, + "loss_pixel": 0.1708, + "loss_text": 1.5299, + "ppl": 5.4783, + "step": 5608 + }, + { + "epoch": 0.03, + "global_step": 5609, + "learning_rate": 0.00047742487479131887, + "loss": 1.6796, + "loss_base2": 2.4232, + "loss_pixel": 0.1688, + "loss_text": 1.5107, + "ppl": 5.3634, + "step": 5609 + }, + { + "epoch": 0.03, + "global_step": 5610, + "learning_rate": 0.0004774207011686144, + "loss": 1.6824, + "loss_base2": 2.4272, + "loss_pixel": 0.1693, + "loss_text": 1.5131, + "ppl": 5.3784, + "step": 5610 + }, + { + "epoch": 0.03, + "global_step": 5611, + "learning_rate": 0.0004774165275459099, + "loss": 1.6894, + "loss_base2": 2.4373, + "loss_pixel": 0.1708, + "loss_text": 1.5186, + "ppl": 5.4162, + "step": 5611 + }, + { + "epoch": 0.03, + "global_step": 5612, + "learning_rate": 0.0004774123539232054, + "loss": 1.6914, + "loss_base2": 2.4402, + "loss_pixel": 0.1711, + "loss_text": 1.5203, + "ppl": 5.4271, + "step": 5612 + }, + { + "epoch": 0.03, + "global_step": 5613, + "learning_rate": 0.0004774081803005009, + "loss": 1.6904, + "loss_base2": 2.4387, + "loss_pixel": 0.1703, + "loss_text": 1.52, + "ppl": 5.4216, + "step": 5613 + }, + { + "epoch": 0.03, + "global_step": 5614, + "learning_rate": 0.0004774040066777963, + "loss": 1.6906, + "loss_base2": 2.439, + "loss_pixel": 0.1706, + "loss_text": 1.52, + "ppl": 5.4227, + "step": 5614 + }, + { + "epoch": 0.03, + "global_step": 5615, + "learning_rate": 0.0004773998330550918, + "loss": 1.6977, + "loss_base2": 2.4493, + "loss_pixel": 0.1689, + "loss_text": 1.5288, + "ppl": 5.4614, + "step": 5615 + }, + { + "epoch": 0.03, + "global_step": 5616, + "learning_rate": 0.0004773956594323873, + "loss": 1.6961, + "loss_base2": 2.447, + "loss_pixel": 0.1703, + "loss_text": 1.5258, + "ppl": 5.4526, + "step": 5616 + }, + { + "epoch": 0.03, + "global_step": 5617, + "learning_rate": 0.0004773914858096828, + "loss": 1.6887, + "loss_base2": 2.4363, + "loss_pixel": 0.169, + "loss_text": 1.5197, + "ppl": 5.4124, + "step": 5617 + }, + { + "epoch": 0.03, + "global_step": 5618, + "learning_rate": 0.00047738731218697827, + "loss": 1.7083, + "loss_base2": 2.4646, + "loss_pixel": 0.1706, + "loss_text": 1.5377, + "ppl": 5.5196, + "step": 5618 + }, + { + "epoch": 0.03, + "global_step": 5619, + "learning_rate": 0.0004773831385642738, + "loss": 1.6922, + "loss_base2": 2.4413, + "loss_pixel": 0.1698, + "loss_text": 1.5224, + "ppl": 5.4314, + "step": 5619 + }, + { + "epoch": 0.03, + "global_step": 5620, + "learning_rate": 0.0004773789649415693, + "loss": 1.6807, + "loss_base2": 2.4247, + "loss_pixel": 0.1715, + "loss_text": 1.5092, + "ppl": 5.3693, + "step": 5620 + }, + { + "epoch": 0.03, + "global_step": 5621, + "learning_rate": 0.0004773747913188648, + "loss": 1.6828, + "loss_base2": 2.4278, + "loss_pixel": 0.1707, + "loss_text": 1.5122, + "ppl": 5.3806, + "step": 5621 + }, + { + "epoch": 0.03, + "global_step": 5622, + "learning_rate": 0.0004773706176961603, + "loss": 1.6891, + "loss_base2": 2.4369, + "loss_pixel": 0.171, + "loss_text": 1.518, + "ppl": 5.4146, + "step": 5622 + }, + { + "epoch": 0.03, + "global_step": 5623, + "learning_rate": 0.00047736644407345575, + "loss": 1.6884, + "loss_base2": 2.4358, + "loss_pixel": 0.1687, + "loss_text": 1.5197, + "ppl": 5.4108, + "step": 5623 + }, + { + "epoch": 0.03, + "global_step": 5624, + "learning_rate": 0.00047736227045075126, + "loss": 1.6742, + "loss_base2": 2.4154, + "loss_pixel": 0.1699, + "loss_text": 1.5043, + "ppl": 5.3345, + "step": 5624 + }, + { + "epoch": 0.03, + "global_step": 5625, + "learning_rate": 0.00047735809682804677, + "loss": 1.6902, + "loss_base2": 2.4384, + "loss_pixel": 0.1684, + "loss_text": 1.5218, + "ppl": 5.4206, + "step": 5625 + }, + { + "epoch": 0.03, + "global_step": 5626, + "learning_rate": 0.0004773539232053423, + "loss": 1.6803, + "loss_base2": 2.4242, + "loss_pixel": 0.1692, + "loss_text": 1.5111, + "ppl": 5.3672, + "step": 5626 + }, + { + "epoch": 0.03, + "global_step": 5627, + "learning_rate": 0.0004773497495826377, + "loss": 1.6791, + "loss_base2": 2.4224, + "loss_pixel": 0.1688, + "loss_text": 1.5103, + "ppl": 5.3607, + "step": 5627 + }, + { + "epoch": 0.03, + "global_step": 5628, + "learning_rate": 0.00047734557595993323, + "loss": 1.6791, + "loss_base2": 2.4224, + "loss_pixel": 0.1715, + "loss_text": 1.5076, + "ppl": 5.3607, + "step": 5628 + }, + { + "epoch": 0.03, + "global_step": 5629, + "learning_rate": 0.00047734140233722874, + "loss": 1.6685, + "loss_base2": 2.4071, + "loss_pixel": 0.17, + "loss_text": 1.4985, + "ppl": 5.3042, + "step": 5629 + }, + { + "epoch": 0.03, + "global_step": 5630, + "learning_rate": 0.00047733722871452425, + "loss": 1.6931, + "loss_base2": 2.4426, + "loss_pixel": 0.1687, + "loss_text": 1.5243, + "ppl": 5.4363, + "step": 5630 + }, + { + "epoch": 0.03, + "global_step": 5631, + "learning_rate": 0.00047733305509181976, + "loss": 1.7031, + "loss_base2": 2.4571, + "loss_pixel": 0.1679, + "loss_text": 1.5352, + "ppl": 5.4909, + "step": 5631 + }, + { + "epoch": 0.03, + "global_step": 5632, + "learning_rate": 0.0004773288814691152, + "loss": 1.6874, + "loss_base2": 2.4344, + "loss_pixel": 0.171, + "loss_text": 1.5164, + "ppl": 5.4054, + "step": 5632 + }, + { + "epoch": 0.03, + "global_step": 5633, + "learning_rate": 0.00047732470784641066, + "loss": 1.7015, + "loss_base2": 2.4547, + "loss_pixel": 0.1695, + "loss_text": 1.532, + "ppl": 5.4822, + "step": 5633 + }, + { + "epoch": 0.03, + "global_step": 5634, + "learning_rate": 0.00047732053422370617, + "loss": 1.6718, + "loss_base2": 2.4119, + "loss_pixel": 0.1686, + "loss_text": 1.5032, + "ppl": 5.3217, + "step": 5634 + }, + { + "epoch": 0.03, + "global_step": 5635, + "learning_rate": 0.0004773163606010017, + "loss": 1.6597, + "loss_base2": 2.3944, + "loss_pixel": 0.1707, + "loss_text": 1.489, + "ppl": 5.2577, + "step": 5635 + }, + { + "epoch": 0.03, + "global_step": 5636, + "learning_rate": 0.00047731218697829713, + "loss": 1.6945, + "loss_base2": 2.4446, + "loss_pixel": 0.1723, + "loss_text": 1.5222, + "ppl": 5.4439, + "step": 5636 + }, + { + "epoch": 0.03, + "global_step": 5637, + "learning_rate": 0.00047730801335559264, + "loss": 1.6907, + "loss_base2": 2.4392, + "loss_pixel": 0.184, + "loss_text": 1.5067, + "ppl": 5.4233, + "step": 5637 + }, + { + "epoch": 0.03, + "global_step": 5638, + "learning_rate": 0.00047730383973288814, + "loss": 1.7031, + "loss_base2": 2.4571, + "loss_pixel": 0.1837, + "loss_text": 1.5194, + "ppl": 5.4909, + "step": 5638 + }, + { + "epoch": 0.03, + "global_step": 5639, + "learning_rate": 0.00047729966611018365, + "loss": 1.6804, + "loss_base2": 2.4243, + "loss_pixel": 0.1835, + "loss_text": 1.4969, + "ppl": 5.3677, + "step": 5639 + }, + { + "epoch": 0.03, + "global_step": 5640, + "learning_rate": 0.00047729549248747916, + "loss": 1.697, + "loss_base2": 2.4483, + "loss_pixel": 0.182, + "loss_text": 1.5149, + "ppl": 5.4576, + "step": 5640 + }, + { + "epoch": 0.03, + "global_step": 5641, + "learning_rate": 0.0004772913188647746, + "loss": 1.6975, + "loss_base2": 2.449, + "loss_pixel": 0.1819, + "loss_text": 1.5156, + "ppl": 5.4603, + "step": 5641 + }, + { + "epoch": 0.03, + "global_step": 5642, + "learning_rate": 0.0004772871452420701, + "loss": 1.6987, + "loss_base2": 2.4507, + "loss_pixel": 0.1817, + "loss_text": 1.5171, + "ppl": 5.4668, + "step": 5642 + }, + { + "epoch": 0.03, + "global_step": 5643, + "learning_rate": 0.00047728297161936563, + "loss": 1.6997, + "loss_base2": 2.4521, + "loss_pixel": 0.1829, + "loss_text": 1.5168, + "ppl": 5.4723, + "step": 5643 + }, + { + "epoch": 0.03, + "global_step": 5644, + "learning_rate": 0.00047727879799666113, + "loss": 1.703, + "loss_base2": 2.4569, + "loss_pixel": 0.184, + "loss_text": 1.519, + "ppl": 5.4904, + "step": 5644 + }, + { + "epoch": 0.03, + "global_step": 5645, + "learning_rate": 0.0004772746243739566, + "loss": 1.6966, + "loss_base2": 2.4477, + "loss_pixel": 0.1823, + "loss_text": 1.5142, + "ppl": 5.4554, + "step": 5645 + }, + { + "epoch": 0.03, + "global_step": 5646, + "learning_rate": 0.0004772704507512521, + "loss": 1.7074, + "loss_base2": 2.4633, + "loss_pixel": 0.1842, + "loss_text": 1.5232, + "ppl": 5.5146, + "step": 5646 + }, + { + "epoch": 0.03, + "global_step": 5647, + "learning_rate": 0.0004772662771285476, + "loss": 1.7342, + "loss_base2": 2.5019, + "loss_pixel": 0.1945, + "loss_text": 1.5397, + "ppl": 5.6644, + "step": 5647 + }, + { + "epoch": 0.03, + "global_step": 5648, + "learning_rate": 0.0004772621035058431, + "loss": 1.719, + "loss_base2": 2.48, + "loss_pixel": 0.2, + "loss_text": 1.519, + "ppl": 5.5789, + "step": 5648 + }, + { + "epoch": 0.03, + "global_step": 5649, + "learning_rate": 0.0004772579298831386, + "loss": 1.7233, + "loss_base2": 2.4862, + "loss_pixel": 0.1996, + "loss_text": 1.5237, + "ppl": 5.603, + "step": 5649 + }, + { + "epoch": 0.04, + "global_step": 5650, + "learning_rate": 0.00047725375626043407, + "loss": 1.7202, + "loss_base2": 2.4817, + "loss_pixel": 0.1979, + "loss_text": 1.5223, + "ppl": 5.5856, + "step": 5650 + }, + { + "epoch": 0.04, + "global_step": 5651, + "learning_rate": 0.0004772495826377296, + "loss": 1.7177, + "loss_base2": 2.4781, + "loss_pixel": 0.1985, + "loss_text": 1.5192, + "ppl": 5.5717, + "step": 5651 + }, + { + "epoch": 0.04, + "global_step": 5652, + "learning_rate": 0.00047724540901502503, + "loss": 1.7343, + "loss_base2": 2.5021, + "loss_pixel": 0.2015, + "loss_text": 1.5328, + "ppl": 5.665, + "step": 5652 + }, + { + "epoch": 0.04, + "global_step": 5653, + "learning_rate": 0.00047724123539232054, + "loss": 1.7156, + "loss_base2": 2.4751, + "loss_pixel": 0.1959, + "loss_text": 1.5197, + "ppl": 5.56, + "step": 5653 + }, + { + "epoch": 0.04, + "global_step": 5654, + "learning_rate": 0.000477237061769616, + "loss": 1.7051, + "loss_base2": 2.4599, + "loss_pixel": 0.1955, + "loss_text": 1.5096, + "ppl": 5.5019, + "step": 5654 + }, + { + "epoch": 0.04, + "global_step": 5655, + "learning_rate": 0.0004772328881469115, + "loss": 1.7157, + "loss_base2": 2.4752, + "loss_pixel": 0.1928, + "loss_text": 1.5229, + "ppl": 5.5606, + "step": 5655 + }, + { + "epoch": 0.04, + "global_step": 5656, + "learning_rate": 0.000477228714524207, + "loss": 1.7066, + "loss_base2": 2.4621, + "loss_pixel": 0.19, + "loss_text": 1.5166, + "ppl": 5.5102, + "step": 5656 + }, + { + "epoch": 0.04, + "global_step": 5657, + "learning_rate": 0.0004772245409015025, + "loss": 1.7111, + "loss_base2": 2.4686, + "loss_pixel": 0.1897, + "loss_text": 1.5214, + "ppl": 5.535, + "step": 5657 + }, + { + "epoch": 0.04, + "global_step": 5658, + "learning_rate": 0.000477220367278798, + "loss": 1.7032, + "loss_base2": 2.4572, + "loss_pixel": 0.1894, + "loss_text": 1.5138, + "ppl": 5.4915, + "step": 5658 + }, + { + "epoch": 0.04, + "global_step": 5659, + "learning_rate": 0.0004772161936560935, + "loss": 1.7097, + "loss_base2": 2.4666, + "loss_pixel": 0.1885, + "loss_text": 1.5212, + "ppl": 5.5273, + "step": 5659 + }, + { + "epoch": 0.04, + "global_step": 5660, + "learning_rate": 0.000477212020033389, + "loss": 1.7209, + "loss_base2": 2.4827, + "loss_pixel": 0.1878, + "loss_text": 1.5331, + "ppl": 5.5896, + "step": 5660 + }, + { + "epoch": 0.04, + "global_step": 5661, + "learning_rate": 0.0004772078464106845, + "loss": 1.7026, + "loss_base2": 2.4563, + "loss_pixel": 0.1893, + "loss_text": 1.5133, + "ppl": 5.4882, + "step": 5661 + }, + { + "epoch": 0.04, + "global_step": 5662, + "learning_rate": 0.00047720367278798, + "loss": 1.5605, + "loss_base2": 2.2513, + "loss_pixel": 0.1879, + "loss_text": 1.3726, + "ppl": 4.7612, + "step": 5662 + }, + { + "epoch": 0.04, + "global_step": 5663, + "learning_rate": 0.00047719949916527545, + "loss": 1.4976, + "loss_base2": 2.1606, + "loss_pixel": 0.1872, + "loss_text": 1.3104, + "ppl": 4.4709, + "step": 5663 + }, + { + "epoch": 0.04, + "global_step": 5664, + "learning_rate": 0.00047719532554257096, + "loss": 1.4931, + "loss_base2": 2.1541, + "loss_pixel": 0.1869, + "loss_text": 1.3062, + "ppl": 4.4509, + "step": 5664 + }, + { + "epoch": 0.04, + "global_step": 5665, + "learning_rate": 0.00047719115191986646, + "loss": 1.4598, + "loss_base2": 2.106, + "loss_pixel": 0.1854, + "loss_text": 1.2743, + "ppl": 4.3051, + "step": 5665 + }, + { + "epoch": 0.04, + "global_step": 5666, + "learning_rate": 0.00047718697829716197, + "loss": 1.493, + "loss_base2": 2.1539, + "loss_pixel": 0.1841, + "loss_text": 1.3089, + "ppl": 4.4504, + "step": 5666 + }, + { + "epoch": 0.04, + "global_step": 5667, + "learning_rate": 0.0004771828046744575, + "loss": 1.5091, + "loss_base2": 2.1772, + "loss_pixel": 0.1847, + "loss_text": 1.3244, + "ppl": 4.5227, + "step": 5667 + }, + { + "epoch": 0.04, + "global_step": 5668, + "learning_rate": 0.00047717863105175293, + "loss": 1.4932, + "loss_base2": 2.1542, + "loss_pixel": 0.1849, + "loss_text": 1.3083, + "ppl": 4.4513, + "step": 5668 + }, + { + "epoch": 0.04, + "global_step": 5669, + "learning_rate": 0.00047717445742904844, + "loss": 1.4721, + "loss_base2": 2.1238, + "loss_pixel": 0.1833, + "loss_text": 1.2888, + "ppl": 4.3584, + "step": 5669 + }, + { + "epoch": 0.04, + "global_step": 5670, + "learning_rate": 0.00047717028380634395, + "loss": 1.6026, + "loss_base2": 2.3121, + "loss_pixel": 0.1839, + "loss_text": 1.4187, + "ppl": 4.9659, + "step": 5670 + }, + { + "epoch": 0.04, + "global_step": 5671, + "learning_rate": 0.0004771661101836394, + "loss": 1.7377, + "loss_base2": 2.507, + "loss_pixel": 0.1834, + "loss_text": 1.5542, + "ppl": 5.6843, + "step": 5671 + }, + { + "epoch": 0.04, + "global_step": 5672, + "learning_rate": 0.0004771619365609349, + "loss": 1.7151, + "loss_base2": 2.4744, + "loss_pixel": 0.1834, + "loss_text": 1.5316, + "ppl": 5.5572, + "step": 5672 + }, + { + "epoch": 0.04, + "global_step": 5673, + "learning_rate": 0.00047715776293823036, + "loss": 1.7035, + "loss_base2": 2.4576, + "loss_pixel": 0.1842, + "loss_text": 1.5193, + "ppl": 5.4931, + "step": 5673 + }, + { + "epoch": 0.04, + "global_step": 5674, + "learning_rate": 0.00047715358931552587, + "loss": 1.7058, + "loss_base2": 2.4609, + "loss_pixel": 0.1814, + "loss_text": 1.5244, + "ppl": 5.5058, + "step": 5674 + }, + { + "epoch": 0.04, + "global_step": 5675, + "learning_rate": 0.0004771494156928214, + "loss": 1.7148, + "loss_base2": 2.4739, + "loss_pixel": 0.1833, + "loss_text": 1.5314, + "ppl": 5.5556, + "step": 5675 + }, + { + "epoch": 0.04, + "global_step": 5676, + "learning_rate": 0.0004771452420701169, + "loss": 1.7093, + "loss_base2": 2.466, + "loss_pixel": 0.1817, + "loss_text": 1.5276, + "ppl": 5.5251, + "step": 5676 + }, + { + "epoch": 0.04, + "global_step": 5677, + "learning_rate": 0.00047714106844741233, + "loss": 1.7063, + "loss_base2": 2.4617, + "loss_pixel": 0.1815, + "loss_text": 1.5248, + "ppl": 5.5085, + "step": 5677 + }, + { + "epoch": 0.04, + "global_step": 5678, + "learning_rate": 0.00047713689482470784, + "loss": 1.7098, + "loss_base2": 2.4667, + "loss_pixel": 0.1819, + "loss_text": 1.5279, + "ppl": 5.5279, + "step": 5678 + }, + { + "epoch": 0.04, + "global_step": 5679, + "learning_rate": 0.00047713272120200335, + "loss": 1.7198, + "loss_base2": 2.4811, + "loss_pixel": 0.1823, + "loss_text": 1.5374, + "ppl": 5.5834, + "step": 5679 + }, + { + "epoch": 0.04, + "global_step": 5680, + "learning_rate": 0.00047712854757929886, + "loss": 1.6998, + "loss_base2": 2.4523, + "loss_pixel": 0.1813, + "loss_text": 1.5185, + "ppl": 5.4729, + "step": 5680 + }, + { + "epoch": 0.04, + "global_step": 5681, + "learning_rate": 0.00047712437395659436, + "loss": 1.7137, + "loss_base2": 2.4723, + "loss_pixel": 0.1805, + "loss_text": 1.5332, + "ppl": 5.5495, + "step": 5681 + }, + { + "epoch": 0.04, + "global_step": 5682, + "learning_rate": 0.0004771202003338898, + "loss": 1.7182, + "loss_base2": 2.4788, + "loss_pixel": 0.1821, + "loss_text": 1.5361, + "ppl": 5.5745, + "step": 5682 + }, + { + "epoch": 0.04, + "global_step": 5683, + "learning_rate": 0.0004771160267111853, + "loss": 1.7063, + "loss_base2": 2.4617, + "loss_pixel": 0.1825, + "loss_text": 1.5238, + "ppl": 5.5085, + "step": 5683 + }, + { + "epoch": 0.04, + "global_step": 5684, + "learning_rate": 0.00047711185308848083, + "loss": 1.6949, + "loss_base2": 2.4452, + "loss_pixel": 0.1822, + "loss_text": 1.5128, + "ppl": 5.4461, + "step": 5684 + }, + { + "epoch": 0.04, + "global_step": 5685, + "learning_rate": 0.00047710767946577634, + "loss": 1.7183, + "loss_base2": 2.479, + "loss_pixel": 0.1855, + "loss_text": 1.5329, + "ppl": 5.575, + "step": 5685 + }, + { + "epoch": 0.04, + "global_step": 5686, + "learning_rate": 0.0004771035058430718, + "loss": 1.7011, + "loss_base2": 2.4542, + "loss_pixel": 0.1813, + "loss_text": 1.5198, + "ppl": 5.48, + "step": 5686 + }, + { + "epoch": 0.04, + "global_step": 5687, + "learning_rate": 0.0004770993322203673, + "loss": 1.692, + "loss_base2": 2.441, + "loss_pixel": 0.1819, + "loss_text": 1.5101, + "ppl": 5.4303, + "step": 5687 + }, + { + "epoch": 0.04, + "global_step": 5688, + "learning_rate": 0.0004770951585976628, + "loss": 1.686, + "loss_base2": 2.4324, + "loss_pixel": 0.1801, + "loss_text": 1.5059, + "ppl": 5.3978, + "step": 5688 + }, + { + "epoch": 0.04, + "global_step": 5689, + "learning_rate": 0.0004770909849749583, + "loss": 1.7075, + "loss_base2": 2.4634, + "loss_pixel": 0.1809, + "loss_text": 1.5266, + "ppl": 5.5152, + "step": 5689 + }, + { + "epoch": 0.04, + "global_step": 5690, + "learning_rate": 0.00047708681135225377, + "loss": 1.7067, + "loss_base2": 2.4622, + "loss_pixel": 0.1832, + "loss_text": 1.5236, + "ppl": 5.5107, + "step": 5690 + }, + { + "epoch": 0.04, + "global_step": 5691, + "learning_rate": 0.0004770826377295492, + "loss": 1.7171, + "loss_base2": 2.4773, + "loss_pixel": 0.1806, + "loss_text": 1.5365, + "ppl": 5.5684, + "step": 5691 + }, + { + "epoch": 0.04, + "global_step": 5692, + "learning_rate": 0.0004770784641068447, + "loss": 1.7055, + "loss_base2": 2.4605, + "loss_pixel": 0.1797, + "loss_text": 1.5258, + "ppl": 5.5041, + "step": 5692 + }, + { + "epoch": 0.04, + "global_step": 5693, + "learning_rate": 0.00047707429048414023, + "loss": 1.7053, + "loss_base2": 2.4602, + "loss_pixel": 0.1797, + "loss_text": 1.5257, + "ppl": 5.503, + "step": 5693 + }, + { + "epoch": 0.04, + "global_step": 5694, + "learning_rate": 0.00047707011686143574, + "loss": 1.7071, + "loss_base2": 2.4628, + "loss_pixel": 0.1805, + "loss_text": 1.5267, + "ppl": 5.513, + "step": 5694 + }, + { + "epoch": 0.04, + "global_step": 5695, + "learning_rate": 0.0004770659432387312, + "loss": 1.6936, + "loss_base2": 2.4433, + "loss_pixel": 0.1797, + "loss_text": 1.514, + "ppl": 5.439, + "step": 5695 + }, + { + "epoch": 0.04, + "global_step": 5696, + "learning_rate": 0.0004770617696160267, + "loss": 1.7014, + "loss_base2": 2.4546, + "loss_pixel": 0.1807, + "loss_text": 1.5207, + "ppl": 5.4816, + "step": 5696 + }, + { + "epoch": 0.04, + "global_step": 5697, + "learning_rate": 0.0004770575959933222, + "loss": 1.6898, + "loss_base2": 2.4379, + "loss_pixel": 0.1801, + "loss_text": 1.5097, + "ppl": 5.4184, + "step": 5697 + }, + { + "epoch": 0.04, + "global_step": 5698, + "learning_rate": 0.0004770534223706177, + "loss": 1.6861, + "loss_base2": 2.4325, + "loss_pixel": 0.1803, + "loss_text": 1.5059, + "ppl": 5.3984, + "step": 5698 + }, + { + "epoch": 0.04, + "global_step": 5699, + "learning_rate": 0.0004770492487479132, + "loss": 1.7047, + "loss_base2": 2.4594, + "loss_pixel": 0.1812, + "loss_text": 1.5236, + "ppl": 5.4997, + "step": 5699 + }, + { + "epoch": 0.04, + "global_step": 5700, + "learning_rate": 0.0004770450751252087, + "loss": 1.7102, + "loss_base2": 2.4673, + "loss_pixel": 0.1795, + "loss_text": 1.5308, + "ppl": 5.5301, + "step": 5700 + }, + { + "epoch": 0.04, + "global_step": 5701, + "learning_rate": 0.0004770409015025042, + "loss": 1.6932, + "loss_base2": 2.4428, + "loss_pixel": 0.1812, + "loss_text": 1.512, + "ppl": 5.4369, + "step": 5701 + }, + { + "epoch": 0.04, + "global_step": 5702, + "learning_rate": 0.0004770367278797997, + "loss": 1.6886, + "loss_base2": 2.4361, + "loss_pixel": 0.1811, + "loss_text": 1.5075, + "ppl": 5.4119, + "step": 5702 + }, + { + "epoch": 0.04, + "global_step": 5703, + "learning_rate": 0.0004770325542570952, + "loss": 1.6745, + "loss_base2": 2.4158, + "loss_pixel": 0.1805, + "loss_text": 1.494, + "ppl": 5.3361, + "step": 5703 + }, + { + "epoch": 0.04, + "global_step": 5704, + "learning_rate": 0.00047702838063439065, + "loss": 1.6865, + "loss_base2": 2.4331, + "loss_pixel": 0.1802, + "loss_text": 1.5063, + "ppl": 5.4005, + "step": 5704 + }, + { + "epoch": 0.04, + "global_step": 5705, + "learning_rate": 0.00047702420701168616, + "loss": 1.709, + "loss_base2": 2.4656, + "loss_pixel": 0.1778, + "loss_text": 1.5312, + "ppl": 5.5234, + "step": 5705 + }, + { + "epoch": 0.04, + "global_step": 5706, + "learning_rate": 0.00047702003338898167, + "loss": 1.6836, + "loss_base2": 2.4289, + "loss_pixel": 0.1758, + "loss_text": 1.5078, + "ppl": 5.3849, + "step": 5706 + }, + { + "epoch": 0.04, + "global_step": 5707, + "learning_rate": 0.0004770158597662772, + "loss": 1.6856, + "loss_base2": 2.4318, + "loss_pixel": 0.1754, + "loss_text": 1.5102, + "ppl": 5.3957, + "step": 5707 + }, + { + "epoch": 0.04, + "global_step": 5708, + "learning_rate": 0.00047701168614357263, + "loss": 1.6767, + "loss_base2": 2.419, + "loss_pixel": 0.1733, + "loss_text": 1.5035, + "ppl": 5.3479, + "step": 5708 + }, + { + "epoch": 0.04, + "global_step": 5709, + "learning_rate": 0.0004770075125208681, + "loss": 1.6849, + "loss_base2": 2.4308, + "loss_pixel": 0.1737, + "loss_text": 1.5112, + "ppl": 5.3919, + "step": 5709 + }, + { + "epoch": 0.04, + "global_step": 5710, + "learning_rate": 0.0004770033388981636, + "loss": 1.6714, + "loss_base2": 2.4113, + "loss_pixel": 0.1738, + "loss_text": 1.4976, + "ppl": 5.3196, + "step": 5710 + }, + { + "epoch": 0.04, + "global_step": 5711, + "learning_rate": 0.0004769991652754591, + "loss": 1.6822, + "loss_base2": 2.4269, + "loss_pixel": 0.1735, + "loss_text": 1.5088, + "ppl": 5.3774, + "step": 5711 + }, + { + "epoch": 0.04, + "global_step": 5712, + "learning_rate": 0.0004769949916527546, + "loss": 1.6809, + "loss_base2": 2.425, + "loss_pixel": 0.1731, + "loss_text": 1.5079, + "ppl": 5.3704, + "step": 5712 + }, + { + "epoch": 0.04, + "global_step": 5713, + "learning_rate": 0.00047699081803005006, + "loss": 1.6888, + "loss_base2": 2.4364, + "loss_pixel": 0.1724, + "loss_text": 1.5163, + "ppl": 5.413, + "step": 5713 + }, + { + "epoch": 0.04, + "global_step": 5714, + "learning_rate": 0.00047698664440734556, + "loss": 1.7009, + "loss_base2": 2.4539, + "loss_pixel": 0.1721, + "loss_text": 1.5288, + "ppl": 5.4789, + "step": 5714 + }, + { + "epoch": 0.04, + "global_step": 5715, + "learning_rate": 0.00047698247078464107, + "loss": 1.6997, + "loss_base2": 2.4521, + "loss_pixel": 0.1732, + "loss_text": 1.5265, + "ppl": 5.4723, + "step": 5715 + }, + { + "epoch": 0.04, + "global_step": 5716, + "learning_rate": 0.0004769782971619366, + "loss": 1.6818, + "loss_base2": 2.4263, + "loss_pixel": 0.1697, + "loss_text": 1.5121, + "ppl": 5.3752, + "step": 5716 + }, + { + "epoch": 0.04, + "global_step": 5717, + "learning_rate": 0.0004769741235392321, + "loss": 1.6844, + "loss_base2": 2.4301, + "loss_pixel": 0.171, + "loss_text": 1.5134, + "ppl": 5.3892, + "step": 5717 + }, + { + "epoch": 0.04, + "global_step": 5718, + "learning_rate": 0.00047696994991652754, + "loss": 1.5465, + "loss_base2": 2.2311, + "loss_pixel": 0.1707, + "loss_text": 1.3758, + "ppl": 4.695, + "step": 5718 + }, + { + "epoch": 0.04, + "global_step": 5719, + "learning_rate": 0.00047696577629382305, + "loss": 1.4737, + "loss_base2": 2.1261, + "loss_pixel": 0.1698, + "loss_text": 1.3039, + "ppl": 4.3654, + "step": 5719 + }, + { + "epoch": 0.04, + "global_step": 5720, + "learning_rate": 0.00047696160267111855, + "loss": 1.4803, + "loss_base2": 2.1356, + "loss_pixel": 0.1703, + "loss_text": 1.3101, + "ppl": 4.3943, + "step": 5720 + }, + { + "epoch": 0.04, + "global_step": 5721, + "learning_rate": 0.00047695742904841406, + "loss": 1.4816, + "loss_base2": 2.1375, + "loss_pixel": 0.176, + "loss_text": 1.3055, + "ppl": 4.4, + "step": 5721 + }, + { + "epoch": 0.04, + "global_step": 5722, + "learning_rate": 0.00047695325542570957, + "loss": 1.4923, + "loss_base2": 2.1529, + "loss_pixel": 0.1911, + "loss_text": 1.3012, + "ppl": 4.4473, + "step": 5722 + }, + { + "epoch": 0.04, + "global_step": 5723, + "learning_rate": 0.000476949081803005, + "loss": 1.4951, + "loss_base2": 2.157, + "loss_pixel": 0.1895, + "loss_text": 1.3056, + "ppl": 4.4598, + "step": 5723 + }, + { + "epoch": 0.04, + "global_step": 5724, + "learning_rate": 0.00047694490818030053, + "loss": 1.5039, + "loss_base2": 2.1697, + "loss_pixel": 0.189, + "loss_text": 1.3149, + "ppl": 4.4992, + "step": 5724 + }, + { + "epoch": 0.04, + "global_step": 5725, + "learning_rate": 0.00047694073455759603, + "loss": 1.4995, + "loss_base2": 2.1633, + "loss_pixel": 0.1889, + "loss_text": 1.3106, + "ppl": 4.4794, + "step": 5725 + }, + { + "epoch": 0.04, + "global_step": 5726, + "learning_rate": 0.00047693656093489154, + "loss": 1.5267, + "loss_base2": 2.2026, + "loss_pixel": 0.1869, + "loss_text": 1.3398, + "ppl": 4.603, + "step": 5726 + }, + { + "epoch": 0.04, + "global_step": 5727, + "learning_rate": 0.00047693238731218694, + "loss": 1.7391, + "loss_base2": 2.509, + "loss_pixel": 0.1836, + "loss_text": 1.5555, + "ppl": 5.6922, + "step": 5727 + }, + { + "epoch": 0.04, + "global_step": 5728, + "learning_rate": 0.00047692821368948245, + "loss": 1.7216, + "loss_base2": 2.4837, + "loss_pixel": 0.1814, + "loss_text": 1.5402, + "ppl": 5.5935, + "step": 5728 + }, + { + "epoch": 0.04, + "global_step": 5729, + "learning_rate": 0.00047692404006677796, + "loss": 1.7267, + "loss_base2": 2.4911, + "loss_pixel": 0.182, + "loss_text": 1.5447, + "ppl": 5.6221, + "step": 5729 + }, + { + "epoch": 0.04, + "global_step": 5730, + "learning_rate": 0.00047691986644407346, + "loss": 1.7147, + "loss_base2": 2.4738, + "loss_pixel": 0.18, + "loss_text": 1.5347, + "ppl": 5.555, + "step": 5730 + }, + { + "epoch": 0.04, + "global_step": 5731, + "learning_rate": 0.00047691569282136897, + "loss": 1.7258, + "loss_base2": 2.4898, + "loss_pixel": 0.1815, + "loss_text": 1.5443, + "ppl": 5.617, + "step": 5731 + }, + { + "epoch": 0.04, + "global_step": 5732, + "learning_rate": 0.0004769115191986644, + "loss": 1.7179, + "loss_base2": 2.4784, + "loss_pixel": 0.1833, + "loss_text": 1.5346, + "ppl": 5.5728, + "step": 5732 + }, + { + "epoch": 0.04, + "global_step": 5733, + "learning_rate": 0.00047690734557595993, + "loss": 1.7158, + "loss_base2": 2.4754, + "loss_pixel": 0.1802, + "loss_text": 1.5356, + "ppl": 5.5611, + "step": 5733 + }, + { + "epoch": 0.04, + "global_step": 5734, + "learning_rate": 0.00047690317195325544, + "loss": 1.6942, + "loss_base2": 2.4442, + "loss_pixel": 0.183, + "loss_text": 1.5112, + "ppl": 5.4423, + "step": 5734 + }, + { + "epoch": 0.04, + "global_step": 5735, + "learning_rate": 0.00047689899833055095, + "loss": 1.719, + "loss_base2": 2.48, + "loss_pixel": 0.1797, + "loss_text": 1.5393, + "ppl": 5.5789, + "step": 5735 + }, + { + "epoch": 0.04, + "global_step": 5736, + "learning_rate": 0.0004768948247078464, + "loss": 1.7036, + "loss_base2": 2.4578, + "loss_pixel": 0.1797, + "loss_text": 1.5239, + "ppl": 5.4937, + "step": 5736 + }, + { + "epoch": 0.04, + "global_step": 5737, + "learning_rate": 0.0004768906510851419, + "loss": 1.6913, + "loss_base2": 2.44, + "loss_pixel": 0.1807, + "loss_text": 1.5106, + "ppl": 5.4265, + "step": 5737 + }, + { + "epoch": 0.04, + "global_step": 5738, + "learning_rate": 0.0004768864774624374, + "loss": 1.7095, + "loss_base2": 2.4663, + "loss_pixel": 0.18, + "loss_text": 1.5295, + "ppl": 5.5262, + "step": 5738 + }, + { + "epoch": 0.04, + "global_step": 5739, + "learning_rate": 0.0004768823038397329, + "loss": 1.7037, + "loss_base2": 2.4579, + "loss_pixel": 0.182, + "loss_text": 1.5217, + "ppl": 5.4942, + "step": 5739 + }, + { + "epoch": 0.04, + "global_step": 5740, + "learning_rate": 0.00047687813021702843, + "loss": 1.703, + "loss_base2": 2.4569, + "loss_pixel": 0.1791, + "loss_text": 1.5239, + "ppl": 5.4904, + "step": 5740 + }, + { + "epoch": 0.04, + "global_step": 5741, + "learning_rate": 0.0004768739565943239, + "loss": 1.7174, + "loss_base2": 2.4777, + "loss_pixel": 0.1801, + "loss_text": 1.5374, + "ppl": 5.57, + "step": 5741 + }, + { + "epoch": 0.04, + "global_step": 5742, + "learning_rate": 0.0004768697829716194, + "loss": 1.7199, + "loss_base2": 2.4813, + "loss_pixel": 0.1806, + "loss_text": 1.5393, + "ppl": 5.584, + "step": 5742 + }, + { + "epoch": 0.04, + "global_step": 5743, + "learning_rate": 0.0004768656093489149, + "loss": 1.6946, + "loss_base2": 2.4448, + "loss_pixel": 0.1824, + "loss_text": 1.5122, + "ppl": 5.4445, + "step": 5743 + }, + { + "epoch": 0.04, + "global_step": 5744, + "learning_rate": 0.0004768614357262104, + "loss": 1.7218, + "loss_base2": 2.484, + "loss_pixel": 0.1792, + "loss_text": 1.5425, + "ppl": 5.5946, + "step": 5744 + }, + { + "epoch": 0.04, + "global_step": 5745, + "learning_rate": 0.00047685726210350586, + "loss": 1.7067, + "loss_base2": 2.4622, + "loss_pixel": 0.1795, + "loss_text": 1.5271, + "ppl": 5.5107, + "step": 5745 + }, + { + "epoch": 0.04, + "global_step": 5746, + "learning_rate": 0.0004768530884808013, + "loss": 1.7007, + "loss_base2": 2.4536, + "loss_pixel": 0.1805, + "loss_text": 1.5202, + "ppl": 5.4778, + "step": 5746 + }, + { + "epoch": 0.04, + "global_step": 5747, + "learning_rate": 0.0004768489148580968, + "loss": 1.7111, + "loss_base2": 2.4686, + "loss_pixel": 0.1806, + "loss_text": 1.5305, + "ppl": 5.535, + "step": 5747 + }, + { + "epoch": 0.04, + "global_step": 5748, + "learning_rate": 0.0004768447412353923, + "loss": 1.5246, + "loss_base2": 2.1995, + "loss_pixel": 0.1795, + "loss_text": 1.3451, + "ppl": 4.5933, + "step": 5748 + }, + { + "epoch": 0.04, + "global_step": 5749, + "learning_rate": 0.00047684056761268783, + "loss": 1.4868, + "loss_base2": 2.145, + "loss_pixel": 0.1804, + "loss_text": 1.3064, + "ppl": 4.4229, + "step": 5749 + }, + { + "epoch": 0.04, + "global_step": 5750, + "learning_rate": 0.0004768363939899833, + "loss": 1.492, + "loss_base2": 2.1525, + "loss_pixel": 0.1797, + "loss_text": 1.3123, + "ppl": 4.446, + "step": 5750 + }, + { + "epoch": 0.04, + "global_step": 5751, + "learning_rate": 0.0004768322203672788, + "loss": 1.4961, + "loss_base2": 2.1584, + "loss_pixel": 0.1807, + "loss_text": 1.3154, + "ppl": 4.4642, + "step": 5751 + }, + { + "epoch": 0.04, + "global_step": 5752, + "learning_rate": 0.0004768280467445743, + "loss": 1.4952, + "loss_base2": 2.1571, + "loss_pixel": 0.1791, + "loss_text": 1.3161, + "ppl": 4.4602, + "step": 5752 + }, + { + "epoch": 0.04, + "global_step": 5753, + "learning_rate": 0.0004768238731218698, + "loss": 1.4831, + "loss_base2": 2.1397, + "loss_pixel": 0.179, + "loss_text": 1.3041, + "ppl": 4.4066, + "step": 5753 + }, + { + "epoch": 0.04, + "global_step": 5754, + "learning_rate": 0.00047681969949916526, + "loss": 1.4859, + "loss_base2": 2.1437, + "loss_pixel": 0.18, + "loss_text": 1.3059, + "ppl": 4.4189, + "step": 5754 + }, + { + "epoch": 0.04, + "global_step": 5755, + "learning_rate": 0.00047681552587646077, + "loss": 1.4653, + "loss_base2": 2.114, + "loss_pixel": 0.179, + "loss_text": 1.2862, + "ppl": 4.3288, + "step": 5755 + }, + { + "epoch": 0.04, + "global_step": 5756, + "learning_rate": 0.0004768113522537563, + "loss": 1.4875, + "loss_base2": 2.146, + "loss_pixel": 0.1794, + "loss_text": 1.3082, + "ppl": 4.426, + "step": 5756 + }, + { + "epoch": 0.04, + "global_step": 5757, + "learning_rate": 0.0004768071786310518, + "loss": 1.7041, + "loss_base2": 2.4585, + "loss_pixel": 0.1785, + "loss_text": 1.5256, + "ppl": 5.4964, + "step": 5757 + }, + { + "epoch": 0.04, + "global_step": 5758, + "learning_rate": 0.0004768030050083473, + "loss": 1.7107, + "loss_base2": 2.468, + "loss_pixel": 0.1797, + "loss_text": 1.531, + "ppl": 5.5328, + "step": 5758 + }, + { + "epoch": 0.04, + "global_step": 5759, + "learning_rate": 0.00047679883138564274, + "loss": 1.7144, + "loss_base2": 2.4734, + "loss_pixel": 0.1786, + "loss_text": 1.5359, + "ppl": 5.5533, + "step": 5759 + }, + { + "epoch": 0.04, + "global_step": 5760, + "learning_rate": 0.00047679465776293825, + "loss": 1.7154, + "loss_base2": 2.4748, + "loss_pixel": 0.1795, + "loss_text": 1.536, + "ppl": 5.5589, + "step": 5760 + }, + { + "epoch": 0.04, + "global_step": 5761, + "learning_rate": 0.00047679048414023376, + "loss": 1.7139, + "loss_base2": 2.4726, + "loss_pixel": 0.1785, + "loss_text": 1.5354, + "ppl": 5.5506, + "step": 5761 + }, + { + "epoch": 0.04, + "global_step": 5762, + "learning_rate": 0.00047678631051752926, + "loss": 1.7126, + "loss_base2": 2.4708, + "loss_pixel": 0.1782, + "loss_text": 1.5343, + "ppl": 5.5434, + "step": 5762 + }, + { + "epoch": 0.04, + "global_step": 5763, + "learning_rate": 0.0004767821368948247, + "loss": 1.7134, + "loss_base2": 2.4719, + "loss_pixel": 0.1794, + "loss_text": 1.534, + "ppl": 5.5478, + "step": 5763 + }, + { + "epoch": 0.04, + "global_step": 5764, + "learning_rate": 0.00047677796327212017, + "loss": 1.7084, + "loss_base2": 2.4647, + "loss_pixel": 0.1789, + "loss_text": 1.5295, + "ppl": 5.5201, + "step": 5764 + }, + { + "epoch": 0.04, + "global_step": 5765, + "learning_rate": 0.0004767737896494157, + "loss": 1.6871, + "loss_base2": 2.434, + "loss_pixel": 0.1794, + "loss_text": 1.5077, + "ppl": 5.4038, + "step": 5765 + }, + { + "epoch": 0.04, + "global_step": 5766, + "learning_rate": 0.0004767696160267112, + "loss": 1.6967, + "loss_base2": 2.4478, + "loss_pixel": 0.1796, + "loss_text": 1.5171, + "ppl": 5.4559, + "step": 5766 + }, + { + "epoch": 0.04, + "global_step": 5767, + "learning_rate": 0.0004767654424040067, + "loss": 1.701, + "loss_base2": 2.454, + "loss_pixel": 0.1782, + "loss_text": 1.5228, + "ppl": 5.4794, + "step": 5767 + }, + { + "epoch": 0.04, + "global_step": 5768, + "learning_rate": 0.00047676126878130214, + "loss": 1.7009, + "loss_base2": 2.4539, + "loss_pixel": 0.1775, + "loss_text": 1.5234, + "ppl": 5.4789, + "step": 5768 + }, + { + "epoch": 0.04, + "global_step": 5769, + "learning_rate": 0.00047675709515859765, + "loss": 1.709, + "loss_base2": 2.4656, + "loss_pixel": 0.1799, + "loss_text": 1.5291, + "ppl": 5.5234, + "step": 5769 + }, + { + "epoch": 0.04, + "global_step": 5770, + "learning_rate": 0.00047675292153589316, + "loss": 1.7126, + "loss_base2": 2.4708, + "loss_pixel": 0.1786, + "loss_text": 1.534, + "ppl": 5.5434, + "step": 5770 + }, + { + "epoch": 0.04, + "global_step": 5771, + "learning_rate": 0.00047674874791318867, + "loss": 1.6833, + "loss_base2": 2.4285, + "loss_pixel": 0.179, + "loss_text": 1.5043, + "ppl": 5.3833, + "step": 5771 + }, + { + "epoch": 0.04, + "global_step": 5772, + "learning_rate": 0.0004767445742904841, + "loss": 1.7103, + "loss_base2": 2.4674, + "loss_pixel": 0.1797, + "loss_text": 1.5306, + "ppl": 5.5306, + "step": 5772 + }, + { + "epoch": 0.04, + "global_step": 5773, + "learning_rate": 0.0004767404006677796, + "loss": 1.7053, + "loss_base2": 2.4602, + "loss_pixel": 0.1799, + "loss_text": 1.5254, + "ppl": 5.503, + "step": 5773 + }, + { + "epoch": 0.04, + "global_step": 5774, + "learning_rate": 0.00047673622704507513, + "loss": 1.7117, + "loss_base2": 2.4695, + "loss_pixel": 0.1801, + "loss_text": 1.5317, + "ppl": 5.5384, + "step": 5774 + }, + { + "epoch": 0.04, + "global_step": 5775, + "learning_rate": 0.00047673205342237064, + "loss": 1.7149, + "loss_base2": 2.4741, + "loss_pixel": 0.1794, + "loss_text": 1.5355, + "ppl": 5.5561, + "step": 5775 + }, + { + "epoch": 0.04, + "global_step": 5776, + "learning_rate": 0.00047672787979966615, + "loss": 1.6788, + "loss_base2": 2.422, + "loss_pixel": 0.1793, + "loss_text": 1.4995, + "ppl": 5.3591, + "step": 5776 + }, + { + "epoch": 0.04, + "global_step": 5777, + "learning_rate": 0.0004767237061769616, + "loss": 1.6953, + "loss_base2": 2.4458, + "loss_pixel": 0.1798, + "loss_text": 1.5156, + "ppl": 5.4483, + "step": 5777 + }, + { + "epoch": 0.04, + "global_step": 5778, + "learning_rate": 0.0004767195325542571, + "loss": 1.7031, + "loss_base2": 2.4571, + "loss_pixel": 0.1801, + "loss_text": 1.5229, + "ppl": 5.4909, + "step": 5778 + }, + { + "epoch": 0.04, + "global_step": 5779, + "learning_rate": 0.0004767153589315526, + "loss": 1.6994, + "loss_base2": 2.4517, + "loss_pixel": 0.1783, + "loss_text": 1.5211, + "ppl": 5.4707, + "step": 5779 + }, + { + "epoch": 0.04, + "global_step": 5780, + "learning_rate": 0.0004767111853088481, + "loss": 1.685, + "loss_base2": 2.4309, + "loss_pixel": 0.1794, + "loss_text": 1.5056, + "ppl": 5.3925, + "step": 5780 + }, + { + "epoch": 0.04, + "global_step": 5781, + "learning_rate": 0.00047670701168614363, + "loss": 1.7022, + "loss_base2": 2.4558, + "loss_pixel": 0.1808, + "loss_text": 1.5214, + "ppl": 5.486, + "step": 5781 + }, + { + "epoch": 0.04, + "global_step": 5782, + "learning_rate": 0.0004767028380634391, + "loss": 1.6916, + "loss_base2": 2.4405, + "loss_pixel": 0.179, + "loss_text": 1.5125, + "ppl": 5.4282, + "step": 5782 + }, + { + "epoch": 0.04, + "global_step": 5783, + "learning_rate": 0.00047669866444073454, + "loss": 1.6878, + "loss_base2": 2.435, + "loss_pixel": 0.1793, + "loss_text": 1.5085, + "ppl": 5.4076, + "step": 5783 + }, + { + "epoch": 0.04, + "global_step": 5784, + "learning_rate": 0.00047669449081803004, + "loss": 1.6915, + "loss_base2": 2.4403, + "loss_pixel": 0.1784, + "loss_text": 1.5131, + "ppl": 5.4276, + "step": 5784 + }, + { + "epoch": 0.04, + "global_step": 5785, + "learning_rate": 0.00047669031719532555, + "loss": 1.6867, + "loss_base2": 2.4334, + "loss_pixel": 0.1784, + "loss_text": 1.5083, + "ppl": 5.4016, + "step": 5785 + }, + { + "epoch": 0.04, + "global_step": 5786, + "learning_rate": 0.000476686143572621, + "loss": 1.6992, + "loss_base2": 2.4514, + "loss_pixel": 0.177, + "loss_text": 1.5222, + "ppl": 5.4696, + "step": 5786 + }, + { + "epoch": 0.04, + "global_step": 5787, + "learning_rate": 0.0004766819699499165, + "loss": 1.7004, + "loss_base2": 2.4532, + "loss_pixel": 0.1786, + "loss_text": 1.5218, + "ppl": 5.4761, + "step": 5787 + }, + { + "epoch": 0.04, + "global_step": 5788, + "learning_rate": 0.000476677796327212, + "loss": 1.6681, + "loss_base2": 2.4066, + "loss_pixel": 0.1801, + "loss_text": 1.488, + "ppl": 5.3021, + "step": 5788 + }, + { + "epoch": 0.04, + "global_step": 5789, + "learning_rate": 0.00047667362270450753, + "loss": 1.7047, + "loss_base2": 2.4594, + "loss_pixel": 0.1793, + "loss_text": 1.5254, + "ppl": 5.4997, + "step": 5789 + }, + { + "epoch": 0.04, + "global_step": 5790, + "learning_rate": 0.00047666944908180303, + "loss": 1.6852, + "loss_base2": 2.4312, + "loss_pixel": 0.1785, + "loss_text": 1.5067, + "ppl": 5.3935, + "step": 5790 + }, + { + "epoch": 0.04, + "global_step": 5791, + "learning_rate": 0.0004766652754590985, + "loss": 1.7105, + "loss_base2": 2.4677, + "loss_pixel": 0.1784, + "loss_text": 1.5321, + "ppl": 5.5317, + "step": 5791 + }, + { + "epoch": 0.04, + "global_step": 5792, + "learning_rate": 0.000476661101836394, + "loss": 1.6989, + "loss_base2": 2.451, + "loss_pixel": 0.1787, + "loss_text": 1.5202, + "ppl": 5.4679, + "step": 5792 + }, + { + "epoch": 0.04, + "global_step": 5793, + "learning_rate": 0.0004766569282136895, + "loss": 1.6868, + "loss_base2": 2.4335, + "loss_pixel": 0.18, + "loss_text": 1.5068, + "ppl": 5.4022, + "step": 5793 + }, + { + "epoch": 0.04, + "global_step": 5794, + "learning_rate": 0.000476652754590985, + "loss": 1.663, + "loss_base2": 2.3992, + "loss_pixel": 0.1792, + "loss_text": 1.4838, + "ppl": 5.2751, + "step": 5794 + }, + { + "epoch": 0.04, + "global_step": 5795, + "learning_rate": 0.00047664858096828046, + "loss": 1.6763, + "loss_base2": 2.4184, + "loss_pixel": 0.177, + "loss_text": 1.4993, + "ppl": 5.3457, + "step": 5795 + }, + { + "epoch": 0.04, + "global_step": 5796, + "learning_rate": 0.00047664440734557597, + "loss": 1.6934, + "loss_base2": 2.4431, + "loss_pixel": 0.179, + "loss_text": 1.5143, + "ppl": 5.4379, + "step": 5796 + }, + { + "epoch": 0.04, + "global_step": 5797, + "learning_rate": 0.0004766402337228715, + "loss": 1.6896, + "loss_base2": 2.4376, + "loss_pixel": 0.1789, + "loss_text": 1.5107, + "ppl": 5.4173, + "step": 5797 + }, + { + "epoch": 0.04, + "global_step": 5798, + "learning_rate": 0.000476636060100167, + "loss": 1.687, + "loss_base2": 2.4338, + "loss_pixel": 0.1785, + "loss_text": 1.5085, + "ppl": 5.4032, + "step": 5798 + }, + { + "epoch": 0.04, + "global_step": 5799, + "learning_rate": 0.0004766318864774625, + "loss": 1.666, + "loss_base2": 2.4035, + "loss_pixel": 0.1782, + "loss_text": 1.4878, + "ppl": 5.291, + "step": 5799 + }, + { + "epoch": 0.04, + "global_step": 5800, + "learning_rate": 0.00047662771285475795, + "loss": 1.6665, + "loss_base2": 2.4043, + "loss_pixel": 0.1781, + "loss_text": 1.4885, + "ppl": 5.2936, + "step": 5800 + }, + { + "epoch": 0.04, + "global_step": 5801, + "learning_rate": 0.00047662353923205345, + "loss": 1.689, + "loss_base2": 2.4367, + "loss_pixel": 0.1786, + "loss_text": 1.5104, + "ppl": 5.4141, + "step": 5801 + }, + { + "epoch": 0.04, + "global_step": 5802, + "learning_rate": 0.0004766193656093489, + "loss": 1.6737, + "loss_base2": 2.4146, + "loss_pixel": 0.179, + "loss_text": 1.4947, + "ppl": 5.3319, + "step": 5802 + }, + { + "epoch": 0.04, + "global_step": 5803, + "learning_rate": 0.0004766151919866444, + "loss": 1.6965, + "loss_base2": 2.4475, + "loss_pixel": 0.1779, + "loss_text": 1.5185, + "ppl": 5.4548, + "step": 5803 + }, + { + "epoch": 0.04, + "global_step": 5804, + "learning_rate": 0.00047661101836393987, + "loss": 1.687, + "loss_base2": 2.4338, + "loss_pixel": 0.1794, + "loss_text": 1.5075, + "ppl": 5.4032, + "step": 5804 + }, + { + "epoch": 0.04, + "global_step": 5805, + "learning_rate": 0.0004766068447412354, + "loss": 1.5261, + "loss_base2": 2.2017, + "loss_pixel": 0.1797, + "loss_text": 1.3464, + "ppl": 4.6002, + "step": 5805 + }, + { + "epoch": 0.04, + "global_step": 5806, + "learning_rate": 0.0004766026711185309, + "loss": 1.5063, + "loss_base2": 2.1731, + "loss_pixel": 0.1805, + "loss_text": 1.3258, + "ppl": 4.51, + "step": 5806 + }, + { + "epoch": 0.04, + "global_step": 5807, + "learning_rate": 0.0004765984974958264, + "loss": 1.4919, + "loss_base2": 2.1524, + "loss_pixel": 0.1774, + "loss_text": 1.3145, + "ppl": 4.4455, + "step": 5807 + }, + { + "epoch": 0.04, + "global_step": 5808, + "learning_rate": 0.0004765943238731219, + "loss": 1.4868, + "loss_base2": 2.145, + "loss_pixel": 0.1782, + "loss_text": 1.3087, + "ppl": 4.4229, + "step": 5808 + }, + { + "epoch": 0.04, + "global_step": 5809, + "learning_rate": 0.00047659015025041735, + "loss": 1.4721, + "loss_base2": 2.1238, + "loss_pixel": 0.1778, + "loss_text": 1.2942, + "ppl": 4.3584, + "step": 5809 + }, + { + "epoch": 0.04, + "global_step": 5810, + "learning_rate": 0.00047658597662771286, + "loss": 1.489, + "loss_base2": 2.1482, + "loss_pixel": 0.179, + "loss_text": 1.31, + "ppl": 4.4327, + "step": 5810 + }, + { + "epoch": 0.04, + "global_step": 5811, + "learning_rate": 0.00047658180300500836, + "loss": 1.4461, + "loss_base2": 2.0863, + "loss_pixel": 0.1786, + "loss_text": 1.2675, + "ppl": 4.2465, + "step": 5811 + }, + { + "epoch": 0.04, + "global_step": 5812, + "learning_rate": 0.00047657762938230387, + "loss": 1.4825, + "loss_base2": 2.1388, + "loss_pixel": 0.1825, + "loss_text": 1.3, + "ppl": 4.4039, + "step": 5812 + }, + { + "epoch": 0.04, + "global_step": 5813, + "learning_rate": 0.0004765734557595993, + "loss": 1.5004, + "loss_base2": 2.1646, + "loss_pixel": 0.1784, + "loss_text": 1.322, + "ppl": 4.4835, + "step": 5813 + }, + { + "epoch": 0.04, + "global_step": 5814, + "learning_rate": 0.00047656928213689483, + "loss": 1.6983, + "loss_base2": 2.4501, + "loss_pixel": 0.1761, + "loss_text": 1.5222, + "ppl": 5.4646, + "step": 5814 + }, + { + "epoch": 0.04, + "global_step": 5815, + "learning_rate": 0.00047656510851419034, + "loss": 1.7091, + "loss_base2": 2.4657, + "loss_pixel": 0.1785, + "loss_text": 1.5306, + "ppl": 5.524, + "step": 5815 + }, + { + "epoch": 0.04, + "global_step": 5816, + "learning_rate": 0.00047656093489148585, + "loss": 1.726, + "loss_base2": 2.4901, + "loss_pixel": 0.1784, + "loss_text": 1.5475, + "ppl": 5.6181, + "step": 5816 + }, + { + "epoch": 0.04, + "global_step": 5817, + "learning_rate": 0.00047655676126878135, + "loss": 1.7162, + "loss_base2": 2.476, + "loss_pixel": 0.1772, + "loss_text": 1.539, + "ppl": 5.5633, + "step": 5817 + }, + { + "epoch": 0.04, + "global_step": 5818, + "learning_rate": 0.0004765525876460768, + "loss": 1.6968, + "loss_base2": 2.448, + "loss_pixel": 0.1773, + "loss_text": 1.5195, + "ppl": 5.4565, + "step": 5818 + }, + { + "epoch": 0.04, + "global_step": 5819, + "learning_rate": 0.0004765484140233723, + "loss": 1.7084, + "loss_base2": 2.4647, + "loss_pixel": 0.1794, + "loss_text": 1.5289, + "ppl": 5.5201, + "step": 5819 + }, + { + "epoch": 0.04, + "global_step": 5820, + "learning_rate": 0.0004765442404006678, + "loss": 1.7063, + "loss_base2": 2.4617, + "loss_pixel": 0.18, + "loss_text": 1.5262, + "ppl": 5.5085, + "step": 5820 + }, + { + "epoch": 0.04, + "global_step": 5821, + "learning_rate": 0.0004765400667779633, + "loss": 1.6804, + "loss_base2": 2.4243, + "loss_pixel": 0.1777, + "loss_text": 1.5027, + "ppl": 5.3677, + "step": 5821 + }, + { + "epoch": 0.04, + "global_step": 5822, + "learning_rate": 0.0004765358931552587, + "loss": 1.6845, + "loss_base2": 2.4302, + "loss_pixel": 0.1778, + "loss_text": 1.5067, + "ppl": 5.3898, + "step": 5822 + }, + { + "epoch": 0.04, + "global_step": 5823, + "learning_rate": 0.00047653171953255423, + "loss": 1.7047, + "loss_base2": 2.4594, + "loss_pixel": 0.1786, + "loss_text": 1.5261, + "ppl": 5.4997, + "step": 5823 + }, + { + "epoch": 0.04, + "global_step": 5824, + "learning_rate": 0.00047652754590984974, + "loss": 1.6795, + "loss_base2": 2.423, + "loss_pixel": 0.1792, + "loss_text": 1.5003, + "ppl": 5.3629, + "step": 5824 + }, + { + "epoch": 0.04, + "global_step": 5825, + "learning_rate": 0.00047652337228714525, + "loss": 1.7065, + "loss_base2": 2.462, + "loss_pixel": 0.1787, + "loss_text": 1.5278, + "ppl": 5.5096, + "step": 5825 + }, + { + "epoch": 0.04, + "global_step": 5826, + "learning_rate": 0.00047651919866444076, + "loss": 1.6934, + "loss_base2": 2.4431, + "loss_pixel": 0.1785, + "loss_text": 1.5149, + "ppl": 5.4379, + "step": 5826 + }, + { + "epoch": 0.04, + "global_step": 5827, + "learning_rate": 0.0004765150250417362, + "loss": 1.7167, + "loss_base2": 2.4767, + "loss_pixel": 0.1801, + "loss_text": 1.5366, + "ppl": 5.5661, + "step": 5827 + }, + { + "epoch": 0.04, + "global_step": 5828, + "learning_rate": 0.0004765108514190317, + "loss": 1.6891, + "loss_base2": 2.4369, + "loss_pixel": 0.1775, + "loss_text": 1.5116, + "ppl": 5.4146, + "step": 5828 + }, + { + "epoch": 0.04, + "global_step": 5829, + "learning_rate": 0.0004765066777963272, + "loss": 1.6941, + "loss_base2": 2.4441, + "loss_pixel": 0.1784, + "loss_text": 1.5158, + "ppl": 5.4417, + "step": 5829 + }, + { + "epoch": 0.04, + "global_step": 5830, + "learning_rate": 0.00047650250417362273, + "loss": 1.7037, + "loss_base2": 2.4579, + "loss_pixel": 0.1785, + "loss_text": 1.5252, + "ppl": 5.4942, + "step": 5830 + }, + { + "epoch": 0.04, + "global_step": 5831, + "learning_rate": 0.0004764983305509182, + "loss": 1.693, + "loss_base2": 2.4425, + "loss_pixel": 0.1779, + "loss_text": 1.5151, + "ppl": 5.4358, + "step": 5831 + }, + { + "epoch": 0.04, + "global_step": 5832, + "learning_rate": 0.0004764941569282137, + "loss": 1.6964, + "loss_base2": 2.4474, + "loss_pixel": 0.1783, + "loss_text": 1.5181, + "ppl": 5.4543, + "step": 5832 + }, + { + "epoch": 0.04, + "global_step": 5833, + "learning_rate": 0.0004764899833055092, + "loss": 1.6983, + "loss_base2": 2.4501, + "loss_pixel": 0.1779, + "loss_text": 1.5204, + "ppl": 5.4646, + "step": 5833 + }, + { + "epoch": 0.04, + "global_step": 5834, + "learning_rate": 0.0004764858096828047, + "loss": 1.6918, + "loss_base2": 2.4408, + "loss_pixel": 0.1787, + "loss_text": 1.5132, + "ppl": 5.4292, + "step": 5834 + }, + { + "epoch": 0.04, + "global_step": 5835, + "learning_rate": 0.0004764816360601002, + "loss": 1.709, + "loss_base2": 2.4656, + "loss_pixel": 0.1787, + "loss_text": 1.5303, + "ppl": 5.5234, + "step": 5835 + }, + { + "epoch": 0.04, + "global_step": 5836, + "learning_rate": 0.00047647746243739567, + "loss": 1.6891, + "loss_base2": 2.4369, + "loss_pixel": 0.1784, + "loss_text": 1.5106, + "ppl": 5.4146, + "step": 5836 + }, + { + "epoch": 0.04, + "global_step": 5837, + "learning_rate": 0.0004764732888146912, + "loss": 1.6915, + "loss_base2": 2.4403, + "loss_pixel": 0.1793, + "loss_text": 1.5122, + "ppl": 5.4276, + "step": 5837 + }, + { + "epoch": 0.04, + "global_step": 5838, + "learning_rate": 0.0004764691151919867, + "loss": 1.7038, + "loss_base2": 2.4581, + "loss_pixel": 0.1779, + "loss_text": 1.5258, + "ppl": 5.4948, + "step": 5838 + }, + { + "epoch": 0.04, + "global_step": 5839, + "learning_rate": 0.0004764649415692822, + "loss": 1.647, + "loss_base2": 2.3761, + "loss_pixel": 0.1783, + "loss_text": 1.4688, + "ppl": 5.1914, + "step": 5839 + }, + { + "epoch": 0.04, + "global_step": 5840, + "learning_rate": 0.00047646076794657764, + "loss": 1.4982, + "loss_base2": 2.1614, + "loss_pixel": 0.1781, + "loss_text": 1.3202, + "ppl": 4.4736, + "step": 5840 + }, + { + "epoch": 0.04, + "global_step": 5841, + "learning_rate": 0.0004764565943238731, + "loss": 1.4954, + "loss_base2": 2.1574, + "loss_pixel": 0.1787, + "loss_text": 1.3166, + "ppl": 4.4611, + "step": 5841 + }, + { + "epoch": 0.04, + "global_step": 5842, + "learning_rate": 0.0004764524207011686, + "loss": 1.4856, + "loss_base2": 2.1433, + "loss_pixel": 0.1785, + "loss_text": 1.307, + "ppl": 4.4176, + "step": 5842 + }, + { + "epoch": 0.04, + "global_step": 5843, + "learning_rate": 0.0004764482470784641, + "loss": 1.4845, + "loss_base2": 2.1417, + "loss_pixel": 0.1779, + "loss_text": 1.3065, + "ppl": 4.4128, + "step": 5843 + }, + { + "epoch": 0.04, + "global_step": 5844, + "learning_rate": 0.0004764440734557596, + "loss": 1.4775, + "loss_base2": 2.1316, + "loss_pixel": 0.1777, + "loss_text": 1.2998, + "ppl": 4.382, + "step": 5844 + }, + { + "epoch": 0.04, + "global_step": 5845, + "learning_rate": 0.00047643989983305507, + "loss": 1.4802, + "loss_base2": 2.1355, + "loss_pixel": 0.1794, + "loss_text": 1.3008, + "ppl": 4.3938, + "step": 5845 + }, + { + "epoch": 0.04, + "global_step": 5846, + "learning_rate": 0.0004764357262103506, + "loss": 1.4742, + "loss_base2": 2.1268, + "loss_pixel": 0.1788, + "loss_text": 1.2954, + "ppl": 4.3675, + "step": 5846 + }, + { + "epoch": 0.04, + "global_step": 5847, + "learning_rate": 0.0004764315525876461, + "loss": 1.4761, + "loss_base2": 2.1296, + "loss_pixel": 0.1791, + "loss_text": 1.297, + "ppl": 4.3758, + "step": 5847 + }, + { + "epoch": 0.04, + "global_step": 5848, + "learning_rate": 0.0004764273789649416, + "loss": 1.4617, + "loss_base2": 2.1088, + "loss_pixel": 0.1807, + "loss_text": 1.2809, + "ppl": 4.3133, + "step": 5848 + }, + { + "epoch": 0.04, + "global_step": 5849, + "learning_rate": 0.0004764232053422371, + "loss": 1.4621, + "loss_base2": 2.1094, + "loss_pixel": 0.1775, + "loss_text": 1.2846, + "ppl": 4.315, + "step": 5849 + }, + { + "epoch": 0.04, + "global_step": 5850, + "learning_rate": 0.00047641903171953255, + "loss": 1.4636, + "loss_base2": 2.1115, + "loss_pixel": 0.1788, + "loss_text": 1.2848, + "ppl": 4.3215, + "step": 5850 + }, + { + "epoch": 0.04, + "global_step": 5851, + "learning_rate": 0.00047641485809682806, + "loss": 1.4696, + "loss_base2": 2.1202, + "loss_pixel": 0.1809, + "loss_text": 1.2887, + "ppl": 4.3475, + "step": 5851 + }, + { + "epoch": 0.04, + "global_step": 5852, + "learning_rate": 0.00047641068447412357, + "loss": 1.477, + "loss_base2": 2.1309, + "loss_pixel": 0.1795, + "loss_text": 1.2975, + "ppl": 4.3798, + "step": 5852 + }, + { + "epoch": 0.04, + "global_step": 5853, + "learning_rate": 0.0004764065108514191, + "loss": 1.4801, + "loss_base2": 2.1353, + "loss_pixel": 0.1797, + "loss_text": 1.3004, + "ppl": 4.3934, + "step": 5853 + }, + { + "epoch": 0.04, + "global_step": 5854, + "learning_rate": 0.00047640233722871453, + "loss": 1.4835, + "loss_base2": 2.1402, + "loss_pixel": 0.1781, + "loss_text": 1.3054, + "ppl": 4.4083, + "step": 5854 + }, + { + "epoch": 0.04, + "global_step": 5855, + "learning_rate": 0.00047639816360601003, + "loss": 1.4492, + "loss_base2": 2.0908, + "loss_pixel": 0.1794, + "loss_text": 1.2699, + "ppl": 4.2597, + "step": 5855 + }, + { + "epoch": 0.04, + "global_step": 5856, + "learning_rate": 0.00047639398998330554, + "loss": 1.4856, + "loss_base2": 2.1433, + "loss_pixel": 0.1777, + "loss_text": 1.3079, + "ppl": 4.4176, + "step": 5856 + }, + { + "epoch": 0.04, + "global_step": 5857, + "learning_rate": 0.00047638981636060105, + "loss": 1.4753, + "loss_base2": 2.1284, + "loss_pixel": 0.1784, + "loss_text": 1.2969, + "ppl": 4.3723, + "step": 5857 + }, + { + "epoch": 0.04, + "global_step": 5858, + "learning_rate": 0.00047638564273789656, + "loss": 1.4698, + "loss_base2": 2.1205, + "loss_pixel": 0.1777, + "loss_text": 1.2921, + "ppl": 4.3484, + "step": 5858 + }, + { + "epoch": 0.04, + "global_step": 5859, + "learning_rate": 0.00047638146911519196, + "loss": 1.4742, + "loss_base2": 2.1268, + "loss_pixel": 0.1795, + "loss_text": 1.2948, + "ppl": 4.3675, + "step": 5859 + }, + { + "epoch": 0.04, + "global_step": 5860, + "learning_rate": 0.00047637729549248746, + "loss": 1.4822, + "loss_base2": 2.1384, + "loss_pixel": 0.1777, + "loss_text": 1.3045, + "ppl": 4.4026, + "step": 5860 + }, + { + "epoch": 0.04, + "global_step": 5861, + "learning_rate": 0.00047637312186978297, + "loss": 1.4736, + "loss_base2": 2.126, + "loss_pixel": 0.1798, + "loss_text": 1.2939, + "ppl": 4.3649, + "step": 5861 + }, + { + "epoch": 0.04, + "global_step": 5862, + "learning_rate": 0.0004763689482470785, + "loss": 1.4741, + "loss_base2": 2.1267, + "loss_pixel": 0.1808, + "loss_text": 1.2933, + "ppl": 4.3671, + "step": 5862 + }, + { + "epoch": 0.04, + "global_step": 5863, + "learning_rate": 0.00047636477462437393, + "loss": 1.467, + "loss_base2": 2.1164, + "loss_pixel": 0.1798, + "loss_text": 1.2872, + "ppl": 4.3362, + "step": 5863 + }, + { + "epoch": 0.04, + "global_step": 5864, + "learning_rate": 0.00047636060100166944, + "loss": 1.6665, + "loss_base2": 2.4043, + "loss_pixel": 0.178, + "loss_text": 1.4885, + "ppl": 5.2936, + "step": 5864 + }, + { + "epoch": 0.04, + "global_step": 5865, + "learning_rate": 0.00047635642737896495, + "loss": 1.7384, + "loss_base2": 2.508, + "loss_pixel": 0.1791, + "loss_text": 1.5594, + "ppl": 5.6882, + "step": 5865 + }, + { + "epoch": 0.04, + "global_step": 5866, + "learning_rate": 0.00047635225375626045, + "loss": 1.7165, + "loss_base2": 2.4764, + "loss_pixel": 0.1782, + "loss_text": 1.5384, + "ppl": 5.565, + "step": 5866 + }, + { + "epoch": 0.04, + "global_step": 5867, + "learning_rate": 0.00047634808013355596, + "loss": 1.7259, + "loss_base2": 2.4899, + "loss_pixel": 0.1776, + "loss_text": 1.5483, + "ppl": 5.6176, + "step": 5867 + }, + { + "epoch": 0.04, + "global_step": 5868, + "learning_rate": 0.0004763439065108514, + "loss": 1.7321, + "loss_base2": 2.4989, + "loss_pixel": 0.1792, + "loss_text": 1.553, + "ppl": 5.6525, + "step": 5868 + }, + { + "epoch": 0.04, + "global_step": 5869, + "learning_rate": 0.0004763397328881469, + "loss": 1.7107, + "loss_base2": 2.468, + "loss_pixel": 0.1797, + "loss_text": 1.531, + "ppl": 5.5328, + "step": 5869 + }, + { + "epoch": 0.04, + "global_step": 5870, + "learning_rate": 0.00047633555926544243, + "loss": 1.692, + "loss_base2": 2.441, + "loss_pixel": 0.1787, + "loss_text": 1.5133, + "ppl": 5.4303, + "step": 5870 + }, + { + "epoch": 0.04, + "global_step": 5871, + "learning_rate": 0.00047633138564273793, + "loss": 1.708, + "loss_base2": 2.4641, + "loss_pixel": 0.1762, + "loss_text": 1.5318, + "ppl": 5.5179, + "step": 5871 + }, + { + "epoch": 0.04, + "global_step": 5872, + "learning_rate": 0.0004763272120200334, + "loss": 1.7004, + "loss_base2": 2.4532, + "loss_pixel": 0.178, + "loss_text": 1.5224, + "ppl": 5.4761, + "step": 5872 + }, + { + "epoch": 0.04, + "global_step": 5873, + "learning_rate": 0.0004763230383973289, + "loss": 1.6974, + "loss_base2": 2.4488, + "loss_pixel": 0.1773, + "loss_text": 1.5202, + "ppl": 5.4597, + "step": 5873 + }, + { + "epoch": 0.04, + "global_step": 5874, + "learning_rate": 0.0004763188647746244, + "loss": 1.7114, + "loss_base2": 2.469, + "loss_pixel": 0.1776, + "loss_text": 1.5338, + "ppl": 5.5367, + "step": 5874 + }, + { + "epoch": 0.04, + "global_step": 5875, + "learning_rate": 0.0004763146911519199, + "loss": 1.6965, + "loss_base2": 2.4475, + "loss_pixel": 0.1781, + "loss_text": 1.5184, + "ppl": 5.4548, + "step": 5875 + }, + { + "epoch": 0.04, + "global_step": 5876, + "learning_rate": 0.0004763105175292154, + "loss": 1.7096, + "loss_base2": 2.4664, + "loss_pixel": 0.1781, + "loss_text": 1.5315, + "ppl": 5.5268, + "step": 5876 + }, + { + "epoch": 0.04, + "global_step": 5877, + "learning_rate": 0.0004763063439065108, + "loss": 1.6998, + "loss_base2": 2.4523, + "loss_pixel": 0.1784, + "loss_text": 1.5215, + "ppl": 5.4729, + "step": 5877 + }, + { + "epoch": 0.04, + "global_step": 5878, + "learning_rate": 0.0004763021702838063, + "loss": 1.6979, + "loss_base2": 2.4496, + "loss_pixel": 0.1775, + "loss_text": 1.5204, + "ppl": 5.4625, + "step": 5878 + }, + { + "epoch": 0.04, + "global_step": 5879, + "learning_rate": 0.00047629799666110183, + "loss": 1.6963, + "loss_base2": 2.4472, + "loss_pixel": 0.1785, + "loss_text": 1.5178, + "ppl": 5.4537, + "step": 5879 + }, + { + "epoch": 0.04, + "global_step": 5880, + "learning_rate": 0.00047629382303839734, + "loss": 1.6826, + "loss_base2": 2.4275, + "loss_pixel": 0.1767, + "loss_text": 1.506, + "ppl": 5.3795, + "step": 5880 + }, + { + "epoch": 0.04, + "global_step": 5881, + "learning_rate": 0.0004762896494156928, + "loss": 1.6992, + "loss_base2": 2.4514, + "loss_pixel": 0.1784, + "loss_text": 1.5208, + "ppl": 5.4696, + "step": 5881 + }, + { + "epoch": 0.04, + "global_step": 5882, + "learning_rate": 0.0004762854757929883, + "loss": 1.6903, + "loss_base2": 2.4386, + "loss_pixel": 0.1766, + "loss_text": 1.5137, + "ppl": 5.4211, + "step": 5882 + }, + { + "epoch": 0.04, + "global_step": 5883, + "learning_rate": 0.0004762813021702838, + "loss": 1.7015, + "loss_base2": 2.4547, + "loss_pixel": 0.1769, + "loss_text": 1.5247, + "ppl": 5.4822, + "step": 5883 + }, + { + "epoch": 0.04, + "global_step": 5884, + "learning_rate": 0.0004762771285475793, + "loss": 1.7079, + "loss_base2": 2.464, + "loss_pixel": 0.1776, + "loss_text": 1.5304, + "ppl": 5.5174, + "step": 5884 + }, + { + "epoch": 0.04, + "global_step": 5885, + "learning_rate": 0.0004762729549248748, + "loss": 1.6961, + "loss_base2": 2.447, + "loss_pixel": 0.1784, + "loss_text": 1.5177, + "ppl": 5.4526, + "step": 5885 + }, + { + "epoch": 0.04, + "global_step": 5886, + "learning_rate": 0.0004762687813021703, + "loss": 1.6653, + "loss_base2": 2.4025, + "loss_pixel": 0.1776, + "loss_text": 1.4877, + "ppl": 5.2873, + "step": 5886 + }, + { + "epoch": 0.04, + "global_step": 5887, + "learning_rate": 0.0004762646076794658, + "loss": 1.6995, + "loss_base2": 2.4519, + "loss_pixel": 0.1787, + "loss_text": 1.5208, + "ppl": 5.4712, + "step": 5887 + }, + { + "epoch": 0.04, + "global_step": 5888, + "learning_rate": 0.0004762604340567613, + "loss": 1.7241, + "loss_base2": 2.4874, + "loss_pixel": 0.1788, + "loss_text": 1.5453, + "ppl": 5.6075, + "step": 5888 + }, + { + "epoch": 0.04, + "global_step": 5889, + "learning_rate": 0.0004762562604340568, + "loss": 1.6781, + "loss_base2": 2.421, + "loss_pixel": 0.1773, + "loss_text": 1.5007, + "ppl": 5.3554, + "step": 5889 + }, + { + "epoch": 0.04, + "global_step": 5890, + "learning_rate": 0.00047625208681135225, + "loss": 1.6933, + "loss_base2": 2.4429, + "loss_pixel": 0.1787, + "loss_text": 1.5146, + "ppl": 5.4374, + "step": 5890 + }, + { + "epoch": 0.04, + "global_step": 5891, + "learning_rate": 0.00047624791318864776, + "loss": 1.6942, + "loss_base2": 2.4442, + "loss_pixel": 0.1787, + "loss_text": 1.5155, + "ppl": 5.4423, + "step": 5891 + }, + { + "epoch": 0.04, + "global_step": 5892, + "learning_rate": 0.00047624373956594326, + "loss": 1.6947, + "loss_base2": 2.4449, + "loss_pixel": 0.1784, + "loss_text": 1.5164, + "ppl": 5.445, + "step": 5892 + }, + { + "epoch": 0.04, + "global_step": 5893, + "learning_rate": 0.00047623956594323877, + "loss": 1.6997, + "loss_base2": 2.4521, + "loss_pixel": 0.1778, + "loss_text": 1.5219, + "ppl": 5.4723, + "step": 5893 + }, + { + "epoch": 0.04, + "global_step": 5894, + "learning_rate": 0.0004762353923205343, + "loss": 1.6708, + "loss_base2": 2.4105, + "loss_pixel": 0.1783, + "loss_text": 1.4925, + "ppl": 5.3164, + "step": 5894 + }, + { + "epoch": 0.04, + "global_step": 5895, + "learning_rate": 0.00047623121869782973, + "loss": 1.7023, + "loss_base2": 2.4559, + "loss_pixel": 0.1773, + "loss_text": 1.525, + "ppl": 5.4866, + "step": 5895 + }, + { + "epoch": 0.04, + "global_step": 5896, + "learning_rate": 0.0004762270450751252, + "loss": 1.6779, + "loss_base2": 2.4207, + "loss_pixel": 0.1776, + "loss_text": 1.5003, + "ppl": 5.3543, + "step": 5896 + }, + { + "epoch": 0.04, + "global_step": 5897, + "learning_rate": 0.0004762228714524207, + "loss": 1.6974, + "loss_base2": 2.4488, + "loss_pixel": 0.1767, + "loss_text": 1.5207, + "ppl": 5.4597, + "step": 5897 + }, + { + "epoch": 0.04, + "global_step": 5898, + "learning_rate": 0.0004762186978297162, + "loss": 1.7123, + "loss_base2": 2.4703, + "loss_pixel": 0.1778, + "loss_text": 1.5344, + "ppl": 5.5417, + "step": 5898 + }, + { + "epoch": 0.04, + "global_step": 5899, + "learning_rate": 0.0004762145242070117, + "loss": 1.6932, + "loss_base2": 2.4428, + "loss_pixel": 0.1778, + "loss_text": 1.5154, + "ppl": 5.4369, + "step": 5899 + }, + { + "epoch": 0.04, + "global_step": 5900, + "learning_rate": 0.00047621035058430716, + "loss": 1.7033, + "loss_base2": 2.4573, + "loss_pixel": 0.179, + "loss_text": 1.5243, + "ppl": 5.492, + "step": 5900 + }, + { + "epoch": 0.04, + "global_step": 5901, + "learning_rate": 0.00047620617696160267, + "loss": 1.697, + "loss_base2": 2.4483, + "loss_pixel": 0.1786, + "loss_text": 1.5185, + "ppl": 5.4576, + "step": 5901 + }, + { + "epoch": 0.04, + "global_step": 5902, + "learning_rate": 0.0004762020033388982, + "loss": 1.696, + "loss_base2": 2.4468, + "loss_pixel": 0.1781, + "loss_text": 1.5179, + "ppl": 5.4521, + "step": 5902 + }, + { + "epoch": 0.04, + "global_step": 5903, + "learning_rate": 0.0004761978297161937, + "loss": 1.6839, + "loss_base2": 2.4294, + "loss_pixel": 0.1783, + "loss_text": 1.5056, + "ppl": 5.3865, + "step": 5903 + }, + { + "epoch": 0.04, + "global_step": 5904, + "learning_rate": 0.00047619365609348913, + "loss": 1.6919, + "loss_base2": 2.4409, + "loss_pixel": 0.1783, + "loss_text": 1.5136, + "ppl": 5.4298, + "step": 5904 + }, + { + "epoch": 0.04, + "global_step": 5905, + "learning_rate": 0.00047618948247078464, + "loss": 1.6809, + "loss_base2": 2.425, + "loss_pixel": 0.1768, + "loss_text": 1.5041, + "ppl": 5.3704, + "step": 5905 + }, + { + "epoch": 0.04, + "global_step": 5906, + "learning_rate": 0.00047618530884808015, + "loss": 1.6897, + "loss_base2": 2.4377, + "loss_pixel": 0.1772, + "loss_text": 1.5125, + "ppl": 5.4179, + "step": 5906 + }, + { + "epoch": 0.04, + "global_step": 5907, + "learning_rate": 0.00047618113522537566, + "loss": 1.687, + "loss_base2": 2.4338, + "loss_pixel": 0.1761, + "loss_text": 1.5109, + "ppl": 5.4032, + "step": 5907 + }, + { + "epoch": 0.04, + "global_step": 5908, + "learning_rate": 0.00047617696160267116, + "loss": 1.7013, + "loss_base2": 2.4545, + "loss_pixel": 0.1785, + "loss_text": 1.5228, + "ppl": 5.4811, + "step": 5908 + }, + { + "epoch": 0.04, + "global_step": 5909, + "learning_rate": 0.0004761727879799666, + "loss": 1.6917, + "loss_base2": 2.4406, + "loss_pixel": 0.1774, + "loss_text": 1.5144, + "ppl": 5.4287, + "step": 5909 + }, + { + "epoch": 0.04, + "global_step": 5910, + "learning_rate": 0.0004761686143572621, + "loss": 1.686, + "loss_base2": 2.4324, + "loss_pixel": 0.1775, + "loss_text": 1.5085, + "ppl": 5.3978, + "step": 5910 + }, + { + "epoch": 0.04, + "global_step": 5911, + "learning_rate": 0.00047616444073455763, + "loss": 1.6878, + "loss_base2": 2.435, + "loss_pixel": 0.1766, + "loss_text": 1.5112, + "ppl": 5.4076, + "step": 5911 + }, + { + "epoch": 0.04, + "global_step": 5912, + "learning_rate": 0.00047616026711185314, + "loss": 1.6688, + "loss_base2": 2.4076, + "loss_pixel": 0.1769, + "loss_text": 1.4919, + "ppl": 5.3058, + "step": 5912 + }, + { + "epoch": 0.04, + "global_step": 5913, + "learning_rate": 0.0004761560934891486, + "loss": 1.6769, + "loss_base2": 2.4193, + "loss_pixel": 0.1791, + "loss_text": 1.4978, + "ppl": 5.3489, + "step": 5913 + }, + { + "epoch": 0.04, + "global_step": 5914, + "learning_rate": 0.0004761519198664441, + "loss": 1.6695, + "loss_base2": 2.4086, + "loss_pixel": 0.1794, + "loss_text": 1.4902, + "ppl": 5.3095, + "step": 5914 + }, + { + "epoch": 0.04, + "global_step": 5915, + "learning_rate": 0.00047614774624373955, + "loss": 1.6989, + "loss_base2": 2.451, + "loss_pixel": 0.1773, + "loss_text": 1.5217, + "ppl": 5.4679, + "step": 5915 + }, + { + "epoch": 0.04, + "global_step": 5916, + "learning_rate": 0.00047614357262103506, + "loss": 1.6749, + "loss_base2": 2.4164, + "loss_pixel": 0.1761, + "loss_text": 1.4988, + "ppl": 5.3383, + "step": 5916 + }, + { + "epoch": 0.04, + "global_step": 5917, + "learning_rate": 0.00047613939899833057, + "loss": 1.6916, + "loss_base2": 2.4405, + "loss_pixel": 0.1773, + "loss_text": 1.5144, + "ppl": 5.4282, + "step": 5917 + }, + { + "epoch": 0.04, + "global_step": 5918, + "learning_rate": 0.000476135225375626, + "loss": 1.667, + "loss_base2": 2.405, + "loss_pixel": 0.1769, + "loss_text": 1.4901, + "ppl": 5.2963, + "step": 5918 + }, + { + "epoch": 0.04, + "global_step": 5919, + "learning_rate": 0.00047613105175292153, + "loss": 1.6808, + "loss_base2": 2.4249, + "loss_pixel": 0.1746, + "loss_text": 1.5062, + "ppl": 5.3699, + "step": 5919 + }, + { + "epoch": 0.04, + "global_step": 5920, + "learning_rate": 0.00047612687813021703, + "loss": 1.6991, + "loss_base2": 2.4513, + "loss_pixel": 0.173, + "loss_text": 1.5261, + "ppl": 5.469, + "step": 5920 + }, + { + "epoch": 0.04, + "global_step": 5921, + "learning_rate": 0.00047612270450751254, + "loss": 1.6799, + "loss_base2": 2.4236, + "loss_pixel": 0.1754, + "loss_text": 1.5045, + "ppl": 5.365, + "step": 5921 + }, + { + "epoch": 0.04, + "global_step": 5922, + "learning_rate": 0.000476118530884808, + "loss": 1.6782, + "loss_base2": 2.4211, + "loss_pixel": 0.1748, + "loss_text": 1.5035, + "ppl": 5.3559, + "step": 5922 + }, + { + "epoch": 0.04, + "global_step": 5923, + "learning_rate": 0.0004761143572621035, + "loss": 1.676, + "loss_base2": 2.418, + "loss_pixel": 0.1737, + "loss_text": 1.5023, + "ppl": 5.3441, + "step": 5923 + }, + { + "epoch": 0.04, + "global_step": 5924, + "learning_rate": 0.000476110183639399, + "loss": 1.6807, + "loss_base2": 2.4247, + "loss_pixel": 0.1827, + "loss_text": 1.498, + "ppl": 5.3693, + "step": 5924 + }, + { + "epoch": 0.04, + "global_step": 5925, + "learning_rate": 0.0004761060100166945, + "loss": 1.7304, + "loss_base2": 2.4964, + "loss_pixel": 0.2069, + "loss_text": 1.5235, + "ppl": 5.6429, + "step": 5925 + }, + { + "epoch": 0.04, + "global_step": 5926, + "learning_rate": 0.00047610183639399, + "loss": 1.7627, + "loss_base2": 2.543, + "loss_pixel": 0.2501, + "loss_text": 1.5126, + "ppl": 5.8282, + "step": 5926 + }, + { + "epoch": 0.04, + "global_step": 5927, + "learning_rate": 0.0004760976627712855, + "loss": 1.8273, + "loss_base2": 2.6362, + "loss_pixel": 0.3135, + "loss_text": 1.5138, + "ppl": 6.2171, + "step": 5927 + }, + { + "epoch": 0.04, + "global_step": 5928, + "learning_rate": 0.000476093489148581, + "loss": 1.8491, + "loss_base2": 2.6677, + "loss_pixel": 0.3409, + "loss_text": 1.5082, + "ppl": 6.3541, + "step": 5928 + }, + { + "epoch": 0.04, + "global_step": 5929, + "learning_rate": 0.0004760893155258765, + "loss": 1.8663, + "loss_base2": 2.6925, + "loss_pixel": 0.3444, + "loss_text": 1.5218, + "ppl": 6.4643, + "step": 5929 + }, + { + "epoch": 0.04, + "global_step": 5930, + "learning_rate": 0.000476085141903172, + "loss": 1.8606, + "loss_base2": 2.6843, + "loss_pixel": 0.3471, + "loss_text": 1.5135, + "ppl": 6.4276, + "step": 5930 + }, + { + "epoch": 0.04, + "global_step": 5931, + "learning_rate": 0.00047608096828046745, + "loss": 1.8883, + "loss_base2": 2.7242, + "loss_pixel": 0.3751, + "loss_text": 1.5133, + "ppl": 6.6081, + "step": 5931 + }, + { + "epoch": 0.04, + "global_step": 5932, + "learning_rate": 0.00047607679465776296, + "loss": 1.8913, + "loss_base2": 2.7286, + "loss_pixel": 0.3552, + "loss_text": 1.5361, + "ppl": 6.628, + "step": 5932 + }, + { + "epoch": 0.04, + "global_step": 5933, + "learning_rate": 0.0004760726210350584, + "loss": 1.9302, + "loss_base2": 2.7847, + "loss_pixel": 0.4147, + "loss_text": 1.5154, + "ppl": 6.8909, + "step": 5933 + }, + { + "epoch": 0.04, + "global_step": 5934, + "learning_rate": 0.0004760684474123539, + "loss": 1.918, + "loss_base2": 2.7671, + "loss_pixel": 0.3933, + "loss_text": 1.5247, + "ppl": 6.8073, + "step": 5934 + }, + { + "epoch": 0.04, + "global_step": 5935, + "learning_rate": 0.00047606427378964943, + "loss": 1.9909, + "loss_base2": 2.8723, + "loss_pixel": 0.3932, + "loss_text": 1.5977, + "ppl": 7.3221, + "step": 5935 + }, + { + "epoch": 0.04, + "global_step": 5936, + "learning_rate": 0.0004760601001669449, + "loss": 2.0653, + "loss_base2": 2.9796, + "loss_pixel": 0.3893, + "loss_text": 1.676, + "ppl": 7.8877, + "step": 5936 + }, + { + "epoch": 0.04, + "global_step": 5937, + "learning_rate": 0.0004760559265442404, + "loss": 2.0862, + "loss_base2": 3.0098, + "loss_pixel": 0.3822, + "loss_text": 1.704, + "ppl": 8.0543, + "step": 5937 + }, + { + "epoch": 0.04, + "global_step": 5938, + "learning_rate": 0.0004760517529215359, + "loss": 2.4472, + "loss_base2": 3.5306, + "loss_pixel": 0.3842, + "loss_text": 2.063, + "ppl": 11.5559, + "step": 5938 + }, + { + "epoch": 0.04, + "global_step": 5939, + "learning_rate": 0.0004760475792988314, + "loss": 2.3686, + "loss_base2": 3.4172, + "loss_pixel": 0.3846, + "loss_text": 1.9839, + "ppl": 10.6824, + "step": 5939 + }, + { + "epoch": 0.04, + "global_step": 5940, + "learning_rate": 0.00047604340567612686, + "loss": 2.4801, + "loss_base2": 3.578, + "loss_pixel": 0.3843, + "loss_text": 2.0958, + "ppl": 11.9425, + "step": 5940 + }, + { + "epoch": 0.04, + "global_step": 5941, + "learning_rate": 0.00047603923205342236, + "loss": 2.6902, + "loss_base2": 3.8811, + "loss_pixel": 0.381, + "loss_text": 2.3093, + "ppl": 14.7346, + "step": 5941 + }, + { + "epoch": 0.04, + "global_step": 5942, + "learning_rate": 0.00047603505843071787, + "loss": 2.7172, + "loss_base2": 3.9201, + "loss_pixel": 0.3825, + "loss_text": 2.3348, + "ppl": 15.1379, + "step": 5942 + }, + { + "epoch": 0.04, + "global_step": 5943, + "learning_rate": 0.0004760308848080134, + "loss": 2.61, + "loss_base2": 3.7654, + "loss_pixel": 0.3799, + "loss_text": 2.23, + "ppl": 13.5991, + "step": 5943 + }, + { + "epoch": 0.04, + "global_step": 5944, + "learning_rate": 0.0004760267111853089, + "loss": 2.8456, + "loss_base2": 4.1053, + "loss_pixel": 0.3847, + "loss_text": 2.461, + "ppl": 17.2119, + "step": 5944 + }, + { + "epoch": 0.04, + "global_step": 5945, + "learning_rate": 0.00047602253756260434, + "loss": 2.9179, + "loss_base2": 4.2096, + "loss_pixel": 0.388, + "loss_text": 2.5298, + "ppl": 18.5024, + "step": 5945 + }, + { + "epoch": 0.04, + "global_step": 5946, + "learning_rate": 0.00047601836393989985, + "loss": 2.82, + "loss_base2": 4.0684, + "loss_pixel": 0.3828, + "loss_text": 2.4372, + "ppl": 16.7769, + "step": 5946 + }, + { + "epoch": 0.04, + "global_step": 5947, + "learning_rate": 0.00047601419031719535, + "loss": 3.1139, + "loss_base2": 4.4924, + "loss_pixel": 0.3814, + "loss_text": 2.7325, + "ppl": 22.5087, + "step": 5947 + }, + { + "epoch": 0.04, + "global_step": 5948, + "learning_rate": 0.00047601001669449086, + "loss": 3.0296, + "loss_base2": 4.3708, + "loss_pixel": 0.3832, + "loss_text": 2.6464, + "ppl": 20.689, + "step": 5948 + }, + { + "epoch": 0.04, + "global_step": 5949, + "learning_rate": 0.0004760058430717863, + "loss": 2.9253, + "loss_base2": 4.2203, + "loss_pixel": 0.383, + "loss_text": 2.5422, + "ppl": 18.6398, + "step": 5949 + }, + { + "epoch": 0.04, + "global_step": 5950, + "learning_rate": 0.0004760016694490818, + "loss": 2.9895, + "loss_base2": 4.3129, + "loss_pixel": 0.3816, + "loss_text": 2.6079, + "ppl": 19.8757, + "step": 5950 + }, + { + "epoch": 0.04, + "global_step": 5951, + "learning_rate": 0.00047599749582637733, + "loss": 3.3078, + "loss_base2": 4.7721, + "loss_pixel": 0.3788, + "loss_text": 2.929, + "ppl": 27.3249, + "step": 5951 + }, + { + "epoch": 0.04, + "global_step": 5952, + "learning_rate": 0.0004759933222036728, + "loss": 3.1468, + "loss_base2": 4.5399, + "loss_pixel": 0.3823, + "loss_text": 2.7645, + "ppl": 23.2615, + "step": 5952 + }, + { + "epoch": 0.04, + "global_step": 5953, + "learning_rate": 0.0004759891485809683, + "loss": 2.9391, + "loss_base2": 4.2402, + "loss_pixel": 0.3755, + "loss_text": 2.5636, + "ppl": 18.8988, + "step": 5953 + }, + { + "epoch": 0.04, + "global_step": 5954, + "learning_rate": 0.00047598497495826374, + "loss": 2.8605, + "loss_base2": 4.1268, + "loss_pixel": 0.3717, + "loss_text": 2.4888, + "ppl": 17.4703, + "step": 5954 + }, + { + "epoch": 0.04, + "global_step": 5955, + "learning_rate": 0.00047598080133555925, + "loss": 2.835, + "loss_base2": 4.09, + "loss_pixel": 0.3741, + "loss_text": 2.4609, + "ppl": 17.0304, + "step": 5955 + }, + { + "epoch": 0.04, + "global_step": 5956, + "learning_rate": 0.00047597662771285476, + "loss": 3.0605, + "loss_base2": 4.4154, + "loss_pixel": 0.432, + "loss_text": 2.6285, + "ppl": 21.3382, + "step": 5956 + }, + { + "epoch": 0.04, + "global_step": 5957, + "learning_rate": 0.00047597245409015026, + "loss": 2.7677, + "loss_base2": 3.9929, + "loss_pixel": 0.3886, + "loss_text": 2.3791, + "ppl": 15.922, + "step": 5957 + }, + { + "epoch": 0.04, + "global_step": 5958, + "learning_rate": 0.00047596828046744577, + "loss": 2.766, + "loss_base2": 3.9905, + "loss_pixel": 0.3854, + "loss_text": 2.3806, + "ppl": 15.8949, + "step": 5958 + }, + { + "epoch": 0.04, + "global_step": 5959, + "learning_rate": 0.0004759641068447412, + "loss": 2.7877, + "loss_base2": 4.0218, + "loss_pixel": 0.3785, + "loss_text": 2.4092, + "ppl": 16.2436, + "step": 5959 + }, + { + "epoch": 0.04, + "global_step": 5960, + "learning_rate": 0.00047595993322203673, + "loss": 2.781, + "loss_base2": 4.0121, + "loss_pixel": 0.3791, + "loss_text": 2.4019, + "ppl": 16.1351, + "step": 5960 + }, + { + "epoch": 0.04, + "global_step": 5961, + "learning_rate": 0.00047595575959933224, + "loss": 2.7403, + "loss_base2": 3.9534, + "loss_pixel": 0.3764, + "loss_text": 2.3639, + "ppl": 15.4916, + "step": 5961 + }, + { + "epoch": 0.04, + "global_step": 5962, + "learning_rate": 0.00047595158597662775, + "loss": 2.7019, + "loss_base2": 3.898, + "loss_pixel": 0.3767, + "loss_text": 2.3251, + "ppl": 14.908, + "step": 5962 + }, + { + "epoch": 0.04, + "global_step": 5963, + "learning_rate": 0.0004759474123539232, + "loss": 2.6744, + "loss_base2": 3.8583, + "loss_pixel": 0.3826, + "loss_text": 2.2917, + "ppl": 14.5036, + "step": 5963 + }, + { + "epoch": 0.04, + "global_step": 5964, + "learning_rate": 0.0004759432387312187, + "loss": 2.6554, + "loss_base2": 3.8309, + "loss_pixel": 0.3769, + "loss_text": 2.2784, + "ppl": 14.2307, + "step": 5964 + }, + { + "epoch": 0.04, + "global_step": 5965, + "learning_rate": 0.0004759390651085142, + "loss": 2.621, + "loss_base2": 3.7813, + "loss_pixel": 0.3782, + "loss_text": 2.2428, + "ppl": 13.7495, + "step": 5965 + }, + { + "epoch": 0.04, + "global_step": 5966, + "learning_rate": 0.0004759348914858097, + "loss": 2.5864, + "loss_base2": 3.7314, + "loss_pixel": 0.3763, + "loss_text": 2.2102, + "ppl": 13.2819, + "step": 5966 + }, + { + "epoch": 0.04, + "global_step": 5967, + "learning_rate": 0.00047593071786310523, + "loss": 2.5788, + "loss_base2": 3.7204, + "loss_pixel": 0.3766, + "loss_text": 2.2022, + "ppl": 13.1813, + "step": 5967 + }, + { + "epoch": 0.04, + "global_step": 5968, + "learning_rate": 0.0004759265442404007, + "loss": 2.5707, + "loss_base2": 3.7087, + "loss_pixel": 0.3757, + "loss_text": 2.1951, + "ppl": 13.075, + "step": 5968 + }, + { + "epoch": 0.04, + "global_step": 5969, + "learning_rate": 0.0004759223706176962, + "loss": 2.5524, + "loss_base2": 3.6823, + "loss_pixel": 0.3746, + "loss_text": 2.1778, + "ppl": 12.8379, + "step": 5969 + }, + { + "epoch": 0.04, + "global_step": 5970, + "learning_rate": 0.0004759181969949917, + "loss": 2.5167, + "loss_base2": 3.6308, + "loss_pixel": 0.3743, + "loss_text": 2.1424, + "ppl": 12.3876, + "step": 5970 + }, + { + "epoch": 0.04, + "global_step": 5971, + "learning_rate": 0.00047591402337228715, + "loss": 2.4914, + "loss_base2": 3.5943, + "loss_pixel": 0.3736, + "loss_text": 2.1178, + "ppl": 12.0782, + "step": 5971 + }, + { + "epoch": 0.04, + "global_step": 5972, + "learning_rate": 0.0004759098497495826, + "loss": 2.468, + "loss_base2": 3.5606, + "loss_pixel": 0.3707, + "loss_text": 2.0974, + "ppl": 11.7988, + "step": 5972 + }, + { + "epoch": 0.04, + "global_step": 5973, + "learning_rate": 0.0004759056761268781, + "loss": 2.4649, + "loss_base2": 3.5561, + "loss_pixel": 0.3724, + "loss_text": 2.0925, + "ppl": 11.7623, + "step": 5973 + }, + { + "epoch": 0.04, + "global_step": 5974, + "learning_rate": 0.0004759015025041736, + "loss": 2.4617, + "loss_base2": 3.5515, + "loss_pixel": 0.3706, + "loss_text": 2.0912, + "ppl": 11.7247, + "step": 5974 + }, + { + "epoch": 0.04, + "global_step": 5975, + "learning_rate": 0.0004758973288814691, + "loss": 2.4132, + "loss_base2": 3.4815, + "loss_pixel": 0.3703, + "loss_text": 2.0429, + "ppl": 11.1696, + "step": 5975 + }, + { + "epoch": 0.04, + "global_step": 5976, + "learning_rate": 0.00047589315525876463, + "loss": 2.4036, + "loss_base2": 3.4677, + "loss_pixel": 0.3718, + "loss_text": 2.0318, + "ppl": 11.0629, + "step": 5976 + }, + { + "epoch": 0.04, + "global_step": 5977, + "learning_rate": 0.0004758889816360601, + "loss": 2.3965, + "loss_base2": 3.4574, + "loss_pixel": 0.3675, + "loss_text": 2.029, + "ppl": 10.9847, + "step": 5977 + }, + { + "epoch": 0.04, + "global_step": 5978, + "learning_rate": 0.0004758848080133556, + "loss": 2.3882, + "loss_base2": 3.4454, + "loss_pixel": 0.368, + "loss_text": 2.0202, + "ppl": 10.8939, + "step": 5978 + }, + { + "epoch": 0.04, + "global_step": 5979, + "learning_rate": 0.0004758806343906511, + "loss": 2.3778, + "loss_base2": 3.4304, + "loss_pixel": 0.3653, + "loss_text": 2.0125, + "ppl": 10.7812, + "step": 5979 + }, + { + "epoch": 0.04, + "global_step": 5980, + "learning_rate": 0.0004758764607679466, + "loss": 2.3547, + "loss_base2": 3.3971, + "loss_pixel": 0.3638, + "loss_text": 1.9909, + "ppl": 10.535, + "step": 5980 + }, + { + "epoch": 0.04, + "global_step": 5981, + "learning_rate": 0.00047587228714524206, + "loss": 2.3325, + "loss_base2": 3.3651, + "loss_pixel": 0.3613, + "loss_text": 1.9712, + "ppl": 10.3037, + "step": 5981 + }, + { + "epoch": 0.04, + "global_step": 5982, + "learning_rate": 0.00047586811352253757, + "loss": 2.3214, + "loss_base2": 3.3491, + "loss_pixel": 0.3643, + "loss_text": 1.9571, + "ppl": 10.1899, + "step": 5982 + }, + { + "epoch": 0.04, + "global_step": 5983, + "learning_rate": 0.0004758639398998331, + "loss": 2.3484, + "loss_base2": 3.388, + "loss_pixel": 0.3938, + "loss_text": 1.9545, + "ppl": 10.4688, + "step": 5983 + }, + { + "epoch": 0.04, + "global_step": 5984, + "learning_rate": 0.0004758597662771286, + "loss": 2.3096, + "loss_base2": 3.332, + "loss_pixel": 0.374, + "loss_text": 1.9356, + "ppl": 10.0704, + "step": 5984 + }, + { + "epoch": 0.04, + "global_step": 5985, + "learning_rate": 0.0004758555926544241, + "loss": 2.3028, + "loss_base2": 3.3222, + "loss_pixel": 0.3791, + "loss_text": 1.9236, + "ppl": 10.0021, + "step": 5985 + }, + { + "epoch": 0.04, + "global_step": 5986, + "learning_rate": 0.00047585141903171954, + "loss": 2.3238, + "loss_base2": 3.3525, + "loss_pixel": 0.3773, + "loss_text": 1.9465, + "ppl": 10.2144, + "step": 5986 + }, + { + "epoch": 0.04, + "global_step": 5987, + "learning_rate": 0.00047584724540901505, + "loss": 2.3096, + "loss_base2": 3.332, + "loss_pixel": 0.3771, + "loss_text": 1.9325, + "ppl": 10.0704, + "step": 5987 + }, + { + "epoch": 0.04, + "global_step": 5988, + "learning_rate": 0.00047584307178631056, + "loss": 2.3104, + "loss_base2": 3.3332, + "loss_pixel": 0.375, + "loss_text": 1.9355, + "ppl": 10.0785, + "step": 5988 + }, + { + "epoch": 0.04, + "global_step": 5989, + "learning_rate": 0.00047583889816360606, + "loss": 2.289, + "loss_base2": 3.3023, + "loss_pixel": 0.3735, + "loss_text": 1.9155, + "ppl": 9.8651, + "step": 5989 + }, + { + "epoch": 0.04, + "global_step": 5990, + "learning_rate": 0.00047583472454090146, + "loss": 2.2849, + "loss_base2": 3.2964, + "loss_pixel": 0.374, + "loss_text": 1.9109, + "ppl": 9.8247, + "step": 5990 + }, + { + "epoch": 0.04, + "global_step": 5991, + "learning_rate": 0.00047583055091819697, + "loss": 2.263, + "loss_base2": 3.2648, + "loss_pixel": 0.3719, + "loss_text": 1.8911, + "ppl": 9.6119, + "step": 5991 + }, + { + "epoch": 0.04, + "global_step": 5992, + "learning_rate": 0.0004758263772954925, + "loss": 2.252, + "loss_base2": 3.2489, + "loss_pixel": 0.3715, + "loss_text": 1.8805, + "ppl": 9.5067, + "step": 5992 + }, + { + "epoch": 0.04, + "global_step": 5993, + "learning_rate": 0.000475822203672788, + "loss": 2.2411, + "loss_base2": 3.2332, + "loss_pixel": 0.3698, + "loss_text": 1.8712, + "ppl": 9.4037, + "step": 5993 + }, + { + "epoch": 0.04, + "global_step": 5994, + "learning_rate": 0.0004758180300500835, + "loss": 2.2328, + "loss_base2": 3.2212, + "loss_pixel": 0.368, + "loss_text": 1.8648, + "ppl": 9.3259, + "step": 5994 + }, + { + "epoch": 0.04, + "global_step": 5995, + "learning_rate": 0.00047581385642737895, + "loss": 2.2385, + "loss_base2": 3.2295, + "loss_pixel": 0.3676, + "loss_text": 1.8709, + "ppl": 9.3793, + "step": 5995 + }, + { + "epoch": 0.04, + "global_step": 5996, + "learning_rate": 0.00047580968280467445, + "loss": 2.225, + "loss_base2": 3.21, + "loss_pixel": 0.3651, + "loss_text": 1.8599, + "ppl": 9.2535, + "step": 5996 + }, + { + "epoch": 0.04, + "global_step": 5997, + "learning_rate": 0.00047580550918196996, + "loss": 2.1966, + "loss_base2": 3.169, + "loss_pixel": 0.3633, + "loss_text": 1.8333, + "ppl": 8.9944, + "step": 5997 + }, + { + "epoch": 0.04, + "global_step": 5998, + "learning_rate": 0.00047580133555926547, + "loss": 2.2033, + "loss_base2": 3.1787, + "loss_pixel": 0.3614, + "loss_text": 1.8418, + "ppl": 9.0548, + "step": 5998 + }, + { + "epoch": 0.04, + "global_step": 5999, + "learning_rate": 0.0004757971619365609, + "loss": 2.2056, + "loss_base2": 3.182, + "loss_pixel": 0.3605, + "loss_text": 1.8451, + "ppl": 9.0757, + "step": 5999 + }, + { + "epoch": 0.04, + "global_step": 6000, + "learning_rate": 0.00047579298831385643, + "loss": 2.1754, + "loss_base2": 3.1384, + "loss_pixel": 0.3583, + "loss_text": 1.8171, + "ppl": 8.8057, + "step": 6000 + }, + { + "epoch": 0.04, + "global_step": 6001, + "learning_rate": 0.00047578881469115193, + "loss": 2.21, + "loss_base2": 3.1884, + "loss_pixel": 0.3585, + "loss_text": 1.8515, + "ppl": 9.1157, + "step": 6001 + }, + { + "epoch": 0.04, + "global_step": 6002, + "learning_rate": 0.00047578464106844744, + "loss": 2.0365, + "loss_base2": 2.938, + "loss_pixel": 0.3575, + "loss_text": 1.679, + "ppl": 7.6637, + "step": 6002 + }, + { + "epoch": 0.04, + "global_step": 6003, + "learning_rate": 0.00047578046744574295, + "loss": 2.0075, + "loss_base2": 2.8962, + "loss_pixel": 0.3591, + "loss_text": 1.6484, + "ppl": 7.4447, + "step": 6003 + }, + { + "epoch": 0.04, + "global_step": 6004, + "learning_rate": 0.0004757762938230384, + "loss": 1.9836, + "loss_base2": 2.8617, + "loss_pixel": 0.3553, + "loss_text": 1.6283, + "ppl": 7.2689, + "step": 6004 + }, + { + "epoch": 0.04, + "global_step": 6005, + "learning_rate": 0.0004757721202003339, + "loss": 1.9659, + "loss_base2": 2.8362, + "loss_pixel": 0.355, + "loss_text": 1.6109, + "ppl": 7.1413, + "step": 6005 + }, + { + "epoch": 0.04, + "global_step": 6006, + "learning_rate": 0.0004757679465776294, + "loss": 1.9309, + "loss_base2": 2.7857, + "loss_pixel": 0.3557, + "loss_text": 1.5752, + "ppl": 6.8957, + "step": 6006 + }, + { + "epoch": 0.04, + "global_step": 6007, + "learning_rate": 0.0004757637729549249, + "loss": 1.9351, + "loss_base2": 2.7918, + "loss_pixel": 0.3534, + "loss_text": 1.5817, + "ppl": 6.9247, + "step": 6007 + }, + { + "epoch": 0.04, + "global_step": 6008, + "learning_rate": 0.0004757595993322203, + "loss": 1.9395, + "loss_base2": 2.7981, + "loss_pixel": 0.3534, + "loss_text": 1.586, + "ppl": 6.9553, + "step": 6008 + }, + { + "epoch": 0.04, + "global_step": 6009, + "learning_rate": 0.00047575542570951583, + "loss": 1.9265, + "loss_base2": 2.7794, + "loss_pixel": 0.354, + "loss_text": 1.5726, + "ppl": 6.8654, + "step": 6009 + }, + { + "epoch": 0.04, + "global_step": 6010, + "learning_rate": 0.00047575125208681134, + "loss": 1.9207, + "loss_base2": 2.771, + "loss_pixel": 0.352, + "loss_text": 1.5687, + "ppl": 6.8257, + "step": 6010 + }, + { + "epoch": 0.04, + "global_step": 6011, + "learning_rate": 0.00047574707846410685, + "loss": 1.9362, + "loss_base2": 2.7933, + "loss_pixel": 0.3494, + "loss_text": 1.5869, + "ppl": 6.9324, + "step": 6011 + }, + { + "epoch": 0.04, + "global_step": 6012, + "learning_rate": 0.00047574290484140235, + "loss": 1.9098, + "loss_base2": 2.7553, + "loss_pixel": 0.3507, + "loss_text": 1.5591, + "ppl": 6.7517, + "step": 6012 + }, + { + "epoch": 0.04, + "global_step": 6013, + "learning_rate": 0.0004757387312186978, + "loss": 1.8777, + "loss_base2": 2.7089, + "loss_pixel": 0.3481, + "loss_text": 1.5296, + "ppl": 6.5384, + "step": 6013 + }, + { + "epoch": 0.04, + "global_step": 6014, + "learning_rate": 0.0004757345575959933, + "loss": 1.8685, + "loss_base2": 2.6957, + "loss_pixel": 0.3469, + "loss_text": 1.5216, + "ppl": 6.4786, + "step": 6014 + }, + { + "epoch": 0.04, + "global_step": 6015, + "learning_rate": 0.0004757303839732888, + "loss": 1.8597, + "loss_base2": 2.683, + "loss_pixel": 0.3444, + "loss_text": 1.5153, + "ppl": 6.4218, + "step": 6015 + }, + { + "epoch": 0.04, + "global_step": 6016, + "learning_rate": 0.00047572621035058433, + "loss": 1.8692, + "loss_base2": 2.6967, + "loss_pixel": 0.3442, + "loss_text": 1.525, + "ppl": 6.4831, + "step": 6016 + }, + { + "epoch": 0.04, + "global_step": 6017, + "learning_rate": 0.00047572203672787983, + "loss": 1.9181, + "loss_base2": 2.7672, + "loss_pixel": 0.3475, + "loss_text": 1.5706, + "ppl": 6.808, + "step": 6017 + }, + { + "epoch": 0.04, + "global_step": 6018, + "learning_rate": 0.0004757178631051753, + "loss": 1.905, + "loss_base2": 2.7483, + "loss_pixel": 0.3504, + "loss_text": 1.5546, + "ppl": 6.7194, + "step": 6018 + }, + { + "epoch": 0.04, + "global_step": 6019, + "learning_rate": 0.0004757136894824708, + "loss": 1.8911, + "loss_base2": 2.7283, + "loss_pixel": 0.3455, + "loss_text": 1.5456, + "ppl": 6.6267, + "step": 6019 + }, + { + "epoch": 0.04, + "global_step": 6020, + "learning_rate": 0.0004757095158597663, + "loss": 1.8919, + "loss_base2": 2.7294, + "loss_pixel": 0.3455, + "loss_text": 1.5465, + "ppl": 6.632, + "step": 6020 + }, + { + "epoch": 0.04, + "global_step": 6021, + "learning_rate": 0.0004757053422370618, + "loss": 1.8588, + "loss_base2": 2.6817, + "loss_pixel": 0.3408, + "loss_text": 1.518, + "ppl": 6.416, + "step": 6021 + }, + { + "epoch": 0.04, + "global_step": 6022, + "learning_rate": 0.00047570116861435726, + "loss": 1.8667, + "loss_base2": 2.6931, + "loss_pixel": 0.3415, + "loss_text": 1.5253, + "ppl": 6.4669, + "step": 6022 + }, + { + "epoch": 0.04, + "global_step": 6023, + "learning_rate": 0.00047569699499165277, + "loss": 1.8419, + "loss_base2": 2.6573, + "loss_pixel": 0.3393, + "loss_text": 1.5025, + "ppl": 6.3085, + "step": 6023 + }, + { + "epoch": 0.04, + "global_step": 6024, + "learning_rate": 0.0004756928213689483, + "loss": 1.835, + "loss_base2": 2.6473, + "loss_pixel": 0.3372, + "loss_text": 1.4978, + "ppl": 6.2651, + "step": 6024 + }, + { + "epoch": 0.04, + "global_step": 6025, + "learning_rate": 0.0004756886477462438, + "loss": 1.8375, + "loss_base2": 2.651, + "loss_pixel": 0.3373, + "loss_text": 1.5001, + "ppl": 6.2808, + "step": 6025 + }, + { + "epoch": 0.04, + "global_step": 6026, + "learning_rate": 0.0004756844741235393, + "loss": 1.8267, + "loss_base2": 2.6354, + "loss_pixel": 0.3419, + "loss_text": 1.4848, + "ppl": 6.2133, + "step": 6026 + }, + { + "epoch": 0.04, + "global_step": 6027, + "learning_rate": 0.0004756803005008347, + "loss": 1.82, + "loss_base2": 2.6257, + "loss_pixel": 0.3379, + "loss_text": 1.4821, + "ppl": 6.1719, + "step": 6027 + }, + { + "epoch": 0.04, + "global_step": 6028, + "learning_rate": 0.0004756761268781302, + "loss": 1.8126, + "loss_base2": 2.615, + "loss_pixel": 0.3347, + "loss_text": 1.4778, + "ppl": 6.1264, + "step": 6028 + }, + { + "epoch": 0.04, + "global_step": 6029, + "learning_rate": 0.0004756719532554257, + "loss": 1.793, + "loss_base2": 2.5868, + "loss_pixel": 0.3324, + "loss_text": 1.4606, + "ppl": 6.0074, + "step": 6029 + }, + { + "epoch": 0.04, + "global_step": 6030, + "learning_rate": 0.0004756677796327212, + "loss": 1.7972, + "loss_base2": 2.5928, + "loss_pixel": 0.3327, + "loss_text": 1.4644, + "ppl": 6.0327, + "step": 6030 + }, + { + "epoch": 0.04, + "global_step": 6031, + "learning_rate": 0.00047566360601001667, + "loss": 1.823, + "loss_base2": 2.63, + "loss_pixel": 0.3325, + "loss_text": 1.4905, + "ppl": 6.1904, + "step": 6031 + }, + { + "epoch": 0.04, + "global_step": 6032, + "learning_rate": 0.0004756594323873122, + "loss": 1.8018, + "loss_base2": 2.5994, + "loss_pixel": 0.3315, + "loss_text": 1.4703, + "ppl": 6.0605, + "step": 6032 + }, + { + "epoch": 0.04, + "global_step": 6033, + "learning_rate": 0.0004756552587646077, + "loss": 1.7962, + "loss_base2": 2.5914, + "loss_pixel": 0.3301, + "loss_text": 1.466, + "ppl": 6.0267, + "step": 6033 + }, + { + "epoch": 0.04, + "global_step": 6034, + "learning_rate": 0.0004756510851419032, + "loss": 1.7739, + "loss_base2": 2.5592, + "loss_pixel": 0.3322, + "loss_text": 1.4416, + "ppl": 5.8938, + "step": 6034 + }, + { + "epoch": 0.04, + "global_step": 6035, + "learning_rate": 0.0004756469115191987, + "loss": 1.7755, + "loss_base2": 2.5615, + "loss_pixel": 0.3263, + "loss_text": 1.4493, + "ppl": 5.9032, + "step": 6035 + }, + { + "epoch": 0.04, + "global_step": 6036, + "learning_rate": 0.00047564273789649415, + "loss": 1.7773, + "loss_base2": 2.5641, + "loss_pixel": 0.3315, + "loss_text": 1.4458, + "ppl": 5.9139, + "step": 6036 + }, + { + "epoch": 0.04, + "global_step": 6037, + "learning_rate": 0.00047563856427378966, + "loss": 1.762, + "loss_base2": 2.542, + "loss_pixel": 0.338, + "loss_text": 1.4239, + "ppl": 5.8241, + "step": 6037 + }, + { + "epoch": 0.04, + "global_step": 6038, + "learning_rate": 0.00047563439065108516, + "loss": 1.7616, + "loss_base2": 2.5415, + "loss_pixel": 0.3319, + "loss_text": 1.4297, + "ppl": 5.8217, + "step": 6038 + }, + { + "epoch": 0.04, + "global_step": 6039, + "learning_rate": 0.00047563021702838067, + "loss": 1.7656, + "loss_base2": 2.5472, + "loss_pixel": 0.3298, + "loss_text": 1.4359, + "ppl": 5.8451, + "step": 6039 + }, + { + "epoch": 0.04, + "global_step": 6040, + "learning_rate": 0.0004756260434056761, + "loss": 1.7729, + "loss_base2": 2.5578, + "loss_pixel": 0.3315, + "loss_text": 1.4415, + "ppl": 5.8879, + "step": 6040 + }, + { + "epoch": 0.04, + "global_step": 6041, + "learning_rate": 0.00047562186978297163, + "loss": 1.7434, + "loss_base2": 2.5152, + "loss_pixel": 0.331, + "loss_text": 1.4125, + "ppl": 5.7167, + "step": 6041 + }, + { + "epoch": 0.04, + "global_step": 6042, + "learning_rate": 0.00047561769616026714, + "loss": 1.7335, + "loss_base2": 2.5009, + "loss_pixel": 0.3246, + "loss_text": 1.409, + "ppl": 5.6604, + "step": 6042 + }, + { + "epoch": 0.04, + "global_step": 6043, + "learning_rate": 0.00047561352253756265, + "loss": 1.7285, + "loss_base2": 2.4937, + "loss_pixel": 0.3233, + "loss_text": 1.4052, + "ppl": 5.6322, + "step": 6043 + }, + { + "epoch": 0.04, + "global_step": 6044, + "learning_rate": 0.00047560934891485815, + "loss": 1.7588, + "loss_base2": 2.5374, + "loss_pixel": 0.3204, + "loss_text": 1.4383, + "ppl": 5.8055, + "step": 6044 + }, + { + "epoch": 0.04, + "global_step": 6045, + "learning_rate": 0.0004756051752921536, + "loss": 1.7449, + "loss_base2": 2.5174, + "loss_pixel": 0.3201, + "loss_text": 1.4248, + "ppl": 5.7253, + "step": 6045 + }, + { + "epoch": 0.04, + "global_step": 6046, + "learning_rate": 0.00047560100166944906, + "loss": 1.7211, + "loss_base2": 2.483, + "loss_pixel": 0.3171, + "loss_text": 1.404, + "ppl": 5.5907, + "step": 6046 + }, + { + "epoch": 0.04, + "global_step": 6047, + "learning_rate": 0.00047559682804674457, + "loss": 1.7213, + "loss_base2": 2.4833, + "loss_pixel": 0.3147, + "loss_text": 1.4066, + "ppl": 5.5918, + "step": 6047 + }, + { + "epoch": 0.04, + "global_step": 6048, + "learning_rate": 0.0004755926544240401, + "loss": 1.7288, + "loss_base2": 2.4941, + "loss_pixel": 0.315, + "loss_text": 1.4138, + "ppl": 5.6339, + "step": 6048 + }, + { + "epoch": 0.04, + "global_step": 6049, + "learning_rate": 0.0004755884808013355, + "loss": 1.7352, + "loss_base2": 2.5034, + "loss_pixel": 0.3127, + "loss_text": 1.4225, + "ppl": 5.6701, + "step": 6049 + }, + { + "epoch": 0.04, + "global_step": 6050, + "learning_rate": 0.00047558430717863103, + "loss": 1.7183, + "loss_base2": 2.479, + "loss_pixel": 0.3113, + "loss_text": 1.407, + "ppl": 5.575, + "step": 6050 + }, + { + "epoch": 0.04, + "global_step": 6051, + "learning_rate": 0.00047558013355592654, + "loss": 1.7034, + "loss_base2": 2.4575, + "loss_pixel": 0.3078, + "loss_text": 1.3956, + "ppl": 5.4926, + "step": 6051 + }, + { + "epoch": 0.04, + "global_step": 6052, + "learning_rate": 0.00047557595993322205, + "loss": 1.9004, + "loss_base2": 2.7417, + "loss_pixel": 0.3085, + "loss_text": 1.5919, + "ppl": 6.6886, + "step": 6052 + }, + { + "epoch": 0.04, + "global_step": 6053, + "learning_rate": 0.00047557178631051756, + "loss": 2.0699, + "loss_base2": 2.9862, + "loss_pixel": 0.3055, + "loss_text": 1.7644, + "ppl": 7.924, + "step": 6053 + }, + { + "epoch": 0.04, + "global_step": 6054, + "learning_rate": 0.000475567612687813, + "loss": 2.053, + "loss_base2": 2.9619, + "loss_pixel": 0.3027, + "loss_text": 1.7503, + "ppl": 7.7912, + "step": 6054 + }, + { + "epoch": 0.04, + "global_step": 6055, + "learning_rate": 0.0004755634390651085, + "loss": 2.0571, + "loss_base2": 2.9678, + "loss_pixel": 0.3017, + "loss_text": 1.7553, + "ppl": 7.8232, + "step": 6055 + }, + { + "epoch": 0.04, + "global_step": 6056, + "learning_rate": 0.000475559265442404, + "loss": 2.0363, + "loss_base2": 2.9378, + "loss_pixel": 0.3032, + "loss_text": 1.7331, + "ppl": 7.6622, + "step": 6056 + }, + { + "epoch": 0.04, + "global_step": 6057, + "learning_rate": 0.00047555509181969953, + "loss": 2.0422, + "loss_base2": 2.9463, + "loss_pixel": 0.3081, + "loss_text": 1.7341, + "ppl": 7.7075, + "step": 6057 + }, + { + "epoch": 0.04, + "global_step": 6058, + "learning_rate": 0.000475550918196995, + "loss": 2.0361, + "loss_base2": 2.9375, + "loss_pixel": 0.3022, + "loss_text": 1.7339, + "ppl": 7.6607, + "step": 6058 + }, + { + "epoch": 0.04, + "global_step": 6059, + "learning_rate": 0.0004755467445742905, + "loss": 2.0275, + "loss_base2": 2.9251, + "loss_pixel": 0.3017, + "loss_text": 1.7258, + "ppl": 7.5951, + "step": 6059 + }, + { + "epoch": 0.04, + "global_step": 6060, + "learning_rate": 0.000475542570951586, + "loss": 2.0242, + "loss_base2": 2.9203, + "loss_pixel": 0.2999, + "loss_text": 1.7242, + "ppl": 7.5701, + "step": 6060 + }, + { + "epoch": 0.04, + "global_step": 6061, + "learning_rate": 0.0004755383973288815, + "loss": 1.9978, + "loss_base2": 2.8822, + "loss_pixel": 0.2986, + "loss_text": 1.6992, + "ppl": 7.3728, + "step": 6061 + }, + { + "epoch": 0.04, + "global_step": 6062, + "learning_rate": 0.000475534223706177, + "loss": 2.0114, + "loss_base2": 2.9018, + "loss_pixel": 0.2973, + "loss_text": 1.714, + "ppl": 7.4738, + "step": 6062 + }, + { + "epoch": 0.04, + "global_step": 6063, + "learning_rate": 0.00047553005008347247, + "loss": 2.0007, + "loss_base2": 2.8864, + "loss_pixel": 0.2962, + "loss_text": 1.7045, + "ppl": 7.3942, + "step": 6063 + }, + { + "epoch": 0.04, + "global_step": 6064, + "learning_rate": 0.000475525876460768, + "loss": 2.0066, + "loss_base2": 2.8949, + "loss_pixel": 0.2965, + "loss_text": 1.7102, + "ppl": 7.438, + "step": 6064 + }, + { + "epoch": 0.04, + "global_step": 6065, + "learning_rate": 0.00047552170283806343, + "loss": 1.9851, + "loss_base2": 2.8639, + "loss_pixel": 0.2942, + "loss_text": 1.6908, + "ppl": 7.2798, + "step": 6065 + }, + { + "epoch": 0.04, + "global_step": 6066, + "learning_rate": 0.00047551752921535893, + "loss": 1.9866, + "loss_base2": 2.8661, + "loss_pixel": 0.2925, + "loss_text": 1.6941, + "ppl": 7.2907, + "step": 6066 + }, + { + "epoch": 0.04, + "global_step": 6067, + "learning_rate": 0.0004755133555926544, + "loss": 1.9809, + "loss_base2": 2.8578, + "loss_pixel": 0.2906, + "loss_text": 1.6903, + "ppl": 7.2493, + "step": 6067 + }, + { + "epoch": 0.04, + "global_step": 6068, + "learning_rate": 0.0004755091819699499, + "loss": 1.9845, + "loss_base2": 2.863, + "loss_pixel": 0.2945, + "loss_text": 1.6901, + "ppl": 7.2754, + "step": 6068 + }, + { + "epoch": 0.04, + "global_step": 6069, + "learning_rate": 0.0004755050083472454, + "loss": 1.9734, + "loss_base2": 2.847, + "loss_pixel": 0.2956, + "loss_text": 1.6778, + "ppl": 7.1951, + "step": 6069 + }, + { + "epoch": 0.04, + "global_step": 6070, + "learning_rate": 0.0004755008347245409, + "loss": 1.9659, + "loss_base2": 2.8362, + "loss_pixel": 0.3041, + "loss_text": 1.6618, + "ppl": 7.1413, + "step": 6070 + }, + { + "epoch": 0.04, + "global_step": 6071, + "learning_rate": 0.0004754966611018364, + "loss": 1.9654, + "loss_base2": 2.8355, + "loss_pixel": 0.2966, + "loss_text": 1.6688, + "ppl": 7.1378, + "step": 6071 + }, + { + "epoch": 0.04, + "global_step": 6072, + "learning_rate": 0.00047549248747913187, + "loss": 1.9624, + "loss_base2": 2.8311, + "loss_pixel": 0.2946, + "loss_text": 1.6678, + "ppl": 7.1164, + "step": 6072 + }, + { + "epoch": 0.04, + "global_step": 6073, + "learning_rate": 0.0004754883138564274, + "loss": 1.9659, + "loss_base2": 2.8362, + "loss_pixel": 0.2937, + "loss_text": 1.6722, + "ppl": 7.1413, + "step": 6073 + }, + { + "epoch": 0.04, + "global_step": 6074, + "learning_rate": 0.0004754841402337229, + "loss": 1.9681, + "loss_base2": 2.8394, + "loss_pixel": 0.297, + "loss_text": 1.6711, + "ppl": 7.1571, + "step": 6074 + }, + { + "epoch": 0.04, + "global_step": 6075, + "learning_rate": 0.0004754799666110184, + "loss": 1.9486, + "loss_base2": 2.8112, + "loss_pixel": 0.2935, + "loss_text": 1.6552, + "ppl": 7.0189, + "step": 6075 + }, + { + "epoch": 0.04, + "global_step": 6076, + "learning_rate": 0.0004754757929883139, + "loss": 1.9641, + "loss_base2": 2.8336, + "loss_pixel": 0.291, + "loss_text": 1.673, + "ppl": 7.1285, + "step": 6076 + }, + { + "epoch": 0.04, + "global_step": 6077, + "learning_rate": 0.00047547161936560935, + "loss": 1.949, + "loss_base2": 2.8118, + "loss_pixel": 0.2923, + "loss_text": 1.6567, + "ppl": 7.0217, + "step": 6077 + }, + { + "epoch": 0.04, + "global_step": 6078, + "learning_rate": 0.00047546744574290486, + "loss": 1.9403, + "loss_base2": 2.7993, + "loss_pixel": 0.2872, + "loss_text": 1.6531, + "ppl": 6.9608, + "step": 6078 + }, + { + "epoch": 0.04, + "global_step": 6079, + "learning_rate": 0.00047546327212020037, + "loss": 1.9397, + "loss_base2": 2.7984, + "loss_pixel": 0.2874, + "loss_text": 1.6523, + "ppl": 6.9567, + "step": 6079 + }, + { + "epoch": 0.04, + "global_step": 6080, + "learning_rate": 0.0004754590984974959, + "loss": 1.9537, + "loss_base2": 2.8186, + "loss_pixel": 0.2851, + "loss_text": 1.6687, + "ppl": 7.0547, + "step": 6080 + }, + { + "epoch": 0.04, + "global_step": 6081, + "learning_rate": 0.00047545492487479133, + "loss": 1.9281, + "loss_base2": 2.7817, + "loss_pixel": 0.2835, + "loss_text": 1.6446, + "ppl": 6.8764, + "step": 6081 + }, + { + "epoch": 0.04, + "global_step": 6082, + "learning_rate": 0.00047545075125208683, + "loss": 1.9312, + "loss_base2": 2.7861, + "loss_pixel": 0.2826, + "loss_text": 1.6485, + "ppl": 6.8978, + "step": 6082 + }, + { + "epoch": 0.04, + "global_step": 6083, + "learning_rate": 0.00047544657762938234, + "loss": 1.9325, + "loss_base2": 2.788, + "loss_pixel": 0.2836, + "loss_text": 1.649, + "ppl": 6.9068, + "step": 6083 + }, + { + "epoch": 0.04, + "global_step": 6084, + "learning_rate": 0.0004754424040066778, + "loss": 1.9363, + "loss_base2": 2.7935, + "loss_pixel": 0.2807, + "loss_text": 1.6556, + "ppl": 6.9331, + "step": 6084 + }, + { + "epoch": 0.04, + "global_step": 6085, + "learning_rate": 0.0004754382303839733, + "loss": 1.9317, + "loss_base2": 2.7869, + "loss_pixel": 0.2792, + "loss_text": 1.6524, + "ppl": 6.9012, + "step": 6085 + }, + { + "epoch": 0.04, + "global_step": 6086, + "learning_rate": 0.00047543405676126876, + "loss": 1.917, + "loss_base2": 2.7656, + "loss_pixel": 0.2776, + "loss_text": 1.6395, + "ppl": 6.8005, + "step": 6086 + }, + { + "epoch": 0.04, + "global_step": 6087, + "learning_rate": 0.00047542988313856426, + "loss": 1.9137, + "loss_base2": 2.7609, + "loss_pixel": 0.2768, + "loss_text": 1.6369, + "ppl": 6.7781, + "step": 6087 + }, + { + "epoch": 0.04, + "global_step": 6088, + "learning_rate": 0.00047542570951585977, + "loss": 1.9291, + "loss_base2": 2.7831, + "loss_pixel": 0.2755, + "loss_text": 1.6536, + "ppl": 6.8833, + "step": 6088 + }, + { + "epoch": 0.04, + "global_step": 6089, + "learning_rate": 0.0004754215358931553, + "loss": 1.9061, + "loss_base2": 2.7499, + "loss_pixel": 0.2758, + "loss_text": 1.6303, + "ppl": 6.7268, + "step": 6089 + }, + { + "epoch": 0.04, + "global_step": 6090, + "learning_rate": 0.00047541736227045073, + "loss": 1.9229, + "loss_base2": 2.7742, + "loss_pixel": 0.2738, + "loss_text": 1.6491, + "ppl": 6.8408, + "step": 6090 + }, + { + "epoch": 0.04, + "global_step": 6091, + "learning_rate": 0.00047541318864774624, + "loss": 1.9231, + "loss_base2": 2.7744, + "loss_pixel": 0.2756, + "loss_text": 1.6475, + "ppl": 6.8421, + "step": 6091 + }, + { + "epoch": 0.04, + "global_step": 6092, + "learning_rate": 0.00047540901502504175, + "loss": 1.9067, + "loss_base2": 2.7508, + "loss_pixel": 0.2764, + "loss_text": 1.6302, + "ppl": 6.7308, + "step": 6092 + }, + { + "epoch": 0.04, + "global_step": 6093, + "learning_rate": 0.00047540484140233725, + "loss": 1.9088, + "loss_base2": 2.7538, + "loss_pixel": 0.2752, + "loss_text": 1.6336, + "ppl": 6.745, + "step": 6093 + }, + { + "epoch": 0.04, + "global_step": 6094, + "learning_rate": 0.00047540066777963276, + "loss": 1.9073, + "loss_base2": 2.7517, + "loss_pixel": 0.2732, + "loss_text": 1.634, + "ppl": 6.7349, + "step": 6094 + }, + { + "epoch": 0.04, + "global_step": 6095, + "learning_rate": 0.0004753964941569282, + "loss": 1.8919, + "loss_base2": 2.7294, + "loss_pixel": 0.2756, + "loss_text": 1.6162, + "ppl": 6.632, + "step": 6095 + }, + { + "epoch": 0.04, + "global_step": 6096, + "learning_rate": 0.0004753923205342237, + "loss": 1.8982, + "loss_base2": 2.7385, + "loss_pixel": 0.2722, + "loss_text": 1.626, + "ppl": 6.6739, + "step": 6096 + }, + { + "epoch": 0.04, + "global_step": 6097, + "learning_rate": 0.00047538814691151923, + "loss": 1.9001, + "loss_base2": 2.7413, + "loss_pixel": 0.2718, + "loss_text": 1.6283, + "ppl": 6.6866, + "step": 6097 + }, + { + "epoch": 0.04, + "global_step": 6098, + "learning_rate": 0.00047538397328881474, + "loss": 1.893, + "loss_base2": 2.731, + "loss_pixel": 0.2732, + "loss_text": 1.6198, + "ppl": 6.6393, + "step": 6098 + }, + { + "epoch": 0.04, + "global_step": 6099, + "learning_rate": 0.0004753797996661102, + "loss": 1.7638, + "loss_base2": 2.5446, + "loss_pixel": 0.2742, + "loss_text": 1.4897, + "ppl": 5.8346, + "step": 6099 + }, + { + "epoch": 0.04, + "global_step": 6100, + "learning_rate": 0.0004753756260434057, + "loss": 1.672, + "loss_base2": 2.4122, + "loss_pixel": 0.2704, + "loss_text": 1.4015, + "ppl": 5.3228, + "step": 6100 + }, + { + "epoch": 0.04, + "global_step": 6101, + "learning_rate": 0.0004753714524207012, + "loss": 1.6651, + "loss_base2": 2.4022, + "loss_pixel": 0.2705, + "loss_text": 1.3946, + "ppl": 5.2862, + "step": 6101 + }, + { + "epoch": 0.04, + "global_step": 6102, + "learning_rate": 0.00047536727879799666, + "loss": 1.631, + "loss_base2": 2.353, + "loss_pixel": 0.2678, + "loss_text": 1.3632, + "ppl": 5.109, + "step": 6102 + }, + { + "epoch": 0.04, + "global_step": 6103, + "learning_rate": 0.00047536310517529216, + "loss": 1.6386, + "loss_base2": 2.364, + "loss_pixel": 0.2675, + "loss_text": 1.3711, + "ppl": 5.148, + "step": 6103 + }, + { + "epoch": 0.04, + "global_step": 6104, + "learning_rate": 0.0004753589315525876, + "loss": 1.6444, + "loss_base2": 2.3724, + "loss_pixel": 0.2657, + "loss_text": 1.3787, + "ppl": 5.1779, + "step": 6104 + }, + { + "epoch": 0.04, + "global_step": 6105, + "learning_rate": 0.0004753547579298831, + "loss": 1.6348, + "loss_base2": 2.3585, + "loss_pixel": 0.2653, + "loss_text": 1.3696, + "ppl": 5.1284, + "step": 6105 + }, + { + "epoch": 0.04, + "global_step": 6106, + "learning_rate": 0.00047535058430717863, + "loss": 1.6239, + "loss_base2": 2.3428, + "loss_pixel": 0.2646, + "loss_text": 1.3593, + "ppl": 5.0728, + "step": 6106 + }, + { + "epoch": 0.04, + "global_step": 6107, + "learning_rate": 0.00047534641068447414, + "loss": 1.6278, + "loss_base2": 2.3484, + "loss_pixel": 0.2626, + "loss_text": 1.3652, + "ppl": 5.0927, + "step": 6107 + }, + { + "epoch": 0.04, + "global_step": 6108, + "learning_rate": 0.0004753422370617696, + "loss": 1.6284, + "loss_base2": 2.3493, + "loss_pixel": 0.2629, + "loss_text": 1.3655, + "ppl": 5.0957, + "step": 6108 + }, + { + "epoch": 0.04, + "global_step": 6109, + "learning_rate": 0.0004753380634390651, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.2616, + "loss_text": 1.3536, + "ppl": 5.0284, + "step": 6109 + }, + { + "epoch": 0.04, + "global_step": 6110, + "learning_rate": 0.0004753338898163606, + "loss": 1.6286, + "loss_base2": 2.3496, + "loss_pixel": 0.2601, + "loss_text": 1.3684, + "ppl": 5.0967, + "step": 6110 + }, + { + "epoch": 0.04, + "global_step": 6111, + "learning_rate": 0.0004753297161936561, + "loss": 1.6107, + "loss_base2": 2.3237, + "loss_pixel": 0.2594, + "loss_text": 1.3513, + "ppl": 5.0063, + "step": 6111 + }, + { + "epoch": 0.04, + "global_step": 6112, + "learning_rate": 0.0004753255425709516, + "loss": 1.6172, + "loss_base2": 2.3331, + "loss_pixel": 0.2594, + "loss_text": 1.3578, + "ppl": 5.039, + "step": 6112 + }, + { + "epoch": 0.04, + "global_step": 6113, + "learning_rate": 0.0004753213689482471, + "loss": 1.6281, + "loss_base2": 2.3489, + "loss_pixel": 0.2619, + "loss_text": 1.3662, + "ppl": 5.0942, + "step": 6113 + }, + { + "epoch": 0.04, + "global_step": 6114, + "learning_rate": 0.0004753171953255426, + "loss": 1.61, + "loss_base2": 2.3227, + "loss_pixel": 0.2613, + "loss_text": 1.3487, + "ppl": 5.0028, + "step": 6114 + }, + { + "epoch": 0.04, + "global_step": 6115, + "learning_rate": 0.0004753130217028381, + "loss": 1.6404, + "loss_base2": 2.3666, + "loss_pixel": 0.2603, + "loss_text": 1.3801, + "ppl": 5.1572, + "step": 6115 + }, + { + "epoch": 0.04, + "global_step": 6116, + "learning_rate": 0.0004753088480801336, + "loss": 1.8278, + "loss_base2": 2.637, + "loss_pixel": 0.2637, + "loss_text": 1.5641, + "ppl": 6.2202, + "step": 6116 + }, + { + "epoch": 0.04, + "global_step": 6117, + "learning_rate": 0.00047530467445742905, + "loss": 1.9352, + "loss_base2": 2.7919, + "loss_pixel": 0.2627, + "loss_text": 1.6724, + "ppl": 6.9254, + "step": 6117 + }, + { + "epoch": 0.04, + "global_step": 6118, + "learning_rate": 0.00047530050083472456, + "loss": 1.8898, + "loss_base2": 2.7264, + "loss_pixel": 0.2577, + "loss_text": 1.6321, + "ppl": 6.618, + "step": 6118 + }, + { + "epoch": 0.04, + "global_step": 6119, + "learning_rate": 0.00047529632721202006, + "loss": 1.8913, + "loss_base2": 2.7286, + "loss_pixel": 0.2604, + "loss_text": 1.6309, + "ppl": 6.628, + "step": 6119 + }, + { + "epoch": 0.04, + "global_step": 6120, + "learning_rate": 0.00047529215358931557, + "loss": 1.902, + "loss_base2": 2.744, + "loss_pixel": 0.2615, + "loss_text": 1.6405, + "ppl": 6.6993, + "step": 6120 + }, + { + "epoch": 0.04, + "global_step": 6121, + "learning_rate": 0.000475287979966611, + "loss": 1.9043, + "loss_base2": 2.7473, + "loss_pixel": 0.2621, + "loss_text": 1.6422, + "ppl": 6.7147, + "step": 6121 + }, + { + "epoch": 0.04, + "global_step": 6122, + "learning_rate": 0.0004752838063439065, + "loss": 1.9081, + "loss_base2": 2.7528, + "loss_pixel": 0.2629, + "loss_text": 1.6452, + "ppl": 6.7403, + "step": 6122 + }, + { + "epoch": 0.04, + "global_step": 6123, + "learning_rate": 0.000475279632721202, + "loss": 1.884, + "loss_base2": 2.718, + "loss_pixel": 0.2616, + "loss_text": 1.6225, + "ppl": 6.5798, + "step": 6123 + }, + { + "epoch": 0.04, + "global_step": 6124, + "learning_rate": 0.0004752754590984975, + "loss": 1.89, + "loss_base2": 2.7267, + "loss_pixel": 0.2618, + "loss_text": 1.6283, + "ppl": 6.6194, + "step": 6124 + }, + { + "epoch": 0.04, + "global_step": 6125, + "learning_rate": 0.000475271285475793, + "loss": 1.8921, + "loss_base2": 2.7297, + "loss_pixel": 0.258, + "loss_text": 1.6341, + "ppl": 6.6333, + "step": 6125 + }, + { + "epoch": 0.04, + "global_step": 6126, + "learning_rate": 0.00047526711185308845, + "loss": 1.8775, + "loss_base2": 2.7087, + "loss_pixel": 0.256, + "loss_text": 1.6215, + "ppl": 6.5371, + "step": 6126 + }, + { + "epoch": 0.04, + "global_step": 6127, + "learning_rate": 0.00047526293823038396, + "loss": 1.8655, + "loss_base2": 2.6913, + "loss_pixel": 0.2554, + "loss_text": 1.6101, + "ppl": 6.4592, + "step": 6127 + }, + { + "epoch": 0.04, + "global_step": 6128, + "learning_rate": 0.00047525876460767947, + "loss": 1.8741, + "loss_base2": 2.7038, + "loss_pixel": 0.2542, + "loss_text": 1.62, + "ppl": 6.515, + "step": 6128 + }, + { + "epoch": 0.04, + "global_step": 6129, + "learning_rate": 0.000475254590984975, + "loss": 1.8666, + "loss_base2": 2.6929, + "loss_pixel": 0.2528, + "loss_text": 1.6137, + "ppl": 6.4663, + "step": 6129 + }, + { + "epoch": 0.04, + "global_step": 6130, + "learning_rate": 0.0004752504173622705, + "loss": 1.8758, + "loss_base2": 2.7062, + "loss_pixel": 0.2525, + "loss_text": 1.6233, + "ppl": 6.526, + "step": 6130 + }, + { + "epoch": 0.04, + "global_step": 6131, + "learning_rate": 0.00047524624373956593, + "loss": 1.8611, + "loss_base2": 2.685, + "loss_pixel": 0.2521, + "loss_text": 1.609, + "ppl": 6.4308, + "step": 6131 + }, + { + "epoch": 0.04, + "global_step": 6132, + "learning_rate": 0.00047524207011686144, + "loss": 1.8629, + "loss_base2": 2.6876, + "loss_pixel": 0.2504, + "loss_text": 1.6125, + "ppl": 6.4424, + "step": 6132 + }, + { + "epoch": 0.04, + "global_step": 6133, + "learning_rate": 0.00047523789649415695, + "loss": 1.8567, + "loss_base2": 2.6787, + "loss_pixel": 0.2497, + "loss_text": 1.607, + "ppl": 6.4026, + "step": 6133 + }, + { + "epoch": 0.04, + "global_step": 6134, + "learning_rate": 0.00047523372287145246, + "loss": 1.8509, + "loss_base2": 2.6703, + "loss_pixel": 0.2483, + "loss_text": 1.6026, + "ppl": 6.3655, + "step": 6134 + }, + { + "epoch": 0.04, + "global_step": 6135, + "learning_rate": 0.00047522954924874796, + "loss": 1.845, + "loss_base2": 2.6618, + "loss_pixel": 0.2484, + "loss_text": 1.5966, + "ppl": 6.3281, + "step": 6135 + }, + { + "epoch": 0.04, + "global_step": 6136, + "learning_rate": 0.0004752253756260434, + "loss": 1.8503, + "loss_base2": 2.6694, + "loss_pixel": 0.2462, + "loss_text": 1.6041, + "ppl": 6.3617, + "step": 6136 + }, + { + "epoch": 0.04, + "global_step": 6137, + "learning_rate": 0.0004752212020033389, + "loss": 1.835, + "loss_base2": 2.6473, + "loss_pixel": 0.2483, + "loss_text": 1.5868, + "ppl": 6.2651, + "step": 6137 + }, + { + "epoch": 0.04, + "global_step": 6138, + "learning_rate": 0.00047521702838063443, + "loss": 1.8373, + "loss_base2": 2.6507, + "loss_pixel": 0.2511, + "loss_text": 1.5862, + "ppl": 6.2796, + "step": 6138 + }, + { + "epoch": 0.04, + "global_step": 6139, + "learning_rate": 0.00047521285475792994, + "loss": 1.8412, + "loss_base2": 2.6563, + "loss_pixel": 0.2501, + "loss_text": 1.5912, + "ppl": 6.3041, + "step": 6139 + }, + { + "epoch": 0.04, + "global_step": 6140, + "learning_rate": 0.00047520868113522534, + "loss": 1.8185, + "loss_base2": 2.6235, + "loss_pixel": 0.2493, + "loss_text": 1.5692, + "ppl": 6.1626, + "step": 6140 + }, + { + "epoch": 0.04, + "global_step": 6141, + "learning_rate": 0.00047520450751252085, + "loss": 1.5895, + "loss_base2": 2.2932, + "loss_pixel": 0.2491, + "loss_text": 1.3405, + "ppl": 4.9013, + "step": 6141 + }, + { + "epoch": 0.04, + "global_step": 6142, + "learning_rate": 0.00047520033388981635, + "loss": 1.5823, + "loss_base2": 2.2828, + "loss_pixel": 0.2469, + "loss_text": 1.3354, + "ppl": 4.8661, + "step": 6142 + }, + { + "epoch": 0.04, + "global_step": 6143, + "learning_rate": 0.00047519616026711186, + "loss": 1.6142, + "loss_base2": 2.3288, + "loss_pixel": 0.2478, + "loss_text": 1.3664, + "ppl": 5.0239, + "step": 6143 + }, + { + "epoch": 0.04, + "global_step": 6144, + "learning_rate": 0.00047519198664440737, + "loss": 1.5792, + "loss_base2": 2.2783, + "loss_pixel": 0.2459, + "loss_text": 1.3333, + "ppl": 4.8511, + "step": 6144 + }, + { + "epoch": 0.04, + "global_step": 6145, + "learning_rate": 0.0004751878130217028, + "loss": 1.5837, + "loss_base2": 2.2848, + "loss_pixel": 0.2431, + "loss_text": 1.3406, + "ppl": 4.873, + "step": 6145 + }, + { + "epoch": 0.04, + "global_step": 6146, + "learning_rate": 0.00047518363939899833, + "loss": 1.6001, + "loss_base2": 2.3085, + "loss_pixel": 0.2443, + "loss_text": 1.3558, + "ppl": 4.9535, + "step": 6146 + }, + { + "epoch": 0.04, + "global_step": 6147, + "learning_rate": 0.00047517946577629383, + "loss": 1.5681, + "loss_base2": 2.2623, + "loss_pixel": 0.243, + "loss_text": 1.3251, + "ppl": 4.7975, + "step": 6147 + }, + { + "epoch": 0.04, + "global_step": 6148, + "learning_rate": 0.00047517529215358934, + "loss": 1.5765, + "loss_base2": 2.2744, + "loss_pixel": 0.2463, + "loss_text": 1.3301, + "ppl": 4.838, + "step": 6148 + }, + { + "epoch": 0.04, + "global_step": 6149, + "learning_rate": 0.0004751711185308848, + "loss": 1.596, + "loss_base2": 2.3025, + "loss_pixel": 0.2546, + "loss_text": 1.3414, + "ppl": 4.9333, + "step": 6149 + }, + { + "epoch": 0.04, + "global_step": 6150, + "learning_rate": 0.0004751669449081803, + "loss": 1.5898, + "loss_base2": 2.2936, + "loss_pixel": 0.2589, + "loss_text": 1.3309, + "ppl": 4.9028, + "step": 6150 + }, + { + "epoch": 0.04, + "global_step": 6151, + "learning_rate": 0.0004751627712854758, + "loss": 1.5771, + "loss_base2": 2.2753, + "loss_pixel": 0.2571, + "loss_text": 1.32, + "ppl": 4.8409, + "step": 6151 + }, + { + "epoch": 0.04, + "global_step": 6152, + "learning_rate": 0.0004751585976627713, + "loss": 1.5677, + "loss_base2": 2.2617, + "loss_pixel": 0.2512, + "loss_text": 1.3165, + "ppl": 4.7956, + "step": 6152 + }, + { + "epoch": 0.04, + "global_step": 6153, + "learning_rate": 0.0004751544240400668, + "loss": 1.5782, + "loss_base2": 2.2769, + "loss_pixel": 0.2502, + "loss_text": 1.3279, + "ppl": 4.8462, + "step": 6153 + }, + { + "epoch": 0.04, + "global_step": 6154, + "learning_rate": 0.0004751502504173623, + "loss": 1.5804, + "loss_base2": 2.28, + "loss_pixel": 0.2468, + "loss_text": 1.3335, + "ppl": 4.8569, + "step": 6154 + }, + { + "epoch": 0.04, + "global_step": 6155, + "learning_rate": 0.0004751460767946578, + "loss": 1.584, + "loss_base2": 2.2852, + "loss_pixel": 0.2471, + "loss_text": 1.3369, + "ppl": 4.8744, + "step": 6155 + }, + { + "epoch": 0.04, + "global_step": 6156, + "learning_rate": 0.0004751419031719533, + "loss": 1.5826, + "loss_base2": 2.2832, + "loss_pixel": 0.2459, + "loss_text": 1.3368, + "ppl": 4.8676, + "step": 6156 + }, + { + "epoch": 0.04, + "global_step": 6157, + "learning_rate": 0.0004751377295492488, + "loss": 1.6529, + "loss_base2": 2.3846, + "loss_pixel": 0.2417, + "loss_text": 1.4112, + "ppl": 5.2221, + "step": 6157 + }, + { + "epoch": 0.04, + "global_step": 6158, + "learning_rate": 0.0004751335559265442, + "loss": 1.8492, + "loss_base2": 2.6678, + "loss_pixel": 0.2401, + "loss_text": 1.6091, + "ppl": 6.3547, + "step": 6158 + }, + { + "epoch": 0.04, + "global_step": 6159, + "learning_rate": 0.0004751293823038397, + "loss": 1.8474, + "loss_base2": 2.6652, + "loss_pixel": 0.2401, + "loss_text": 1.6073, + "ppl": 6.3433, + "step": 6159 + }, + { + "epoch": 0.04, + "global_step": 6160, + "learning_rate": 0.0004751252086811352, + "loss": 1.8525, + "loss_base2": 2.6726, + "loss_pixel": 0.239, + "loss_text": 1.6134, + "ppl": 6.3757, + "step": 6160 + }, + { + "epoch": 0.04, + "global_step": 6161, + "learning_rate": 0.0004751210350584307, + "loss": 1.8621, + "loss_base2": 2.6864, + "loss_pixel": 0.2403, + "loss_text": 1.6218, + "ppl": 6.4372, + "step": 6161 + }, + { + "epoch": 0.04, + "global_step": 6162, + "learning_rate": 0.00047511686143572623, + "loss": 1.8412, + "loss_base2": 2.6563, + "loss_pixel": 0.236, + "loss_text": 1.6053, + "ppl": 6.3041, + "step": 6162 + }, + { + "epoch": 0.04, + "global_step": 6163, + "learning_rate": 0.0004751126878130217, + "loss": 1.8319, + "loss_base2": 2.6429, + "loss_pixel": 0.2376, + "loss_text": 1.5943, + "ppl": 6.2457, + "step": 6163 + }, + { + "epoch": 0.04, + "global_step": 6164, + "learning_rate": 0.0004751085141903172, + "loss": 1.8065, + "loss_base2": 2.6062, + "loss_pixel": 0.2341, + "loss_text": 1.5724, + "ppl": 6.0891, + "step": 6164 + }, + { + "epoch": 0.04, + "global_step": 6165, + "learning_rate": 0.0004751043405676127, + "loss": 1.8284, + "loss_base2": 2.6378, + "loss_pixel": 0.2355, + "loss_text": 1.5929, + "ppl": 6.2239, + "step": 6165 + }, + { + "epoch": 0.04, + "global_step": 6166, + "learning_rate": 0.0004751001669449082, + "loss": 1.8371, + "loss_base2": 2.6504, + "loss_pixel": 0.2434, + "loss_text": 1.5937, + "ppl": 6.2783, + "step": 6166 + }, + { + "epoch": 0.04, + "global_step": 6167, + "learning_rate": 0.00047509599332220366, + "loss": 1.8401, + "loss_base2": 2.6547, + "loss_pixel": 0.2485, + "loss_text": 1.5917, + "ppl": 6.2972, + "step": 6167 + }, + { + "epoch": 0.04, + "global_step": 6168, + "learning_rate": 0.00047509181969949916, + "loss": 1.8228, + "loss_base2": 2.6297, + "loss_pixel": 0.246, + "loss_text": 1.5768, + "ppl": 6.1892, + "step": 6168 + }, + { + "epoch": 0.04, + "global_step": 6169, + "learning_rate": 0.00047508764607679467, + "loss": 1.8485, + "loss_base2": 2.6668, + "loss_pixel": 0.2441, + "loss_text": 1.6043, + "ppl": 6.3503, + "step": 6169 + }, + { + "epoch": 0.04, + "global_step": 6170, + "learning_rate": 0.0004750834724540902, + "loss": 1.8331, + "loss_base2": 2.6446, + "loss_pixel": 0.2449, + "loss_text": 1.5882, + "ppl": 6.2532, + "step": 6170 + }, + { + "epoch": 0.04, + "global_step": 6171, + "learning_rate": 0.0004750792988313857, + "loss": 1.8359, + "loss_base2": 2.6486, + "loss_pixel": 0.2426, + "loss_text": 1.5934, + "ppl": 6.2708, + "step": 6171 + }, + { + "epoch": 0.04, + "global_step": 6172, + "learning_rate": 0.00047507512520868114, + "loss": 1.8275, + "loss_base2": 2.6365, + "loss_pixel": 0.2441, + "loss_text": 1.5834, + "ppl": 6.2183, + "step": 6172 + }, + { + "epoch": 0.04, + "global_step": 6173, + "learning_rate": 0.00047507095158597665, + "loss": 1.8358, + "loss_base2": 2.6485, + "loss_pixel": 0.2472, + "loss_text": 1.5886, + "ppl": 6.2701, + "step": 6173 + }, + { + "epoch": 0.04, + "global_step": 6174, + "learning_rate": 0.00047506677796327215, + "loss": 1.83, + "loss_base2": 2.6401, + "loss_pixel": 0.2403, + "loss_text": 1.5898, + "ppl": 6.2339, + "step": 6174 + }, + { + "epoch": 0.04, + "global_step": 6175, + "learning_rate": 0.00047506260434056766, + "loss": 1.8324, + "loss_base2": 2.6436, + "loss_pixel": 0.2373, + "loss_text": 1.595, + "ppl": 6.2489, + "step": 6175 + }, + { + "epoch": 0.04, + "global_step": 6176, + "learning_rate": 0.0004750584307178631, + "loss": 1.818, + "loss_base2": 2.6228, + "loss_pixel": 0.2359, + "loss_text": 1.5821, + "ppl": 6.1595, + "step": 6176 + }, + { + "epoch": 0.04, + "global_step": 6177, + "learning_rate": 0.00047505425709515857, + "loss": 1.8341, + "loss_base2": 2.646, + "loss_pixel": 0.2361, + "loss_text": 1.598, + "ppl": 6.2595, + "step": 6177 + }, + { + "epoch": 0.04, + "global_step": 6178, + "learning_rate": 0.0004750500834724541, + "loss": 1.8278, + "loss_base2": 2.637, + "loss_pixel": 0.2326, + "loss_text": 1.5952, + "ppl": 6.2202, + "step": 6178 + }, + { + "epoch": 0.04, + "global_step": 6179, + "learning_rate": 0.0004750459098497496, + "loss": 1.7976, + "loss_base2": 2.5934, + "loss_pixel": 0.2338, + "loss_text": 1.5638, + "ppl": 6.0351, + "step": 6179 + }, + { + "epoch": 0.04, + "global_step": 6180, + "learning_rate": 0.0004750417362270451, + "loss": 1.766, + "loss_base2": 2.5478, + "loss_pixel": 0.2303, + "loss_text": 1.5357, + "ppl": 5.8474, + "step": 6180 + }, + { + "epoch": 0.04, + "global_step": 6181, + "learning_rate": 0.00047503756260434054, + "loss": 1.798, + "loss_base2": 2.594, + "loss_pixel": 0.2298, + "loss_text": 1.5682, + "ppl": 6.0376, + "step": 6181 + }, + { + "epoch": 0.04, + "global_step": 6182, + "learning_rate": 0.00047503338898163605, + "loss": 1.8197, + "loss_base2": 2.6253, + "loss_pixel": 0.2263, + "loss_text": 1.5934, + "ppl": 6.17, + "step": 6182 + }, + { + "epoch": 0.04, + "global_step": 6183, + "learning_rate": 0.00047502921535893156, + "loss": 1.8267, + "loss_base2": 2.6354, + "loss_pixel": 0.2316, + "loss_text": 1.595, + "ppl": 6.2133, + "step": 6183 + }, + { + "epoch": 0.04, + "global_step": 6184, + "learning_rate": 0.00047502504173622706, + "loss": 1.8119, + "loss_base2": 2.614, + "loss_pixel": 0.2393, + "loss_text": 1.5726, + "ppl": 6.1221, + "step": 6184 + }, + { + "epoch": 0.04, + "global_step": 6185, + "learning_rate": 0.00047502086811352257, + "loss": 1.8288, + "loss_base2": 2.6384, + "loss_pixel": 0.2377, + "loss_text": 1.5911, + "ppl": 6.2264, + "step": 6185 + }, + { + "epoch": 0.04, + "global_step": 6186, + "learning_rate": 0.000475016694490818, + "loss": 1.8217, + "loss_base2": 2.6282, + "loss_pixel": 0.2358, + "loss_text": 1.5859, + "ppl": 6.1824, + "step": 6186 + }, + { + "epoch": 0.04, + "global_step": 6187, + "learning_rate": 0.00047501252086811353, + "loss": 1.814, + "loss_base2": 2.617, + "loss_pixel": 0.2319, + "loss_text": 1.5821, + "ppl": 6.1349, + "step": 6187 + }, + { + "epoch": 0.04, + "global_step": 6188, + "learning_rate": 0.00047500834724540904, + "loss": 1.8317, + "loss_base2": 2.6426, + "loss_pixel": 0.2321, + "loss_text": 1.5996, + "ppl": 6.2445, + "step": 6188 + }, + { + "epoch": 0.04, + "global_step": 6189, + "learning_rate": 0.00047500417362270455, + "loss": 1.8049, + "loss_base2": 2.6039, + "loss_pixel": 0.2287, + "loss_text": 1.5762, + "ppl": 6.0794, + "step": 6189 + }, + { + "epoch": 0.04, + "global_step": 6190, + "learning_rate": 0.000475, + "loss": 1.8234, + "loss_base2": 2.6306, + "loss_pixel": 0.2269, + "loss_text": 1.5965, + "ppl": 6.1929, + "step": 6190 + }, + { + "epoch": 0.04, + "global_step": 6191, + "learning_rate": 0.0004749958263772955, + "loss": 1.8085, + "loss_base2": 2.6091, + "loss_pixel": 0.2263, + "loss_text": 1.5823, + "ppl": 6.1013, + "step": 6191 + }, + { + "epoch": 0.04, + "global_step": 6192, + "learning_rate": 0.000474991652754591, + "loss": 1.8053, + "loss_base2": 2.6045, + "loss_pixel": 0.2271, + "loss_text": 1.5782, + "ppl": 6.0818, + "step": 6192 + }, + { + "epoch": 0.04, + "global_step": 6193, + "learning_rate": 0.0004749874791318865, + "loss": 1.7954, + "loss_base2": 2.5902, + "loss_pixel": 0.2257, + "loss_text": 1.5697, + "ppl": 6.0219, + "step": 6193 + }, + { + "epoch": 0.04, + "global_step": 6194, + "learning_rate": 0.00047498330550918203, + "loss": 1.816, + "loss_base2": 2.6199, + "loss_pixel": 0.2255, + "loss_text": 1.5905, + "ppl": 6.1472, + "step": 6194 + }, + { + "epoch": 0.04, + "global_step": 6195, + "learning_rate": 0.0004749791318864775, + "loss": 1.8132, + "loss_base2": 2.6159, + "loss_pixel": 0.2237, + "loss_text": 1.5895, + "ppl": 6.13, + "step": 6195 + }, + { + "epoch": 0.04, + "global_step": 6196, + "learning_rate": 0.00047497495826377293, + "loss": 1.8068, + "loss_base2": 2.6067, + "loss_pixel": 0.2193, + "loss_text": 1.5874, + "ppl": 6.0909, + "step": 6196 + }, + { + "epoch": 0.04, + "global_step": 6197, + "learning_rate": 0.00047497078464106844, + "loss": 1.7993, + "loss_base2": 2.5958, + "loss_pixel": 0.2196, + "loss_text": 1.5797, + "ppl": 6.0454, + "step": 6197 + }, + { + "epoch": 0.04, + "global_step": 6198, + "learning_rate": 0.00047496661101836395, + "loss": 1.7947, + "loss_base2": 2.5892, + "loss_pixel": 0.2198, + "loss_text": 1.5749, + "ppl": 6.0177, + "step": 6198 + }, + { + "epoch": 0.04, + "global_step": 6199, + "learning_rate": 0.0004749624373956594, + "loss": 1.8035, + "loss_base2": 2.6019, + "loss_pixel": 0.2202, + "loss_text": 1.5833, + "ppl": 6.0709, + "step": 6199 + }, + { + "epoch": 0.04, + "global_step": 6200, + "learning_rate": 0.0004749582637729549, + "loss": 1.786, + "loss_base2": 2.5767, + "loss_pixel": 0.2181, + "loss_text": 1.5679, + "ppl": 5.9655, + "step": 6200 + }, + { + "epoch": 0.04, + "global_step": 6201, + "learning_rate": 0.0004749540901502504, + "loss": 1.7782, + "loss_base2": 2.5654, + "loss_pixel": 0.2189, + "loss_text": 1.5593, + "ppl": 5.9192, + "step": 6201 + }, + { + "epoch": 0.04, + "global_step": 6202, + "learning_rate": 0.0004749499165275459, + "loss": 1.5508, + "loss_base2": 2.2373, + "loss_pixel": 0.2168, + "loss_text": 1.3339, + "ppl": 4.7152, + "step": 6202 + }, + { + "epoch": 0.04, + "global_step": 6203, + "learning_rate": 0.00047494574290484143, + "loss": 1.5592, + "loss_base2": 2.2495, + "loss_pixel": 0.2179, + "loss_text": 1.3414, + "ppl": 4.755, + "step": 6203 + }, + { + "epoch": 0.04, + "global_step": 6204, + "learning_rate": 0.0004749415692821369, + "loss": 1.5672, + "loss_base2": 2.261, + "loss_pixel": 0.2249, + "loss_text": 1.3423, + "ppl": 4.7932, + "step": 6204 + }, + { + "epoch": 0.04, + "global_step": 6205, + "learning_rate": 0.0004749373956594324, + "loss": 1.5727, + "loss_base2": 2.2689, + "loss_pixel": 0.23, + "loss_text": 1.3427, + "ppl": 4.8196, + "step": 6205 + }, + { + "epoch": 0.04, + "global_step": 6206, + "learning_rate": 0.0004749332220367279, + "loss": 1.5543, + "loss_base2": 2.2424, + "loss_pixel": 0.2271, + "loss_text": 1.3272, + "ppl": 4.7318, + "step": 6206 + }, + { + "epoch": 0.04, + "global_step": 6207, + "learning_rate": 0.0004749290484140234, + "loss": 1.5523, + "loss_base2": 2.2395, + "loss_pixel": 0.2275, + "loss_text": 1.3248, + "ppl": 4.7223, + "step": 6207 + }, + { + "epoch": 0.04, + "global_step": 6208, + "learning_rate": 0.00047492487479131886, + "loss": 1.5539, + "loss_base2": 2.2418, + "loss_pixel": 0.2257, + "loss_text": 1.3281, + "ppl": 4.7299, + "step": 6208 + }, + { + "epoch": 0.04, + "global_step": 6209, + "learning_rate": 0.00047492070116861437, + "loss": 1.5572, + "loss_base2": 2.2466, + "loss_pixel": 0.2257, + "loss_text": 1.3316, + "ppl": 4.7455, + "step": 6209 + }, + { + "epoch": 0.04, + "global_step": 6210, + "learning_rate": 0.0004749165275459099, + "loss": 1.6153, + "loss_base2": 2.3304, + "loss_pixel": 0.2252, + "loss_text": 1.3901, + "ppl": 5.0294, + "step": 6210 + }, + { + "epoch": 0.04, + "global_step": 6211, + "learning_rate": 0.0004749123539232054, + "loss": 1.811, + "loss_base2": 2.6127, + "loss_pixel": 0.2233, + "loss_text": 1.5878, + "ppl": 6.1166, + "step": 6211 + }, + { + "epoch": 0.04, + "global_step": 6212, + "learning_rate": 0.0004749081803005009, + "loss": 1.8147, + "loss_base2": 2.6181, + "loss_pixel": 0.2225, + "loss_text": 1.5922, + "ppl": 6.1392, + "step": 6212 + }, + { + "epoch": 0.04, + "global_step": 6213, + "learning_rate": 0.00047490400667779634, + "loss": 1.8079, + "loss_base2": 2.6082, + "loss_pixel": 0.2225, + "loss_text": 1.5854, + "ppl": 6.0976, + "step": 6213 + }, + { + "epoch": 0.04, + "global_step": 6214, + "learning_rate": 0.00047489983305509185, + "loss": 1.8027, + "loss_base2": 2.6007, + "loss_pixel": 0.2227, + "loss_text": 1.58, + "ppl": 6.066, + "step": 6214 + }, + { + "epoch": 0.04, + "global_step": 6215, + "learning_rate": 0.0004748956594323873, + "loss": 1.8011, + "loss_base2": 2.5984, + "loss_pixel": 0.22, + "loss_text": 1.5812, + "ppl": 6.0563, + "step": 6215 + }, + { + "epoch": 0.04, + "global_step": 6216, + "learning_rate": 0.0004748914858096828, + "loss": 1.7949, + "loss_base2": 2.5895, + "loss_pixel": 0.2195, + "loss_text": 1.5755, + "ppl": 6.0189, + "step": 6216 + }, + { + "epoch": 0.04, + "global_step": 6217, + "learning_rate": 0.00047488731218697826, + "loss": 1.7889, + "loss_base2": 2.5808, + "loss_pixel": 0.2193, + "loss_text": 1.5696, + "ppl": 5.9829, + "step": 6217 + }, + { + "epoch": 0.04, + "global_step": 6218, + "learning_rate": 0.00047488313856427377, + "loss": 1.8153, + "loss_base2": 2.6189, + "loss_pixel": 0.2201, + "loss_text": 1.5952, + "ppl": 6.1429, + "step": 6218 + }, + { + "epoch": 0.04, + "global_step": 6219, + "learning_rate": 0.0004748789649415693, + "loss": 1.7849, + "loss_base2": 2.5751, + "loss_pixel": 0.2172, + "loss_text": 1.5677, + "ppl": 5.959, + "step": 6219 + }, + { + "epoch": 0.04, + "global_step": 6220, + "learning_rate": 0.0004748747913188648, + "loss": 1.8036, + "loss_base2": 2.602, + "loss_pixel": 0.2179, + "loss_text": 1.5856, + "ppl": 6.0715, + "step": 6220 + }, + { + "epoch": 0.04, + "global_step": 6221, + "learning_rate": 0.0004748706176961603, + "loss": 1.8022, + "loss_base2": 2.6, + "loss_pixel": 0.2165, + "loss_text": 1.5858, + "ppl": 6.063, + "step": 6221 + }, + { + "epoch": 0.04, + "global_step": 6222, + "learning_rate": 0.00047486644407345575, + "loss": 1.7982, + "loss_base2": 2.5943, + "loss_pixel": 0.2166, + "loss_text": 1.5816, + "ppl": 6.0388, + "step": 6222 + }, + { + "epoch": 0.04, + "global_step": 6223, + "learning_rate": 0.00047486227045075125, + "loss": 1.7916, + "loss_base2": 2.5847, + "loss_pixel": 0.2164, + "loss_text": 1.5752, + "ppl": 5.999, + "step": 6223 + }, + { + "epoch": 0.04, + "global_step": 6224, + "learning_rate": 0.00047485809682804676, + "loss": 1.7729, + "loss_base2": 2.5578, + "loss_pixel": 0.2143, + "loss_text": 1.5585, + "ppl": 5.8879, + "step": 6224 + }, + { + "epoch": 0.04, + "global_step": 6225, + "learning_rate": 0.00047485392320534227, + "loss": 1.7903, + "loss_base2": 2.5829, + "loss_pixel": 0.2165, + "loss_text": 1.5738, + "ppl": 5.9912, + "step": 6225 + }, + { + "epoch": 0.04, + "global_step": 6226, + "learning_rate": 0.0004748497495826377, + "loss": 1.8013, + "loss_base2": 2.5987, + "loss_pixel": 0.2223, + "loss_text": 1.5789, + "ppl": 6.0575, + "step": 6226 + }, + { + "epoch": 0.04, + "global_step": 6227, + "learning_rate": 0.00047484557595993323, + "loss": 1.7818, + "loss_base2": 2.5706, + "loss_pixel": 0.226, + "loss_text": 1.5558, + "ppl": 5.9405, + "step": 6227 + }, + { + "epoch": 0.04, + "global_step": 6228, + "learning_rate": 0.00047484140233722874, + "loss": 1.7895, + "loss_base2": 2.5817, + "loss_pixel": 0.2189, + "loss_text": 1.5706, + "ppl": 5.9865, + "step": 6228 + }, + { + "epoch": 0.04, + "global_step": 6229, + "learning_rate": 0.00047483722871452424, + "loss": 1.8046, + "loss_base2": 2.6035, + "loss_pixel": 0.2237, + "loss_text": 1.5809, + "ppl": 6.0775, + "step": 6229 + }, + { + "epoch": 0.04, + "global_step": 6230, + "learning_rate": 0.00047483305509181975, + "loss": 1.7888, + "loss_base2": 2.5807, + "loss_pixel": 0.2218, + "loss_text": 1.567, + "ppl": 5.9823, + "step": 6230 + }, + { + "epoch": 0.04, + "global_step": 6231, + "learning_rate": 0.0004748288814691152, + "loss": 1.7945, + "loss_base2": 2.5889, + "loss_pixel": 0.2181, + "loss_text": 1.5764, + "ppl": 6.0165, + "step": 6231 + }, + { + "epoch": 0.04, + "global_step": 6232, + "learning_rate": 0.0004748247078464107, + "loss": 1.6708, + "loss_base2": 2.4105, + "loss_pixel": 0.217, + "loss_text": 1.4538, + "ppl": 5.3164, + "step": 6232 + }, + { + "epoch": 0.04, + "global_step": 6233, + "learning_rate": 0.0004748205342237062, + "loss": 1.5809, + "loss_base2": 2.2808, + "loss_pixel": 0.2186, + "loss_text": 1.3623, + "ppl": 4.8593, + "step": 6233 + }, + { + "epoch": 0.04, + "global_step": 6234, + "learning_rate": 0.00047481636060100167, + "loss": 1.5499, + "loss_base2": 2.236, + "loss_pixel": 0.2175, + "loss_text": 1.3324, + "ppl": 4.711, + "step": 6234 + }, + { + "epoch": 0.04, + "global_step": 6235, + "learning_rate": 0.0004748121869782971, + "loss": 1.5424, + "loss_base2": 2.2252, + "loss_pixel": 0.2153, + "loss_text": 1.327, + "ppl": 4.6758, + "step": 6235 + }, + { + "epoch": 0.04, + "global_step": 6236, + "learning_rate": 0.00047480801335559263, + "loss": 1.5349, + "loss_base2": 2.2144, + "loss_pixel": 0.215, + "loss_text": 1.3198, + "ppl": 4.6409, + "step": 6236 + }, + { + "epoch": 0.04, + "global_step": 6237, + "learning_rate": 0.00047480383973288814, + "loss": 1.5442, + "loss_base2": 2.2278, + "loss_pixel": 0.2144, + "loss_text": 1.3298, + "ppl": 4.6842, + "step": 6237 + }, + { + "epoch": 0.04, + "global_step": 6238, + "learning_rate": 0.00047479966611018365, + "loss": 1.5345, + "loss_base2": 2.2138, + "loss_pixel": 0.2148, + "loss_text": 1.3197, + "ppl": 4.639, + "step": 6238 + }, + { + "epoch": 0.04, + "global_step": 6239, + "learning_rate": 0.00047479549248747915, + "loss": 1.5295, + "loss_base2": 2.2066, + "loss_pixel": 0.2129, + "loss_text": 1.3166, + "ppl": 4.6159, + "step": 6239 + }, + { + "epoch": 0.04, + "global_step": 6240, + "learning_rate": 0.0004747913188647746, + "loss": 1.5505, + "loss_base2": 2.2369, + "loss_pixel": 0.2129, + "loss_text": 1.3375, + "ppl": 4.7138, + "step": 6240 + }, + { + "epoch": 0.04, + "global_step": 6241, + "learning_rate": 0.0004747871452420701, + "loss": 1.6721, + "loss_base2": 2.4123, + "loss_pixel": 0.2118, + "loss_text": 1.4602, + "ppl": 5.3233, + "step": 6241 + }, + { + "epoch": 0.04, + "global_step": 6242, + "learning_rate": 0.0004747829716193656, + "loss": 1.7959, + "loss_base2": 2.5909, + "loss_pixel": 0.213, + "loss_text": 1.5829, + "ppl": 6.0249, + "step": 6242 + }, + { + "epoch": 0.04, + "global_step": 6243, + "learning_rate": 0.00047477879799666113, + "loss": 1.7978, + "loss_base2": 2.5937, + "loss_pixel": 0.2118, + "loss_text": 1.586, + "ppl": 6.0364, + "step": 6243 + }, + { + "epoch": 0.04, + "global_step": 6244, + "learning_rate": 0.00047477462437395664, + "loss": 1.7955, + "loss_base2": 2.5904, + "loss_pixel": 0.2112, + "loss_text": 1.5843, + "ppl": 6.0225, + "step": 6244 + }, + { + "epoch": 0.04, + "global_step": 6245, + "learning_rate": 0.0004747704507512521, + "loss": 1.7825, + "loss_base2": 2.5716, + "loss_pixel": 0.2095, + "loss_text": 1.573, + "ppl": 5.9447, + "step": 6245 + }, + { + "epoch": 0.04, + "global_step": 6246, + "learning_rate": 0.0004747662771285476, + "loss": 1.7769, + "loss_base2": 2.5635, + "loss_pixel": 0.2129, + "loss_text": 1.5641, + "ppl": 5.9115, + "step": 6246 + }, + { + "epoch": 0.04, + "global_step": 6247, + "learning_rate": 0.0004747621035058431, + "loss": 1.7865, + "loss_base2": 2.5774, + "loss_pixel": 0.2095, + "loss_text": 1.577, + "ppl": 5.9685, + "step": 6247 + }, + { + "epoch": 0.04, + "global_step": 6248, + "learning_rate": 0.0004747579298831386, + "loss": 1.7706, + "loss_base2": 2.5544, + "loss_pixel": 0.2098, + "loss_text": 1.5608, + "ppl": 5.8744, + "step": 6248 + }, + { + "epoch": 0.04, + "global_step": 6249, + "learning_rate": 0.00047475375626043406, + "loss": 1.7764, + "loss_base2": 2.5628, + "loss_pixel": 0.2096, + "loss_text": 1.5668, + "ppl": 5.9085, + "step": 6249 + }, + { + "epoch": 0.04, + "global_step": 6250, + "learning_rate": 0.00047474958263772957, + "loss": 1.7817, + "loss_base2": 2.5704, + "loss_pixel": 0.2077, + "loss_text": 1.574, + "ppl": 5.9399, + "step": 6250 + }, + { + "epoch": 0.04, + "global_step": 6251, + "learning_rate": 0.0004747454090150251, + "loss": 1.7888, + "loss_base2": 2.5807, + "loss_pixel": 0.2083, + "loss_text": 1.5805, + "ppl": 5.9823, + "step": 6251 + }, + { + "epoch": 0.04, + "global_step": 6252, + "learning_rate": 0.0004747412353923206, + "loss": 1.7788, + "loss_base2": 2.5663, + "loss_pixel": 0.207, + "loss_text": 1.5717, + "ppl": 5.9227, + "step": 6252 + }, + { + "epoch": 0.04, + "global_step": 6253, + "learning_rate": 0.00047473706176961604, + "loss": 1.7762, + "loss_base2": 2.5625, + "loss_pixel": 0.2078, + "loss_text": 1.5684, + "ppl": 5.9074, + "step": 6253 + }, + { + "epoch": 0.04, + "global_step": 6254, + "learning_rate": 0.0004747328881469115, + "loss": 1.7764, + "loss_base2": 2.5628, + "loss_pixel": 0.2076, + "loss_text": 1.5688, + "ppl": 5.9085, + "step": 6254 + }, + { + "epoch": 0.04, + "global_step": 6255, + "learning_rate": 0.000474728714524207, + "loss": 1.7857, + "loss_base2": 2.5762, + "loss_pixel": 0.2064, + "loss_text": 1.5793, + "ppl": 5.9638, + "step": 6255 + }, + { + "epoch": 0.04, + "global_step": 6256, + "learning_rate": 0.0004747245409015025, + "loss": 1.7571, + "loss_base2": 2.535, + "loss_pixel": 0.205, + "loss_text": 1.5521, + "ppl": 5.7956, + "step": 6256 + }, + { + "epoch": 0.04, + "global_step": 6257, + "learning_rate": 0.000474720367278798, + "loss": 1.7705, + "loss_base2": 2.5543, + "loss_pixel": 0.2059, + "loss_text": 1.5645, + "ppl": 5.8738, + "step": 6257 + }, + { + "epoch": 0.04, + "global_step": 6258, + "learning_rate": 0.00047471619365609347, + "loss": 1.7711, + "loss_base2": 2.5552, + "loss_pixel": 0.2051, + "loss_text": 1.566, + "ppl": 5.8773, + "step": 6258 + }, + { + "epoch": 0.04, + "global_step": 6259, + "learning_rate": 0.000474712020033389, + "loss": 1.7476, + "loss_base2": 2.5213, + "loss_pixel": 0.206, + "loss_text": 1.5416, + "ppl": 5.7408, + "step": 6259 + }, + { + "epoch": 0.04, + "global_step": 6260, + "learning_rate": 0.0004747078464106845, + "loss": 1.772, + "loss_base2": 2.5565, + "loss_pixel": 0.2035, + "loss_text": 1.5685, + "ppl": 5.8826, + "step": 6260 + }, + { + "epoch": 0.04, + "global_step": 6261, + "learning_rate": 0.00047470367278798, + "loss": 1.744, + "loss_base2": 2.5161, + "loss_pixel": 0.2045, + "loss_text": 1.5396, + "ppl": 5.7202, + "step": 6261 + }, + { + "epoch": 0.04, + "global_step": 6262, + "learning_rate": 0.0004746994991652755, + "loss": 1.7698, + "loss_base2": 2.5533, + "loss_pixel": 0.2044, + "loss_text": 1.5653, + "ppl": 5.8697, + "step": 6262 + }, + { + "epoch": 0.04, + "global_step": 6263, + "learning_rate": 0.00047469532554257095, + "loss": 1.7642, + "loss_base2": 2.5452, + "loss_pixel": 0.2047, + "loss_text": 1.5595, + "ppl": 5.8369, + "step": 6263 + }, + { + "epoch": 0.04, + "global_step": 6264, + "learning_rate": 0.00047469115191986646, + "loss": 1.7585, + "loss_base2": 2.537, + "loss_pixel": 0.2033, + "loss_text": 1.5553, + "ppl": 5.8037, + "step": 6264 + }, + { + "epoch": 0.04, + "global_step": 6265, + "learning_rate": 0.00047468697829716196, + "loss": 1.7256, + "loss_base2": 2.4895, + "loss_pixel": 0.2028, + "loss_text": 1.5228, + "ppl": 5.6159, + "step": 6265 + }, + { + "epoch": 0.04, + "global_step": 6266, + "learning_rate": 0.00047468280467445747, + "loss": 1.5327, + "loss_base2": 2.2112, + "loss_pixel": 0.2022, + "loss_text": 1.3305, + "ppl": 4.6307, + "step": 6266 + }, + { + "epoch": 0.04, + "global_step": 6267, + "learning_rate": 0.0004746786310517529, + "loss": 1.5172, + "loss_base2": 2.1889, + "loss_pixel": 0.2029, + "loss_text": 1.3143, + "ppl": 4.5594, + "step": 6267 + }, + { + "epoch": 0.04, + "global_step": 6268, + "learning_rate": 0.00047467445742904843, + "loss": 1.548, + "loss_base2": 2.2333, + "loss_pixel": 0.2028, + "loss_text": 1.3451, + "ppl": 4.7021, + "step": 6268 + }, + { + "epoch": 0.04, + "global_step": 6269, + "learning_rate": 0.00047467028380634394, + "loss": 1.5163, + "loss_base2": 2.1876, + "loss_pixel": 0.2019, + "loss_text": 1.3144, + "ppl": 4.5553, + "step": 6269 + }, + { + "epoch": 0.04, + "global_step": 6270, + "learning_rate": 0.00047466611018363945, + "loss": 1.5251, + "loss_base2": 2.2003, + "loss_pixel": 0.2019, + "loss_text": 1.3232, + "ppl": 4.5956, + "step": 6270 + }, + { + "epoch": 0.04, + "global_step": 6271, + "learning_rate": 0.0004746619365609349, + "loss": 1.5293, + "loss_base2": 2.2063, + "loss_pixel": 0.2021, + "loss_text": 1.3272, + "ppl": 4.6149, + "step": 6271 + }, + { + "epoch": 0.04, + "global_step": 6272, + "learning_rate": 0.00047465776293823035, + "loss": 1.5143, + "loss_base2": 2.1847, + "loss_pixel": 0.2013, + "loss_text": 1.313, + "ppl": 4.5462, + "step": 6272 + }, + { + "epoch": 0.04, + "global_step": 6273, + "learning_rate": 0.00047465358931552586, + "loss": 1.5105, + "loss_base2": 2.1792, + "loss_pixel": 0.2019, + "loss_text": 1.3086, + "ppl": 4.529, + "step": 6273 + }, + { + "epoch": 0.04, + "global_step": 6274, + "learning_rate": 0.00047464941569282137, + "loss": 1.6293, + "loss_base2": 2.3506, + "loss_pixel": 0.201, + "loss_text": 1.4282, + "ppl": 5.1003, + "step": 6274 + }, + { + "epoch": 0.04, + "global_step": 6275, + "learning_rate": 0.0004746452420701169, + "loss": 1.5911, + "loss_base2": 2.2955, + "loss_pixel": 0.2016, + "loss_text": 1.3895, + "ppl": 4.9091, + "step": 6275 + }, + { + "epoch": 0.04, + "global_step": 6276, + "learning_rate": 0.00047464106844741233, + "loss": 1.5466, + "loss_base2": 2.2313, + "loss_pixel": 0.2005, + "loss_text": 1.3462, + "ppl": 4.6955, + "step": 6276 + }, + { + "epoch": 0.04, + "global_step": 6277, + "learning_rate": 0.00047463689482470783, + "loss": 1.526, + "loss_base2": 2.2016, + "loss_pixel": 0.2003, + "loss_text": 1.3257, + "ppl": 4.5997, + "step": 6277 + }, + { + "epoch": 0.04, + "global_step": 6278, + "learning_rate": 0.00047463272120200334, + "loss": 1.5402, + "loss_base2": 2.222, + "loss_pixel": 0.2001, + "loss_text": 1.3401, + "ppl": 4.6655, + "step": 6278 + }, + { + "epoch": 0.04, + "global_step": 6279, + "learning_rate": 0.00047462854757929885, + "loss": 1.5114, + "loss_base2": 2.1805, + "loss_pixel": 0.2005, + "loss_text": 1.3109, + "ppl": 4.5331, + "step": 6279 + }, + { + "epoch": 0.04, + "global_step": 6280, + "learning_rate": 0.00047462437395659436, + "loss": 1.5402, + "loss_base2": 2.222, + "loss_pixel": 0.2005, + "loss_text": 1.3397, + "ppl": 4.6655, + "step": 6280 + }, + { + "epoch": 0.04, + "global_step": 6281, + "learning_rate": 0.0004746202003338898, + "loss": 1.51, + "loss_base2": 2.1785, + "loss_pixel": 0.2001, + "loss_text": 1.3099, + "ppl": 4.5267, + "step": 6281 + }, + { + "epoch": 0.04, + "global_step": 6282, + "learning_rate": 0.0004746160267111853, + "loss": 1.5047, + "loss_base2": 2.1708, + "loss_pixel": 0.1992, + "loss_text": 1.3055, + "ppl": 4.5028, + "step": 6282 + }, + { + "epoch": 0.04, + "global_step": 6283, + "learning_rate": 0.0004746118530884808, + "loss": 1.4875, + "loss_base2": 2.146, + "loss_pixel": 0.2004, + "loss_text": 1.2871, + "ppl": 4.426, + "step": 6283 + }, + { + "epoch": 0.04, + "global_step": 6284, + "learning_rate": 0.00047460767946577633, + "loss": 1.5064, + "loss_base2": 2.1733, + "loss_pixel": 0.1995, + "loss_text": 1.3068, + "ppl": 4.5105, + "step": 6284 + }, + { + "epoch": 0.04, + "global_step": 6285, + "learning_rate": 0.0004746035058430718, + "loss": 1.5203, + "loss_base2": 2.1933, + "loss_pixel": 0.1992, + "loss_text": 1.3211, + "ppl": 4.5736, + "step": 6285 + }, + { + "epoch": 0.04, + "global_step": 6286, + "learning_rate": 0.0004745993322203673, + "loss": 1.5029, + "loss_base2": 2.1682, + "loss_pixel": 0.2003, + "loss_text": 1.3026, + "ppl": 4.4947, + "step": 6286 + }, + { + "epoch": 0.04, + "global_step": 6287, + "learning_rate": 0.0004745951585976628, + "loss": 1.5283, + "loss_base2": 2.2049, + "loss_pixel": 0.1994, + "loss_text": 1.3289, + "ppl": 4.6103, + "step": 6287 + }, + { + "epoch": 0.04, + "global_step": 6288, + "learning_rate": 0.0004745909849749583, + "loss": 1.4976, + "loss_base2": 2.1606, + "loss_pixel": 0.1986, + "loss_text": 1.299, + "ppl": 4.4709, + "step": 6288 + }, + { + "epoch": 0.04, + "global_step": 6289, + "learning_rate": 0.0004745868113522538, + "loss": 1.5153, + "loss_base2": 2.1861, + "loss_pixel": 0.1978, + "loss_text": 1.3174, + "ppl": 4.5508, + "step": 6289 + }, + { + "epoch": 0.04, + "global_step": 6290, + "learning_rate": 0.0004745826377295492, + "loss": 1.5117, + "loss_base2": 2.1809, + "loss_pixel": 0.1988, + "loss_text": 1.3129, + "ppl": 4.5344, + "step": 6290 + }, + { + "epoch": 0.04, + "global_step": 6291, + "learning_rate": 0.0004745784641068447, + "loss": 1.5185, + "loss_base2": 2.1907, + "loss_pixel": 0.1978, + "loss_text": 1.3207, + "ppl": 4.5654, + "step": 6291 + }, + { + "epoch": 0.04, + "global_step": 6292, + "learning_rate": 0.00047457429048414023, + "loss": 1.5111, + "loss_base2": 2.1801, + "loss_pixel": 0.1987, + "loss_text": 1.3125, + "ppl": 4.5317, + "step": 6292 + }, + { + "epoch": 0.04, + "global_step": 6293, + "learning_rate": 0.00047457011686143573, + "loss": 1.7665, + "loss_base2": 2.5485, + "loss_pixel": 0.1985, + "loss_text": 1.568, + "ppl": 5.8503, + "step": 6293 + }, + { + "epoch": 0.04, + "global_step": 6294, + "learning_rate": 0.0004745659432387312, + "loss": 1.7761, + "loss_base2": 2.5624, + "loss_pixel": 0.1974, + "loss_text": 1.5787, + "ppl": 5.9068, + "step": 6294 + }, + { + "epoch": 0.04, + "global_step": 6295, + "learning_rate": 0.0004745617696160267, + "loss": 1.782, + "loss_base2": 2.5709, + "loss_pixel": 0.1982, + "loss_text": 1.5838, + "ppl": 5.9417, + "step": 6295 + }, + { + "epoch": 0.04, + "global_step": 6296, + "learning_rate": 0.0004745575959933222, + "loss": 1.7631, + "loss_base2": 2.5436, + "loss_pixel": 0.1982, + "loss_text": 1.565, + "ppl": 5.8305, + "step": 6296 + }, + { + "epoch": 0.04, + "global_step": 6297, + "learning_rate": 0.0004745534223706177, + "loss": 1.769, + "loss_base2": 2.5521, + "loss_pixel": 0.197, + "loss_text": 1.572, + "ppl": 5.865, + "step": 6297 + }, + { + "epoch": 0.04, + "global_step": 6298, + "learning_rate": 0.0004745492487479132, + "loss": 1.7572, + "loss_base2": 2.5351, + "loss_pixel": 0.1986, + "loss_text": 1.5586, + "ppl": 5.7962, + "step": 6298 + }, + { + "epoch": 0.04, + "global_step": 6299, + "learning_rate": 0.00047454507512520867, + "loss": 1.7652, + "loss_base2": 2.5466, + "loss_pixel": 0.1959, + "loss_text": 1.5692, + "ppl": 5.8427, + "step": 6299 + }, + { + "epoch": 0.04, + "global_step": 6300, + "learning_rate": 0.0004745409015025042, + "loss": 1.7645, + "loss_base2": 2.5456, + "loss_pixel": 0.1972, + "loss_text": 1.5673, + "ppl": 5.8387, + "step": 6300 + }, + { + "epoch": 0.04, + "global_step": 6301, + "learning_rate": 0.0004745367278797997, + "loss": 1.7698, + "loss_base2": 2.5533, + "loss_pixel": 0.196, + "loss_text": 1.5737, + "ppl": 5.8697, + "step": 6301 + }, + { + "epoch": 0.04, + "global_step": 6302, + "learning_rate": 0.0004745325542570952, + "loss": 1.7529, + "loss_base2": 2.5289, + "loss_pixel": 0.1965, + "loss_text": 1.5564, + "ppl": 5.7713, + "step": 6302 + }, + { + "epoch": 0.04, + "global_step": 6303, + "learning_rate": 0.0004745283806343907, + "loss": 1.7353, + "loss_base2": 2.5035, + "loss_pixel": 0.1978, + "loss_text": 1.5375, + "ppl": 5.6706, + "step": 6303 + }, + { + "epoch": 0.04, + "global_step": 6304, + "learning_rate": 0.00047452420701168615, + "loss": 1.7545, + "loss_base2": 2.5312, + "loss_pixel": 0.1953, + "loss_text": 1.5592, + "ppl": 5.7806, + "step": 6304 + }, + { + "epoch": 0.04, + "global_step": 6305, + "learning_rate": 0.00047452003338898166, + "loss": 1.7628, + "loss_base2": 2.5432, + "loss_pixel": 0.1966, + "loss_text": 1.5663, + "ppl": 5.8287, + "step": 6305 + }, + { + "epoch": 0.04, + "global_step": 6306, + "learning_rate": 0.00047451585976627717, + "loss": 1.7456, + "loss_base2": 2.5184, + "loss_pixel": 0.1965, + "loss_text": 1.5491, + "ppl": 5.7293, + "step": 6306 + }, + { + "epoch": 0.04, + "global_step": 6307, + "learning_rate": 0.0004745116861435727, + "loss": 1.7617, + "loss_base2": 2.5416, + "loss_pixel": 0.1985, + "loss_text": 1.5632, + "ppl": 5.8223, + "step": 6307 + }, + { + "epoch": 0.04, + "global_step": 6308, + "learning_rate": 0.00047450751252086813, + "loss": 1.7587, + "loss_base2": 2.5373, + "loss_pixel": 0.1952, + "loss_text": 1.5636, + "ppl": 5.8049, + "step": 6308 + }, + { + "epoch": 0.04, + "global_step": 6309, + "learning_rate": 0.0004745033388981636, + "loss": 1.7271, + "loss_base2": 2.4917, + "loss_pixel": 0.1968, + "loss_text": 1.5303, + "ppl": 5.6243, + "step": 6309 + }, + { + "epoch": 0.04, + "global_step": 6310, + "learning_rate": 0.0004744991652754591, + "loss": 1.7524, + "loss_base2": 2.5282, + "loss_pixel": 0.1965, + "loss_text": 1.5559, + "ppl": 5.7684, + "step": 6310 + }, + { + "epoch": 0.04, + "global_step": 6311, + "learning_rate": 0.0004744949916527546, + "loss": 1.7388, + "loss_base2": 2.5086, + "loss_pixel": 0.1941, + "loss_text": 1.5447, + "ppl": 5.6905, + "step": 6311 + }, + { + "epoch": 0.04, + "global_step": 6312, + "learning_rate": 0.0004744908180300501, + "loss": 1.7574, + "loss_base2": 2.5354, + "loss_pixel": 0.1964, + "loss_text": 1.561, + "ppl": 5.7973, + "step": 6312 + }, + { + "epoch": 0.04, + "global_step": 6313, + "learning_rate": 0.00047448664440734556, + "loss": 1.7509, + "loss_base2": 2.526, + "loss_pixel": 0.1951, + "loss_text": 1.5558, + "ppl": 5.7598, + "step": 6313 + }, + { + "epoch": 0.04, + "global_step": 6314, + "learning_rate": 0.00047448247078464106, + "loss": 1.7514, + "loss_base2": 2.5267, + "loss_pixel": 0.1954, + "loss_text": 1.556, + "ppl": 5.7627, + "step": 6314 + }, + { + "epoch": 0.04, + "global_step": 6315, + "learning_rate": 0.00047447829716193657, + "loss": 1.751, + "loss_base2": 2.5262, + "loss_pixel": 0.1933, + "loss_text": 1.5577, + "ppl": 5.7604, + "step": 6315 + }, + { + "epoch": 0.04, + "global_step": 6316, + "learning_rate": 0.0004744741235392321, + "loss": 1.7354, + "loss_base2": 2.5037, + "loss_pixel": 0.1932, + "loss_text": 1.5423, + "ppl": 5.6712, + "step": 6316 + }, + { + "epoch": 0.04, + "global_step": 6317, + "learning_rate": 0.00047446994991652753, + "loss": 1.7284, + "loss_base2": 2.4936, + "loss_pixel": 0.1928, + "loss_text": 1.5356, + "ppl": 5.6316, + "step": 6317 + }, + { + "epoch": 0.04, + "global_step": 6318, + "learning_rate": 0.00047446577629382304, + "loss": 1.5125, + "loss_base2": 2.1821, + "loss_pixel": 0.1944, + "loss_text": 1.3181, + "ppl": 4.5381, + "step": 6318 + }, + { + "epoch": 0.04, + "global_step": 6319, + "learning_rate": 0.00047446160267111855, + "loss": 1.5149, + "loss_base2": 2.1855, + "loss_pixel": 0.1958, + "loss_text": 1.3191, + "ppl": 4.549, + "step": 6319 + }, + { + "epoch": 0.04, + "global_step": 6320, + "learning_rate": 0.00047445742904841405, + "loss": 1.5223, + "loss_base2": 2.1962, + "loss_pixel": 0.1951, + "loss_text": 1.3272, + "ppl": 4.5828, + "step": 6320 + }, + { + "epoch": 0.04, + "global_step": 6321, + "learning_rate": 0.00047445325542570956, + "loss": 1.5164, + "loss_base2": 2.1877, + "loss_pixel": 0.1951, + "loss_text": 1.3213, + "ppl": 4.5558, + "step": 6321 + }, + { + "epoch": 0.04, + "global_step": 6322, + "learning_rate": 0.000474449081803005, + "loss": 1.5186, + "loss_base2": 2.1909, + "loss_pixel": 0.1941, + "loss_text": 1.3245, + "ppl": 4.5658, + "step": 6322 + }, + { + "epoch": 0.04, + "global_step": 6323, + "learning_rate": 0.0004744449081803005, + "loss": 1.5148, + "loss_base2": 2.1854, + "loss_pixel": 0.1943, + "loss_text": 1.3205, + "ppl": 4.5485, + "step": 6323 + }, + { + "epoch": 0.04, + "global_step": 6324, + "learning_rate": 0.00047444073455759603, + "loss": 1.492, + "loss_base2": 2.1525, + "loss_pixel": 0.1961, + "loss_text": 1.2958, + "ppl": 4.446, + "step": 6324 + }, + { + "epoch": 0.04, + "global_step": 6325, + "learning_rate": 0.00047443656093489154, + "loss": 1.517, + "loss_base2": 2.1886, + "loss_pixel": 0.1944, + "loss_text": 1.3226, + "ppl": 4.5585, + "step": 6325 + }, + { + "epoch": 0.04, + "global_step": 6326, + "learning_rate": 0.000474432387312187, + "loss": 1.4775, + "loss_base2": 2.1316, + "loss_pixel": 0.1941, + "loss_text": 1.2835, + "ppl": 4.382, + "step": 6326 + }, + { + "epoch": 0.04, + "global_step": 6327, + "learning_rate": 0.00047442821368948244, + "loss": 1.5151, + "loss_base2": 2.1858, + "loss_pixel": 0.1956, + "loss_text": 1.3194, + "ppl": 4.5499, + "step": 6327 + }, + { + "epoch": 0.04, + "global_step": 6328, + "learning_rate": 0.00047442404006677795, + "loss": 1.4847, + "loss_base2": 2.142, + "loss_pixel": 0.1941, + "loss_text": 1.2906, + "ppl": 4.4136, + "step": 6328 + }, + { + "epoch": 0.04, + "global_step": 6329, + "learning_rate": 0.00047441986644407346, + "loss": 1.4789, + "loss_base2": 2.1336, + "loss_pixel": 0.1947, + "loss_text": 1.2842, + "ppl": 4.3881, + "step": 6329 + }, + { + "epoch": 0.04, + "global_step": 6330, + "learning_rate": 0.00047441569282136896, + "loss": 1.5, + "loss_base2": 2.164, + "loss_pixel": 0.1966, + "loss_text": 1.3034, + "ppl": 4.4817, + "step": 6330 + }, + { + "epoch": 0.04, + "global_step": 6331, + "learning_rate": 0.0004744115191986644, + "loss": 1.524, + "loss_base2": 2.1987, + "loss_pixel": 0.1941, + "loss_text": 1.3299, + "ppl": 4.5906, + "step": 6331 + }, + { + "epoch": 0.04, + "global_step": 6332, + "learning_rate": 0.0004744073455759599, + "loss": 1.4831, + "loss_base2": 2.1397, + "loss_pixel": 0.1954, + "loss_text": 1.2877, + "ppl": 4.4066, + "step": 6332 + }, + { + "epoch": 0.04, + "global_step": 6333, + "learning_rate": 0.00047440317195325543, + "loss": 1.4948, + "loss_base2": 2.1565, + "loss_pixel": 0.1942, + "loss_text": 1.3006, + "ppl": 4.4584, + "step": 6333 + }, + { + "epoch": 0.04, + "global_step": 6334, + "learning_rate": 0.00047439899833055094, + "loss": 1.4942, + "loss_base2": 2.1557, + "loss_pixel": 0.1937, + "loss_text": 1.3005, + "ppl": 4.4558, + "step": 6334 + }, + { + "epoch": 0.04, + "global_step": 6335, + "learning_rate": 0.0004743948247078464, + "loss": 1.6288, + "loss_base2": 2.3499, + "loss_pixel": 0.1942, + "loss_text": 1.4345, + "ppl": 5.0978, + "step": 6335 + }, + { + "epoch": 0.04, + "global_step": 6336, + "learning_rate": 0.0004743906510851419, + "loss": 1.7676, + "loss_base2": 2.5501, + "loss_pixel": 0.1942, + "loss_text": 1.5734, + "ppl": 5.8568, + "step": 6336 + }, + { + "epoch": 0.04, + "global_step": 6337, + "learning_rate": 0.0004743864774624374, + "loss": 1.7484, + "loss_base2": 2.5224, + "loss_pixel": 0.1936, + "loss_text": 1.5547, + "ppl": 5.7454, + "step": 6337 + }, + { + "epoch": 0.04, + "global_step": 6338, + "learning_rate": 0.0004743823038397329, + "loss": 1.7386, + "loss_base2": 2.5083, + "loss_pixel": 0.1924, + "loss_text": 1.5463, + "ppl": 5.6894, + "step": 6338 + }, + { + "epoch": 0.04, + "global_step": 6339, + "learning_rate": 0.0004743781302170284, + "loss": 1.7526, + "loss_base2": 2.5285, + "loss_pixel": 0.1938, + "loss_text": 1.5589, + "ppl": 5.7696, + "step": 6339 + }, + { + "epoch": 0.04, + "global_step": 6340, + "learning_rate": 0.0004743739565943239, + "loss": 1.7522, + "loss_base2": 2.5279, + "loss_pixel": 0.194, + "loss_text": 1.5582, + "ppl": 5.7673, + "step": 6340 + }, + { + "epoch": 0.04, + "global_step": 6341, + "learning_rate": 0.0004743697829716194, + "loss": 1.753, + "loss_base2": 2.529, + "loss_pixel": 0.194, + "loss_text": 1.5591, + "ppl": 5.7719, + "step": 6341 + }, + { + "epoch": 0.04, + "global_step": 6342, + "learning_rate": 0.0004743656093489149, + "loss": 1.749, + "loss_base2": 2.5233, + "loss_pixel": 0.1915, + "loss_text": 1.5575, + "ppl": 5.7489, + "step": 6342 + }, + { + "epoch": 0.04, + "global_step": 6343, + "learning_rate": 0.0004743614357262104, + "loss": 1.7525, + "loss_base2": 2.5283, + "loss_pixel": 0.1913, + "loss_text": 1.5612, + "ppl": 5.769, + "step": 6343 + }, + { + "epoch": 0.04, + "global_step": 6344, + "learning_rate": 0.00047435726210350585, + "loss": 1.7497, + "loss_base2": 2.5243, + "loss_pixel": 0.1932, + "loss_text": 1.5565, + "ppl": 5.7529, + "step": 6344 + }, + { + "epoch": 0.04, + "global_step": 6345, + "learning_rate": 0.00047435308848080136, + "loss": 1.7609, + "loss_base2": 2.5404, + "loss_pixel": 0.1933, + "loss_text": 1.5676, + "ppl": 5.8177, + "step": 6345 + }, + { + "epoch": 0.04, + "global_step": 6346, + "learning_rate": 0.0004743489148580968, + "loss": 1.7431, + "loss_base2": 2.5148, + "loss_pixel": 0.193, + "loss_text": 1.5502, + "ppl": 5.715, + "step": 6346 + }, + { + "epoch": 0.04, + "global_step": 6347, + "learning_rate": 0.0004743447412353923, + "loss": 1.7408, + "loss_base2": 2.5114, + "loss_pixel": 0.1933, + "loss_text": 1.5475, + "ppl": 5.7019, + "step": 6347 + }, + { + "epoch": 0.04, + "global_step": 6348, + "learning_rate": 0.0004743405676126878, + "loss": 1.743, + "loss_base2": 2.5146, + "loss_pixel": 0.1924, + "loss_text": 1.5507, + "ppl": 5.7145, + "step": 6348 + }, + { + "epoch": 0.04, + "global_step": 6349, + "learning_rate": 0.0004743363939899833, + "loss": 1.7476, + "loss_base2": 2.5213, + "loss_pixel": 0.192, + "loss_text": 1.5556, + "ppl": 5.7408, + "step": 6349 + }, + { + "epoch": 0.04, + "global_step": 6350, + "learning_rate": 0.0004743322203672788, + "loss": 1.7478, + "loss_base2": 2.5215, + "loss_pixel": 0.1916, + "loss_text": 1.5561, + "ppl": 5.742, + "step": 6350 + }, + { + "epoch": 0.04, + "global_step": 6351, + "learning_rate": 0.0004743280467445743, + "loss": 1.7708, + "loss_base2": 2.5547, + "loss_pixel": 0.1931, + "loss_text": 1.5777, + "ppl": 5.8756, + "step": 6351 + }, + { + "epoch": 0.04, + "global_step": 6352, + "learning_rate": 0.0004743238731218698, + "loss": 1.7513, + "loss_base2": 2.5266, + "loss_pixel": 0.1958, + "loss_text": 1.5555, + "ppl": 5.7621, + "step": 6352 + }, + { + "epoch": 0.04, + "global_step": 6353, + "learning_rate": 0.00047431969949916525, + "loss": 1.7441, + "loss_base2": 2.5162, + "loss_pixel": 0.1956, + "loss_text": 1.5485, + "ppl": 5.7208, + "step": 6353 + }, + { + "epoch": 0.04, + "global_step": 6354, + "learning_rate": 0.00047431552587646076, + "loss": 1.7404, + "loss_base2": 2.5109, + "loss_pixel": 0.1965, + "loss_text": 1.544, + "ppl": 5.6996, + "step": 6354 + }, + { + "epoch": 0.04, + "global_step": 6355, + "learning_rate": 0.00047431135225375627, + "loss": 1.7599, + "loss_base2": 2.539, + "loss_pixel": 0.1933, + "loss_text": 1.5666, + "ppl": 5.8119, + "step": 6355 + }, + { + "epoch": 0.04, + "global_step": 6356, + "learning_rate": 0.0004743071786310518, + "loss": 1.7472, + "loss_base2": 2.5207, + "loss_pixel": 0.194, + "loss_text": 1.5532, + "ppl": 5.7385, + "step": 6356 + }, + { + "epoch": 0.04, + "global_step": 6357, + "learning_rate": 0.0004743030050083473, + "loss": 1.7487, + "loss_base2": 2.5228, + "loss_pixel": 0.1935, + "loss_text": 1.5552, + "ppl": 5.7471, + "step": 6357 + }, + { + "epoch": 0.04, + "global_step": 6358, + "learning_rate": 0.00047429883138564273, + "loss": 1.7194, + "loss_base2": 2.4806, + "loss_pixel": 0.1928, + "loss_text": 1.5266, + "ppl": 5.5812, + "step": 6358 + }, + { + "epoch": 0.04, + "global_step": 6359, + "learning_rate": 0.00047429465776293824, + "loss": 1.7225, + "loss_base2": 2.485, + "loss_pixel": 0.192, + "loss_text": 1.5305, + "ppl": 5.5985, + "step": 6359 + }, + { + "epoch": 0.04, + "global_step": 6360, + "learning_rate": 0.00047429048414023375, + "loss": 1.4963, + "loss_base2": 2.1587, + "loss_pixel": 0.1912, + "loss_text": 1.3051, + "ppl": 4.4651, + "step": 6360 + }, + { + "epoch": 0.04, + "global_step": 6361, + "learning_rate": 0.00047428631051752926, + "loss": 1.4899, + "loss_base2": 2.1495, + "loss_pixel": 0.1924, + "loss_text": 1.2974, + "ppl": 4.4367, + "step": 6361 + }, + { + "epoch": 0.04, + "global_step": 6362, + "learning_rate": 0.00047428213689482476, + "loss": 1.4891, + "loss_base2": 2.1483, + "loss_pixel": 0.1922, + "loss_text": 1.2969, + "ppl": 4.4331, + "step": 6362 + }, + { + "epoch": 0.04, + "global_step": 6363, + "learning_rate": 0.0004742779632721202, + "loss": 1.4935, + "loss_base2": 2.1547, + "loss_pixel": 0.1927, + "loss_text": 1.3007, + "ppl": 4.4527, + "step": 6363 + }, + { + "epoch": 0.04, + "global_step": 6364, + "learning_rate": 0.0004742737896494157, + "loss": 1.5033, + "loss_base2": 2.1688, + "loss_pixel": 0.1913, + "loss_text": 1.3121, + "ppl": 4.4965, + "step": 6364 + }, + { + "epoch": 0.04, + "global_step": 6365, + "learning_rate": 0.0004742696160267112, + "loss": 1.5115, + "loss_base2": 2.1806, + "loss_pixel": 0.1908, + "loss_text": 1.3207, + "ppl": 4.5335, + "step": 6365 + }, + { + "epoch": 0.04, + "global_step": 6366, + "learning_rate": 0.0004742654424040067, + "loss": 1.5178, + "loss_base2": 2.1897, + "loss_pixel": 0.1917, + "loss_text": 1.3261, + "ppl": 4.5622, + "step": 6366 + }, + { + "epoch": 0.04, + "global_step": 6367, + "learning_rate": 0.00047426126878130214, + "loss": 1.6196, + "loss_base2": 2.3366, + "loss_pixel": 0.1914, + "loss_text": 1.4282, + "ppl": 5.0511, + "step": 6367 + }, + { + "epoch": 0.04, + "global_step": 6368, + "learning_rate": 0.00047425709515859765, + "loss": 1.7446, + "loss_base2": 2.5169, + "loss_pixel": 0.1906, + "loss_text": 1.554, + "ppl": 5.7236, + "step": 6368 + }, + { + "epoch": 0.04, + "global_step": 6369, + "learning_rate": 0.00047425292153589315, + "loss": 1.7494, + "loss_base2": 2.5239, + "loss_pixel": 0.1916, + "loss_text": 1.5579, + "ppl": 5.7512, + "step": 6369 + }, + { + "epoch": 0.04, + "global_step": 6370, + "learning_rate": 0.00047424874791318866, + "loss": 1.7482, + "loss_base2": 2.5221, + "loss_pixel": 0.1906, + "loss_text": 1.5576, + "ppl": 5.7443, + "step": 6370 + }, + { + "epoch": 0.04, + "global_step": 6371, + "learning_rate": 0.00047424457429048417, + "loss": 1.7436, + "loss_base2": 2.5155, + "loss_pixel": 0.1906, + "loss_text": 1.553, + "ppl": 5.7179, + "step": 6371 + }, + { + "epoch": 0.04, + "global_step": 6372, + "learning_rate": 0.0004742404006677796, + "loss": 1.7422, + "loss_base2": 2.5135, + "loss_pixel": 0.1898, + "loss_text": 1.5524, + "ppl": 5.7099, + "step": 6372 + }, + { + "epoch": 0.04, + "global_step": 6373, + "learning_rate": 0.00047423622704507513, + "loss": 1.7416, + "loss_base2": 2.5126, + "loss_pixel": 0.1903, + "loss_text": 1.5513, + "ppl": 5.7065, + "step": 6373 + }, + { + "epoch": 0.04, + "global_step": 6374, + "learning_rate": 0.00047423205342237064, + "loss": 1.7533, + "loss_base2": 2.5295, + "loss_pixel": 0.1916, + "loss_text": 1.5617, + "ppl": 5.7736, + "step": 6374 + }, + { + "epoch": 0.04, + "global_step": 6375, + "learning_rate": 0.00047422787979966614, + "loss": 1.7502, + "loss_base2": 2.525, + "loss_pixel": 0.19, + "loss_text": 1.5602, + "ppl": 5.7558, + "step": 6375 + }, + { + "epoch": 0.04, + "global_step": 6376, + "learning_rate": 0.0004742237061769616, + "loss": 1.7296, + "loss_base2": 2.4953, + "loss_pixel": 0.1912, + "loss_text": 1.5384, + "ppl": 5.6384, + "step": 6376 + }, + { + "epoch": 0.04, + "global_step": 6377, + "learning_rate": 0.0004742195325542571, + "loss": 1.738, + "loss_base2": 2.5074, + "loss_pixel": 0.1899, + "loss_text": 1.548, + "ppl": 5.686, + "step": 6377 + }, + { + "epoch": 0.04, + "global_step": 6378, + "learning_rate": 0.0004742153589315526, + "loss": 1.7579, + "loss_base2": 2.5361, + "loss_pixel": 0.1896, + "loss_text": 1.5683, + "ppl": 5.8002, + "step": 6378 + }, + { + "epoch": 0.04, + "global_step": 6379, + "learning_rate": 0.0004742111853088481, + "loss": 1.7058, + "loss_base2": 2.4609, + "loss_pixel": 0.1887, + "loss_text": 1.5171, + "ppl": 5.5058, + "step": 6379 + }, + { + "epoch": 0.04, + "global_step": 6380, + "learning_rate": 0.0004742070116861436, + "loss": 1.7398, + "loss_base2": 2.51, + "loss_pixel": 0.1918, + "loss_text": 1.548, + "ppl": 5.6962, + "step": 6380 + }, + { + "epoch": 0.04, + "global_step": 6381, + "learning_rate": 0.0004742028380634391, + "loss": 1.7324, + "loss_base2": 2.4993, + "loss_pixel": 0.1883, + "loss_text": 1.544, + "ppl": 5.6542, + "step": 6381 + }, + { + "epoch": 0.04, + "global_step": 6382, + "learning_rate": 0.0004741986644407346, + "loss": 1.7412, + "loss_base2": 2.512, + "loss_pixel": 0.1901, + "loss_text": 1.5511, + "ppl": 5.7042, + "step": 6382 + }, + { + "epoch": 0.04, + "global_step": 6383, + "learning_rate": 0.0004741944908180301, + "loss": 1.7544, + "loss_base2": 2.5311, + "loss_pixel": 0.191, + "loss_text": 1.5634, + "ppl": 5.78, + "step": 6383 + }, + { + "epoch": 0.04, + "global_step": 6384, + "learning_rate": 0.00047419031719532555, + "loss": 1.7317, + "loss_base2": 2.4983, + "loss_pixel": 0.1899, + "loss_text": 1.5418, + "ppl": 5.6503, + "step": 6384 + }, + { + "epoch": 0.04, + "global_step": 6385, + "learning_rate": 0.000474186143572621, + "loss": 1.7339, + "loss_base2": 2.5015, + "loss_pixel": 0.1897, + "loss_text": 1.5443, + "ppl": 5.6627, + "step": 6385 + }, + { + "epoch": 0.04, + "global_step": 6386, + "learning_rate": 0.0004741819699499165, + "loss": 1.7244, + "loss_base2": 2.4878, + "loss_pixel": 0.1915, + "loss_text": 1.5329, + "ppl": 5.6092, + "step": 6386 + }, + { + "epoch": 0.04, + "global_step": 6387, + "learning_rate": 0.000474177796327212, + "loss": 1.7264, + "loss_base2": 2.4907, + "loss_pixel": 0.1888, + "loss_text": 1.5375, + "ppl": 5.6204, + "step": 6387 + }, + { + "epoch": 0.04, + "global_step": 6388, + "learning_rate": 0.0004741736227045075, + "loss": 1.746, + "loss_base2": 2.5189, + "loss_pixel": 0.1898, + "loss_text": 1.5562, + "ppl": 5.7316, + "step": 6388 + }, + { + "epoch": 0.04, + "global_step": 6389, + "learning_rate": 0.00047416944908180303, + "loss": 1.6044, + "loss_base2": 2.3147, + "loss_pixel": 0.1902, + "loss_text": 1.4142, + "ppl": 4.9749, + "step": 6389 + }, + { + "epoch": 0.04, + "global_step": 6390, + "learning_rate": 0.0004741652754590985, + "loss": 1.5017, + "loss_base2": 2.1665, + "loss_pixel": 0.1902, + "loss_text": 1.3115, + "ppl": 4.4893, + "step": 6390 + }, + { + "epoch": 0.04, + "global_step": 6391, + "learning_rate": 0.000474161101836394, + "loss": 1.5018, + "loss_base2": 2.1666, + "loss_pixel": 0.1885, + "loss_text": 1.3133, + "ppl": 4.4898, + "step": 6391 + }, + { + "epoch": 0.04, + "global_step": 6392, + "learning_rate": 0.0004741569282136895, + "loss": 1.4978, + "loss_base2": 2.1609, + "loss_pixel": 0.1892, + "loss_text": 1.3086, + "ppl": 4.4718, + "step": 6392 + }, + { + "epoch": 0.04, + "global_step": 6393, + "learning_rate": 0.000474152754590985, + "loss": 1.4799, + "loss_base2": 2.135, + "loss_pixel": 0.1884, + "loss_text": 1.2916, + "ppl": 4.3925, + "step": 6393 + }, + { + "epoch": 0.04, + "global_step": 6394, + "learning_rate": 0.00047414858096828046, + "loss": 1.4816, + "loss_base2": 2.1375, + "loss_pixel": 0.188, + "loss_text": 1.2936, + "ppl": 4.4, + "step": 6394 + }, + { + "epoch": 0.04, + "global_step": 6395, + "learning_rate": 0.00047414440734557596, + "loss": 1.4921, + "loss_base2": 2.1526, + "loss_pixel": 0.1903, + "loss_text": 1.3018, + "ppl": 4.4464, + "step": 6395 + }, + { + "epoch": 0.04, + "global_step": 6396, + "learning_rate": 0.00047414023372287147, + "loss": 1.4772, + "loss_base2": 2.1311, + "loss_pixel": 0.1878, + "loss_text": 1.2894, + "ppl": 4.3807, + "step": 6396 + }, + { + "epoch": 0.04, + "global_step": 6397, + "learning_rate": 0.000474136060100167, + "loss": 1.5938, + "loss_base2": 2.2994, + "loss_pixel": 0.1907, + "loss_text": 1.403, + "ppl": 4.9224, + "step": 6397 + }, + { + "epoch": 0.04, + "global_step": 6398, + "learning_rate": 0.0004741318864774625, + "loss": 1.7384, + "loss_base2": 2.508, + "loss_pixel": 0.1892, + "loss_text": 1.5492, + "ppl": 5.6882, + "step": 6398 + }, + { + "epoch": 0.04, + "global_step": 6399, + "learning_rate": 0.00047412771285475794, + "loss": 1.7509, + "loss_base2": 2.526, + "loss_pixel": 0.1893, + "loss_text": 1.5616, + "ppl": 5.7598, + "step": 6399 + }, + { + "epoch": 0.04, + "global_step": 6400, + "learning_rate": 0.00047412353923205345, + "loss": 1.7475, + "loss_base2": 2.5211, + "loss_pixel": 0.1891, + "loss_text": 1.5584, + "ppl": 5.7402, + "step": 6400 + }, + { + "epoch": 0.04, + "global_step": 6401, + "learning_rate": 0.00047411936560934895, + "loss": 1.7387, + "loss_base2": 2.5084, + "loss_pixel": 0.1887, + "loss_text": 1.55, + "ppl": 5.6899, + "step": 6401 + }, + { + "epoch": 0.04, + "global_step": 6402, + "learning_rate": 0.00047411519198664446, + "loss": 1.7581, + "loss_base2": 2.5364, + "loss_pixel": 0.1916, + "loss_text": 1.5666, + "ppl": 5.8014, + "step": 6402 + }, + { + "epoch": 0.04, + "global_step": 6403, + "learning_rate": 0.00047411101836393986, + "loss": 1.7333, + "loss_base2": 2.5006, + "loss_pixel": 0.1913, + "loss_text": 1.5419, + "ppl": 5.6593, + "step": 6403 + }, + { + "epoch": 0.04, + "global_step": 6404, + "learning_rate": 0.00047410684474123537, + "loss": 1.7403, + "loss_base2": 2.5107, + "loss_pixel": 0.1895, + "loss_text": 1.5509, + "ppl": 5.6991, + "step": 6404 + }, + { + "epoch": 0.04, + "global_step": 6405, + "learning_rate": 0.0004741026711185309, + "loss": 1.7455, + "loss_base2": 2.5182, + "loss_pixel": 0.1915, + "loss_text": 1.554, + "ppl": 5.7288, + "step": 6405 + }, + { + "epoch": 0.04, + "global_step": 6406, + "learning_rate": 0.0004740984974958264, + "loss": 1.7415, + "loss_base2": 2.5125, + "loss_pixel": 0.1888, + "loss_text": 1.5527, + "ppl": 5.7059, + "step": 6406 + }, + { + "epoch": 0.04, + "global_step": 6407, + "learning_rate": 0.0004740943238731219, + "loss": 1.7325, + "loss_base2": 2.4995, + "loss_pixel": 0.1899, + "loss_text": 1.5426, + "ppl": 5.6548, + "step": 6407 + }, + { + "epoch": 0.04, + "global_step": 6408, + "learning_rate": 0.00047409015025041734, + "loss": 1.7373, + "loss_base2": 2.5064, + "loss_pixel": 0.1891, + "loss_text": 1.5482, + "ppl": 5.682, + "step": 6408 + }, + { + "epoch": 0.04, + "global_step": 6409, + "learning_rate": 0.00047408597662771285, + "loss": 1.7367, + "loss_base2": 2.5055, + "loss_pixel": 0.1881, + "loss_text": 1.5486, + "ppl": 5.6786, + "step": 6409 + }, + { + "epoch": 0.04, + "global_step": 6410, + "learning_rate": 0.00047408180300500836, + "loss": 1.7354, + "loss_base2": 2.5037, + "loss_pixel": 0.1845, + "loss_text": 1.5509, + "ppl": 5.6712, + "step": 6410 + }, + { + "epoch": 0.04, + "global_step": 6411, + "learning_rate": 0.00047407762938230386, + "loss": 1.7388, + "loss_base2": 2.5086, + "loss_pixel": 0.1883, + "loss_text": 1.5505, + "ppl": 5.6905, + "step": 6411 + }, + { + "epoch": 0.04, + "global_step": 6412, + "learning_rate": 0.0004740734557595993, + "loss": 1.7279, + "loss_base2": 2.4928, + "loss_pixel": 0.1862, + "loss_text": 1.5417, + "ppl": 5.6288, + "step": 6412 + }, + { + "epoch": 0.04, + "global_step": 6413, + "learning_rate": 0.0004740692821368948, + "loss": 1.7317, + "loss_base2": 2.4983, + "loss_pixel": 0.1847, + "loss_text": 1.547, + "ppl": 5.6503, + "step": 6413 + }, + { + "epoch": 0.04, + "global_step": 6414, + "learning_rate": 0.00047406510851419033, + "loss": 1.7353, + "loss_base2": 2.5035, + "loss_pixel": 0.1867, + "loss_text": 1.5485, + "ppl": 5.6706, + "step": 6414 + }, + { + "epoch": 0.04, + "global_step": 6415, + "learning_rate": 0.00047406093489148584, + "loss": 1.7365, + "loss_base2": 2.5052, + "loss_pixel": 0.1854, + "loss_text": 1.5511, + "ppl": 5.6774, + "step": 6415 + }, + { + "epoch": 0.04, + "global_step": 6416, + "learning_rate": 0.00047405676126878135, + "loss": 1.7343, + "loss_base2": 2.5021, + "loss_pixel": 0.1838, + "loss_text": 1.5505, + "ppl": 5.665, + "step": 6416 + }, + { + "epoch": 0.04, + "global_step": 6417, + "learning_rate": 0.0004740525876460768, + "loss": 1.7368, + "loss_base2": 2.5057, + "loss_pixel": 0.1858, + "loss_text": 1.551, + "ppl": 5.6791, + "step": 6417 + }, + { + "epoch": 0.04, + "global_step": 6418, + "learning_rate": 0.0004740484140233723, + "loss": 1.727, + "loss_base2": 2.4915, + "loss_pixel": 0.1863, + "loss_text": 1.5407, + "ppl": 5.6238, + "step": 6418 + }, + { + "epoch": 0.04, + "global_step": 6419, + "learning_rate": 0.0004740442404006678, + "loss": 1.7371, + "loss_base2": 2.5061, + "loss_pixel": 0.1942, + "loss_text": 1.5428, + "ppl": 5.6808, + "step": 6419 + }, + { + "epoch": 0.04, + "global_step": 6420, + "learning_rate": 0.0004740400667779633, + "loss": 1.7409, + "loss_base2": 2.5116, + "loss_pixel": 0.1942, + "loss_text": 1.5468, + "ppl": 5.7025, + "step": 6420 + }, + { + "epoch": 0.04, + "global_step": 6421, + "learning_rate": 0.00047403589315525883, + "loss": 1.7416, + "loss_base2": 2.5126, + "loss_pixel": 0.1907, + "loss_text": 1.5509, + "ppl": 5.7065, + "step": 6421 + }, + { + "epoch": 0.04, + "global_step": 6422, + "learning_rate": 0.00047403171953255423, + "loss": 1.7468, + "loss_base2": 2.5201, + "loss_pixel": 0.1921, + "loss_text": 1.5547, + "ppl": 5.7362, + "step": 6422 + }, + { + "epoch": 0.04, + "global_step": 6423, + "learning_rate": 0.00047402754590984973, + "loss": 1.7378, + "loss_base2": 2.5071, + "loss_pixel": 0.1896, + "loss_text": 1.5483, + "ppl": 5.6848, + "step": 6423 + }, + { + "epoch": 0.04, + "global_step": 6424, + "learning_rate": 0.00047402337228714524, + "loss": 1.7006, + "loss_base2": 2.4534, + "loss_pixel": 0.1908, + "loss_text": 1.5098, + "ppl": 5.4772, + "step": 6424 + }, + { + "epoch": 0.04, + "global_step": 6425, + "learning_rate": 0.00047401919866444075, + "loss": 1.7222, + "loss_base2": 2.4846, + "loss_pixel": 0.1916, + "loss_text": 1.5306, + "ppl": 5.5968, + "step": 6425 + }, + { + "epoch": 0.04, + "global_step": 6426, + "learning_rate": 0.0004740150250417362, + "loss": 1.7173, + "loss_base2": 2.4775, + "loss_pixel": 0.1894, + "loss_text": 1.528, + "ppl": 5.5695, + "step": 6426 + }, + { + "epoch": 0.04, + "global_step": 6427, + "learning_rate": 0.0004740108514190317, + "loss": 1.7323, + "loss_base2": 2.4992, + "loss_pixel": 0.1924, + "loss_text": 1.5398, + "ppl": 5.6536, + "step": 6427 + }, + { + "epoch": 0.04, + "global_step": 6428, + "learning_rate": 0.0004740066777963272, + "loss": 1.7254, + "loss_base2": 2.4892, + "loss_pixel": 0.1929, + "loss_text": 1.5325, + "ppl": 5.6148, + "step": 6428 + }, + { + "epoch": 0.04, + "global_step": 6429, + "learning_rate": 0.0004740025041736227, + "loss": 1.7435, + "loss_base2": 2.5153, + "loss_pixel": 0.1912, + "loss_text": 1.5523, + "ppl": 5.7173, + "step": 6429 + }, + { + "epoch": 0.04, + "global_step": 6430, + "learning_rate": 0.00047399833055091823, + "loss": 1.7198, + "loss_base2": 2.4811, + "loss_pixel": 0.1903, + "loss_text": 1.5295, + "ppl": 5.5834, + "step": 6430 + }, + { + "epoch": 0.04, + "global_step": 6431, + "learning_rate": 0.0004739941569282137, + "loss": 1.7077, + "loss_base2": 2.4637, + "loss_pixel": 0.1894, + "loss_text": 1.5182, + "ppl": 5.5163, + "step": 6431 + }, + { + "epoch": 0.04, + "global_step": 6432, + "learning_rate": 0.0004739899833055092, + "loss": 1.7357, + "loss_base2": 2.5041, + "loss_pixel": 0.1909, + "loss_text": 1.5448, + "ppl": 5.6729, + "step": 6432 + }, + { + "epoch": 0.04, + "global_step": 6433, + "learning_rate": 0.0004739858096828047, + "loss": 1.7284, + "loss_base2": 2.4936, + "loss_pixel": 0.189, + "loss_text": 1.5394, + "ppl": 5.6316, + "step": 6433 + }, + { + "epoch": 0.04, + "global_step": 6434, + "learning_rate": 0.0004739816360601002, + "loss": 1.7323, + "loss_base2": 2.4992, + "loss_pixel": 0.1901, + "loss_text": 1.5422, + "ppl": 5.6536, + "step": 6434 + }, + { + "epoch": 0.04, + "global_step": 6435, + "learning_rate": 0.00047397746243739566, + "loss": 1.7196, + "loss_base2": 2.4809, + "loss_pixel": 0.1897, + "loss_text": 1.5299, + "ppl": 5.5823, + "step": 6435 + }, + { + "epoch": 0.04, + "global_step": 6436, + "learning_rate": 0.00047397328881469117, + "loss": 1.7199, + "loss_base2": 2.4813, + "loss_pixel": 0.1894, + "loss_text": 1.5306, + "ppl": 5.584, + "step": 6436 + }, + { + "epoch": 0.04, + "global_step": 6437, + "learning_rate": 0.0004739691151919867, + "loss": 1.7216, + "loss_base2": 2.4837, + "loss_pixel": 0.1889, + "loss_text": 1.5327, + "ppl": 5.5935, + "step": 6437 + }, + { + "epoch": 0.04, + "global_step": 6438, + "learning_rate": 0.0004739649415692822, + "loss": 1.7289, + "loss_base2": 2.4943, + "loss_pixel": 0.1892, + "loss_text": 1.5396, + "ppl": 5.6345, + "step": 6438 + }, + { + "epoch": 0.04, + "global_step": 6439, + "learning_rate": 0.0004739607679465777, + "loss": 1.7491, + "loss_base2": 2.5234, + "loss_pixel": 0.1892, + "loss_text": 1.5599, + "ppl": 5.7494, + "step": 6439 + }, + { + "epoch": 0.04, + "global_step": 6440, + "learning_rate": 0.0004739565943238731, + "loss": 1.7245, + "loss_base2": 2.4879, + "loss_pixel": 0.188, + "loss_text": 1.5365, + "ppl": 5.6097, + "step": 6440 + }, + { + "epoch": 0.04, + "global_step": 6441, + "learning_rate": 0.0004739524207011686, + "loss": 1.7289, + "loss_base2": 2.4943, + "loss_pixel": 0.1888, + "loss_text": 1.5401, + "ppl": 5.6345, + "step": 6441 + }, + { + "epoch": 0.04, + "global_step": 6442, + "learning_rate": 0.0004739482470784641, + "loss": 1.7198, + "loss_base2": 2.4811, + "loss_pixel": 0.1893, + "loss_text": 1.5305, + "ppl": 5.5834, + "step": 6442 + }, + { + "epoch": 0.04, + "global_step": 6443, + "learning_rate": 0.0004739440734557596, + "loss": 1.7226, + "loss_base2": 2.4852, + "loss_pixel": 0.1879, + "loss_text": 1.5347, + "ppl": 5.5991, + "step": 6443 + }, + { + "epoch": 0.04, + "global_step": 6444, + "learning_rate": 0.00047393989983305506, + "loss": 1.7248, + "loss_base2": 2.4884, + "loss_pixel": 0.1892, + "loss_text": 1.5356, + "ppl": 5.6114, + "step": 6444 + }, + { + "epoch": 0.04, + "global_step": 6445, + "learning_rate": 0.00047393572621035057, + "loss": 1.7351, + "loss_base2": 2.5032, + "loss_pixel": 0.1868, + "loss_text": 1.5483, + "ppl": 5.6695, + "step": 6445 + }, + { + "epoch": 0.04, + "global_step": 6446, + "learning_rate": 0.0004739315525876461, + "loss": 1.7098, + "loss_base2": 2.4667, + "loss_pixel": 0.1878, + "loss_text": 1.522, + "ppl": 5.5279, + "step": 6446 + }, + { + "epoch": 0.04, + "global_step": 6447, + "learning_rate": 0.0004739273789649416, + "loss": 1.7362, + "loss_base2": 2.5048, + "loss_pixel": 0.1888, + "loss_text": 1.5474, + "ppl": 5.6757, + "step": 6447 + }, + { + "epoch": 0.04, + "global_step": 6448, + "learning_rate": 0.0004739232053422371, + "loss": 1.7211, + "loss_base2": 2.483, + "loss_pixel": 0.1872, + "loss_text": 1.5339, + "ppl": 5.5907, + "step": 6448 + }, + { + "epoch": 0.04, + "global_step": 6449, + "learning_rate": 0.00047391903171953255, + "loss": 1.7232, + "loss_base2": 2.4861, + "loss_pixel": 0.1867, + "loss_text": 1.5365, + "ppl": 5.6024, + "step": 6449 + }, + { + "epoch": 0.04, + "global_step": 6450, + "learning_rate": 0.00047391485809682805, + "loss": 1.7264, + "loss_base2": 2.4907, + "loss_pixel": 0.1872, + "loss_text": 1.5391, + "ppl": 5.6204, + "step": 6450 + }, + { + "epoch": 0.04, + "global_step": 6451, + "learning_rate": 0.00047391068447412356, + "loss": 1.7377, + "loss_base2": 2.507, + "loss_pixel": 0.1878, + "loss_text": 1.55, + "ppl": 5.6843, + "step": 6451 + }, + { + "epoch": 0.04, + "global_step": 6452, + "learning_rate": 0.00047390651085141907, + "loss": 1.7051, + "loss_base2": 2.4599, + "loss_pixel": 0.1885, + "loss_text": 1.5166, + "ppl": 5.5019, + "step": 6452 + }, + { + "epoch": 0.04, + "global_step": 6453, + "learning_rate": 0.0004739023372287145, + "loss": 1.728, + "loss_base2": 2.493, + "loss_pixel": 0.1867, + "loss_text": 1.5414, + "ppl": 5.6294, + "step": 6453 + }, + { + "epoch": 0.04, + "global_step": 6454, + "learning_rate": 0.00047389816360601003, + "loss": 1.7239, + "loss_base2": 2.4871, + "loss_pixel": 0.1873, + "loss_text": 1.5365, + "ppl": 5.6064, + "step": 6454 + }, + { + "epoch": 0.04, + "global_step": 6455, + "learning_rate": 0.00047389398998330554, + "loss": 1.7091, + "loss_base2": 2.4657, + "loss_pixel": 0.1882, + "loss_text": 1.521, + "ppl": 5.524, + "step": 6455 + }, + { + "epoch": 0.04, + "global_step": 6456, + "learning_rate": 0.00047388981636060104, + "loss": 1.7321, + "loss_base2": 2.4989, + "loss_pixel": 0.1885, + "loss_text": 1.5436, + "ppl": 5.6525, + "step": 6456 + }, + { + "epoch": 0.04, + "global_step": 6457, + "learning_rate": 0.00047388564273789655, + "loss": 1.729, + "loss_base2": 2.4944, + "loss_pixel": 0.1869, + "loss_text": 1.5421, + "ppl": 5.635, + "step": 6457 + }, + { + "epoch": 0.04, + "global_step": 6458, + "learning_rate": 0.000473881469115192, + "loss": 1.7059, + "loss_base2": 2.4611, + "loss_pixel": 0.1859, + "loss_text": 1.52, + "ppl": 5.5063, + "step": 6458 + }, + { + "epoch": 0.04, + "global_step": 6459, + "learning_rate": 0.00047387729549248746, + "loss": 1.7392, + "loss_base2": 2.5091, + "loss_pixel": 0.1866, + "loss_text": 1.5526, + "ppl": 5.6928, + "step": 6459 + }, + { + "epoch": 0.04, + "global_step": 6460, + "learning_rate": 0.00047387312186978296, + "loss": 1.7435, + "loss_base2": 2.5153, + "loss_pixel": 0.1878, + "loss_text": 1.5557, + "ppl": 5.7173, + "step": 6460 + }, + { + "epoch": 0.04, + "global_step": 6461, + "learning_rate": 0.00047386894824707847, + "loss": 1.7119, + "loss_base2": 2.4697, + "loss_pixel": 0.1875, + "loss_text": 1.5244, + "ppl": 5.5395, + "step": 6461 + }, + { + "epoch": 0.04, + "global_step": 6462, + "learning_rate": 0.0004738647746243739, + "loss": 1.7258, + "loss_base2": 2.4898, + "loss_pixel": 0.1877, + "loss_text": 1.5381, + "ppl": 5.617, + "step": 6462 + }, + { + "epoch": 0.04, + "global_step": 6463, + "learning_rate": 0.00047386060100166943, + "loss": 1.7246, + "loss_base2": 2.4881, + "loss_pixel": 0.1856, + "loss_text": 1.5389, + "ppl": 5.6103, + "step": 6463 + }, + { + "epoch": 0.04, + "global_step": 6464, + "learning_rate": 0.00047385642737896494, + "loss": 1.7287, + "loss_base2": 2.494, + "loss_pixel": 0.1862, + "loss_text": 1.5425, + "ppl": 5.6333, + "step": 6464 + }, + { + "epoch": 0.04, + "global_step": 6465, + "learning_rate": 0.00047385225375626045, + "loss": 1.7087, + "loss_base2": 2.4651, + "loss_pixel": 0.1861, + "loss_text": 1.5225, + "ppl": 5.5218, + "step": 6465 + }, + { + "epoch": 0.04, + "global_step": 6466, + "learning_rate": 0.00047384808013355595, + "loss": 1.7125, + "loss_base2": 2.4706, + "loss_pixel": 0.188, + "loss_text": 1.5245, + "ppl": 5.5428, + "step": 6466 + }, + { + "epoch": 0.04, + "global_step": 6467, + "learning_rate": 0.0004738439065108514, + "loss": 1.7054, + "loss_base2": 2.4604, + "loss_pixel": 0.1879, + "loss_text": 1.5174, + "ppl": 5.5036, + "step": 6467 + }, + { + "epoch": 0.04, + "global_step": 6468, + "learning_rate": 0.0004738397328881469, + "loss": 1.7258, + "loss_base2": 2.4898, + "loss_pixel": 0.187, + "loss_text": 1.5389, + "ppl": 5.617, + "step": 6468 + }, + { + "epoch": 0.04, + "global_step": 6469, + "learning_rate": 0.0004738355592654424, + "loss": 1.6814, + "loss_base2": 2.4257, + "loss_pixel": 0.1863, + "loss_text": 1.4951, + "ppl": 5.3731, + "step": 6469 + }, + { + "epoch": 0.04, + "global_step": 6470, + "learning_rate": 0.00047383138564273793, + "loss": 1.7186, + "loss_base2": 2.4794, + "loss_pixel": 0.1867, + "loss_text": 1.5319, + "ppl": 5.5767, + "step": 6470 + }, + { + "epoch": 0.04, + "global_step": 6471, + "learning_rate": 0.0004738272120200334, + "loss": 1.7337, + "loss_base2": 2.5012, + "loss_pixel": 0.1857, + "loss_text": 1.548, + "ppl": 5.6616, + "step": 6471 + }, + { + "epoch": 0.04, + "global_step": 6472, + "learning_rate": 0.0004738230383973289, + "loss": 1.7287, + "loss_base2": 2.494, + "loss_pixel": 0.1864, + "loss_text": 1.5424, + "ppl": 5.6333, + "step": 6472 + }, + { + "epoch": 0.04, + "global_step": 6473, + "learning_rate": 0.0004738188647746244, + "loss": 1.7081, + "loss_base2": 2.4643, + "loss_pixel": 0.1846, + "loss_text": 1.5236, + "ppl": 5.5185, + "step": 6473 + }, + { + "epoch": 0.04, + "global_step": 6474, + "learning_rate": 0.0004738146911519199, + "loss": 1.7211, + "loss_base2": 2.483, + "loss_pixel": 0.1852, + "loss_text": 1.5359, + "ppl": 5.5907, + "step": 6474 + }, + { + "epoch": 0.04, + "global_step": 6475, + "learning_rate": 0.0004738105175292154, + "loss": 1.7079, + "loss_base2": 2.464, + "loss_pixel": 0.1862, + "loss_text": 1.5216, + "ppl": 5.5174, + "step": 6475 + }, + { + "epoch": 0.04, + "global_step": 6476, + "learning_rate": 0.00047380634390651086, + "loss": 1.7187, + "loss_base2": 2.4796, + "loss_pixel": 0.186, + "loss_text": 1.5327, + "ppl": 5.5773, + "step": 6476 + }, + { + "epoch": 0.04, + "global_step": 6477, + "learning_rate": 0.00047380217028380637, + "loss": 1.7173, + "loss_base2": 2.4775, + "loss_pixel": 0.187, + "loss_text": 1.5303, + "ppl": 5.5695, + "step": 6477 + }, + { + "epoch": 0.04, + "global_step": 6478, + "learning_rate": 0.0004737979966611018, + "loss": 1.715, + "loss_base2": 2.4742, + "loss_pixel": 0.1868, + "loss_text": 1.5282, + "ppl": 5.5567, + "step": 6478 + }, + { + "epoch": 0.04, + "global_step": 6479, + "learning_rate": 0.00047379382303839733, + "loss": 1.7132, + "loss_base2": 2.4716, + "loss_pixel": 0.1851, + "loss_text": 1.5281, + "ppl": 5.5467, + "step": 6479 + }, + { + "epoch": 0.04, + "global_step": 6480, + "learning_rate": 0.00047378964941569284, + "loss": 1.7091, + "loss_base2": 2.4657, + "loss_pixel": 0.1855, + "loss_text": 1.5236, + "ppl": 5.524, + "step": 6480 + }, + { + "epoch": 0.04, + "global_step": 6481, + "learning_rate": 0.0004737854757929883, + "loss": 1.7307, + "loss_base2": 2.4969, + "loss_pixel": 0.1847, + "loss_text": 1.546, + "ppl": 5.6446, + "step": 6481 + }, + { + "epoch": 0.04, + "global_step": 6482, + "learning_rate": 0.0004737813021702838, + "loss": 1.7278, + "loss_base2": 2.4927, + "loss_pixel": 0.1864, + "loss_text": 1.5414, + "ppl": 5.6283, + "step": 6482 + }, + { + "epoch": 0.04, + "global_step": 6483, + "learning_rate": 0.0004737771285475793, + "loss": 1.7086, + "loss_base2": 2.465, + "loss_pixel": 0.1865, + "loss_text": 1.5222, + "ppl": 5.5212, + "step": 6483 + }, + { + "epoch": 0.04, + "global_step": 6484, + "learning_rate": 0.0004737729549248748, + "loss": 1.7243, + "loss_base2": 2.4876, + "loss_pixel": 0.1867, + "loss_text": 1.5375, + "ppl": 5.6086, + "step": 6484 + }, + { + "epoch": 0.04, + "global_step": 6485, + "learning_rate": 0.00047376878130217027, + "loss": 1.7253, + "loss_base2": 2.4891, + "loss_pixel": 0.1933, + "loss_text": 1.532, + "ppl": 5.6142, + "step": 6485 + }, + { + "epoch": 0.04, + "global_step": 6486, + "learning_rate": 0.0004737646076794658, + "loss": 1.7476, + "loss_base2": 2.5213, + "loss_pixel": 0.1956, + "loss_text": 1.552, + "ppl": 5.7408, + "step": 6486 + }, + { + "epoch": 0.04, + "global_step": 6487, + "learning_rate": 0.0004737604340567613, + "loss": 1.7149, + "loss_base2": 2.4741, + "loss_pixel": 0.1973, + "loss_text": 1.5176, + "ppl": 5.5561, + "step": 6487 + }, + { + "epoch": 0.04, + "global_step": 6488, + "learning_rate": 0.0004737562604340568, + "loss": 1.7184, + "loss_base2": 2.4791, + "loss_pixel": 0.1866, + "loss_text": 1.5318, + "ppl": 5.5756, + "step": 6488 + }, + { + "epoch": 0.04, + "global_step": 6489, + "learning_rate": 0.0004737520868113523, + "loss": 1.7137, + "loss_base2": 2.4723, + "loss_pixel": 0.1842, + "loss_text": 1.5296, + "ppl": 5.5495, + "step": 6489 + }, + { + "epoch": 0.04, + "global_step": 6490, + "learning_rate": 0.00047374791318864775, + "loss": 1.4913, + "loss_base2": 2.1515, + "loss_pixel": 0.1864, + "loss_text": 1.3049, + "ppl": 4.4429, + "step": 6490 + }, + { + "epoch": 0.04, + "global_step": 6491, + "learning_rate": 0.00047374373956594326, + "loss": 1.5219, + "loss_base2": 2.1956, + "loss_pixel": 0.1853, + "loss_text": 1.3366, + "ppl": 4.5809, + "step": 6491 + }, + { + "epoch": 0.04, + "global_step": 6492, + "learning_rate": 0.00047373956594323876, + "loss": 1.4933, + "loss_base2": 2.1544, + "loss_pixel": 0.1844, + "loss_text": 1.309, + "ppl": 4.4518, + "step": 6492 + }, + { + "epoch": 0.04, + "global_step": 6493, + "learning_rate": 0.00047373539232053427, + "loss": 1.5006, + "loss_base2": 2.1649, + "loss_pixel": 0.1859, + "loss_text": 1.3147, + "ppl": 4.4844, + "step": 6493 + }, + { + "epoch": 0.04, + "global_step": 6494, + "learning_rate": 0.0004737312186978297, + "loss": 1.4928, + "loss_base2": 2.1537, + "loss_pixel": 0.1842, + "loss_text": 1.3086, + "ppl": 4.4495, + "step": 6494 + }, + { + "epoch": 0.04, + "global_step": 6495, + "learning_rate": 0.00047372704507512523, + "loss": 1.4957, + "loss_base2": 2.1578, + "loss_pixel": 0.1831, + "loss_text": 1.3125, + "ppl": 4.4625, + "step": 6495 + }, + { + "epoch": 0.04, + "global_step": 6496, + "learning_rate": 0.0004737228714524207, + "loss": 1.473, + "loss_base2": 2.1251, + "loss_pixel": 0.1849, + "loss_text": 1.2881, + "ppl": 4.3623, + "step": 6496 + }, + { + "epoch": 0.04, + "global_step": 6497, + "learning_rate": 0.0004737186978297162, + "loss": 1.4557, + "loss_base2": 2.1001, + "loss_pixel": 0.1844, + "loss_text": 1.2713, + "ppl": 4.2875, + "step": 6497 + }, + { + "epoch": 0.04, + "global_step": 6498, + "learning_rate": 0.0004737145242070117, + "loss": 1.5705, + "loss_base2": 2.2658, + "loss_pixel": 0.1837, + "loss_text": 1.3869, + "ppl": 4.8091, + "step": 6498 + }, + { + "epoch": 0.04, + "global_step": 6499, + "learning_rate": 0.00047371035058430715, + "loss": 1.734, + "loss_base2": 2.5016, + "loss_pixel": 0.1831, + "loss_text": 1.5509, + "ppl": 5.6633, + "step": 6499 + }, + { + "epoch": 0.04, + "global_step": 6500, + "learning_rate": 0.00047370617696160266, + "loss": 1.7377, + "loss_base2": 2.507, + "loss_pixel": 0.1828, + "loss_text": 1.5549, + "ppl": 5.6843, + "step": 6500 + }, + { + "epoch": 0.04, + "global_step": 6501, + "learning_rate": 0.00047370200333889817, + "loss": 1.7171, + "loss_base2": 2.4773, + "loss_pixel": 0.1831, + "loss_text": 1.534, + "ppl": 5.5684, + "step": 6501 + }, + { + "epoch": 0.04, + "global_step": 6502, + "learning_rate": 0.0004736978297161937, + "loss": 1.7272, + "loss_base2": 2.4918, + "loss_pixel": 0.1838, + "loss_text": 1.5435, + "ppl": 5.6249, + "step": 6502 + }, + { + "epoch": 0.04, + "global_step": 6503, + "learning_rate": 0.00047369365609348913, + "loss": 1.709, + "loss_base2": 2.4656, + "loss_pixel": 0.1812, + "loss_text": 1.5279, + "ppl": 5.5234, + "step": 6503 + }, + { + "epoch": 0.04, + "global_step": 6504, + "learning_rate": 0.00047368948247078464, + "loss": 1.7229, + "loss_base2": 2.4856, + "loss_pixel": 0.1822, + "loss_text": 1.5406, + "ppl": 5.6007, + "step": 6504 + }, + { + "epoch": 0.04, + "global_step": 6505, + "learning_rate": 0.00047368530884808014, + "loss": 1.7209, + "loss_base2": 2.4827, + "loss_pixel": 0.1829, + "loss_text": 1.538, + "ppl": 5.5896, + "step": 6505 + }, + { + "epoch": 0.04, + "global_step": 6506, + "learning_rate": 0.00047368113522537565, + "loss": 1.7208, + "loss_base2": 2.4826, + "loss_pixel": 0.1838, + "loss_text": 1.537, + "ppl": 5.589, + "step": 6506 + }, + { + "epoch": 0.04, + "global_step": 6507, + "learning_rate": 0.00047367696160267116, + "loss": 1.7001, + "loss_base2": 2.4527, + "loss_pixel": 0.1802, + "loss_text": 1.5199, + "ppl": 5.4745, + "step": 6507 + }, + { + "epoch": 0.04, + "global_step": 6508, + "learning_rate": 0.0004736727879799666, + "loss": 1.7179, + "loss_base2": 2.4784, + "loss_pixel": 0.1807, + "loss_text": 1.5372, + "ppl": 5.5728, + "step": 6508 + }, + { + "epoch": 0.04, + "global_step": 6509, + "learning_rate": 0.0004736686143572621, + "loss": 1.7241, + "loss_base2": 2.4874, + "loss_pixel": 0.1804, + "loss_text": 1.5437, + "ppl": 5.6075, + "step": 6509 + }, + { + "epoch": 0.04, + "global_step": 6510, + "learning_rate": 0.0004736644407345576, + "loss": 1.722, + "loss_base2": 2.4843, + "loss_pixel": 0.182, + "loss_text": 1.54, + "ppl": 5.5957, + "step": 6510 + }, + { + "epoch": 0.04, + "global_step": 6511, + "learning_rate": 0.00047366026711185313, + "loss": 1.7179, + "loss_base2": 2.4784, + "loss_pixel": 0.1788, + "loss_text": 1.5391, + "ppl": 5.5728, + "step": 6511 + }, + { + "epoch": 0.04, + "global_step": 6512, + "learning_rate": 0.0004736560934891486, + "loss": 1.7096, + "loss_base2": 2.4664, + "loss_pixel": 0.1785, + "loss_text": 1.5311, + "ppl": 5.5268, + "step": 6512 + }, + { + "epoch": 0.04, + "global_step": 6513, + "learning_rate": 0.0004736519198664441, + "loss": 1.7168, + "loss_base2": 2.4768, + "loss_pixel": 0.1794, + "loss_text": 1.5374, + "ppl": 5.5667, + "step": 6513 + }, + { + "epoch": 0.04, + "global_step": 6514, + "learning_rate": 0.0004736477462437396, + "loss": 1.7123, + "loss_base2": 2.4703, + "loss_pixel": 0.1787, + "loss_text": 1.5336, + "ppl": 5.5417, + "step": 6514 + }, + { + "epoch": 0.04, + "global_step": 6515, + "learning_rate": 0.00047364357262103505, + "loss": 1.721, + "loss_base2": 2.4829, + "loss_pixel": 0.1812, + "loss_text": 1.5398, + "ppl": 5.5901, + "step": 6515 + }, + { + "epoch": 0.04, + "global_step": 6516, + "learning_rate": 0.00047363939899833056, + "loss": 1.7115, + "loss_base2": 2.4692, + "loss_pixel": 0.1783, + "loss_text": 1.5332, + "ppl": 5.5373, + "step": 6516 + }, + { + "epoch": 0.04, + "global_step": 6517, + "learning_rate": 0.000473635225375626, + "loss": 1.699, + "loss_base2": 2.4511, + "loss_pixel": 0.1793, + "loss_text": 1.5197, + "ppl": 5.4685, + "step": 6517 + }, + { + "epoch": 0.04, + "global_step": 6518, + "learning_rate": 0.0004736310517529215, + "loss": 1.7076, + "loss_base2": 2.4635, + "loss_pixel": 0.1769, + "loss_text": 1.5307, + "ppl": 5.5157, + "step": 6518 + }, + { + "epoch": 0.04, + "global_step": 6519, + "learning_rate": 0.00047362687813021703, + "loss": 1.7106, + "loss_base2": 2.4679, + "loss_pixel": 0.1799, + "loss_text": 1.5307, + "ppl": 5.5323, + "step": 6519 + }, + { + "epoch": 0.04, + "global_step": 6520, + "learning_rate": 0.00047362270450751254, + "loss": 1.6975, + "loss_base2": 2.449, + "loss_pixel": 0.1783, + "loss_text": 1.5191, + "ppl": 5.4603, + "step": 6520 + }, + { + "epoch": 0.04, + "global_step": 6521, + "learning_rate": 0.000473618530884808, + "loss": 1.7126, + "loss_base2": 2.4708, + "loss_pixel": 0.1792, + "loss_text": 1.5334, + "ppl": 5.5434, + "step": 6521 + }, + { + "epoch": 0.04, + "global_step": 6522, + "learning_rate": 0.0004736143572621035, + "loss": 1.7001, + "loss_base2": 2.4527, + "loss_pixel": 0.1797, + "loss_text": 1.5204, + "ppl": 5.4745, + "step": 6522 + }, + { + "epoch": 0.04, + "global_step": 6523, + "learning_rate": 0.000473610183639399, + "loss": 1.6106, + "loss_base2": 2.3236, + "loss_pixel": 0.1907, + "loss_text": 1.4198, + "ppl": 5.0058, + "step": 6523 + }, + { + "epoch": 0.04, + "global_step": 6524, + "learning_rate": 0.0004736060100166945, + "loss": 1.4998, + "loss_base2": 2.1638, + "loss_pixel": 0.1894, + "loss_text": 1.3104, + "ppl": 4.4808, + "step": 6524 + }, + { + "epoch": 0.04, + "global_step": 6525, + "learning_rate": 0.00047360183639399, + "loss": 1.4846, + "loss_base2": 2.1418, + "loss_pixel": 0.1909, + "loss_text": 1.2938, + "ppl": 4.4132, + "step": 6525 + }, + { + "epoch": 0.04, + "global_step": 6526, + "learning_rate": 0.00047359766277128547, + "loss": 1.4918, + "loss_base2": 2.1522, + "loss_pixel": 0.1881, + "loss_text": 1.3036, + "ppl": 4.4451, + "step": 6526 + }, + { + "epoch": 0.04, + "global_step": 6527, + "learning_rate": 0.000473593489148581, + "loss": 1.4867, + "loss_base2": 2.1449, + "loss_pixel": 0.1877, + "loss_text": 1.299, + "ppl": 4.4225, + "step": 6527 + }, + { + "epoch": 0.04, + "global_step": 6528, + "learning_rate": 0.0004735893155258765, + "loss": 1.4866, + "loss_base2": 2.1447, + "loss_pixel": 0.1888, + "loss_text": 1.2978, + "ppl": 4.422, + "step": 6528 + }, + { + "epoch": 0.04, + "global_step": 6529, + "learning_rate": 0.000473585141903172, + "loss": 1.4733, + "loss_base2": 2.1255, + "loss_pixel": 0.1858, + "loss_text": 1.2875, + "ppl": 4.3636, + "step": 6529 + }, + { + "epoch": 0.04, + "global_step": 6530, + "learning_rate": 0.00047358096828046745, + "loss": 1.4807, + "loss_base2": 2.1362, + "loss_pixel": 0.1867, + "loss_text": 1.294, + "ppl": 4.396, + "step": 6530 + }, + { + "epoch": 0.04, + "global_step": 6531, + "learning_rate": 0.00047357679465776295, + "loss": 1.6398, + "loss_base2": 2.3657, + "loss_pixel": 0.1854, + "loss_text": 1.4545, + "ppl": 5.1541, + "step": 6531 + }, + { + "epoch": 0.04, + "global_step": 6532, + "learning_rate": 0.00047357262103505846, + "loss": 1.7197, + "loss_base2": 2.481, + "loss_pixel": 0.1858, + "loss_text": 1.5339, + "ppl": 5.5829, + "step": 6532 + }, + { + "epoch": 0.04, + "global_step": 6533, + "learning_rate": 0.00047356844741235397, + "loss": 1.7192, + "loss_base2": 2.4803, + "loss_pixel": 0.1869, + "loss_text": 1.5322, + "ppl": 5.5801, + "step": 6533 + }, + { + "epoch": 0.04, + "global_step": 6534, + "learning_rate": 0.0004735642737896494, + "loss": 1.7295, + "loss_base2": 2.4951, + "loss_pixel": 0.1869, + "loss_text": 1.5426, + "ppl": 5.6378, + "step": 6534 + }, + { + "epoch": 0.04, + "global_step": 6535, + "learning_rate": 0.0004735601001669449, + "loss": 1.7212, + "loss_base2": 2.4832, + "loss_pixel": 0.1877, + "loss_text": 1.5335, + "ppl": 5.5912, + "step": 6535 + }, + { + "epoch": 0.04, + "global_step": 6536, + "learning_rate": 0.0004735559265442404, + "loss": 1.7347, + "loss_base2": 2.5026, + "loss_pixel": 0.1879, + "loss_text": 1.5468, + "ppl": 5.6672, + "step": 6536 + }, + { + "epoch": 0.04, + "global_step": 6537, + "learning_rate": 0.0004735517529215359, + "loss": 1.7072, + "loss_base2": 2.463, + "loss_pixel": 0.1863, + "loss_text": 1.5209, + "ppl": 5.5135, + "step": 6537 + }, + { + "epoch": 0.04, + "global_step": 6538, + "learning_rate": 0.0004735475792988314, + "loss": 1.7198, + "loss_base2": 2.4811, + "loss_pixel": 0.1862, + "loss_text": 1.5335, + "ppl": 5.5834, + "step": 6538 + }, + { + "epoch": 0.04, + "global_step": 6539, + "learning_rate": 0.0004735434056761269, + "loss": 1.7134, + "loss_base2": 2.4719, + "loss_pixel": 0.1859, + "loss_text": 1.5275, + "ppl": 5.5478, + "step": 6539 + }, + { + "epoch": 0.04, + "global_step": 6540, + "learning_rate": 0.00047353923205342236, + "loss": 1.7257, + "loss_base2": 2.4897, + "loss_pixel": 0.1861, + "loss_text": 1.5396, + "ppl": 5.6165, + "step": 6540 + }, + { + "epoch": 0.04, + "global_step": 6541, + "learning_rate": 0.00047353505843071786, + "loss": 1.7235, + "loss_base2": 2.4865, + "loss_pixel": 0.1864, + "loss_text": 1.5371, + "ppl": 5.6041, + "step": 6541 + }, + { + "epoch": 0.04, + "global_step": 6542, + "learning_rate": 0.00047353088480801337, + "loss": 1.7192, + "loss_base2": 2.4803, + "loss_pixel": 0.1854, + "loss_text": 1.5338, + "ppl": 5.5801, + "step": 6542 + }, + { + "epoch": 0.04, + "global_step": 6543, + "learning_rate": 0.0004735267111853089, + "loss": 1.7235, + "loss_base2": 2.4865, + "loss_pixel": 0.1853, + "loss_text": 1.5382, + "ppl": 5.6041, + "step": 6543 + }, + { + "epoch": 0.04, + "global_step": 6544, + "learning_rate": 0.00047352253756260433, + "loss": 1.7059, + "loss_base2": 2.4611, + "loss_pixel": 0.1848, + "loss_text": 1.521, + "ppl": 5.5063, + "step": 6544 + }, + { + "epoch": 0.04, + "global_step": 6545, + "learning_rate": 0.00047351836393989984, + "loss": 1.7263, + "loss_base2": 2.4905, + "loss_pixel": 0.1852, + "loss_text": 1.5411, + "ppl": 5.6198, + "step": 6545 + }, + { + "epoch": 0.04, + "global_step": 6546, + "learning_rate": 0.00047351419031719535, + "loss": 1.7118, + "loss_base2": 2.4696, + "loss_pixel": 0.1851, + "loss_text": 1.5267, + "ppl": 5.5389, + "step": 6546 + }, + { + "epoch": 0.04, + "global_step": 6547, + "learning_rate": 0.00047351001669449085, + "loss": 1.719, + "loss_base2": 2.48, + "loss_pixel": 0.1853, + "loss_text": 1.5337, + "ppl": 5.5789, + "step": 6547 + }, + { + "epoch": 0.04, + "global_step": 6548, + "learning_rate": 0.00047350584307178636, + "loss": 1.7135, + "loss_base2": 2.4721, + "loss_pixel": 0.1855, + "loss_text": 1.528, + "ppl": 5.5483, + "step": 6548 + }, + { + "epoch": 0.04, + "global_step": 6549, + "learning_rate": 0.0004735016694490818, + "loss": 1.7138, + "loss_base2": 2.4725, + "loss_pixel": 0.1877, + "loss_text": 1.5261, + "ppl": 5.55, + "step": 6549 + }, + { + "epoch": 0.04, + "global_step": 6550, + "learning_rate": 0.0004734974958263773, + "loss": 1.7199, + "loss_base2": 2.4813, + "loss_pixel": 0.1868, + "loss_text": 1.5331, + "ppl": 5.584, + "step": 6550 + }, + { + "epoch": 0.04, + "global_step": 6551, + "learning_rate": 0.00047349332220367283, + "loss": 1.717, + "loss_base2": 2.4771, + "loss_pixel": 0.1846, + "loss_text": 1.5324, + "ppl": 5.5678, + "step": 6551 + }, + { + "epoch": 0.04, + "global_step": 6552, + "learning_rate": 0.00047348914858096834, + "loss": 1.7204, + "loss_base2": 2.482, + "loss_pixel": 0.1854, + "loss_text": 1.535, + "ppl": 5.5868, + "step": 6552 + }, + { + "epoch": 0.04, + "global_step": 6553, + "learning_rate": 0.00047348497495826373, + "loss": 1.7361, + "loss_base2": 2.5047, + "loss_pixel": 0.1842, + "loss_text": 1.5519, + "ppl": 5.6752, + "step": 6553 + }, + { + "epoch": 0.04, + "global_step": 6554, + "learning_rate": 0.00047348080133555924, + "loss": 1.712, + "loss_base2": 2.4699, + "loss_pixel": 0.1842, + "loss_text": 1.5279, + "ppl": 5.54, + "step": 6554 + }, + { + "epoch": 0.04, + "global_step": 6555, + "learning_rate": 0.00047347662771285475, + "loss": 1.6898, + "loss_base2": 2.4379, + "loss_pixel": 0.184, + "loss_text": 1.5058, + "ppl": 5.4184, + "step": 6555 + }, + { + "epoch": 0.04, + "global_step": 6556, + "learning_rate": 0.00047347245409015026, + "loss": 1.5005, + "loss_base2": 2.1648, + "loss_pixel": 0.1845, + "loss_text": 1.316, + "ppl": 4.4839, + "step": 6556 + }, + { + "epoch": 0.04, + "global_step": 6557, + "learning_rate": 0.00047346828046744576, + "loss": 1.4764, + "loss_base2": 2.13, + "loss_pixel": 0.1845, + "loss_text": 1.2919, + "ppl": 4.3772, + "step": 6557 + }, + { + "epoch": 0.04, + "global_step": 6558, + "learning_rate": 0.0004734641068447412, + "loss": 1.5013, + "loss_base2": 2.1659, + "loss_pixel": 0.1855, + "loss_text": 1.3159, + "ppl": 4.4875, + "step": 6558 + }, + { + "epoch": 0.04, + "global_step": 6559, + "learning_rate": 0.0004734599332220367, + "loss": 1.5076, + "loss_base2": 2.175, + "loss_pixel": 0.1852, + "loss_text": 1.3224, + "ppl": 4.5159, + "step": 6559 + }, + { + "epoch": 0.04, + "global_step": 6560, + "learning_rate": 0.00047345575959933223, + "loss": 1.4795, + "loss_base2": 2.1345, + "loss_pixel": 0.1846, + "loss_text": 1.2949, + "ppl": 4.3907, + "step": 6560 + }, + { + "epoch": 0.04, + "global_step": 6561, + "learning_rate": 0.00047345158597662774, + "loss": 1.4755, + "loss_base2": 2.1287, + "loss_pixel": 0.1837, + "loss_text": 1.2918, + "ppl": 4.3732, + "step": 6561 + }, + { + "epoch": 0.04, + "global_step": 6562, + "learning_rate": 0.0004734474123539232, + "loss": 1.471, + "loss_base2": 2.1222, + "loss_pixel": 0.1851, + "loss_text": 1.2859, + "ppl": 4.3536, + "step": 6562 + }, + { + "epoch": 0.04, + "global_step": 6563, + "learning_rate": 0.0004734432387312187, + "loss": 1.4813, + "loss_base2": 2.1371, + "loss_pixel": 0.1848, + "loss_text": 1.2965, + "ppl": 4.3987, + "step": 6563 + }, + { + "epoch": 0.04, + "global_step": 6564, + "learning_rate": 0.0004734390651085142, + "loss": 1.4886, + "loss_base2": 2.1476, + "loss_pixel": 0.1848, + "loss_text": 1.3038, + "ppl": 4.4309, + "step": 6564 + }, + { + "epoch": 0.04, + "global_step": 6565, + "learning_rate": 0.0004734348914858097, + "loss": 1.4828, + "loss_base2": 2.1392, + "loss_pixel": 0.1845, + "loss_text": 1.2983, + "ppl": 4.4053, + "step": 6565 + }, + { + "epoch": 0.04, + "global_step": 6566, + "learning_rate": 0.0004734307178631052, + "loss": 1.4832, + "loss_base2": 2.1398, + "loss_pixel": 0.1831, + "loss_text": 1.3001, + "ppl": 4.407, + "step": 6566 + }, + { + "epoch": 0.04, + "global_step": 6567, + "learning_rate": 0.0004734265442404007, + "loss": 1.496, + "loss_base2": 2.1583, + "loss_pixel": 0.183, + "loss_text": 1.313, + "ppl": 4.4638, + "step": 6567 + }, + { + "epoch": 0.04, + "global_step": 6568, + "learning_rate": 0.0004734223706176962, + "loss": 1.4732, + "loss_base2": 2.1254, + "loss_pixel": 0.1831, + "loss_text": 1.2901, + "ppl": 4.3632, + "step": 6568 + }, + { + "epoch": 0.04, + "global_step": 6569, + "learning_rate": 0.0004734181969949917, + "loss": 1.4825, + "loss_base2": 2.1388, + "loss_pixel": 0.1852, + "loss_text": 1.2973, + "ppl": 4.4039, + "step": 6569 + }, + { + "epoch": 0.04, + "global_step": 6570, + "learning_rate": 0.0004734140233722872, + "loss": 1.4693, + "loss_base2": 2.1198, + "loss_pixel": 0.184, + "loss_text": 1.2853, + "ppl": 4.3462, + "step": 6570 + }, + { + "epoch": 0.04, + "global_step": 6571, + "learning_rate": 0.0004734098497495826, + "loss": 1.4795, + "loss_base2": 2.1345, + "loss_pixel": 0.1846, + "loss_text": 1.2949, + "ppl": 4.3907, + "step": 6571 + }, + { + "epoch": 0.04, + "global_step": 6572, + "learning_rate": 0.0004734056761268781, + "loss": 1.4783, + "loss_base2": 2.1327, + "loss_pixel": 0.1841, + "loss_text": 1.2942, + "ppl": 4.3855, + "step": 6572 + }, + { + "epoch": 0.04, + "global_step": 6573, + "learning_rate": 0.0004734015025041736, + "loss": 1.4813, + "loss_base2": 2.1371, + "loss_pixel": 0.1829, + "loss_text": 1.2984, + "ppl": 4.3987, + "step": 6573 + }, + { + "epoch": 0.04, + "global_step": 6574, + "learning_rate": 0.0004733973288814691, + "loss": 1.475, + "loss_base2": 2.128, + "loss_pixel": 0.184, + "loss_text": 1.291, + "ppl": 4.371, + "step": 6574 + }, + { + "epoch": 0.04, + "global_step": 6575, + "learning_rate": 0.0004733931552587646, + "loss": 1.4668, + "loss_base2": 2.1161, + "loss_pixel": 0.183, + "loss_text": 1.2838, + "ppl": 4.3353, + "step": 6575 + }, + { + "epoch": 0.04, + "global_step": 6576, + "learning_rate": 0.0004733889816360601, + "loss": 1.465, + "loss_base2": 2.1135, + "loss_pixel": 0.182, + "loss_text": 1.283, + "ppl": 4.3275, + "step": 6576 + }, + { + "epoch": 0.04, + "global_step": 6577, + "learning_rate": 0.0004733848080133556, + "loss": 1.4664, + "loss_base2": 2.1156, + "loss_pixel": 0.1866, + "loss_text": 1.2798, + "ppl": 4.3336, + "step": 6577 + }, + { + "epoch": 0.04, + "global_step": 6578, + "learning_rate": 0.0004733806343906511, + "loss": 1.4698, + "loss_base2": 2.1205, + "loss_pixel": 0.1828, + "loss_text": 1.2869, + "ppl": 4.3484, + "step": 6578 + }, + { + "epoch": 0.04, + "global_step": 6579, + "learning_rate": 0.0004733764607679466, + "loss": 1.4836, + "loss_base2": 2.1404, + "loss_pixel": 0.1841, + "loss_text": 1.2995, + "ppl": 4.4088, + "step": 6579 + }, + { + "epoch": 0.04, + "global_step": 6580, + "learning_rate": 0.00047337228714524205, + "loss": 1.5611, + "loss_base2": 2.2522, + "loss_pixel": 0.1834, + "loss_text": 1.3777, + "ppl": 4.7641, + "step": 6580 + }, + { + "epoch": 0.04, + "global_step": 6581, + "learning_rate": 0.00047336811352253756, + "loss": 1.7357, + "loss_base2": 2.5041, + "loss_pixel": 0.1849, + "loss_text": 1.5508, + "ppl": 5.6729, + "step": 6581 + }, + { + "epoch": 0.04, + "global_step": 6582, + "learning_rate": 0.00047336393989983307, + "loss": 1.7354, + "loss_base2": 2.5037, + "loss_pixel": 0.1865, + "loss_text": 1.5489, + "ppl": 5.6712, + "step": 6582 + }, + { + "epoch": 0.04, + "global_step": 6583, + "learning_rate": 0.0004733597662771286, + "loss": 1.7279, + "loss_base2": 2.4928, + "loss_pixel": 0.1834, + "loss_text": 1.5445, + "ppl": 5.6288, + "step": 6583 + }, + { + "epoch": 0.04, + "global_step": 6584, + "learning_rate": 0.0004733555926544241, + "loss": 1.727, + "loss_base2": 2.4915, + "loss_pixel": 0.1846, + "loss_text": 1.5424, + "ppl": 5.6238, + "step": 6584 + }, + { + "epoch": 0.04, + "global_step": 6585, + "learning_rate": 0.00047335141903171954, + "loss": 1.7183, + "loss_base2": 2.479, + "loss_pixel": 0.185, + "loss_text": 1.5332, + "ppl": 5.575, + "step": 6585 + }, + { + "epoch": 0.04, + "global_step": 6586, + "learning_rate": 0.00047334724540901504, + "loss": 1.7026, + "loss_base2": 2.4563, + "loss_pixel": 0.1981, + "loss_text": 1.5046, + "ppl": 5.4882, + "step": 6586 + }, + { + "epoch": 0.04, + "global_step": 6587, + "learning_rate": 0.00047334307178631055, + "loss": 1.7439, + "loss_base2": 2.5159, + "loss_pixel": 0.2073, + "loss_text": 1.5366, + "ppl": 5.7196, + "step": 6587 + }, + { + "epoch": 0.04, + "global_step": 6588, + "learning_rate": 0.00047333889816360606, + "loss": 1.7615, + "loss_base2": 2.5413, + "loss_pixel": 0.2287, + "loss_text": 1.5329, + "ppl": 5.8212, + "step": 6588 + }, + { + "epoch": 0.04, + "global_step": 6589, + "learning_rate": 0.00047333472454090156, + "loss": 1.7509, + "loss_base2": 2.526, + "loss_pixel": 0.2077, + "loss_text": 1.5431, + "ppl": 5.7598, + "step": 6589 + }, + { + "epoch": 0.04, + "global_step": 6590, + "learning_rate": 0.00047333055091819696, + "loss": 1.7307, + "loss_base2": 2.4969, + "loss_pixel": 0.2081, + "loss_text": 1.5226, + "ppl": 5.6446, + "step": 6590 + }, + { + "epoch": 0.04, + "global_step": 6591, + "learning_rate": 0.00047332637729549247, + "loss": 1.7401, + "loss_base2": 2.5104, + "loss_pixel": 0.2077, + "loss_text": 1.5323, + "ppl": 5.6979, + "step": 6591 + }, + { + "epoch": 0.04, + "global_step": 6592, + "learning_rate": 0.000473322203672788, + "loss": 1.7301, + "loss_base2": 2.496, + "loss_pixel": 0.2013, + "loss_text": 1.5287, + "ppl": 5.6412, + "step": 6592 + }, + { + "epoch": 0.04, + "global_step": 6593, + "learning_rate": 0.0004733180300500835, + "loss": 1.7144, + "loss_base2": 2.4734, + "loss_pixel": 0.1995, + "loss_text": 1.5149, + "ppl": 5.5533, + "step": 6593 + }, + { + "epoch": 0.04, + "global_step": 6594, + "learning_rate": 0.00047331385642737894, + "loss": 1.7232, + "loss_base2": 2.4861, + "loss_pixel": 0.1981, + "loss_text": 1.5251, + "ppl": 5.6024, + "step": 6594 + }, + { + "epoch": 0.04, + "global_step": 6595, + "learning_rate": 0.00047330968280467445, + "loss": 1.7334, + "loss_base2": 2.5008, + "loss_pixel": 0.2001, + "loss_text": 1.5333, + "ppl": 5.6599, + "step": 6595 + }, + { + "epoch": 0.04, + "global_step": 6596, + "learning_rate": 0.00047330550918196995, + "loss": 1.7281, + "loss_base2": 2.4931, + "loss_pixel": 0.1973, + "loss_text": 1.5307, + "ppl": 5.6299, + "step": 6596 + }, + { + "epoch": 0.04, + "global_step": 6597, + "learning_rate": 0.00047330133555926546, + "loss": 1.7104, + "loss_base2": 2.4676, + "loss_pixel": 0.194, + "loss_text": 1.5164, + "ppl": 5.5312, + "step": 6597 + }, + { + "epoch": 0.04, + "global_step": 6598, + "learning_rate": 0.00047329716193656097, + "loss": 1.7133, + "loss_base2": 2.4718, + "loss_pixel": 0.1951, + "loss_text": 1.5182, + "ppl": 5.5472, + "step": 6598 + }, + { + "epoch": 0.04, + "global_step": 6599, + "learning_rate": 0.0004732929883138564, + "loss": 1.7155, + "loss_base2": 2.4749, + "loss_pixel": 0.191, + "loss_text": 1.5245, + "ppl": 5.5595, + "step": 6599 + }, + { + "epoch": 0.04, + "global_step": 6600, + "learning_rate": 0.00047328881469115193, + "loss": 1.7316, + "loss_base2": 2.4982, + "loss_pixel": 0.1946, + "loss_text": 1.537, + "ppl": 5.6497, + "step": 6600 + }, + { + "epoch": 0.04, + "global_step": 6601, + "learning_rate": 0.00047328464106844744, + "loss": 1.7322, + "loss_base2": 2.499, + "loss_pixel": 0.2016, + "loss_text": 1.5306, + "ppl": 5.6531, + "step": 6601 + }, + { + "epoch": 0.04, + "global_step": 6602, + "learning_rate": 0.00047328046744574294, + "loss": 1.7451, + "loss_base2": 2.5176, + "loss_pixel": 0.2165, + "loss_text": 1.5286, + "ppl": 5.7265, + "step": 6602 + }, + { + "epoch": 0.04, + "global_step": 6603, + "learning_rate": 0.0004732762938230384, + "loss": 1.7642, + "loss_base2": 2.5452, + "loss_pixel": 0.2284, + "loss_text": 1.5358, + "ppl": 5.8369, + "step": 6603 + }, + { + "epoch": 0.04, + "global_step": 6604, + "learning_rate": 0.0004732721202003339, + "loss": 1.7067, + "loss_base2": 2.4622, + "loss_pixel": 0.2308, + "loss_text": 1.4759, + "ppl": 5.5107, + "step": 6604 + }, + { + "epoch": 0.04, + "global_step": 6605, + "learning_rate": 0.0004732679465776294, + "loss": 1.5294, + "loss_base2": 2.2065, + "loss_pixel": 0.2257, + "loss_text": 1.3037, + "ppl": 4.6154, + "step": 6605 + }, + { + "epoch": 0.04, + "global_step": 6606, + "learning_rate": 0.0004732637729549249, + "loss": 1.5183, + "loss_base2": 2.1904, + "loss_pixel": 0.2183, + "loss_text": 1.3001, + "ppl": 4.5645, + "step": 6606 + }, + { + "epoch": 0.04, + "global_step": 6607, + "learning_rate": 0.0004732595993322204, + "loss": 1.489, + "loss_base2": 2.1482, + "loss_pixel": 0.2127, + "loss_text": 1.2762, + "ppl": 4.4327, + "step": 6607 + }, + { + "epoch": 0.04, + "global_step": 6608, + "learning_rate": 0.0004732554257095159, + "loss": 1.523, + "loss_base2": 2.1972, + "loss_pixel": 0.2107, + "loss_text": 1.3124, + "ppl": 4.586, + "step": 6608 + }, + { + "epoch": 0.04, + "global_step": 6609, + "learning_rate": 0.00047325125208681133, + "loss": 1.5263, + "loss_base2": 2.202, + "loss_pixel": 0.2078, + "loss_text": 1.3185, + "ppl": 4.6011, + "step": 6609 + }, + { + "epoch": 0.04, + "global_step": 6610, + "learning_rate": 0.00047324707846410684, + "loss": 1.493, + "loss_base2": 2.1539, + "loss_pixel": 0.2077, + "loss_text": 1.2853, + "ppl": 4.4504, + "step": 6610 + }, + { + "epoch": 0.04, + "global_step": 6611, + "learning_rate": 0.00047324290484140235, + "loss": 1.5188, + "loss_base2": 2.1912, + "loss_pixel": 0.2055, + "loss_text": 1.3132, + "ppl": 4.5667, + "step": 6611 + }, + { + "epoch": 0.04, + "global_step": 6612, + "learning_rate": 0.0004732387312186978, + "loss": 1.6321, + "loss_base2": 2.3546, + "loss_pixel": 0.215, + "loss_text": 1.4171, + "ppl": 5.1146, + "step": 6612 + }, + { + "epoch": 0.04, + "global_step": 6613, + "learning_rate": 0.0004732345575959933, + "loss": 1.7767, + "loss_base2": 2.5632, + "loss_pixel": 0.226, + "loss_text": 1.5506, + "ppl": 5.9103, + "step": 6613 + }, + { + "epoch": 0.04, + "global_step": 6614, + "learning_rate": 0.0004732303839732888, + "loss": 1.7885, + "loss_base2": 2.5803, + "loss_pixel": 0.2332, + "loss_text": 1.5552, + "ppl": 5.9805, + "step": 6614 + }, + { + "epoch": 0.04, + "global_step": 6615, + "learning_rate": 0.0004732262103505843, + "loss": 1.7491, + "loss_base2": 2.5234, + "loss_pixel": 0.2191, + "loss_text": 1.5299, + "ppl": 5.7494, + "step": 6615 + }, + { + "epoch": 0.04, + "global_step": 6616, + "learning_rate": 0.00047322203672787983, + "loss": 1.745, + "loss_base2": 2.5175, + "loss_pixel": 0.2121, + "loss_text": 1.5329, + "ppl": 5.7259, + "step": 6616 + }, + { + "epoch": 0.04, + "global_step": 6617, + "learning_rate": 0.0004732178631051753, + "loss": 1.7438, + "loss_base2": 2.5158, + "loss_pixel": 0.2136, + "loss_text": 1.5302, + "ppl": 5.719, + "step": 6617 + }, + { + "epoch": 0.04, + "global_step": 6618, + "learning_rate": 0.0004732136894824708, + "loss": 1.7501, + "loss_base2": 2.5249, + "loss_pixel": 0.2148, + "loss_text": 1.5353, + "ppl": 5.7552, + "step": 6618 + }, + { + "epoch": 0.04, + "global_step": 6619, + "learning_rate": 0.0004732095158597663, + "loss": 1.7531, + "loss_base2": 2.5292, + "loss_pixel": 0.2127, + "loss_text": 1.5405, + "ppl": 5.7725, + "step": 6619 + }, + { + "epoch": 0.04, + "global_step": 6620, + "learning_rate": 0.0004732053422370618, + "loss": 1.7502, + "loss_base2": 2.525, + "loss_pixel": 0.2149, + "loss_text": 1.5353, + "ppl": 5.7558, + "step": 6620 + }, + { + "epoch": 0.04, + "global_step": 6621, + "learning_rate": 0.00047320116861435726, + "loss": 1.7362, + "loss_base2": 2.5048, + "loss_pixel": 0.2077, + "loss_text": 1.5286, + "ppl": 5.6757, + "step": 6621 + }, + { + "epoch": 0.04, + "global_step": 6622, + "learning_rate": 0.00047319699499165276, + "loss": 1.7387, + "loss_base2": 2.5084, + "loss_pixel": 0.2096, + "loss_text": 1.5291, + "ppl": 5.6899, + "step": 6622 + }, + { + "epoch": 0.04, + "global_step": 6623, + "learning_rate": 0.00047319282136894827, + "loss": 1.7278, + "loss_base2": 2.4927, + "loss_pixel": 0.2043, + "loss_text": 1.5235, + "ppl": 5.6283, + "step": 6623 + }, + { + "epoch": 0.04, + "global_step": 6624, + "learning_rate": 0.0004731886477462438, + "loss": 1.7125, + "loss_base2": 2.4706, + "loss_pixel": 0.2037, + "loss_text": 1.5089, + "ppl": 5.5428, + "step": 6624 + }, + { + "epoch": 0.04, + "global_step": 6625, + "learning_rate": 0.0004731844741235393, + "loss": 1.7384, + "loss_base2": 2.508, + "loss_pixel": 0.2025, + "loss_text": 1.5358, + "ppl": 5.6882, + "step": 6625 + }, + { + "epoch": 0.04, + "global_step": 6626, + "learning_rate": 0.00047318030050083474, + "loss": 1.7346, + "loss_base2": 2.5025, + "loss_pixel": 0.1997, + "loss_text": 1.5349, + "ppl": 5.6667, + "step": 6626 + }, + { + "epoch": 0.04, + "global_step": 6627, + "learning_rate": 0.00047317612687813025, + "loss": 1.7466, + "loss_base2": 2.5198, + "loss_pixel": 0.2006, + "loss_text": 1.546, + "ppl": 5.7351, + "step": 6627 + }, + { + "epoch": 0.04, + "global_step": 6628, + "learning_rate": 0.0004731719532554257, + "loss": 1.702, + "loss_base2": 2.4555, + "loss_pixel": 0.198, + "loss_text": 1.504, + "ppl": 5.4849, + "step": 6628 + }, + { + "epoch": 0.04, + "global_step": 6629, + "learning_rate": 0.0004731677796327212, + "loss": 1.7343, + "loss_base2": 2.5021, + "loss_pixel": 0.198, + "loss_text": 1.5363, + "ppl": 5.665, + "step": 6629 + }, + { + "epoch": 0.04, + "global_step": 6630, + "learning_rate": 0.00047316360601001666, + "loss": 1.7103, + "loss_base2": 2.4674, + "loss_pixel": 0.195, + "loss_text": 1.5153, + "ppl": 5.5306, + "step": 6630 + }, + { + "epoch": 0.04, + "global_step": 6631, + "learning_rate": 0.00047315943238731217, + "loss": 1.7199, + "loss_base2": 2.4813, + "loss_pixel": 0.1955, + "loss_text": 1.5244, + "ppl": 5.584, + "step": 6631 + }, + { + "epoch": 0.04, + "global_step": 6632, + "learning_rate": 0.0004731552587646077, + "loss": 1.7215, + "loss_base2": 2.4836, + "loss_pixel": 0.1946, + "loss_text": 1.5269, + "ppl": 5.5929, + "step": 6632 + }, + { + "epoch": 0.04, + "global_step": 6633, + "learning_rate": 0.0004731510851419032, + "loss": 1.7157, + "loss_base2": 2.4752, + "loss_pixel": 0.1947, + "loss_text": 1.521, + "ppl": 5.5606, + "step": 6633 + }, + { + "epoch": 0.04, + "global_step": 6634, + "learning_rate": 0.0004731469115191987, + "loss": 1.7412, + "loss_base2": 2.512, + "loss_pixel": 0.1981, + "loss_text": 1.5432, + "ppl": 5.7042, + "step": 6634 + }, + { + "epoch": 0.04, + "global_step": 6635, + "learning_rate": 0.00047314273789649414, + "loss": 1.7081, + "loss_base2": 2.4643, + "loss_pixel": 0.1964, + "loss_text": 1.5117, + "ppl": 5.5185, + "step": 6635 + }, + { + "epoch": 0.04, + "global_step": 6636, + "learning_rate": 0.00047313856427378965, + "loss": 1.7267, + "loss_base2": 2.4911, + "loss_pixel": 0.1948, + "loss_text": 1.5319, + "ppl": 5.6221, + "step": 6636 + }, + { + "epoch": 0.04, + "global_step": 6637, + "learning_rate": 0.00047313439065108516, + "loss": 1.7239, + "loss_base2": 2.4871, + "loss_pixel": 0.1935, + "loss_text": 1.5304, + "ppl": 5.6064, + "step": 6637 + }, + { + "epoch": 0.04, + "global_step": 6638, + "learning_rate": 0.00047313021702838066, + "loss": 1.7245, + "loss_base2": 2.4879, + "loss_pixel": 0.1942, + "loss_text": 1.5303, + "ppl": 5.6097, + "step": 6638 + }, + { + "epoch": 0.04, + "global_step": 6639, + "learning_rate": 0.0004731260434056761, + "loss": 1.7007, + "loss_base2": 2.4536, + "loss_pixel": 0.1921, + "loss_text": 1.5085, + "ppl": 5.4778, + "step": 6639 + }, + { + "epoch": 0.04, + "global_step": 6640, + "learning_rate": 0.0004731218697829716, + "loss": 1.7146, + "loss_base2": 2.4736, + "loss_pixel": 0.1925, + "loss_text": 1.5221, + "ppl": 5.5545, + "step": 6640 + }, + { + "epoch": 0.04, + "global_step": 6641, + "learning_rate": 0.00047311769616026713, + "loss": 1.7247, + "loss_base2": 2.4882, + "loss_pixel": 0.1914, + "loss_text": 1.5333, + "ppl": 5.6108, + "step": 6641 + }, + { + "epoch": 0.04, + "global_step": 6642, + "learning_rate": 0.00047311352253756264, + "loss": 1.6894, + "loss_base2": 2.4373, + "loss_pixel": 0.1894, + "loss_text": 1.5, + "ppl": 5.4162, + "step": 6642 + }, + { + "epoch": 0.04, + "global_step": 6643, + "learning_rate": 0.00047310934891485815, + "loss": 1.7316, + "loss_base2": 2.4982, + "loss_pixel": 0.1908, + "loss_text": 1.5408, + "ppl": 5.6497, + "step": 6643 + }, + { + "epoch": 0.04, + "global_step": 6644, + "learning_rate": 0.0004731051752921536, + "loss": 1.7198, + "loss_base2": 2.4811, + "loss_pixel": 0.19, + "loss_text": 1.5298, + "ppl": 5.5834, + "step": 6644 + }, + { + "epoch": 0.04, + "global_step": 6645, + "learning_rate": 0.0004731010016694491, + "loss": 1.7259, + "loss_base2": 2.4899, + "loss_pixel": 0.1907, + "loss_text": 1.5352, + "ppl": 5.6176, + "step": 6645 + }, + { + "epoch": 0.04, + "global_step": 6646, + "learning_rate": 0.0004730968280467446, + "loss": 1.7038, + "loss_base2": 2.4581, + "loss_pixel": 0.1887, + "loss_text": 1.5151, + "ppl": 5.4948, + "step": 6646 + }, + { + "epoch": 0.04, + "global_step": 6647, + "learning_rate": 0.00047309265442404007, + "loss": 1.7243, + "loss_base2": 2.4876, + "loss_pixel": 0.1882, + "loss_text": 1.5362, + "ppl": 5.6086, + "step": 6647 + }, + { + "epoch": 0.04, + "global_step": 6648, + "learning_rate": 0.0004730884808013356, + "loss": 1.7057, + "loss_base2": 2.4608, + "loss_pixel": 0.1879, + "loss_text": 1.5178, + "ppl": 5.5052, + "step": 6648 + }, + { + "epoch": 0.04, + "global_step": 6649, + "learning_rate": 0.00047308430717863103, + "loss": 1.7124, + "loss_base2": 2.4705, + "loss_pixel": 0.1876, + "loss_text": 1.5249, + "ppl": 5.5422, + "step": 6649 + }, + { + "epoch": 0.04, + "global_step": 6650, + "learning_rate": 0.00047308013355592654, + "loss": 1.7027, + "loss_base2": 2.4565, + "loss_pixel": 0.1874, + "loss_text": 1.5153, + "ppl": 5.4887, + "step": 6650 + }, + { + "epoch": 0.04, + "global_step": 6651, + "learning_rate": 0.00047307595993322204, + "loss": 1.7185, + "loss_base2": 2.4793, + "loss_pixel": 0.188, + "loss_text": 1.5304, + "ppl": 5.5762, + "step": 6651 + }, + { + "epoch": 0.04, + "global_step": 6652, + "learning_rate": 0.00047307178631051755, + "loss": 1.6985, + "loss_base2": 2.4504, + "loss_pixel": 0.1882, + "loss_text": 1.5103, + "ppl": 5.4657, + "step": 6652 + }, + { + "epoch": 0.04, + "global_step": 6653, + "learning_rate": 0.000473067612687813, + "loss": 1.6967, + "loss_base2": 2.4478, + "loss_pixel": 0.1877, + "loss_text": 1.509, + "ppl": 5.4559, + "step": 6653 + }, + { + "epoch": 0.04, + "global_step": 6654, + "learning_rate": 0.0004730634390651085, + "loss": 1.7193, + "loss_base2": 2.4804, + "loss_pixel": 0.1865, + "loss_text": 1.5328, + "ppl": 5.5806, + "step": 6654 + }, + { + "epoch": 0.04, + "global_step": 6655, + "learning_rate": 0.000473059265442404, + "loss": 1.7068, + "loss_base2": 2.4624, + "loss_pixel": 0.1875, + "loss_text": 1.5193, + "ppl": 5.5113, + "step": 6655 + }, + { + "epoch": 0.04, + "global_step": 6656, + "learning_rate": 0.0004730550918196995, + "loss": 1.7017, + "loss_base2": 2.455, + "loss_pixel": 0.1867, + "loss_text": 1.515, + "ppl": 5.4833, + "step": 6656 + }, + { + "epoch": 0.04, + "global_step": 6657, + "learning_rate": 0.00047305091819699503, + "loss": 1.7167, + "loss_base2": 2.4767, + "loss_pixel": 0.1858, + "loss_text": 1.531, + "ppl": 5.5661, + "step": 6657 + }, + { + "epoch": 0.04, + "global_step": 6658, + "learning_rate": 0.0004730467445742905, + "loss": 1.7088, + "loss_base2": 2.4653, + "loss_pixel": 0.1862, + "loss_text": 1.5226, + "ppl": 5.5223, + "step": 6658 + }, + { + "epoch": 0.04, + "global_step": 6659, + "learning_rate": 0.000473042570951586, + "loss": 1.7151, + "loss_base2": 2.4744, + "loss_pixel": 0.1862, + "loss_text": 1.5289, + "ppl": 5.5572, + "step": 6659 + }, + { + "epoch": 0.04, + "global_step": 6660, + "learning_rate": 0.0004730383973288815, + "loss": 1.6945, + "loss_base2": 2.4446, + "loss_pixel": 0.1856, + "loss_text": 1.5089, + "ppl": 5.4439, + "step": 6660 + }, + { + "epoch": 0.04, + "global_step": 6661, + "learning_rate": 0.000473034223706177, + "loss": 1.691, + "loss_base2": 2.4396, + "loss_pixel": 0.1861, + "loss_text": 1.505, + "ppl": 5.4249, + "step": 6661 + }, + { + "epoch": 0.04, + "global_step": 6662, + "learning_rate": 0.00047303005008347246, + "loss": 1.6016, + "loss_base2": 2.3106, + "loss_pixel": 0.1848, + "loss_text": 1.4168, + "ppl": 4.961, + "step": 6662 + }, + { + "epoch": 0.04, + "global_step": 6663, + "learning_rate": 0.00047302587646076797, + "loss": 1.4669, + "loss_base2": 2.1163, + "loss_pixel": 0.1853, + "loss_text": 1.2815, + "ppl": 4.3358, + "step": 6663 + }, + { + "epoch": 0.04, + "global_step": 6664, + "learning_rate": 0.0004730217028380635, + "loss": 1.4869, + "loss_base2": 2.1451, + "loss_pixel": 0.1851, + "loss_text": 1.3018, + "ppl": 4.4234, + "step": 6664 + }, + { + "epoch": 0.04, + "global_step": 6665, + "learning_rate": 0.00047301752921535893, + "loss": 1.484, + "loss_base2": 2.141, + "loss_pixel": 0.1857, + "loss_text": 1.2983, + "ppl": 4.4106, + "step": 6665 + }, + { + "epoch": 0.04, + "global_step": 6666, + "learning_rate": 0.00047301335559265444, + "loss": 1.4756, + "loss_base2": 2.1288, + "loss_pixel": 0.1866, + "loss_text": 1.289, + "ppl": 4.3737, + "step": 6666 + }, + { + "epoch": 0.04, + "global_step": 6667, + "learning_rate": 0.0004730091819699499, + "loss": 1.4994, + "loss_base2": 2.1632, + "loss_pixel": 0.1854, + "loss_text": 1.3139, + "ppl": 4.479, + "step": 6667 + }, + { + "epoch": 0.04, + "global_step": 6668, + "learning_rate": 0.0004730050083472454, + "loss": 1.4792, + "loss_base2": 2.134, + "loss_pixel": 0.1839, + "loss_text": 1.2953, + "ppl": 4.3894, + "step": 6668 + }, + { + "epoch": 0.04, + "global_step": 6669, + "learning_rate": 0.0004730008347245409, + "loss": 1.4689, + "loss_base2": 2.1192, + "loss_pixel": 0.1863, + "loss_text": 1.2826, + "ppl": 4.3445, + "step": 6669 + }, + { + "epoch": 0.04, + "global_step": 6670, + "learning_rate": 0.0004729966611018364, + "loss": 1.4635, + "loss_base2": 2.1114, + "loss_pixel": 0.1857, + "loss_text": 1.2777, + "ppl": 4.3211, + "step": 6670 + }, + { + "epoch": 0.04, + "global_step": 6671, + "learning_rate": 0.00047299248747913186, + "loss": 1.4546, + "loss_base2": 2.0985, + "loss_pixel": 0.1843, + "loss_text": 1.2703, + "ppl": 4.2828, + "step": 6671 + }, + { + "epoch": 0.04, + "global_step": 6672, + "learning_rate": 0.00047298831385642737, + "loss": 1.4522, + "loss_base2": 2.0951, + "loss_pixel": 0.1856, + "loss_text": 1.2666, + "ppl": 4.2725, + "step": 6672 + }, + { + "epoch": 0.04, + "global_step": 6673, + "learning_rate": 0.0004729841402337229, + "loss": 1.4665, + "loss_base2": 2.1157, + "loss_pixel": 0.1834, + "loss_text": 1.2831, + "ppl": 4.334, + "step": 6673 + }, + { + "epoch": 0.04, + "global_step": 6674, + "learning_rate": 0.0004729799666110184, + "loss": 1.4873, + "loss_base2": 2.1457, + "loss_pixel": 0.1833, + "loss_text": 1.3039, + "ppl": 4.4251, + "step": 6674 + }, + { + "epoch": 0.04, + "global_step": 6675, + "learning_rate": 0.0004729757929883139, + "loss": 1.4687, + "loss_base2": 2.1189, + "loss_pixel": 0.1869, + "loss_text": 1.2819, + "ppl": 4.3436, + "step": 6675 + }, + { + "epoch": 0.04, + "global_step": 6676, + "learning_rate": 0.00047297161936560935, + "loss": 1.4742, + "loss_base2": 2.1268, + "loss_pixel": 0.1842, + "loss_text": 1.29, + "ppl": 4.3675, + "step": 6676 + }, + { + "epoch": 0.04, + "global_step": 6677, + "learning_rate": 0.00047296744574290485, + "loss": 1.4634, + "loss_base2": 2.1112, + "loss_pixel": 0.1837, + "loss_text": 1.2798, + "ppl": 4.3206, + "step": 6677 + }, + { + "epoch": 0.04, + "global_step": 6678, + "learning_rate": 0.00047296327212020036, + "loss": 1.4716, + "loss_base2": 2.1231, + "loss_pixel": 0.1848, + "loss_text": 1.2868, + "ppl": 4.3562, + "step": 6678 + }, + { + "epoch": 0.04, + "global_step": 6679, + "learning_rate": 0.00047295909849749587, + "loss": 1.4499, + "loss_base2": 2.0918, + "loss_pixel": 0.1842, + "loss_text": 1.2656, + "ppl": 4.2627, + "step": 6679 + }, + { + "epoch": 0.04, + "global_step": 6680, + "learning_rate": 0.0004729549248747913, + "loss": 1.4588, + "loss_base2": 2.1046, + "loss_pixel": 0.1846, + "loss_text": 1.2742, + "ppl": 4.3008, + "step": 6680 + }, + { + "epoch": 0.04, + "global_step": 6681, + "learning_rate": 0.00047295075125208683, + "loss": 1.4799, + "loss_base2": 2.135, + "loss_pixel": 0.1849, + "loss_text": 1.295, + "ppl": 4.3925, + "step": 6681 + }, + { + "epoch": 0.04, + "global_step": 6682, + "learning_rate": 0.00047294657762938234, + "loss": 1.4755, + "loss_base2": 2.1287, + "loss_pixel": 0.184, + "loss_text": 1.2915, + "ppl": 4.3732, + "step": 6682 + }, + { + "epoch": 0.04, + "global_step": 6683, + "learning_rate": 0.00047294240400667784, + "loss": 1.4704, + "loss_base2": 2.1213, + "loss_pixel": 0.1852, + "loss_text": 1.2852, + "ppl": 4.351, + "step": 6683 + }, + { + "epoch": 0.04, + "global_step": 6684, + "learning_rate": 0.0004729382303839733, + "loss": 1.4555, + "loss_base2": 2.0998, + "loss_pixel": 0.1839, + "loss_text": 1.2715, + "ppl": 4.2866, + "step": 6684 + }, + { + "epoch": 0.04, + "global_step": 6685, + "learning_rate": 0.00047293405676126875, + "loss": 1.4675, + "loss_base2": 2.1172, + "loss_pixel": 0.1841, + "loss_text": 1.2834, + "ppl": 4.3384, + "step": 6685 + }, + { + "epoch": 0.04, + "global_step": 6686, + "learning_rate": 0.00047292988313856426, + "loss": 1.4862, + "loss_base2": 2.1441, + "loss_pixel": 0.183, + "loss_text": 1.3032, + "ppl": 4.4203, + "step": 6686 + }, + { + "epoch": 0.04, + "global_step": 6687, + "learning_rate": 0.00047292570951585976, + "loss": 1.4657, + "loss_base2": 2.1146, + "loss_pixel": 0.1831, + "loss_text": 1.2826, + "ppl": 4.3306, + "step": 6687 + }, + { + "epoch": 0.04, + "global_step": 6688, + "learning_rate": 0.00047292153589315527, + "loss": 1.4756, + "loss_base2": 2.1288, + "loss_pixel": 0.1844, + "loss_text": 1.2911, + "ppl": 4.3737, + "step": 6688 + }, + { + "epoch": 0.04, + "global_step": 6689, + "learning_rate": 0.0004729173622704507, + "loss": 1.4666, + "loss_base2": 2.1159, + "loss_pixel": 0.1834, + "loss_text": 1.2831, + "ppl": 4.3345, + "step": 6689 + }, + { + "epoch": 0.04, + "global_step": 6690, + "learning_rate": 0.00047291318864774623, + "loss": 1.4873, + "loss_base2": 2.1457, + "loss_pixel": 0.1839, + "loss_text": 1.3034, + "ppl": 4.4251, + "step": 6690 + }, + { + "epoch": 0.04, + "global_step": 6691, + "learning_rate": 0.00047290901502504174, + "loss": 1.4582, + "loss_base2": 2.1037, + "loss_pixel": 0.1843, + "loss_text": 1.2739, + "ppl": 4.2982, + "step": 6691 + }, + { + "epoch": 0.04, + "global_step": 6692, + "learning_rate": 0.00047290484140233725, + "loss": 1.4539, + "loss_base2": 2.0975, + "loss_pixel": 0.1841, + "loss_text": 1.2698, + "ppl": 4.2798, + "step": 6692 + }, + { + "epoch": 0.04, + "global_step": 6693, + "learning_rate": 0.00047290066777963275, + "loss": 1.4851, + "loss_base2": 2.1425, + "loss_pixel": 0.1837, + "loss_text": 1.3014, + "ppl": 4.4154, + "step": 6693 + }, + { + "epoch": 0.04, + "global_step": 6694, + "learning_rate": 0.0004728964941569282, + "loss": 1.4566, + "loss_base2": 2.1014, + "loss_pixel": 0.1854, + "loss_text": 1.2712, + "ppl": 4.2913, + "step": 6694 + }, + { + "epoch": 0.04, + "global_step": 6695, + "learning_rate": 0.0004728923205342237, + "loss": 1.4824, + "loss_base2": 2.1387, + "loss_pixel": 0.1829, + "loss_text": 1.2994, + "ppl": 4.4035, + "step": 6695 + }, + { + "epoch": 0.04, + "global_step": 6696, + "learning_rate": 0.0004728881469115192, + "loss": 1.6036, + "loss_base2": 2.3135, + "loss_pixel": 0.1838, + "loss_text": 1.4198, + "ppl": 4.9709, + "step": 6696 + }, + { + "epoch": 0.04, + "global_step": 6697, + "learning_rate": 0.00047288397328881473, + "loss": 1.7232, + "loss_base2": 2.4861, + "loss_pixel": 0.1836, + "loss_text": 1.5396, + "ppl": 5.6024, + "step": 6697 + }, + { + "epoch": 0.04, + "global_step": 6698, + "learning_rate": 0.0004728797996661102, + "loss": 1.734, + "loss_base2": 2.5016, + "loss_pixel": 0.1828, + "loss_text": 1.5512, + "ppl": 5.6633, + "step": 6698 + }, + { + "epoch": 0.04, + "global_step": 6699, + "learning_rate": 0.0004728756260434057, + "loss": 1.7322, + "loss_base2": 2.499, + "loss_pixel": 0.1836, + "loss_text": 1.5485, + "ppl": 5.6531, + "step": 6699 + }, + { + "epoch": 0.04, + "global_step": 6700, + "learning_rate": 0.0004728714524207012, + "loss": 1.7228, + "loss_base2": 2.4855, + "loss_pixel": 0.1836, + "loss_text": 1.5392, + "ppl": 5.6002, + "step": 6700 + }, + { + "epoch": 0.04, + "global_step": 6701, + "learning_rate": 0.0004728672787979967, + "loss": 1.7165, + "loss_base2": 2.4764, + "loss_pixel": 0.1823, + "loss_text": 1.5341, + "ppl": 5.565, + "step": 6701 + }, + { + "epoch": 0.04, + "global_step": 6702, + "learning_rate": 0.0004728631051752922, + "loss": 1.7143, + "loss_base2": 2.4732, + "loss_pixel": 0.1837, + "loss_text": 1.5306, + "ppl": 5.5528, + "step": 6702 + }, + { + "epoch": 0.04, + "global_step": 6703, + "learning_rate": 0.0004728589315525876, + "loss": 1.7294, + "loss_base2": 2.495, + "loss_pixel": 0.1843, + "loss_text": 1.5451, + "ppl": 5.6373, + "step": 6703 + }, + { + "epoch": 0.04, + "global_step": 6704, + "learning_rate": 0.0004728547579298831, + "loss": 1.7109, + "loss_base2": 2.4683, + "loss_pixel": 0.184, + "loss_text": 1.527, + "ppl": 5.5339, + "step": 6704 + }, + { + "epoch": 0.04, + "global_step": 6705, + "learning_rate": 0.0004728505843071786, + "loss": 1.7265, + "loss_base2": 2.4908, + "loss_pixel": 0.1832, + "loss_text": 1.5432, + "ppl": 5.6209, + "step": 6705 + }, + { + "epoch": 0.04, + "global_step": 6706, + "learning_rate": 0.00047284641068447413, + "loss": 1.7049, + "loss_base2": 2.4597, + "loss_pixel": 0.1831, + "loss_text": 1.5218, + "ppl": 5.5008, + "step": 6706 + }, + { + "epoch": 0.04, + "global_step": 6707, + "learning_rate": 0.00047284223706176964, + "loss": 1.6863, + "loss_base2": 2.4328, + "loss_pixel": 0.1834, + "loss_text": 1.5029, + "ppl": 5.3995, + "step": 6707 + }, + { + "epoch": 0.04, + "global_step": 6708, + "learning_rate": 0.0004728380634390651, + "loss": 1.71, + "loss_base2": 2.467, + "loss_pixel": 0.1817, + "loss_text": 1.5283, + "ppl": 5.529, + "step": 6708 + }, + { + "epoch": 0.04, + "global_step": 6709, + "learning_rate": 0.0004728338898163606, + "loss": 1.7005, + "loss_base2": 2.4533, + "loss_pixel": 0.1828, + "loss_text": 1.5177, + "ppl": 5.4767, + "step": 6709 + }, + { + "epoch": 0.04, + "global_step": 6710, + "learning_rate": 0.0004728297161936561, + "loss": 1.7078, + "loss_base2": 2.4638, + "loss_pixel": 0.1834, + "loss_text": 1.5244, + "ppl": 5.5168, + "step": 6710 + }, + { + "epoch": 0.04, + "global_step": 6711, + "learning_rate": 0.0004728255425709516, + "loss": 1.7047, + "loss_base2": 2.4594, + "loss_pixel": 0.1825, + "loss_text": 1.5222, + "ppl": 5.4997, + "step": 6711 + }, + { + "epoch": 0.04, + "global_step": 6712, + "learning_rate": 0.00047282136894824707, + "loss": 1.7106, + "loss_base2": 2.4679, + "loss_pixel": 0.1834, + "loss_text": 1.5272, + "ppl": 5.5323, + "step": 6712 + }, + { + "epoch": 0.04, + "global_step": 6713, + "learning_rate": 0.0004728171953255426, + "loss": 1.7142, + "loss_base2": 2.4731, + "loss_pixel": 0.1826, + "loss_text": 1.5316, + "ppl": 5.5522, + "step": 6713 + }, + { + "epoch": 0.04, + "global_step": 6714, + "learning_rate": 0.0004728130217028381, + "loss": 1.7118, + "loss_base2": 2.4696, + "loss_pixel": 0.1839, + "loss_text": 1.5279, + "ppl": 5.5389, + "step": 6714 + }, + { + "epoch": 0.04, + "global_step": 6715, + "learning_rate": 0.0004728088480801336, + "loss": 1.7176, + "loss_base2": 2.478, + "loss_pixel": 0.1819, + "loss_text": 1.5357, + "ppl": 5.5711, + "step": 6715 + }, + { + "epoch": 0.04, + "global_step": 6716, + "learning_rate": 0.0004728046744574291, + "loss": 1.698, + "loss_base2": 2.4497, + "loss_pixel": 0.1828, + "loss_text": 1.5152, + "ppl": 5.463, + "step": 6716 + }, + { + "epoch": 0.04, + "global_step": 6717, + "learning_rate": 0.00047280050083472455, + "loss": 1.6805, + "loss_base2": 2.4244, + "loss_pixel": 0.1817, + "loss_text": 1.4989, + "ppl": 5.3682, + "step": 6717 + }, + { + "epoch": 0.04, + "global_step": 6718, + "learning_rate": 0.00047279632721202006, + "loss": 1.7164, + "loss_base2": 2.4762, + "loss_pixel": 0.1833, + "loss_text": 1.533, + "ppl": 5.5645, + "step": 6718 + }, + { + "epoch": 0.04, + "global_step": 6719, + "learning_rate": 0.00047279215358931556, + "loss": 1.716, + "loss_base2": 2.4757, + "loss_pixel": 0.1829, + "loss_text": 1.5331, + "ppl": 5.5622, + "step": 6719 + }, + { + "epoch": 0.04, + "global_step": 6720, + "learning_rate": 0.00047278797996661107, + "loss": 1.7035, + "loss_base2": 2.4576, + "loss_pixel": 0.1821, + "loss_text": 1.5214, + "ppl": 5.4931, + "step": 6720 + }, + { + "epoch": 0.04, + "global_step": 6721, + "learning_rate": 0.00047278380634390647, + "loss": 1.6632, + "loss_base2": 2.3995, + "loss_pixel": 0.183, + "loss_text": 1.4802, + "ppl": 5.2762, + "step": 6721 + }, + { + "epoch": 0.04, + "global_step": 6722, + "learning_rate": 0.000472779632721202, + "loss": 1.4904, + "loss_base2": 2.1502, + "loss_pixel": 0.1819, + "loss_text": 1.3085, + "ppl": 4.4389, + "step": 6722 + }, + { + "epoch": 0.04, + "global_step": 6723, + "learning_rate": 0.0004727754590984975, + "loss": 1.4874, + "loss_base2": 2.1459, + "loss_pixel": 0.1815, + "loss_text": 1.3058, + "ppl": 4.4256, + "step": 6723 + }, + { + "epoch": 0.04, + "global_step": 6724, + "learning_rate": 0.000472771285475793, + "loss": 1.4845, + "loss_base2": 2.1417, + "loss_pixel": 0.1829, + "loss_text": 1.3016, + "ppl": 4.4128, + "step": 6724 + }, + { + "epoch": 0.04, + "global_step": 6725, + "learning_rate": 0.0004727671118530885, + "loss": 1.4981, + "loss_base2": 2.1613, + "loss_pixel": 0.1812, + "loss_text": 1.3169, + "ppl": 4.4732, + "step": 6725 + }, + { + "epoch": 0.04, + "global_step": 6726, + "learning_rate": 0.00047276293823038395, + "loss": 1.4614, + "loss_base2": 2.1084, + "loss_pixel": 0.1838, + "loss_text": 1.2776, + "ppl": 4.312, + "step": 6726 + }, + { + "epoch": 0.04, + "global_step": 6727, + "learning_rate": 0.00047275876460767946, + "loss": 1.4885, + "loss_base2": 2.1475, + "loss_pixel": 0.1824, + "loss_text": 1.3061, + "ppl": 4.4304, + "step": 6727 + }, + { + "epoch": 0.04, + "global_step": 6728, + "learning_rate": 0.00047275459098497497, + "loss": 1.4527, + "loss_base2": 2.0958, + "loss_pixel": 0.1825, + "loss_text": 1.2702, + "ppl": 4.2746, + "step": 6728 + }, + { + "epoch": 0.04, + "global_step": 6729, + "learning_rate": 0.0004727504173622705, + "loss": 1.6352, + "loss_base2": 2.3591, + "loss_pixel": 0.1817, + "loss_text": 1.4535, + "ppl": 5.1305, + "step": 6729 + }, + { + "epoch": 0.04, + "global_step": 6730, + "learning_rate": 0.00047274624373956593, + "loss": 1.7254, + "loss_base2": 2.4892, + "loss_pixel": 0.1827, + "loss_text": 1.5427, + "ppl": 5.6148, + "step": 6730 + }, + { + "epoch": 0.04, + "global_step": 6731, + "learning_rate": 0.00047274207011686144, + "loss": 1.6859, + "loss_base2": 2.4322, + "loss_pixel": 0.183, + "loss_text": 1.5029, + "ppl": 5.3973, + "step": 6731 + }, + { + "epoch": 0.04, + "global_step": 6732, + "learning_rate": 0.00047273789649415694, + "loss": 1.7165, + "loss_base2": 2.4764, + "loss_pixel": 0.1815, + "loss_text": 1.535, + "ppl": 5.565, + "step": 6732 + }, + { + "epoch": 0.04, + "global_step": 6733, + "learning_rate": 0.00047273372287145245, + "loss": 1.7317, + "loss_base2": 2.4983, + "loss_pixel": 0.183, + "loss_text": 1.5488, + "ppl": 5.6503, + "step": 6733 + }, + { + "epoch": 0.04, + "global_step": 6734, + "learning_rate": 0.00047272954924874796, + "loss": 1.7113, + "loss_base2": 2.4689, + "loss_pixel": 0.1818, + "loss_text": 1.5295, + "ppl": 5.5362, + "step": 6734 + }, + { + "epoch": 0.04, + "global_step": 6735, + "learning_rate": 0.0004727253756260434, + "loss": 1.7197, + "loss_base2": 2.481, + "loss_pixel": 0.1837, + "loss_text": 1.5359, + "ppl": 5.5829, + "step": 6735 + }, + { + "epoch": 0.04, + "global_step": 6736, + "learning_rate": 0.0004727212020033389, + "loss": 1.7207, + "loss_base2": 2.4824, + "loss_pixel": 0.1853, + "loss_text": 1.5354, + "ppl": 5.5884, + "step": 6736 + }, + { + "epoch": 0.04, + "global_step": 6737, + "learning_rate": 0.0004727170283806344, + "loss": 1.7161, + "loss_base2": 2.4758, + "loss_pixel": 0.1826, + "loss_text": 1.5335, + "ppl": 5.5628, + "step": 6737 + }, + { + "epoch": 0.04, + "global_step": 6738, + "learning_rate": 0.00047271285475792993, + "loss": 1.6963, + "loss_base2": 2.4472, + "loss_pixel": 0.182, + "loss_text": 1.5143, + "ppl": 5.4537, + "step": 6738 + }, + { + "epoch": 0.04, + "global_step": 6739, + "learning_rate": 0.0004727086811352254, + "loss": 1.7115, + "loss_base2": 2.4692, + "loss_pixel": 0.187, + "loss_text": 1.5245, + "ppl": 5.5373, + "step": 6739 + }, + { + "epoch": 0.04, + "global_step": 6740, + "learning_rate": 0.00047270450751252084, + "loss": 1.6859, + "loss_base2": 2.4322, + "loss_pixel": 0.1919, + "loss_text": 1.494, + "ppl": 5.3973, + "step": 6740 + }, + { + "epoch": 0.04, + "global_step": 6741, + "learning_rate": 0.00047270033388981635, + "loss": 1.6985, + "loss_base2": 2.4504, + "loss_pixel": 0.1907, + "loss_text": 1.5078, + "ppl": 5.4657, + "step": 6741 + }, + { + "epoch": 0.04, + "global_step": 6742, + "learning_rate": 0.00047269616026711185, + "loss": 1.7175, + "loss_base2": 2.4778, + "loss_pixel": 0.1845, + "loss_text": 1.533, + "ppl": 5.5706, + "step": 6742 + }, + { + "epoch": 0.04, + "global_step": 6743, + "learning_rate": 0.00047269198664440736, + "loss": 1.7354, + "loss_base2": 2.5037, + "loss_pixel": 0.183, + "loss_text": 1.5525, + "ppl": 5.6712, + "step": 6743 + }, + { + "epoch": 0.04, + "global_step": 6744, + "learning_rate": 0.0004726878130217028, + "loss": 1.7209, + "loss_base2": 2.4827, + "loss_pixel": 0.1807, + "loss_text": 1.5403, + "ppl": 5.5896, + "step": 6744 + }, + { + "epoch": 0.04, + "global_step": 6745, + "learning_rate": 0.0004726836393989983, + "loss": 1.7064, + "loss_base2": 2.4618, + "loss_pixel": 0.1798, + "loss_text": 1.5266, + "ppl": 5.5091, + "step": 6745 + }, + { + "epoch": 0.04, + "global_step": 6746, + "learning_rate": 0.00047267946577629383, + "loss": 1.6797, + "loss_base2": 2.4233, + "loss_pixel": 0.1806, + "loss_text": 1.4991, + "ppl": 5.3639, + "step": 6746 + }, + { + "epoch": 0.04, + "global_step": 6747, + "learning_rate": 0.00047267529215358934, + "loss": 1.6995, + "loss_base2": 2.4519, + "loss_pixel": 0.1807, + "loss_text": 1.5188, + "ppl": 5.4712, + "step": 6747 + }, + { + "epoch": 0.04, + "global_step": 6748, + "learning_rate": 0.0004726711185308848, + "loss": 1.6881, + "loss_base2": 2.4354, + "loss_pixel": 0.1789, + "loss_text": 1.5092, + "ppl": 5.4092, + "step": 6748 + }, + { + "epoch": 0.04, + "global_step": 6749, + "learning_rate": 0.0004726669449081803, + "loss": 1.7088, + "loss_base2": 2.4653, + "loss_pixel": 0.1788, + "loss_text": 1.53, + "ppl": 5.5223, + "step": 6749 + }, + { + "epoch": 0.04, + "global_step": 6750, + "learning_rate": 0.0004726627712854758, + "loss": 1.7095, + "loss_base2": 2.4663, + "loss_pixel": 0.1791, + "loss_text": 1.5304, + "ppl": 5.5262, + "step": 6750 + }, + { + "epoch": 0.04, + "global_step": 6751, + "learning_rate": 0.0004726585976627713, + "loss": 1.7056, + "loss_base2": 2.4607, + "loss_pixel": 0.179, + "loss_text": 1.5266, + "ppl": 5.5047, + "step": 6751 + }, + { + "epoch": 0.04, + "global_step": 6752, + "learning_rate": 0.0004726544240400668, + "loss": 1.7089, + "loss_base2": 2.4654, + "loss_pixel": 0.1796, + "loss_text": 1.5293, + "ppl": 5.5229, + "step": 6752 + }, + { + "epoch": 0.04, + "global_step": 6753, + "learning_rate": 0.00047265025041736227, + "loss": 1.7029, + "loss_base2": 2.4568, + "loss_pixel": 0.1766, + "loss_text": 1.5262, + "ppl": 5.4898, + "step": 6753 + }, + { + "epoch": 0.04, + "global_step": 6754, + "learning_rate": 0.0004726460767946578, + "loss": 1.6822, + "loss_base2": 2.4269, + "loss_pixel": 0.1764, + "loss_text": 1.5058, + "ppl": 5.3774, + "step": 6754 + }, + { + "epoch": 0.04, + "global_step": 6755, + "learning_rate": 0.0004726419031719533, + "loss": 1.7113, + "loss_base2": 2.4689, + "loss_pixel": 0.1805, + "loss_text": 1.5308, + "ppl": 5.5362, + "step": 6755 + }, + { + "epoch": 0.04, + "global_step": 6756, + "learning_rate": 0.0004726377295492488, + "loss": 1.6856, + "loss_base2": 2.4318, + "loss_pixel": 0.176, + "loss_text": 1.5096, + "ppl": 5.3957, + "step": 6756 + }, + { + "epoch": 0.04, + "global_step": 6757, + "learning_rate": 0.00047263355592654425, + "loss": 1.7138, + "loss_base2": 2.4725, + "loss_pixel": 0.1771, + "loss_text": 1.5367, + "ppl": 5.55, + "step": 6757 + }, + { + "epoch": 0.04, + "global_step": 6758, + "learning_rate": 0.00047262938230383975, + "loss": 1.7009, + "loss_base2": 2.4539, + "loss_pixel": 0.1752, + "loss_text": 1.5257, + "ppl": 5.4789, + "step": 6758 + }, + { + "epoch": 0.04, + "global_step": 6759, + "learning_rate": 0.0004726252086811352, + "loss": 1.7106, + "loss_base2": 2.4679, + "loss_pixel": 0.1891, + "loss_text": 1.5214, + "ppl": 5.5323, + "step": 6759 + }, + { + "epoch": 0.04, + "global_step": 6760, + "learning_rate": 0.0004726210350584307, + "loss": 1.7181, + "loss_base2": 2.4787, + "loss_pixel": 0.1929, + "loss_text": 1.5252, + "ppl": 5.5739, + "step": 6760 + }, + { + "epoch": 0.04, + "global_step": 6761, + "learning_rate": 0.0004726168614357262, + "loss": 1.7109, + "loss_base2": 2.4683, + "loss_pixel": 0.1918, + "loss_text": 1.5191, + "ppl": 5.5339, + "step": 6761 + }, + { + "epoch": 0.04, + "global_step": 6762, + "learning_rate": 0.0004726126878130217, + "loss": 1.7108, + "loss_base2": 2.4682, + "loss_pixel": 0.1921, + "loss_text": 1.5188, + "ppl": 5.5334, + "step": 6762 + }, + { + "epoch": 0.04, + "global_step": 6763, + "learning_rate": 0.0004726085141903172, + "loss": 1.6896, + "loss_base2": 2.4376, + "loss_pixel": 0.1905, + "loss_text": 1.499, + "ppl": 5.4173, + "step": 6763 + }, + { + "epoch": 0.04, + "global_step": 6764, + "learning_rate": 0.0004726043405676127, + "loss": 1.715, + "loss_base2": 2.4742, + "loss_pixel": 0.1814, + "loss_text": 1.5336, + "ppl": 5.5567, + "step": 6764 + }, + { + "epoch": 0.04, + "global_step": 6765, + "learning_rate": 0.0004726001669449082, + "loss": 1.6858, + "loss_base2": 2.4321, + "loss_pixel": 0.1802, + "loss_text": 1.5056, + "ppl": 5.3968, + "step": 6765 + }, + { + "epoch": 0.04, + "global_step": 6766, + "learning_rate": 0.0004725959933222037, + "loss": 1.7098, + "loss_base2": 2.4667, + "loss_pixel": 0.1782, + "loss_text": 1.5316, + "ppl": 5.5279, + "step": 6766 + }, + { + "epoch": 0.04, + "global_step": 6767, + "learning_rate": 0.00047259181969949916, + "loss": 1.6772, + "loss_base2": 2.4197, + "loss_pixel": 0.1789, + "loss_text": 1.4984, + "ppl": 5.3506, + "step": 6767 + }, + { + "epoch": 0.04, + "global_step": 6768, + "learning_rate": 0.00047258764607679466, + "loss": 1.6869, + "loss_base2": 2.4337, + "loss_pixel": 0.1783, + "loss_text": 1.5085, + "ppl": 5.4027, + "step": 6768 + }, + { + "epoch": 0.04, + "global_step": 6769, + "learning_rate": 0.00047258347245409017, + "loss": 1.7022, + "loss_base2": 2.4558, + "loss_pixel": 0.1802, + "loss_text": 1.522, + "ppl": 5.486, + "step": 6769 + }, + { + "epoch": 0.04, + "global_step": 6770, + "learning_rate": 0.0004725792988313857, + "loss": 1.6856, + "loss_base2": 2.4318, + "loss_pixel": 0.1775, + "loss_text": 1.5082, + "ppl": 5.3957, + "step": 6770 + }, + { + "epoch": 0.04, + "global_step": 6771, + "learning_rate": 0.00047257512520868113, + "loss": 1.692, + "loss_base2": 2.441, + "loss_pixel": 0.1751, + "loss_text": 1.5169, + "ppl": 5.4303, + "step": 6771 + }, + { + "epoch": 0.04, + "global_step": 6772, + "learning_rate": 0.00047257095158597664, + "loss": 1.6943, + "loss_base2": 2.4444, + "loss_pixel": 0.1782, + "loss_text": 1.5161, + "ppl": 5.4428, + "step": 6772 + }, + { + "epoch": 0.04, + "global_step": 6773, + "learning_rate": 0.00047256677796327215, + "loss": 1.4702, + "loss_base2": 2.1211, + "loss_pixel": 0.1754, + "loss_text": 1.2948, + "ppl": 4.3501, + "step": 6773 + }, + { + "epoch": 0.04, + "global_step": 6774, + "learning_rate": 0.00047256260434056765, + "loss": 1.4916, + "loss_base2": 2.1519, + "loss_pixel": 0.1787, + "loss_text": 1.3129, + "ppl": 4.4442, + "step": 6774 + }, + { + "epoch": 0.04, + "global_step": 6775, + "learning_rate": 0.00047255843071786316, + "loss": 1.477, + "loss_base2": 2.1309, + "loss_pixel": 0.1764, + "loss_text": 1.3006, + "ppl": 4.3798, + "step": 6775 + }, + { + "epoch": 0.04, + "global_step": 6776, + "learning_rate": 0.0004725542570951586, + "loss": 1.4576, + "loss_base2": 2.1029, + "loss_pixel": 0.1763, + "loss_text": 1.2813, + "ppl": 4.2956, + "step": 6776 + }, + { + "epoch": 0.04, + "global_step": 6777, + "learning_rate": 0.0004725500834724541, + "loss": 1.4789, + "loss_base2": 2.1336, + "loss_pixel": 0.1758, + "loss_text": 1.3031, + "ppl": 4.3881, + "step": 6777 + }, + { + "epoch": 0.04, + "global_step": 6778, + "learning_rate": 0.0004725459098497496, + "loss": 1.4491, + "loss_base2": 2.0906, + "loss_pixel": 0.1747, + "loss_text": 1.2744, + "ppl": 4.2593, + "step": 6778 + }, + { + "epoch": 0.04, + "global_step": 6779, + "learning_rate": 0.0004725417362270451, + "loss": 1.4677, + "loss_base2": 2.1174, + "loss_pixel": 0.1767, + "loss_text": 1.291, + "ppl": 4.3392, + "step": 6779 + }, + { + "epoch": 0.04, + "global_step": 6780, + "learning_rate": 0.00047253756260434054, + "loss": 1.4953, + "loss_base2": 2.1573, + "loss_pixel": 0.1809, + "loss_text": 1.3145, + "ppl": 4.4607, + "step": 6780 + }, + { + "epoch": 0.04, + "global_step": 6781, + "learning_rate": 0.00047253338898163604, + "loss": 1.6667, + "loss_base2": 2.4045, + "loss_pixel": 0.1952, + "loss_text": 1.4715, + "ppl": 5.2947, + "step": 6781 + }, + { + "epoch": 0.04, + "global_step": 6782, + "learning_rate": 0.00047252921535893155, + "loss": 1.7241, + "loss_base2": 2.4874, + "loss_pixel": 0.1936, + "loss_text": 1.5305, + "ppl": 5.6075, + "step": 6782 + }, + { + "epoch": 0.04, + "global_step": 6783, + "learning_rate": 0.00047252504173622706, + "loss": 1.7166, + "loss_base2": 2.4765, + "loss_pixel": 0.1877, + "loss_text": 1.5289, + "ppl": 5.5656, + "step": 6783 + }, + { + "epoch": 0.04, + "global_step": 6784, + "learning_rate": 0.00047252086811352256, + "loss": 1.7183, + "loss_base2": 2.479, + "loss_pixel": 0.1852, + "loss_text": 1.5332, + "ppl": 5.575, + "step": 6784 + }, + { + "epoch": 0.04, + "global_step": 6785, + "learning_rate": 0.000472516694490818, + "loss": 1.7112, + "loss_base2": 2.4687, + "loss_pixel": 0.1857, + "loss_text": 1.5255, + "ppl": 5.5356, + "step": 6785 + }, + { + "epoch": 0.04, + "global_step": 6786, + "learning_rate": 0.0004725125208681135, + "loss": 1.7027, + "loss_base2": 2.4565, + "loss_pixel": 0.185, + "loss_text": 1.5176, + "ppl": 5.4887, + "step": 6786 + }, + { + "epoch": 0.04, + "global_step": 6787, + "learning_rate": 0.00047250834724540903, + "loss": 1.7244, + "loss_base2": 2.4878, + "loss_pixel": 0.1852, + "loss_text": 1.5392, + "ppl": 5.6092, + "step": 6787 + }, + { + "epoch": 0.04, + "global_step": 6788, + "learning_rate": 0.00047250417362270454, + "loss": 1.7001, + "loss_base2": 2.4527, + "loss_pixel": 0.1844, + "loss_text": 1.5156, + "ppl": 5.4745, + "step": 6788 + }, + { + "epoch": 0.04, + "global_step": 6789, + "learning_rate": 0.0004725, + "loss": 1.7144, + "loss_base2": 2.4734, + "loss_pixel": 0.1846, + "loss_text": 1.5297, + "ppl": 5.5533, + "step": 6789 + }, + { + "epoch": 0.04, + "global_step": 6790, + "learning_rate": 0.0004724958263772955, + "loss": 1.688, + "loss_base2": 2.4353, + "loss_pixel": 0.1834, + "loss_text": 1.5046, + "ppl": 5.4087, + "step": 6790 + }, + { + "epoch": 0.04, + "global_step": 6791, + "learning_rate": 0.000472491652754591, + "loss": 1.7194, + "loss_base2": 2.4806, + "loss_pixel": 0.1837, + "loss_text": 1.5356, + "ppl": 5.5812, + "step": 6791 + }, + { + "epoch": 0.04, + "global_step": 6792, + "learning_rate": 0.0004724874791318865, + "loss": 1.7076, + "loss_base2": 2.4635, + "loss_pixel": 0.184, + "loss_text": 1.5236, + "ppl": 5.5157, + "step": 6792 + }, + { + "epoch": 0.04, + "global_step": 6793, + "learning_rate": 0.000472483305509182, + "loss": 1.6972, + "loss_base2": 2.4485, + "loss_pixel": 0.1838, + "loss_text": 1.5134, + "ppl": 5.4586, + "step": 6793 + }, + { + "epoch": 0.04, + "global_step": 6794, + "learning_rate": 0.0004724791318864775, + "loss": 1.7101, + "loss_base2": 2.4672, + "loss_pixel": 0.1829, + "loss_text": 1.5271, + "ppl": 5.5295, + "step": 6794 + }, + { + "epoch": 0.04, + "global_step": 6795, + "learning_rate": 0.000472474958263773, + "loss": 1.6912, + "loss_base2": 2.4399, + "loss_pixel": 0.1827, + "loss_text": 1.5085, + "ppl": 5.426, + "step": 6795 + }, + { + "epoch": 0.04, + "global_step": 6796, + "learning_rate": 0.0004724707846410685, + "loss": 1.6981, + "loss_base2": 2.4498, + "loss_pixel": 0.1833, + "loss_text": 1.5148, + "ppl": 5.4636, + "step": 6796 + }, + { + "epoch": 0.04, + "global_step": 6797, + "learning_rate": 0.00047246661101836394, + "loss": 1.715, + "loss_base2": 2.4742, + "loss_pixel": 0.1837, + "loss_text": 1.5314, + "ppl": 5.5567, + "step": 6797 + }, + { + "epoch": 0.04, + "global_step": 6798, + "learning_rate": 0.0004724624373956594, + "loss": 1.707, + "loss_base2": 2.4627, + "loss_pixel": 0.1837, + "loss_text": 1.5233, + "ppl": 5.5124, + "step": 6798 + }, + { + "epoch": 0.04, + "global_step": 6799, + "learning_rate": 0.0004724582637729549, + "loss": 1.7044, + "loss_base2": 2.4589, + "loss_pixel": 0.1832, + "loss_text": 1.5212, + "ppl": 5.4981, + "step": 6799 + }, + { + "epoch": 0.04, + "global_step": 6800, + "learning_rate": 0.0004724540901502504, + "loss": 1.7147, + "loss_base2": 2.4738, + "loss_pixel": 0.1835, + "loss_text": 1.5312, + "ppl": 5.555, + "step": 6800 + }, + { + "epoch": 0.04, + "global_step": 6801, + "learning_rate": 0.0004724499165275459, + "loss": 1.7159, + "loss_base2": 2.4755, + "loss_pixel": 0.1847, + "loss_text": 1.5312, + "ppl": 5.5617, + "step": 6801 + }, + { + "epoch": 0.04, + "global_step": 6802, + "learning_rate": 0.0004724457429048414, + "loss": 1.681, + "loss_base2": 2.4252, + "loss_pixel": 0.1835, + "loss_text": 1.4975, + "ppl": 5.3709, + "step": 6802 + }, + { + "epoch": 0.04, + "global_step": 6803, + "learning_rate": 0.0004724415692821369, + "loss": 1.6419, + "loss_base2": 2.3688, + "loss_pixel": 0.1831, + "loss_text": 1.4588, + "ppl": 5.165, + "step": 6803 + }, + { + "epoch": 0.04, + "global_step": 6804, + "learning_rate": 0.0004724373956594324, + "loss": 1.6834, + "loss_base2": 2.4286, + "loss_pixel": 0.1835, + "loss_text": 1.4999, + "ppl": 5.3838, + "step": 6804 + }, + { + "epoch": 0.04, + "global_step": 6805, + "learning_rate": 0.0004724332220367279, + "loss": 1.714, + "loss_base2": 2.4728, + "loss_pixel": 0.1833, + "loss_text": 1.5307, + "ppl": 5.5511, + "step": 6805 + }, + { + "epoch": 0.04, + "global_step": 6806, + "learning_rate": 0.0004724290484140234, + "loss": 1.7056, + "loss_base2": 2.4607, + "loss_pixel": 0.1836, + "loss_text": 1.522, + "ppl": 5.5047, + "step": 6806 + }, + { + "epoch": 0.04, + "global_step": 6807, + "learning_rate": 0.00047242487479131885, + "loss": 1.7002, + "loss_base2": 2.4529, + "loss_pixel": 0.182, + "loss_text": 1.5182, + "ppl": 5.475, + "step": 6807 + }, + { + "epoch": 0.04, + "global_step": 6808, + "learning_rate": 0.00047242070116861436, + "loss": 1.7141, + "loss_base2": 2.4729, + "loss_pixel": 0.1822, + "loss_text": 1.5319, + "ppl": 5.5517, + "step": 6808 + }, + { + "epoch": 0.04, + "global_step": 6809, + "learning_rate": 0.00047241652754590987, + "loss": 1.6927, + "loss_base2": 2.442, + "loss_pixel": 0.1816, + "loss_text": 1.5111, + "ppl": 5.4341, + "step": 6809 + }, + { + "epoch": 0.04, + "global_step": 6810, + "learning_rate": 0.0004724123539232054, + "loss": 1.687, + "loss_base2": 2.4338, + "loss_pixel": 0.1806, + "loss_text": 1.5064, + "ppl": 5.4032, + "step": 6810 + }, + { + "epoch": 0.04, + "global_step": 6811, + "learning_rate": 0.0004724081803005009, + "loss": 1.7077, + "loss_base2": 2.4637, + "loss_pixel": 0.183, + "loss_text": 1.5247, + "ppl": 5.5163, + "step": 6811 + }, + { + "epoch": 0.04, + "global_step": 6812, + "learning_rate": 0.00047240400667779634, + "loss": 1.6871, + "loss_base2": 2.434, + "loss_pixel": 0.1814, + "loss_text": 1.5057, + "ppl": 5.4038, + "step": 6812 + }, + { + "epoch": 0.04, + "global_step": 6813, + "learning_rate": 0.00047239983305509184, + "loss": 1.6866, + "loss_base2": 2.4332, + "loss_pixel": 0.182, + "loss_text": 1.5046, + "ppl": 5.4011, + "step": 6813 + }, + { + "epoch": 0.04, + "global_step": 6814, + "learning_rate": 0.00047239565943238735, + "loss": 1.6926, + "loss_base2": 2.4419, + "loss_pixel": 0.1807, + "loss_text": 1.5119, + "ppl": 5.4336, + "step": 6814 + }, + { + "epoch": 0.04, + "global_step": 6815, + "learning_rate": 0.00047239148580968286, + "loss": 1.6719, + "loss_base2": 2.412, + "loss_pixel": 0.1823, + "loss_text": 1.4895, + "ppl": 5.3223, + "step": 6815 + }, + { + "epoch": 0.04, + "global_step": 6816, + "learning_rate": 0.00047238731218697826, + "loss": 1.7168, + "loss_base2": 2.4768, + "loss_pixel": 0.1804, + "loss_text": 1.5364, + "ppl": 5.5667, + "step": 6816 + }, + { + "epoch": 0.04, + "global_step": 6817, + "learning_rate": 0.00047238313856427376, + "loss": 1.6907, + "loss_base2": 2.4392, + "loss_pixel": 0.1806, + "loss_text": 1.5101, + "ppl": 5.4233, + "step": 6817 + }, + { + "epoch": 0.04, + "global_step": 6818, + "learning_rate": 0.00047237896494156927, + "loss": 1.685, + "loss_base2": 2.4309, + "loss_pixel": 0.1808, + "loss_text": 1.5042, + "ppl": 5.3925, + "step": 6818 + }, + { + "epoch": 0.04, + "global_step": 6819, + "learning_rate": 0.0004723747913188648, + "loss": 1.6907, + "loss_base2": 2.4392, + "loss_pixel": 0.1822, + "loss_text": 1.5086, + "ppl": 5.4233, + "step": 6819 + }, + { + "epoch": 0.04, + "global_step": 6820, + "learning_rate": 0.0004723706176961603, + "loss": 1.6807, + "loss_base2": 2.4247, + "loss_pixel": 0.1804, + "loss_text": 1.5003, + "ppl": 5.3693, + "step": 6820 + }, + { + "epoch": 0.04, + "global_step": 6821, + "learning_rate": 0.00047236644407345574, + "loss": 1.6956, + "loss_base2": 2.4462, + "loss_pixel": 0.1816, + "loss_text": 1.514, + "ppl": 5.4499, + "step": 6821 + }, + { + "epoch": 0.04, + "global_step": 6822, + "learning_rate": 0.00047236227045075125, + "loss": 1.7013, + "loss_base2": 2.4545, + "loss_pixel": 0.1805, + "loss_text": 1.5207, + "ppl": 5.4811, + "step": 6822 + }, + { + "epoch": 0.04, + "global_step": 6823, + "learning_rate": 0.00047235809682804675, + "loss": 1.7023, + "loss_base2": 2.4559, + "loss_pixel": 0.1825, + "loss_text": 1.5198, + "ppl": 5.4866, + "step": 6823 + }, + { + "epoch": 0.04, + "global_step": 6824, + "learning_rate": 0.00047235392320534226, + "loss": 1.696, + "loss_base2": 2.4468, + "loss_pixel": 0.1812, + "loss_text": 1.5148, + "ppl": 5.4521, + "step": 6824 + }, + { + "epoch": 0.04, + "global_step": 6825, + "learning_rate": 0.00047234974958263777, + "loss": 1.6962, + "loss_base2": 2.4471, + "loss_pixel": 0.1805, + "loss_text": 1.5156, + "ppl": 5.4532, + "step": 6825 + }, + { + "epoch": 0.04, + "global_step": 6826, + "learning_rate": 0.0004723455759599332, + "loss": 1.7135, + "loss_base2": 2.4721, + "loss_pixel": 0.181, + "loss_text": 1.5325, + "ppl": 5.5483, + "step": 6826 + }, + { + "epoch": 0.04, + "global_step": 6827, + "learning_rate": 0.00047234140233722873, + "loss": 1.693, + "loss_base2": 2.4425, + "loss_pixel": 0.1827, + "loss_text": 1.5103, + "ppl": 5.4358, + "step": 6827 + }, + { + "epoch": 0.04, + "global_step": 6828, + "learning_rate": 0.00047233722871452424, + "loss": 1.6956, + "loss_base2": 2.4462, + "loss_pixel": 0.1811, + "loss_text": 1.5145, + "ppl": 5.4499, + "step": 6828 + }, + { + "epoch": 0.04, + "global_step": 6829, + "learning_rate": 0.00047233305509181974, + "loss": 1.6756, + "loss_base2": 2.4174, + "loss_pixel": 0.1826, + "loss_text": 1.4931, + "ppl": 5.342, + "step": 6829 + }, + { + "epoch": 0.04, + "global_step": 6830, + "learning_rate": 0.0004723288814691152, + "loss": 1.6936, + "loss_base2": 2.4433, + "loss_pixel": 0.1822, + "loss_text": 1.5114, + "ppl": 5.439, + "step": 6830 + }, + { + "epoch": 0.04, + "global_step": 6831, + "learning_rate": 0.0004723247078464107, + "loss": 1.6883, + "loss_base2": 2.4357, + "loss_pixel": 0.1814, + "loss_text": 1.5069, + "ppl": 5.4103, + "step": 6831 + }, + { + "epoch": 0.04, + "global_step": 6832, + "learning_rate": 0.0004723205342237062, + "loss": 1.6998, + "loss_base2": 2.4523, + "loss_pixel": 0.1805, + "loss_text": 1.5193, + "ppl": 5.4729, + "step": 6832 + }, + { + "epoch": 0.04, + "global_step": 6833, + "learning_rate": 0.0004723163606010017, + "loss": 1.6958, + "loss_base2": 2.4465, + "loss_pixel": 0.1815, + "loss_text": 1.5143, + "ppl": 5.451, + "step": 6833 + }, + { + "epoch": 0.04, + "global_step": 6834, + "learning_rate": 0.00047231218697829717, + "loss": 1.6968, + "loss_base2": 2.448, + "loss_pixel": 0.1812, + "loss_text": 1.5156, + "ppl": 5.4565, + "step": 6834 + }, + { + "epoch": 0.04, + "global_step": 6835, + "learning_rate": 0.0004723080133555926, + "loss": 1.6935, + "loss_base2": 2.4432, + "loss_pixel": 0.1813, + "loss_text": 1.5122, + "ppl": 5.4385, + "step": 6835 + }, + { + "epoch": 0.04, + "global_step": 6836, + "learning_rate": 0.00047230383973288813, + "loss": 1.7107, + "loss_base2": 2.468, + "loss_pixel": 0.1808, + "loss_text": 1.5299, + "ppl": 5.5328, + "step": 6836 + }, + { + "epoch": 0.04, + "global_step": 6837, + "learning_rate": 0.00047229966611018364, + "loss": 1.6884, + "loss_base2": 2.4358, + "loss_pixel": 0.1814, + "loss_text": 1.5069, + "ppl": 5.4108, + "step": 6837 + }, + { + "epoch": 0.04, + "global_step": 6838, + "learning_rate": 0.00047229549248747915, + "loss": 1.6831, + "loss_base2": 2.4282, + "loss_pixel": 0.1805, + "loss_text": 1.5026, + "ppl": 5.3822, + "step": 6838 + }, + { + "epoch": 0.04, + "global_step": 6839, + "learning_rate": 0.0004722913188647746, + "loss": 1.6911, + "loss_base2": 2.4397, + "loss_pixel": 0.1797, + "loss_text": 1.5115, + "ppl": 5.4254, + "step": 6839 + }, + { + "epoch": 0.04, + "global_step": 6840, + "learning_rate": 0.0004722871452420701, + "loss": 1.6959, + "loss_base2": 2.4467, + "loss_pixel": 0.1808, + "loss_text": 1.5151, + "ppl": 5.4516, + "step": 6840 + }, + { + "epoch": 0.04, + "global_step": 6841, + "learning_rate": 0.0004722829716193656, + "loss": 1.6617, + "loss_base2": 2.3973, + "loss_pixel": 0.181, + "loss_text": 1.4808, + "ppl": 5.2683, + "step": 6841 + }, + { + "epoch": 0.04, + "global_step": 6842, + "learning_rate": 0.0004722787979966611, + "loss": 1.6896, + "loss_base2": 2.4376, + "loss_pixel": 0.1815, + "loss_text": 1.508, + "ppl": 5.4173, + "step": 6842 + }, + { + "epoch": 0.04, + "global_step": 6843, + "learning_rate": 0.00047227462437395663, + "loss": 1.6953, + "loss_base2": 2.4458, + "loss_pixel": 0.1802, + "loss_text": 1.5151, + "ppl": 5.4483, + "step": 6843 + }, + { + "epoch": 0.04, + "global_step": 6844, + "learning_rate": 0.0004722704507512521, + "loss": 1.6751, + "loss_base2": 2.4167, + "loss_pixel": 0.1807, + "loss_text": 1.4944, + "ppl": 5.3393, + "step": 6844 + }, + { + "epoch": 0.04, + "global_step": 6845, + "learning_rate": 0.0004722662771285476, + "loss": 1.6836, + "loss_base2": 2.4289, + "loss_pixel": 0.1827, + "loss_text": 1.5008, + "ppl": 5.3849, + "step": 6845 + }, + { + "epoch": 0.04, + "global_step": 6846, + "learning_rate": 0.0004722621035058431, + "loss": 1.4831, + "loss_base2": 2.1397, + "loss_pixel": 0.18, + "loss_text": 1.3031, + "ppl": 4.4066, + "step": 6846 + }, + { + "epoch": 0.04, + "global_step": 6847, + "learning_rate": 0.0004722579298831386, + "loss": 1.4761, + "loss_base2": 2.1296, + "loss_pixel": 0.1805, + "loss_text": 1.2956, + "ppl": 4.3758, + "step": 6847 + }, + { + "epoch": 0.04, + "global_step": 6848, + "learning_rate": 0.00047225375626043406, + "loss": 1.4836, + "loss_base2": 2.1404, + "loss_pixel": 0.1795, + "loss_text": 1.3042, + "ppl": 4.4088, + "step": 6848 + }, + { + "epoch": 0.04, + "global_step": 6849, + "learning_rate": 0.00047224958263772956, + "loss": 1.4619, + "loss_base2": 2.1091, + "loss_pixel": 0.1825, + "loss_text": 1.2794, + "ppl": 4.3141, + "step": 6849 + }, + { + "epoch": 0.04, + "global_step": 6850, + "learning_rate": 0.00047224540901502507, + "loss": 1.4443, + "loss_base2": 2.0837, + "loss_pixel": 0.1802, + "loss_text": 1.2642, + "ppl": 4.2389, + "step": 6850 + }, + { + "epoch": 0.04, + "global_step": 6851, + "learning_rate": 0.0004722412353923206, + "loss": 1.4511, + "loss_base2": 2.0935, + "loss_pixel": 0.1792, + "loss_text": 1.2718, + "ppl": 4.2678, + "step": 6851 + }, + { + "epoch": 0.04, + "global_step": 6852, + "learning_rate": 0.0004722370617696161, + "loss": 1.4633, + "loss_base2": 2.1111, + "loss_pixel": 0.1802, + "loss_text": 1.2832, + "ppl": 4.3202, + "step": 6852 + }, + { + "epoch": 0.04, + "global_step": 6853, + "learning_rate": 0.0004722328881469115, + "loss": 1.4974, + "loss_base2": 2.1603, + "loss_pixel": 0.1803, + "loss_text": 1.3171, + "ppl": 4.4701, + "step": 6853 + }, + { + "epoch": 0.04, + "global_step": 6854, + "learning_rate": 0.000472228714524207, + "loss": 1.4593, + "loss_base2": 2.1053, + "loss_pixel": 0.1808, + "loss_text": 1.2784, + "ppl": 4.3029, + "step": 6854 + }, + { + "epoch": 0.04, + "global_step": 6855, + "learning_rate": 0.0004722245409015025, + "loss": 1.4448, + "loss_base2": 2.0844, + "loss_pixel": 0.1837, + "loss_text": 1.2611, + "ppl": 4.241, + "step": 6855 + }, + { + "epoch": 0.04, + "global_step": 6856, + "learning_rate": 0.000472220367278798, + "loss": 1.4677, + "loss_base2": 2.1174, + "loss_pixel": 0.1811, + "loss_text": 1.2865, + "ppl": 4.3392, + "step": 6856 + }, + { + "epoch": 0.04, + "global_step": 6857, + "learning_rate": 0.00047221619365609346, + "loss": 1.4452, + "loss_base2": 2.085, + "loss_pixel": 0.1806, + "loss_text": 1.2646, + "ppl": 4.2427, + "step": 6857 + }, + { + "epoch": 0.04, + "global_step": 6858, + "learning_rate": 0.00047221202003338897, + "loss": 1.4504, + "loss_base2": 2.0925, + "loss_pixel": 0.1805, + "loss_text": 1.2699, + "ppl": 4.2648, + "step": 6858 + }, + { + "epoch": 0.04, + "global_step": 6859, + "learning_rate": 0.0004722078464106845, + "loss": 1.4399, + "loss_base2": 2.0773, + "loss_pixel": 0.18, + "loss_text": 1.2599, + "ppl": 4.2203, + "step": 6859 + }, + { + "epoch": 0.04, + "global_step": 6860, + "learning_rate": 0.00047220367278798, + "loss": 1.4978, + "loss_base2": 2.1609, + "loss_pixel": 0.1801, + "loss_text": 1.3177, + "ppl": 4.4718, + "step": 6860 + }, + { + "epoch": 0.04, + "global_step": 6861, + "learning_rate": 0.0004721994991652755, + "loss": 1.4479, + "loss_base2": 2.0889, + "loss_pixel": 0.1807, + "loss_text": 1.2672, + "ppl": 4.2542, + "step": 6861 + }, + { + "epoch": 0.04, + "global_step": 6862, + "learning_rate": 0.00047219532554257094, + "loss": 1.6881, + "loss_base2": 2.4354, + "loss_pixel": 0.1817, + "loss_text": 1.5065, + "ppl": 5.4092, + "step": 6862 + }, + { + "epoch": 0.04, + "global_step": 6863, + "learning_rate": 0.00047219115191986645, + "loss": 1.7188, + "loss_base2": 2.4797, + "loss_pixel": 0.1816, + "loss_text": 1.5373, + "ppl": 5.5778, + "step": 6863 + }, + { + "epoch": 0.04, + "global_step": 6864, + "learning_rate": 0.00047218697829716196, + "loss": 1.7211, + "loss_base2": 2.483, + "loss_pixel": 0.1798, + "loss_text": 1.5413, + "ppl": 5.5907, + "step": 6864 + }, + { + "epoch": 0.04, + "global_step": 6865, + "learning_rate": 0.00047218280467445746, + "loss": 1.7187, + "loss_base2": 2.4796, + "loss_pixel": 0.1811, + "loss_text": 1.5377, + "ppl": 5.5773, + "step": 6865 + }, + { + "epoch": 0.04, + "global_step": 6866, + "learning_rate": 0.0004721786310517529, + "loss": 1.7118, + "loss_base2": 2.4696, + "loss_pixel": 0.1811, + "loss_text": 1.5306, + "ppl": 5.5389, + "step": 6866 + }, + { + "epoch": 0.04, + "global_step": 6867, + "learning_rate": 0.0004721744574290484, + "loss": 1.7063, + "loss_base2": 2.4617, + "loss_pixel": 0.1802, + "loss_text": 1.5261, + "ppl": 5.5085, + "step": 6867 + }, + { + "epoch": 0.04, + "global_step": 6868, + "learning_rate": 0.00047217028380634393, + "loss": 1.6912, + "loss_base2": 2.4399, + "loss_pixel": 0.1795, + "loss_text": 1.5117, + "ppl": 5.426, + "step": 6868 + }, + { + "epoch": 0.04, + "global_step": 6869, + "learning_rate": 0.00047216611018363944, + "loss": 1.6918, + "loss_base2": 2.4408, + "loss_pixel": 0.1806, + "loss_text": 1.5112, + "ppl": 5.4292, + "step": 6869 + }, + { + "epoch": 0.04, + "global_step": 6870, + "learning_rate": 0.00047216193656093495, + "loss": 1.7046, + "loss_base2": 2.4592, + "loss_pixel": 0.1813, + "loss_text": 1.5233, + "ppl": 5.4992, + "step": 6870 + }, + { + "epoch": 0.04, + "global_step": 6871, + "learning_rate": 0.0004721577629382304, + "loss": 1.6932, + "loss_base2": 2.4428, + "loss_pixel": 0.1815, + "loss_text": 1.5117, + "ppl": 5.4369, + "step": 6871 + }, + { + "epoch": 0.04, + "global_step": 6872, + "learning_rate": 0.00047215358931552585, + "loss": 1.7083, + "loss_base2": 2.4646, + "loss_pixel": 0.181, + "loss_text": 1.5273, + "ppl": 5.5196, + "step": 6872 + }, + { + "epoch": 0.04, + "global_step": 6873, + "learning_rate": 0.00047214941569282136, + "loss": 1.6902, + "loss_base2": 2.4384, + "loss_pixel": 0.1805, + "loss_text": 1.5097, + "ppl": 5.4206, + "step": 6873 + }, + { + "epoch": 0.04, + "global_step": 6874, + "learning_rate": 0.00047214524207011687, + "loss": 1.706, + "loss_base2": 2.4612, + "loss_pixel": 0.1816, + "loss_text": 1.5243, + "ppl": 5.5069, + "step": 6874 + }, + { + "epoch": 0.04, + "global_step": 6875, + "learning_rate": 0.0004721410684474123, + "loss": 1.6983, + "loss_base2": 2.4501, + "loss_pixel": 0.1801, + "loss_text": 1.5182, + "ppl": 5.4646, + "step": 6875 + }, + { + "epoch": 0.04, + "global_step": 6876, + "learning_rate": 0.00047213689482470783, + "loss": 1.7015, + "loss_base2": 2.4547, + "loss_pixel": 0.1803, + "loss_text": 1.5212, + "ppl": 5.4822, + "step": 6876 + }, + { + "epoch": 0.04, + "global_step": 6877, + "learning_rate": 0.00047213272120200334, + "loss": 1.712, + "loss_base2": 2.4699, + "loss_pixel": 0.1807, + "loss_text": 1.5313, + "ppl": 5.54, + "step": 6877 + }, + { + "epoch": 0.04, + "global_step": 6878, + "learning_rate": 0.00047212854757929884, + "loss": 1.6923, + "loss_base2": 2.4415, + "loss_pixel": 0.1805, + "loss_text": 1.5118, + "ppl": 5.432, + "step": 6878 + }, + { + "epoch": 0.04, + "global_step": 6879, + "learning_rate": 0.00047212437395659435, + "loss": 1.6929, + "loss_base2": 2.4423, + "loss_pixel": 0.1806, + "loss_text": 1.5123, + "ppl": 5.4352, + "step": 6879 + }, + { + "epoch": 0.04, + "global_step": 6880, + "learning_rate": 0.0004721202003338898, + "loss": 1.7097, + "loss_base2": 2.4666, + "loss_pixel": 0.1805, + "loss_text": 1.5292, + "ppl": 5.5273, + "step": 6880 + }, + { + "epoch": 0.04, + "global_step": 6881, + "learning_rate": 0.0004721160267111853, + "loss": 1.7021, + "loss_base2": 2.4556, + "loss_pixel": 0.1813, + "loss_text": 1.5208, + "ppl": 5.4855, + "step": 6881 + }, + { + "epoch": 0.04, + "global_step": 6882, + "learning_rate": 0.0004721118530884808, + "loss": 1.6828, + "loss_base2": 2.4278, + "loss_pixel": 0.1807, + "loss_text": 1.5021, + "ppl": 5.3806, + "step": 6882 + }, + { + "epoch": 0.04, + "global_step": 6883, + "learning_rate": 0.0004721076794657763, + "loss": 1.7071, + "loss_base2": 2.4628, + "loss_pixel": 0.1811, + "loss_text": 1.5259, + "ppl": 5.513, + "step": 6883 + }, + { + "epoch": 0.04, + "global_step": 6884, + "learning_rate": 0.00047210350584307183, + "loss": 1.6963, + "loss_base2": 2.4472, + "loss_pixel": 0.1801, + "loss_text": 1.5162, + "ppl": 5.4537, + "step": 6884 + }, + { + "epoch": 0.04, + "global_step": 6885, + "learning_rate": 0.0004720993322203673, + "loss": 1.6855, + "loss_base2": 2.4317, + "loss_pixel": 0.1801, + "loss_text": 1.5054, + "ppl": 5.3951, + "step": 6885 + }, + { + "epoch": 0.04, + "global_step": 6886, + "learning_rate": 0.0004720951585976628, + "loss": 1.5973, + "loss_base2": 2.3044, + "loss_pixel": 0.1821, + "loss_text": 1.4152, + "ppl": 4.9397, + "step": 6886 + }, + { + "epoch": 0.04, + "global_step": 6887, + "learning_rate": 0.0004720909849749583, + "loss": 1.4934, + "loss_base2": 2.1545, + "loss_pixel": 0.1803, + "loss_text": 1.3131, + "ppl": 4.4522, + "step": 6887 + }, + { + "epoch": 0.04, + "global_step": 6888, + "learning_rate": 0.0004720868113522538, + "loss": 1.4781, + "loss_base2": 2.1324, + "loss_pixel": 0.1811, + "loss_text": 1.297, + "ppl": 4.3846, + "step": 6888 + }, + { + "epoch": 0.04, + "global_step": 6889, + "learning_rate": 0.00047208263772954926, + "loss": 1.4987, + "loss_base2": 2.1622, + "loss_pixel": 0.1807, + "loss_text": 1.318, + "ppl": 4.4759, + "step": 6889 + }, + { + "epoch": 0.04, + "global_step": 6890, + "learning_rate": 0.0004720784641068447, + "loss": 1.448, + "loss_base2": 2.089, + "loss_pixel": 0.1806, + "loss_text": 1.2673, + "ppl": 4.2546, + "step": 6890 + }, + { + "epoch": 0.04, + "global_step": 6891, + "learning_rate": 0.0004720742904841402, + "loss": 1.4756, + "loss_base2": 2.1288, + "loss_pixel": 0.1801, + "loss_text": 1.2954, + "ppl": 4.3737, + "step": 6891 + }, + { + "epoch": 0.04, + "global_step": 6892, + "learning_rate": 0.00047207011686143573, + "loss": 1.4636, + "loss_base2": 2.1115, + "loss_pixel": 0.1798, + "loss_text": 1.2839, + "ppl": 4.3215, + "step": 6892 + }, + { + "epoch": 0.04, + "global_step": 6893, + "learning_rate": 0.00047206594323873124, + "loss": 1.4613, + "loss_base2": 2.1082, + "loss_pixel": 0.1795, + "loss_text": 1.2818, + "ppl": 4.3116, + "step": 6893 + }, + { + "epoch": 0.04, + "global_step": 6894, + "learning_rate": 0.0004720617696160267, + "loss": 1.4482, + "loss_base2": 2.0893, + "loss_pixel": 0.1806, + "loss_text": 1.2677, + "ppl": 4.2554, + "step": 6894 + }, + { + "epoch": 0.04, + "global_step": 6895, + "learning_rate": 0.0004720575959933222, + "loss": 1.6067, + "loss_base2": 2.318, + "loss_pixel": 0.1808, + "loss_text": 1.4259, + "ppl": 4.9863, + "step": 6895 + }, + { + "epoch": 0.04, + "global_step": 6896, + "learning_rate": 0.0004720534223706177, + "loss": 1.6918, + "loss_base2": 2.4408, + "loss_pixel": 0.1791, + "loss_text": 1.5127, + "ppl": 5.4292, + "step": 6896 + }, + { + "epoch": 0.04, + "global_step": 6897, + "learning_rate": 0.0004720492487479132, + "loss": 1.7065, + "loss_base2": 2.462, + "loss_pixel": 0.1818, + "loss_text": 1.5247, + "ppl": 5.5096, + "step": 6897 + }, + { + "epoch": 0.04, + "global_step": 6898, + "learning_rate": 0.00047204507512520866, + "loss": 1.7033, + "loss_base2": 2.4573, + "loss_pixel": 0.1799, + "loss_text": 1.5233, + "ppl": 5.492, + "step": 6898 + }, + { + "epoch": 0.04, + "global_step": 6899, + "learning_rate": 0.00047204090150250417, + "loss": 1.7003, + "loss_base2": 2.453, + "loss_pixel": 0.1792, + "loss_text": 1.5211, + "ppl": 5.4756, + "step": 6899 + }, + { + "epoch": 0.04, + "global_step": 6900, + "learning_rate": 0.0004720367278797997, + "loss": 1.6931, + "loss_base2": 2.4426, + "loss_pixel": 0.1795, + "loss_text": 1.5136, + "ppl": 5.4363, + "step": 6900 + }, + { + "epoch": 0.04, + "global_step": 6901, + "learning_rate": 0.0004720325542570952, + "loss": 1.6872, + "loss_base2": 2.4341, + "loss_pixel": 0.1801, + "loss_text": 1.5071, + "ppl": 5.4043, + "step": 6901 + }, + { + "epoch": 0.04, + "global_step": 6902, + "learning_rate": 0.0004720283806343907, + "loss": 1.6954, + "loss_base2": 2.4459, + "loss_pixel": 0.1793, + "loss_text": 1.516, + "ppl": 5.4488, + "step": 6902 + }, + { + "epoch": 0.04, + "global_step": 6903, + "learning_rate": 0.00047202420701168615, + "loss": 1.7095, + "loss_base2": 2.4663, + "loss_pixel": 0.1806, + "loss_text": 1.5288, + "ppl": 5.5262, + "step": 6903 + }, + { + "epoch": 0.04, + "global_step": 6904, + "learning_rate": 0.00047202003338898165, + "loss": 1.6948, + "loss_base2": 2.4451, + "loss_pixel": 0.1812, + "loss_text": 1.5136, + "ppl": 5.4456, + "step": 6904 + }, + { + "epoch": 0.04, + "global_step": 6905, + "learning_rate": 0.00047201585976627716, + "loss": 1.6846, + "loss_base2": 2.4304, + "loss_pixel": 0.1756, + "loss_text": 1.5089, + "ppl": 5.3903, + "step": 6905 + }, + { + "epoch": 0.04, + "global_step": 6906, + "learning_rate": 0.00047201168614357267, + "loss": 1.6885, + "loss_base2": 2.436, + "loss_pixel": 0.1794, + "loss_text": 1.509, + "ppl": 5.4114, + "step": 6906 + }, + { + "epoch": 0.04, + "global_step": 6907, + "learning_rate": 0.0004720075125208681, + "loss": 1.6944, + "loss_base2": 2.4445, + "loss_pixel": 0.1787, + "loss_text": 1.5157, + "ppl": 5.4434, + "step": 6907 + }, + { + "epoch": 0.04, + "global_step": 6908, + "learning_rate": 0.00047200333889816363, + "loss": 1.6953, + "loss_base2": 2.4458, + "loss_pixel": 0.1755, + "loss_text": 1.5198, + "ppl": 5.4483, + "step": 6908 + }, + { + "epoch": 0.04, + "global_step": 6909, + "learning_rate": 0.0004719991652754591, + "loss": 1.7028, + "loss_base2": 2.4566, + "loss_pixel": 0.1765, + "loss_text": 1.5263, + "ppl": 5.4893, + "step": 6909 + }, + { + "epoch": 0.04, + "global_step": 6910, + "learning_rate": 0.0004719949916527546, + "loss": 1.7011, + "loss_base2": 2.4542, + "loss_pixel": 0.1783, + "loss_text": 1.5228, + "ppl": 5.48, + "step": 6910 + }, + { + "epoch": 0.04, + "global_step": 6911, + "learning_rate": 0.0004719908180300501, + "loss": 1.6877, + "loss_base2": 2.4348, + "loss_pixel": 0.1758, + "loss_text": 1.5119, + "ppl": 5.407, + "step": 6911 + }, + { + "epoch": 0.04, + "global_step": 6912, + "learning_rate": 0.00047198664440734555, + "loss": 1.6852, + "loss_base2": 2.4312, + "loss_pixel": 0.178, + "loss_text": 1.5072, + "ppl": 5.3935, + "step": 6912 + }, + { + "epoch": 0.04, + "global_step": 6913, + "learning_rate": 0.00047198247078464106, + "loss": 1.6947, + "loss_base2": 2.4449, + "loss_pixel": 0.1754, + "loss_text": 1.5194, + "ppl": 5.445, + "step": 6913 + }, + { + "epoch": 0.04, + "global_step": 6914, + "learning_rate": 0.00047197829716193656, + "loss": 1.675, + "loss_base2": 2.4165, + "loss_pixel": 0.1777, + "loss_text": 1.4973, + "ppl": 5.3388, + "step": 6914 + }, + { + "epoch": 0.04, + "global_step": 6915, + "learning_rate": 0.00047197412353923207, + "loss": 1.6866, + "loss_base2": 2.4332, + "loss_pixel": 0.1735, + "loss_text": 1.5131, + "ppl": 5.4011, + "step": 6915 + }, + { + "epoch": 0.04, + "global_step": 6916, + "learning_rate": 0.0004719699499165275, + "loss": 1.6969, + "loss_base2": 2.4481, + "loss_pixel": 0.175, + "loss_text": 1.5219, + "ppl": 5.457, + "step": 6916 + }, + { + "epoch": 0.04, + "global_step": 6917, + "learning_rate": 0.00047196577629382303, + "loss": 1.6784, + "loss_base2": 2.4214, + "loss_pixel": 0.1737, + "loss_text": 1.5047, + "ppl": 5.357, + "step": 6917 + }, + { + "epoch": 0.04, + "global_step": 6918, + "learning_rate": 0.00047196160267111854, + "loss": 1.7036, + "loss_base2": 2.4578, + "loss_pixel": 0.1771, + "loss_text": 1.5265, + "ppl": 5.4937, + "step": 6918 + }, + { + "epoch": 0.04, + "global_step": 6919, + "learning_rate": 0.00047195742904841405, + "loss": 1.6877, + "loss_base2": 2.4348, + "loss_pixel": 0.1738, + "loss_text": 1.5139, + "ppl": 5.407, + "step": 6919 + }, + { + "epoch": 0.04, + "global_step": 6920, + "learning_rate": 0.00047195325542570955, + "loss": 1.6865, + "loss_base2": 2.4331, + "loss_pixel": 0.1814, + "loss_text": 1.505, + "ppl": 5.4005, + "step": 6920 + }, + { + "epoch": 0.04, + "global_step": 6921, + "learning_rate": 0.000471949081803005, + "loss": 1.6988, + "loss_base2": 2.4509, + "loss_pixel": 0.1825, + "loss_text": 1.5163, + "ppl": 5.4674, + "step": 6921 + }, + { + "epoch": 0.04, + "global_step": 6922, + "learning_rate": 0.0004719449081803005, + "loss": 1.6928, + "loss_base2": 2.4422, + "loss_pixel": 0.1825, + "loss_text": 1.5103, + "ppl": 5.4347, + "step": 6922 + }, + { + "epoch": 0.04, + "global_step": 6923, + "learning_rate": 0.000471940734557596, + "loss": 1.7033, + "loss_base2": 2.4573, + "loss_pixel": 0.1831, + "loss_text": 1.5202, + "ppl": 5.492, + "step": 6923 + }, + { + "epoch": 0.04, + "global_step": 6924, + "learning_rate": 0.00047193656093489153, + "loss": 1.6993, + "loss_base2": 2.4516, + "loss_pixel": 0.1834, + "loss_text": 1.5158, + "ppl": 5.4701, + "step": 6924 + }, + { + "epoch": 0.04, + "global_step": 6925, + "learning_rate": 0.000471932387312187, + "loss": 1.7046, + "loss_base2": 2.4592, + "loss_pixel": 0.1824, + "loss_text": 1.5222, + "ppl": 5.4992, + "step": 6925 + }, + { + "epoch": 0.04, + "global_step": 6926, + "learning_rate": 0.0004719282136894825, + "loss": 1.6922, + "loss_base2": 2.4413, + "loss_pixel": 0.1822, + "loss_text": 1.51, + "ppl": 5.4314, + "step": 6926 + }, + { + "epoch": 0.04, + "global_step": 6927, + "learning_rate": 0.000471924040066778, + "loss": 1.6857, + "loss_base2": 2.432, + "loss_pixel": 0.1822, + "loss_text": 1.5035, + "ppl": 5.3962, + "step": 6927 + }, + { + "epoch": 0.04, + "global_step": 6928, + "learning_rate": 0.00047191986644407345, + "loss": 1.6941, + "loss_base2": 2.4441, + "loss_pixel": 0.1816, + "loss_text": 1.5125, + "ppl": 5.4417, + "step": 6928 + }, + { + "epoch": 0.04, + "global_step": 6929, + "learning_rate": 0.00047191569282136896, + "loss": 1.6824, + "loss_base2": 2.4272, + "loss_pixel": 0.1812, + "loss_text": 1.5012, + "ppl": 5.3784, + "step": 6929 + }, + { + "epoch": 0.04, + "global_step": 6930, + "learning_rate": 0.0004719115191986644, + "loss": 1.6876, + "loss_base2": 2.4347, + "loss_pixel": 0.182, + "loss_text": 1.5056, + "ppl": 5.4065, + "step": 6930 + }, + { + "epoch": 0.04, + "global_step": 6931, + "learning_rate": 0.0004719073455759599, + "loss": 1.6996, + "loss_base2": 2.452, + "loss_pixel": 0.1811, + "loss_text": 1.5185, + "ppl": 5.4718, + "step": 6931 + }, + { + "epoch": 0.04, + "global_step": 6932, + "learning_rate": 0.0004719031719532554, + "loss": 1.6736, + "loss_base2": 2.4145, + "loss_pixel": 0.1814, + "loss_text": 1.4922, + "ppl": 5.3313, + "step": 6932 + }, + { + "epoch": 0.04, + "global_step": 6933, + "learning_rate": 0.00047189899833055093, + "loss": 1.6886, + "loss_base2": 2.4361, + "loss_pixel": 0.1806, + "loss_text": 1.508, + "ppl": 5.4119, + "step": 6933 + }, + { + "epoch": 0.04, + "global_step": 6934, + "learning_rate": 0.0004718948247078464, + "loss": 1.6886, + "loss_base2": 2.4361, + "loss_pixel": 0.1808, + "loss_text": 1.5078, + "ppl": 5.4119, + "step": 6934 + }, + { + "epoch": 0.04, + "global_step": 6935, + "learning_rate": 0.0004718906510851419, + "loss": 1.689, + "loss_base2": 2.4367, + "loss_pixel": 0.1805, + "loss_text": 1.5085, + "ppl": 5.4141, + "step": 6935 + }, + { + "epoch": 0.04, + "global_step": 6936, + "learning_rate": 0.0004718864774624374, + "loss": 1.6984, + "loss_base2": 2.4503, + "loss_pixel": 0.1803, + "loss_text": 1.5181, + "ppl": 5.4652, + "step": 6936 + }, + { + "epoch": 0.04, + "global_step": 6937, + "learning_rate": 0.0004718823038397329, + "loss": 1.7001, + "loss_base2": 2.4527, + "loss_pixel": 0.1794, + "loss_text": 1.5207, + "ppl": 5.4745, + "step": 6937 + }, + { + "epoch": 0.04, + "global_step": 6938, + "learning_rate": 0.0004718781302170284, + "loss": 1.7051, + "loss_base2": 2.4599, + "loss_pixel": 0.1812, + "loss_text": 1.524, + "ppl": 5.5019, + "step": 6938 + }, + { + "epoch": 0.04, + "global_step": 6939, + "learning_rate": 0.00047187395659432387, + "loss": 1.6417, + "loss_base2": 2.3685, + "loss_pixel": 0.1802, + "loss_text": 1.4615, + "ppl": 5.1639, + "step": 6939 + }, + { + "epoch": 0.04, + "global_step": 6940, + "learning_rate": 0.0004718697829716194, + "loss": 1.4706, + "loss_base2": 2.1216, + "loss_pixel": 0.1813, + "loss_text": 1.2893, + "ppl": 4.3518, + "step": 6940 + }, + { + "epoch": 0.04, + "global_step": 6941, + "learning_rate": 0.0004718656093489149, + "loss": 1.4725, + "loss_base2": 2.1244, + "loss_pixel": 0.1804, + "loss_text": 1.2921, + "ppl": 4.3601, + "step": 6941 + }, + { + "epoch": 0.04, + "global_step": 6942, + "learning_rate": 0.0004718614357262104, + "loss": 1.4716, + "loss_base2": 2.1231, + "loss_pixel": 0.1804, + "loss_text": 1.2912, + "ppl": 4.3562, + "step": 6942 + }, + { + "epoch": 0.04, + "global_step": 6943, + "learning_rate": 0.0004718572621035059, + "loss": 1.4601, + "loss_base2": 2.1065, + "loss_pixel": 0.1795, + "loss_text": 1.2806, + "ppl": 4.3064, + "step": 6943 + }, + { + "epoch": 0.04, + "global_step": 6944, + "learning_rate": 0.00047185308848080135, + "loss": 1.452, + "loss_base2": 2.0948, + "loss_pixel": 0.1803, + "loss_text": 1.2717, + "ppl": 4.2716, + "step": 6944 + }, + { + "epoch": 0.04, + "global_step": 6945, + "learning_rate": 0.00047184891485809686, + "loss": 1.4831, + "loss_base2": 2.1397, + "loss_pixel": 0.1798, + "loss_text": 1.3033, + "ppl": 4.4066, + "step": 6945 + }, + { + "epoch": 0.04, + "global_step": 6946, + "learning_rate": 0.00047184474123539236, + "loss": 1.4648, + "loss_base2": 2.1133, + "loss_pixel": 0.1795, + "loss_text": 1.2853, + "ppl": 4.3267, + "step": 6946 + }, + { + "epoch": 0.04, + "global_step": 6947, + "learning_rate": 0.0004718405676126878, + "loss": 1.6647, + "loss_base2": 2.4017, + "loss_pixel": 0.1813, + "loss_text": 1.4834, + "ppl": 5.2841, + "step": 6947 + }, + { + "epoch": 0.04, + "global_step": 6948, + "learning_rate": 0.00047183639398998327, + "loss": 1.7098, + "loss_base2": 2.4667, + "loss_pixel": 0.1804, + "loss_text": 1.5293, + "ppl": 5.5279, + "step": 6948 + }, + { + "epoch": 0.04, + "global_step": 6949, + "learning_rate": 0.0004718322203672788, + "loss": 1.7053, + "loss_base2": 2.4602, + "loss_pixel": 0.1798, + "loss_text": 1.5256, + "ppl": 5.503, + "step": 6949 + }, + { + "epoch": 0.04, + "global_step": 6950, + "learning_rate": 0.0004718280467445743, + "loss": 1.7036, + "loss_base2": 2.4578, + "loss_pixel": 0.1802, + "loss_text": 1.5234, + "ppl": 5.4937, + "step": 6950 + }, + { + "epoch": 0.04, + "global_step": 6951, + "learning_rate": 0.0004718238731218698, + "loss": 1.7072, + "loss_base2": 2.463, + "loss_pixel": 0.1804, + "loss_text": 1.5268, + "ppl": 5.5135, + "step": 6951 + }, + { + "epoch": 0.04, + "global_step": 6952, + "learning_rate": 0.0004718196994991653, + "loss": 1.6776, + "loss_base2": 2.4203, + "loss_pixel": 0.1805, + "loss_text": 1.4971, + "ppl": 5.3527, + "step": 6952 + }, + { + "epoch": 0.04, + "global_step": 6953, + "learning_rate": 0.00047181552587646075, + "loss": 1.7103, + "loss_base2": 2.4674, + "loss_pixel": 0.1791, + "loss_text": 1.5312, + "ppl": 5.5306, + "step": 6953 + }, + { + "epoch": 0.04, + "global_step": 6954, + "learning_rate": 0.00047181135225375626, + "loss": 1.6996, + "loss_base2": 2.452, + "loss_pixel": 0.18, + "loss_text": 1.5196, + "ppl": 5.4718, + "step": 6954 + }, + { + "epoch": 0.04, + "global_step": 6955, + "learning_rate": 0.00047180717863105177, + "loss": 1.6913, + "loss_base2": 2.44, + "loss_pixel": 0.1802, + "loss_text": 1.5111, + "ppl": 5.4265, + "step": 6955 + }, + { + "epoch": 0.04, + "global_step": 6956, + "learning_rate": 0.0004718030050083473, + "loss": 1.6891, + "loss_base2": 2.4369, + "loss_pixel": 0.1811, + "loss_text": 1.508, + "ppl": 5.4146, + "step": 6956 + }, + { + "epoch": 0.04, + "global_step": 6957, + "learning_rate": 0.00047179883138564273, + "loss": 1.699, + "loss_base2": 2.4511, + "loss_pixel": 0.1803, + "loss_text": 1.5186, + "ppl": 5.4685, + "step": 6957 + }, + { + "epoch": 0.04, + "global_step": 6958, + "learning_rate": 0.00047179465776293824, + "loss": 1.6901, + "loss_base2": 2.4383, + "loss_pixel": 0.1785, + "loss_text": 1.5115, + "ppl": 5.42, + "step": 6958 + }, + { + "epoch": 0.04, + "global_step": 6959, + "learning_rate": 0.00047179048414023374, + "loss": 1.6881, + "loss_base2": 2.4354, + "loss_pixel": 0.1797, + "loss_text": 1.5085, + "ppl": 5.4092, + "step": 6959 + }, + { + "epoch": 0.04, + "global_step": 6960, + "learning_rate": 0.00047178631051752925, + "loss": 1.6969, + "loss_base2": 2.4481, + "loss_pixel": 0.1818, + "loss_text": 1.5151, + "ppl": 5.457, + "step": 6960 + }, + { + "epoch": 0.04, + "global_step": 6961, + "learning_rate": 0.00047178213689482476, + "loss": 1.6912, + "loss_base2": 2.4399, + "loss_pixel": 0.1791, + "loss_text": 1.5121, + "ppl": 5.426, + "step": 6961 + }, + { + "epoch": 0.04, + "global_step": 6962, + "learning_rate": 0.0004717779632721202, + "loss": 1.7079, + "loss_base2": 2.464, + "loss_pixel": 0.1797, + "loss_text": 1.5282, + "ppl": 5.5174, + "step": 6962 + }, + { + "epoch": 0.04, + "global_step": 6963, + "learning_rate": 0.0004717737896494157, + "loss": 1.6893, + "loss_base2": 2.4371, + "loss_pixel": 0.179, + "loss_text": 1.5104, + "ppl": 5.4157, + "step": 6963 + }, + { + "epoch": 0.04, + "global_step": 6964, + "learning_rate": 0.0004717696160267112, + "loss": 1.6981, + "loss_base2": 2.4498, + "loss_pixel": 0.1821, + "loss_text": 1.516, + "ppl": 5.4636, + "step": 6964 + }, + { + "epoch": 0.04, + "global_step": 6965, + "learning_rate": 0.00047176544240400673, + "loss": 1.6838, + "loss_base2": 2.4292, + "loss_pixel": 0.1787, + "loss_text": 1.5051, + "ppl": 5.386, + "step": 6965 + }, + { + "epoch": 0.04, + "global_step": 6966, + "learning_rate": 0.00047176126878130213, + "loss": 1.6954, + "loss_base2": 2.4459, + "loss_pixel": 0.1801, + "loss_text": 1.5152, + "ppl": 5.4488, + "step": 6966 + }, + { + "epoch": 0.04, + "global_step": 6967, + "learning_rate": 0.00047175709515859764, + "loss": 1.6954, + "loss_base2": 2.4459, + "loss_pixel": 0.1792, + "loss_text": 1.5162, + "ppl": 5.4488, + "step": 6967 + }, + { + "epoch": 0.04, + "global_step": 6968, + "learning_rate": 0.00047175292153589315, + "loss": 1.6785, + "loss_base2": 2.4216, + "loss_pixel": 0.1796, + "loss_text": 1.4989, + "ppl": 5.3575, + "step": 6968 + }, + { + "epoch": 0.04, + "global_step": 6969, + "learning_rate": 0.00047174874791318865, + "loss": 1.697, + "loss_base2": 2.4483, + "loss_pixel": 0.1803, + "loss_text": 1.5167, + "ppl": 5.4576, + "step": 6969 + }, + { + "epoch": 0.04, + "global_step": 6970, + "learning_rate": 0.00047174457429048416, + "loss": 1.6519, + "loss_base2": 2.3832, + "loss_pixel": 0.1791, + "loss_text": 1.4729, + "ppl": 5.2169, + "step": 6970 + }, + { + "epoch": 0.04, + "global_step": 6971, + "learning_rate": 0.0004717404006677796, + "loss": 1.4797, + "loss_base2": 2.1348, + "loss_pixel": 0.1798, + "loss_text": 1.2999, + "ppl": 4.3916, + "step": 6971 + }, + { + "epoch": 0.04, + "global_step": 6972, + "learning_rate": 0.0004717362270450751, + "loss": 1.4743, + "loss_base2": 2.127, + "loss_pixel": 0.1789, + "loss_text": 1.2954, + "ppl": 4.368, + "step": 6972 + }, + { + "epoch": 0.04, + "global_step": 6973, + "learning_rate": 0.00047173205342237063, + "loss": 1.4812, + "loss_base2": 2.1369, + "loss_pixel": 0.179, + "loss_text": 1.3021, + "ppl": 4.3982, + "step": 6973 + }, + { + "epoch": 0.04, + "global_step": 6974, + "learning_rate": 0.00047172787979966614, + "loss": 1.4566, + "loss_base2": 2.1014, + "loss_pixel": 0.1788, + "loss_text": 1.2777, + "ppl": 4.2913, + "step": 6974 + }, + { + "epoch": 0.04, + "global_step": 6975, + "learning_rate": 0.0004717237061769616, + "loss": 1.4568, + "loss_base2": 2.1017, + "loss_pixel": 0.1806, + "loss_text": 1.2762, + "ppl": 4.2922, + "step": 6975 + }, + { + "epoch": 0.04, + "global_step": 6976, + "learning_rate": 0.0004717195325542571, + "loss": 1.4773, + "loss_base2": 2.1313, + "loss_pixel": 0.1793, + "loss_text": 1.298, + "ppl": 4.3811, + "step": 6976 + }, + { + "epoch": 0.04, + "global_step": 6977, + "learning_rate": 0.0004717153589315526, + "loss": 1.465, + "loss_base2": 2.1135, + "loss_pixel": 0.179, + "loss_text": 1.2861, + "ppl": 4.3275, + "step": 6977 + }, + { + "epoch": 0.04, + "global_step": 6978, + "learning_rate": 0.0004717111853088481, + "loss": 1.4595, + "loss_base2": 2.1056, + "loss_pixel": 0.1804, + "loss_text": 1.2791, + "ppl": 4.3038, + "step": 6978 + }, + { + "epoch": 0.04, + "global_step": 6979, + "learning_rate": 0.0004717070116861436, + "loss": 1.536, + "loss_base2": 2.216, + "loss_pixel": 0.1792, + "loss_text": 1.3568, + "ppl": 4.646, + "step": 6979 + }, + { + "epoch": 0.04, + "global_step": 6980, + "learning_rate": 0.00047170283806343907, + "loss": 1.6856, + "loss_base2": 2.4318, + "loss_pixel": 0.1792, + "loss_text": 1.5064, + "ppl": 5.3957, + "step": 6980 + }, + { + "epoch": 0.04, + "global_step": 6981, + "learning_rate": 0.0004716986644407346, + "loss": 1.715, + "loss_base2": 2.4742, + "loss_pixel": 0.1788, + "loss_text": 1.5362, + "ppl": 5.5567, + "step": 6981 + }, + { + "epoch": 0.04, + "global_step": 6982, + "learning_rate": 0.0004716944908180301, + "loss": 1.6923, + "loss_base2": 2.4415, + "loss_pixel": 0.1796, + "loss_text": 1.5127, + "ppl": 5.432, + "step": 6982 + }, + { + "epoch": 0.04, + "global_step": 6983, + "learning_rate": 0.0004716903171953256, + "loss": 1.6987, + "loss_base2": 2.4507, + "loss_pixel": 0.1781, + "loss_text": 1.5207, + "ppl": 5.4668, + "step": 6983 + }, + { + "epoch": 0.04, + "global_step": 6984, + "learning_rate": 0.000471686143572621, + "loss": 1.7053, + "loss_base2": 2.4602, + "loss_pixel": 0.1753, + "loss_text": 1.5301, + "ppl": 5.503, + "step": 6984 + }, + { + "epoch": 0.04, + "global_step": 6985, + "learning_rate": 0.0004716819699499165, + "loss": 1.6818, + "loss_base2": 2.4263, + "loss_pixel": 0.1774, + "loss_text": 1.5044, + "ppl": 5.3752, + "step": 6985 + }, + { + "epoch": 0.04, + "global_step": 6986, + "learning_rate": 0.000471677796327212, + "loss": 1.6884, + "loss_base2": 2.4358, + "loss_pixel": 0.1739, + "loss_text": 1.5145, + "ppl": 5.4108, + "step": 6986 + }, + { + "epoch": 0.04, + "global_step": 6987, + "learning_rate": 0.0004716736227045075, + "loss": 1.7149, + "loss_base2": 2.4741, + "loss_pixel": 0.1752, + "loss_text": 1.5397, + "ppl": 5.5561, + "step": 6987 + }, + { + "epoch": 0.04, + "global_step": 6988, + "learning_rate": 0.000471669449081803, + "loss": 1.6966, + "loss_base2": 2.4477, + "loss_pixel": 0.1749, + "loss_text": 1.5217, + "ppl": 5.4554, + "step": 6988 + }, + { + "epoch": 0.04, + "global_step": 6989, + "learning_rate": 0.0004716652754590985, + "loss": 1.7061, + "loss_base2": 2.4614, + "loss_pixel": 0.176, + "loss_text": 1.5301, + "ppl": 5.5074, + "step": 6989 + }, + { + "epoch": 0.04, + "global_step": 6990, + "learning_rate": 0.000471661101836394, + "loss": 1.6803, + "loss_base2": 2.4242, + "loss_pixel": 0.1758, + "loss_text": 1.5046, + "ppl": 5.3672, + "step": 6990 + }, + { + "epoch": 0.04, + "global_step": 6991, + "learning_rate": 0.0004716569282136895, + "loss": 1.692, + "loss_base2": 2.441, + "loss_pixel": 0.1754, + "loss_text": 1.5166, + "ppl": 5.4303, + "step": 6991 + }, + { + "epoch": 0.04, + "global_step": 6992, + "learning_rate": 0.000471652754590985, + "loss": 1.6756, + "loss_base2": 2.4174, + "loss_pixel": 0.1763, + "loss_text": 1.4993, + "ppl": 5.342, + "step": 6992 + }, + { + "epoch": 0.04, + "global_step": 6993, + "learning_rate": 0.00047164858096828045, + "loss": 1.6725, + "loss_base2": 2.4129, + "loss_pixel": 0.1746, + "loss_text": 1.4979, + "ppl": 5.3255, + "step": 6993 + }, + { + "epoch": 0.04, + "global_step": 6994, + "learning_rate": 0.00047164440734557596, + "loss": 1.6881, + "loss_base2": 2.4354, + "loss_pixel": 0.1751, + "loss_text": 1.513, + "ppl": 5.4092, + "step": 6994 + }, + { + "epoch": 0.04, + "global_step": 6995, + "learning_rate": 0.00047164023372287146, + "loss": 1.684, + "loss_base2": 2.4295, + "loss_pixel": 0.1707, + "loss_text": 1.5132, + "ppl": 5.3871, + "step": 6995 + }, + { + "epoch": 0.04, + "global_step": 6996, + "learning_rate": 0.00047163606010016697, + "loss": 1.6813, + "loss_base2": 2.4256, + "loss_pixel": 0.1726, + "loss_text": 1.5087, + "ppl": 5.3725, + "step": 6996 + }, + { + "epoch": 0.04, + "global_step": 6997, + "learning_rate": 0.0004716318864774625, + "loss": 1.6857, + "loss_base2": 2.432, + "loss_pixel": 0.174, + "loss_text": 1.5117, + "ppl": 5.3962, + "step": 6997 + }, + { + "epoch": 0.04, + "global_step": 6998, + "learning_rate": 0.00047162771285475793, + "loss": 1.6727, + "loss_base2": 2.4132, + "loss_pixel": 0.1744, + "loss_text": 1.4983, + "ppl": 5.3265, + "step": 6998 + }, + { + "epoch": 0.04, + "global_step": 6999, + "learning_rate": 0.00047162353923205344, + "loss": 1.6812, + "loss_base2": 2.4255, + "loss_pixel": 0.1733, + "loss_text": 1.5079, + "ppl": 5.372, + "step": 6999 + }, + { + "epoch": 0.04, + "global_step": 7000, + "learning_rate": 0.00047161936560934895, + "loss": 1.6743, + "loss_base2": 2.4155, + "loss_pixel": 0.1735, + "loss_text": 1.5008, + "ppl": 5.3351, + "step": 7000 + }, + { + "epoch": 0.04, + "global_step": 7001, + "learning_rate": 0.00047161519198664445, + "loss": 1.6813, + "loss_base2": 2.4256, + "loss_pixel": 0.1739, + "loss_text": 1.5074, + "ppl": 5.3725, + "step": 7001 + }, + { + "epoch": 0.04, + "global_step": 7002, + "learning_rate": 0.00047161101836393996, + "loss": 1.6947, + "loss_base2": 2.4449, + "loss_pixel": 0.1736, + "loss_text": 1.521, + "ppl": 5.445, + "step": 7002 + }, + { + "epoch": 0.04, + "global_step": 7003, + "learning_rate": 0.00047160684474123536, + "loss": 1.6847, + "loss_base2": 2.4305, + "loss_pixel": 0.1743, + "loss_text": 1.5104, + "ppl": 5.3908, + "step": 7003 + }, + { + "epoch": 0.04, + "global_step": 7004, + "learning_rate": 0.00047160267111853087, + "loss": 1.6833, + "loss_base2": 2.4285, + "loss_pixel": 0.1725, + "loss_text": 1.5108, + "ppl": 5.3833, + "step": 7004 + }, + { + "epoch": 0.04, + "global_step": 7005, + "learning_rate": 0.0004715984974958264, + "loss": 1.6469, + "loss_base2": 2.376, + "loss_pixel": 0.1716, + "loss_text": 1.4753, + "ppl": 5.1909, + "step": 7005 + }, + { + "epoch": 0.04, + "global_step": 7006, + "learning_rate": 0.0004715943238731219, + "loss": 1.571, + "loss_base2": 2.2665, + "loss_pixel": 0.1745, + "loss_text": 1.3965, + "ppl": 4.8115, + "step": 7006 + }, + { + "epoch": 0.04, + "global_step": 7007, + "learning_rate": 0.00047159015025041734, + "loss": 1.508, + "loss_base2": 2.1756, + "loss_pixel": 0.1745, + "loss_text": 1.3334, + "ppl": 4.5177, + "step": 7007 + }, + { + "epoch": 0.04, + "global_step": 7008, + "learning_rate": 0.00047158597662771284, + "loss": 1.4688, + "loss_base2": 2.119, + "loss_pixel": 0.1727, + "loss_text": 1.2961, + "ppl": 4.344, + "step": 7008 + }, + { + "epoch": 0.04, + "global_step": 7009, + "learning_rate": 0.00047158180300500835, + "loss": 1.4663, + "loss_base2": 2.1154, + "loss_pixel": 0.1726, + "loss_text": 1.2938, + "ppl": 4.3332, + "step": 7009 + }, + { + "epoch": 0.04, + "global_step": 7010, + "learning_rate": 0.00047157762938230386, + "loss": 1.471, + "loss_base2": 2.1222, + "loss_pixel": 0.1732, + "loss_text": 1.2978, + "ppl": 4.3536, + "step": 7010 + }, + { + "epoch": 0.04, + "global_step": 7011, + "learning_rate": 0.00047157345575959936, + "loss": 1.4338, + "loss_base2": 2.0685, + "loss_pixel": 0.1755, + "loss_text": 1.2583, + "ppl": 4.1946, + "step": 7011 + }, + { + "epoch": 0.04, + "global_step": 7012, + "learning_rate": 0.0004715692821368948, + "loss": 1.4566, + "loss_base2": 2.1014, + "loss_pixel": 0.1718, + "loss_text": 1.2849, + "ppl": 4.2913, + "step": 7012 + }, + { + "epoch": 0.04, + "global_step": 7013, + "learning_rate": 0.0004715651085141903, + "loss": 1.4553, + "loss_base2": 2.0996, + "loss_pixel": 0.1738, + "loss_text": 1.2815, + "ppl": 4.2858, + "step": 7013 + }, + { + "epoch": 0.04, + "global_step": 7014, + "learning_rate": 0.00047156093489148583, + "loss": 1.4513, + "loss_base2": 2.0938, + "loss_pixel": 0.1729, + "loss_text": 1.2783, + "ppl": 4.2687, + "step": 7014 + }, + { + "epoch": 0.04, + "global_step": 7015, + "learning_rate": 0.00047155676126878134, + "loss": 1.6283, + "loss_base2": 2.3491, + "loss_pixel": 0.1745, + "loss_text": 1.4538, + "ppl": 5.0952, + "step": 7015 + }, + { + "epoch": 0.04, + "global_step": 7016, + "learning_rate": 0.0004715525876460768, + "loss": 1.6963, + "loss_base2": 2.4472, + "loss_pixel": 0.1738, + "loss_text": 1.5225, + "ppl": 5.4537, + "step": 7016 + }, + { + "epoch": 0.04, + "global_step": 7017, + "learning_rate": 0.0004715484140233723, + "loss": 1.7142, + "loss_base2": 2.4731, + "loss_pixel": 0.1735, + "loss_text": 1.5407, + "ppl": 5.5522, + "step": 7017 + }, + { + "epoch": 0.04, + "global_step": 7018, + "learning_rate": 0.0004715442404006678, + "loss": 1.6834, + "loss_base2": 2.4286, + "loss_pixel": 0.1735, + "loss_text": 1.5099, + "ppl": 5.3838, + "step": 7018 + }, + { + "epoch": 0.04, + "global_step": 7019, + "learning_rate": 0.0004715400667779633, + "loss": 1.7024, + "loss_base2": 2.456, + "loss_pixel": 0.1728, + "loss_text": 1.5295, + "ppl": 5.4871, + "step": 7019 + }, + { + "epoch": 0.04, + "global_step": 7020, + "learning_rate": 0.0004715358931552588, + "loss": 1.6825, + "loss_base2": 2.4273, + "loss_pixel": 0.174, + "loss_text": 1.5085, + "ppl": 5.379, + "step": 7020 + }, + { + "epoch": 0.04, + "global_step": 7021, + "learning_rate": 0.0004715317195325543, + "loss": 1.7071, + "loss_base2": 2.4628, + "loss_pixel": 0.1741, + "loss_text": 1.533, + "ppl": 5.513, + "step": 7021 + }, + { + "epoch": 0.04, + "global_step": 7022, + "learning_rate": 0.00047152754590984973, + "loss": 1.6983, + "loss_base2": 2.4501, + "loss_pixel": 0.1729, + "loss_text": 1.5254, + "ppl": 5.4646, + "step": 7022 + }, + { + "epoch": 0.04, + "global_step": 7023, + "learning_rate": 0.00047152337228714524, + "loss": 1.6845, + "loss_base2": 2.4302, + "loss_pixel": 0.1737, + "loss_text": 1.5108, + "ppl": 5.3898, + "step": 7023 + }, + { + "epoch": 0.04, + "global_step": 7024, + "learning_rate": 0.00047151919866444074, + "loss": 1.6949, + "loss_base2": 2.4452, + "loss_pixel": 0.1716, + "loss_text": 1.5233, + "ppl": 5.4461, + "step": 7024 + }, + { + "epoch": 0.04, + "global_step": 7025, + "learning_rate": 0.0004715150250417362, + "loss": 1.6992, + "loss_base2": 2.4514, + "loss_pixel": 0.1723, + "loss_text": 1.527, + "ppl": 5.4696, + "step": 7025 + }, + { + "epoch": 0.04, + "global_step": 7026, + "learning_rate": 0.0004715108514190317, + "loss": 1.6911, + "loss_base2": 2.4397, + "loss_pixel": 0.1722, + "loss_text": 1.5189, + "ppl": 5.4254, + "step": 7026 + }, + { + "epoch": 0.04, + "global_step": 7027, + "learning_rate": 0.0004715066777963272, + "loss": 1.683, + "loss_base2": 2.4281, + "loss_pixel": 0.1703, + "loss_text": 1.5127, + "ppl": 5.3817, + "step": 7027 + }, + { + "epoch": 0.04, + "global_step": 7028, + "learning_rate": 0.0004715025041736227, + "loss": 1.6889, + "loss_base2": 2.4366, + "loss_pixel": 0.1744, + "loss_text": 1.5145, + "ppl": 5.4135, + "step": 7028 + }, + { + "epoch": 0.04, + "global_step": 7029, + "learning_rate": 0.0004714983305509182, + "loss": 1.6906, + "loss_base2": 2.439, + "loss_pixel": 0.171, + "loss_text": 1.5196, + "ppl": 5.4227, + "step": 7029 + }, + { + "epoch": 0.04, + "global_step": 7030, + "learning_rate": 0.0004714941569282137, + "loss": 1.678, + "loss_base2": 2.4208, + "loss_pixel": 0.1711, + "loss_text": 1.507, + "ppl": 5.3548, + "step": 7030 + }, + { + "epoch": 0.04, + "global_step": 7031, + "learning_rate": 0.0004714899833055092, + "loss": 1.6648, + "loss_base2": 2.4018, + "loss_pixel": 0.1714, + "loss_text": 1.4933, + "ppl": 5.2846, + "step": 7031 + }, + { + "epoch": 0.04, + "global_step": 7032, + "learning_rate": 0.0004714858096828047, + "loss": 1.6894, + "loss_base2": 2.4373, + "loss_pixel": 0.1693, + "loss_text": 1.52, + "ppl": 5.4162, + "step": 7032 + }, + { + "epoch": 0.04, + "global_step": 7033, + "learning_rate": 0.0004714816360601002, + "loss": 1.6899, + "loss_base2": 2.438, + "loss_pixel": 0.1719, + "loss_text": 1.518, + "ppl": 5.4189, + "step": 7033 + }, + { + "epoch": 0.04, + "global_step": 7034, + "learning_rate": 0.00047147746243739565, + "loss": 1.6807, + "loss_base2": 2.4247, + "loss_pixel": 0.1713, + "loss_text": 1.5094, + "ppl": 5.3693, + "step": 7034 + }, + { + "epoch": 0.04, + "global_step": 7035, + "learning_rate": 0.00047147328881469116, + "loss": 1.693, + "loss_base2": 2.4425, + "loss_pixel": 0.1708, + "loss_text": 1.5222, + "ppl": 5.4358, + "step": 7035 + }, + { + "epoch": 0.04, + "global_step": 7036, + "learning_rate": 0.00047146911519198667, + "loss": 1.6753, + "loss_base2": 2.4169, + "loss_pixel": 0.1698, + "loss_text": 1.5056, + "ppl": 5.3404, + "step": 7036 + }, + { + "epoch": 0.04, + "global_step": 7037, + "learning_rate": 0.0004714649415692822, + "loss": 1.5252, + "loss_base2": 2.2004, + "loss_pixel": 0.1718, + "loss_text": 1.3534, + "ppl": 4.5961, + "step": 7037 + }, + { + "epoch": 0.04, + "global_step": 7038, + "learning_rate": 0.0004714607679465777, + "loss": 1.4573, + "loss_base2": 2.1024, + "loss_pixel": 0.1713, + "loss_text": 1.286, + "ppl": 4.2943, + "step": 7038 + }, + { + "epoch": 0.04, + "global_step": 7039, + "learning_rate": 0.00047145659432387314, + "loss": 1.4643, + "loss_base2": 2.1125, + "loss_pixel": 0.1705, + "loss_text": 1.2938, + "ppl": 4.3245, + "step": 7039 + }, + { + "epoch": 0.04, + "global_step": 7040, + "learning_rate": 0.00047145242070116864, + "loss": 1.4511, + "loss_base2": 2.0935, + "loss_pixel": 0.1709, + "loss_text": 1.2802, + "ppl": 4.2678, + "step": 7040 + }, + { + "epoch": 0.04, + "global_step": 7041, + "learning_rate": 0.0004714482470784641, + "loss": 1.4624, + "loss_base2": 2.1098, + "loss_pixel": 0.1721, + "loss_text": 1.2903, + "ppl": 4.3163, + "step": 7041 + }, + { + "epoch": 0.04, + "global_step": 7042, + "learning_rate": 0.0004714440734557596, + "loss": 1.4592, + "loss_base2": 2.1052, + "loss_pixel": 0.1719, + "loss_text": 1.2874, + "ppl": 4.3025, + "step": 7042 + }, + { + "epoch": 0.04, + "global_step": 7043, + "learning_rate": 0.00047143989983305506, + "loss": 1.4379, + "loss_base2": 2.0745, + "loss_pixel": 0.17, + "loss_text": 1.2679, + "ppl": 4.2118, + "step": 7043 + }, + { + "epoch": 0.04, + "global_step": 7044, + "learning_rate": 0.00047143572621035056, + "loss": 1.4482, + "loss_base2": 2.0893, + "loss_pixel": 0.1703, + "loss_text": 1.2779, + "ppl": 4.2554, + "step": 7044 + }, + { + "epoch": 0.04, + "global_step": 7045, + "learning_rate": 0.00047143155258764607, + "loss": 1.4418, + "loss_base2": 2.0801, + "loss_pixel": 0.1707, + "loss_text": 1.2711, + "ppl": 4.2283, + "step": 7045 + }, + { + "epoch": 0.04, + "global_step": 7046, + "learning_rate": 0.0004714273789649416, + "loss": 1.6314, + "loss_base2": 2.3536, + "loss_pixel": 0.1699, + "loss_text": 1.4615, + "ppl": 5.111, + "step": 7046 + }, + { + "epoch": 0.04, + "global_step": 7047, + "learning_rate": 0.0004714232053422371, + "loss": 1.7003, + "loss_base2": 2.453, + "loss_pixel": 0.1751, + "loss_text": 1.5253, + "ppl": 5.4756, + "step": 7047 + }, + { + "epoch": 0.04, + "global_step": 7048, + "learning_rate": 0.00047141903171953254, + "loss": 1.7036, + "loss_base2": 2.4578, + "loss_pixel": 0.1698, + "loss_text": 1.5338, + "ppl": 5.4937, + "step": 7048 + }, + { + "epoch": 0.04, + "global_step": 7049, + "learning_rate": 0.00047141485809682805, + "loss": 1.6902, + "loss_base2": 2.4384, + "loss_pixel": 0.1704, + "loss_text": 1.5198, + "ppl": 5.4206, + "step": 7049 + }, + { + "epoch": 0.04, + "global_step": 7050, + "learning_rate": 0.00047141068447412355, + "loss": 1.7061, + "loss_base2": 2.4614, + "loss_pixel": 0.1714, + "loss_text": 1.5348, + "ppl": 5.5074, + "step": 7050 + }, + { + "epoch": 0.04, + "global_step": 7051, + "learning_rate": 0.00047140651085141906, + "loss": 1.6967, + "loss_base2": 2.4478, + "loss_pixel": 0.1718, + "loss_text": 1.525, + "ppl": 5.4559, + "step": 7051 + }, + { + "epoch": 0.04, + "global_step": 7052, + "learning_rate": 0.00047140233722871457, + "loss": 1.6895, + "loss_base2": 2.4374, + "loss_pixel": 0.171, + "loss_text": 1.5185, + "ppl": 5.4168, + "step": 7052 + }, + { + "epoch": 0.04, + "global_step": 7053, + "learning_rate": 0.00047139816360601, + "loss": 1.6904, + "loss_base2": 2.4387, + "loss_pixel": 0.1699, + "loss_text": 1.5205, + "ppl": 5.4216, + "step": 7053 + }, + { + "epoch": 0.04, + "global_step": 7054, + "learning_rate": 0.00047139398998330553, + "loss": 1.7176, + "loss_base2": 2.478, + "loss_pixel": 0.1694, + "loss_text": 1.5482, + "ppl": 5.5711, + "step": 7054 + }, + { + "epoch": 0.04, + "global_step": 7055, + "learning_rate": 0.00047138981636060104, + "loss": 1.6718, + "loss_base2": 2.4119, + "loss_pixel": 0.1708, + "loss_text": 1.5011, + "ppl": 5.3217, + "step": 7055 + }, + { + "epoch": 0.04, + "global_step": 7056, + "learning_rate": 0.00047138564273789654, + "loss": 1.6747, + "loss_base2": 2.4161, + "loss_pixel": 0.1709, + "loss_text": 1.5038, + "ppl": 5.3372, + "step": 7056 + }, + { + "epoch": 0.04, + "global_step": 7057, + "learning_rate": 0.000471381469115192, + "loss": 1.6477, + "loss_base2": 2.3771, + "loss_pixel": 0.1699, + "loss_text": 1.4778, + "ppl": 5.195, + "step": 7057 + }, + { + "epoch": 0.04, + "global_step": 7058, + "learning_rate": 0.0004713772954924875, + "loss": 1.6678, + "loss_base2": 2.4061, + "loss_pixel": 0.1726, + "loss_text": 1.4952, + "ppl": 5.3005, + "step": 7058 + }, + { + "epoch": 0.04, + "global_step": 7059, + "learning_rate": 0.00047137312186978296, + "loss": 1.6893, + "loss_base2": 2.4371, + "loss_pixel": 0.1711, + "loss_text": 1.5182, + "ppl": 5.4157, + "step": 7059 + }, + { + "epoch": 0.04, + "global_step": 7060, + "learning_rate": 0.00047136894824707846, + "loss": 1.6866, + "loss_base2": 2.4332, + "loss_pixel": 0.1712, + "loss_text": 1.5154, + "ppl": 5.4011, + "step": 7060 + }, + { + "epoch": 0.04, + "global_step": 7061, + "learning_rate": 0.00047136477462437397, + "loss": 1.6872, + "loss_base2": 2.4341, + "loss_pixel": 0.1687, + "loss_text": 1.5185, + "ppl": 5.4043, + "step": 7061 + }, + { + "epoch": 0.04, + "global_step": 7062, + "learning_rate": 0.0004713606010016694, + "loss": 1.7004, + "loss_base2": 2.4532, + "loss_pixel": 0.172, + "loss_text": 1.5284, + "ppl": 5.4761, + "step": 7062 + }, + { + "epoch": 0.04, + "global_step": 7063, + "learning_rate": 0.00047135642737896493, + "loss": 1.6607, + "loss_base2": 2.3959, + "loss_pixel": 0.1705, + "loss_text": 1.4902, + "ppl": 5.263, + "step": 7063 + }, + { + "epoch": 0.04, + "global_step": 7064, + "learning_rate": 0.00047135225375626044, + "loss": 1.6777, + "loss_base2": 2.4204, + "loss_pixel": 0.1707, + "loss_text": 1.5069, + "ppl": 5.3532, + "step": 7064 + }, + { + "epoch": 0.04, + "global_step": 7065, + "learning_rate": 0.00047134808013355595, + "loss": 1.6895, + "loss_base2": 2.4374, + "loss_pixel": 0.1714, + "loss_text": 1.5182, + "ppl": 5.4168, + "step": 7065 + }, + { + "epoch": 0.04, + "global_step": 7066, + "learning_rate": 0.0004713439065108514, + "loss": 1.6804, + "loss_base2": 2.4243, + "loss_pixel": 0.1711, + "loss_text": 1.5093, + "ppl": 5.3677, + "step": 7066 + }, + { + "epoch": 0.04, + "global_step": 7067, + "learning_rate": 0.0004713397328881469, + "loss": 1.694, + "loss_base2": 2.4439, + "loss_pixel": 0.1821, + "loss_text": 1.5119, + "ppl": 5.4412, + "step": 7067 + }, + { + "epoch": 0.04, + "global_step": 7068, + "learning_rate": 0.0004713355592654424, + "loss": 1.5924, + "loss_base2": 2.2973, + "loss_pixel": 0.1902, + "loss_text": 1.4022, + "ppl": 4.9155, + "step": 7068 + }, + { + "epoch": 0.04, + "global_step": 7069, + "learning_rate": 0.0004713313856427379, + "loss": 1.4868, + "loss_base2": 2.145, + "loss_pixel": 0.1896, + "loss_text": 1.2972, + "ppl": 4.4229, + "step": 7069 + }, + { + "epoch": 0.04, + "global_step": 7070, + "learning_rate": 0.00047132721202003343, + "loss": 1.4732, + "loss_base2": 2.1254, + "loss_pixel": 0.1733, + "loss_text": 1.2999, + "ppl": 4.3632, + "step": 7070 + }, + { + "epoch": 0.04, + "global_step": 7071, + "learning_rate": 0.0004713230383973289, + "loss": 1.4682, + "loss_base2": 2.1182, + "loss_pixel": 0.1731, + "loss_text": 1.2952, + "ppl": 4.3414, + "step": 7071 + }, + { + "epoch": 0.04, + "global_step": 7072, + "learning_rate": 0.0004713188647746244, + "loss": 1.4698, + "loss_base2": 2.1205, + "loss_pixel": 0.1702, + "loss_text": 1.2996, + "ppl": 4.3484, + "step": 7072 + }, + { + "epoch": 0.04, + "global_step": 7073, + "learning_rate": 0.0004713146911519199, + "loss": 1.4443, + "loss_base2": 2.0837, + "loss_pixel": 0.1707, + "loss_text": 1.2736, + "ppl": 4.2389, + "step": 7073 + }, + { + "epoch": 0.04, + "global_step": 7074, + "learning_rate": 0.0004713105175292154, + "loss": 1.4785, + "loss_base2": 2.133, + "loss_pixel": 0.1723, + "loss_text": 1.3062, + "ppl": 4.3864, + "step": 7074 + }, + { + "epoch": 0.04, + "global_step": 7075, + "learning_rate": 0.00047130634390651086, + "loss": 1.4437, + "loss_base2": 2.0828, + "loss_pixel": 0.172, + "loss_text": 1.2717, + "ppl": 4.2363, + "step": 7075 + }, + { + "epoch": 0.04, + "global_step": 7076, + "learning_rate": 0.00047130217028380636, + "loss": 1.6537, + "loss_base2": 2.3858, + "loss_pixel": 0.1701, + "loss_text": 1.4836, + "ppl": 5.2263, + "step": 7076 + }, + { + "epoch": 0.04, + "global_step": 7077, + "learning_rate": 0.00047129799666110187, + "loss": 1.6996, + "loss_base2": 2.452, + "loss_pixel": 0.1724, + "loss_text": 1.5273, + "ppl": 5.4718, + "step": 7077 + }, + { + "epoch": 0.04, + "global_step": 7078, + "learning_rate": 0.0004712938230383973, + "loss": 1.6932, + "loss_base2": 2.4428, + "loss_pixel": 0.1712, + "loss_text": 1.522, + "ppl": 5.4369, + "step": 7078 + }, + { + "epoch": 0.04, + "global_step": 7079, + "learning_rate": 0.00047128964941569283, + "loss": 1.6935, + "loss_base2": 2.4432, + "loss_pixel": 0.1708, + "loss_text": 1.5227, + "ppl": 5.4385, + "step": 7079 + }, + { + "epoch": 0.04, + "global_step": 7080, + "learning_rate": 0.0004712854757929883, + "loss": 1.6936, + "loss_base2": 2.4433, + "loss_pixel": 0.1717, + "loss_text": 1.5219, + "ppl": 5.439, + "step": 7080 + }, + { + "epoch": 0.04, + "global_step": 7081, + "learning_rate": 0.0004712813021702838, + "loss": 1.6955, + "loss_base2": 2.4461, + "loss_pixel": 0.1721, + "loss_text": 1.5234, + "ppl": 5.4494, + "step": 7081 + }, + { + "epoch": 0.04, + "global_step": 7082, + "learning_rate": 0.0004712771285475793, + "loss": 1.6855, + "loss_base2": 2.4317, + "loss_pixel": 0.1721, + "loss_text": 1.5134, + "ppl": 5.3951, + "step": 7082 + }, + { + "epoch": 0.04, + "global_step": 7083, + "learning_rate": 0.0004712729549248748, + "loss": 1.6721, + "loss_base2": 2.4123, + "loss_pixel": 0.1694, + "loss_text": 1.5027, + "ppl": 5.3233, + "step": 7083 + }, + { + "epoch": 0.04, + "global_step": 7084, + "learning_rate": 0.00047126878130217026, + "loss": 1.6959, + "loss_base2": 2.4467, + "loss_pixel": 0.1699, + "loss_text": 1.526, + "ppl": 5.4516, + "step": 7084 + }, + { + "epoch": 0.04, + "global_step": 7085, + "learning_rate": 0.00047126460767946577, + "loss": 1.6938, + "loss_base2": 2.4436, + "loss_pixel": 0.1717, + "loss_text": 1.5221, + "ppl": 5.4401, + "step": 7085 + }, + { + "epoch": 0.04, + "global_step": 7086, + "learning_rate": 0.0004712604340567613, + "loss": 1.6942, + "loss_base2": 2.4442, + "loss_pixel": 0.1715, + "loss_text": 1.5227, + "ppl": 5.4423, + "step": 7086 + }, + { + "epoch": 0.04, + "global_step": 7087, + "learning_rate": 0.0004712562604340568, + "loss": 1.6883, + "loss_base2": 2.4357, + "loss_pixel": 0.1691, + "loss_text": 1.5192, + "ppl": 5.4103, + "step": 7087 + }, + { + "epoch": 0.04, + "global_step": 7088, + "learning_rate": 0.0004712520868113523, + "loss": 1.6837, + "loss_base2": 2.4291, + "loss_pixel": 0.1791, + "loss_text": 1.5046, + "ppl": 5.3854, + "step": 7088 + }, + { + "epoch": 0.04, + "global_step": 7089, + "learning_rate": 0.00047124791318864774, + "loss": 1.7065, + "loss_base2": 2.462, + "loss_pixel": 0.1893, + "loss_text": 1.5172, + "ppl": 5.5096, + "step": 7089 + }, + { + "epoch": 0.04, + "global_step": 7090, + "learning_rate": 0.00047124373956594325, + "loss": 1.7059, + "loss_base2": 2.4611, + "loss_pixel": 0.1895, + "loss_text": 1.5164, + "ppl": 5.5063, + "step": 7090 + }, + { + "epoch": 0.04, + "global_step": 7091, + "learning_rate": 0.00047123956594323876, + "loss": 1.6964, + "loss_base2": 2.4474, + "loss_pixel": 0.1827, + "loss_text": 1.5137, + "ppl": 5.4543, + "step": 7091 + }, + { + "epoch": 0.04, + "global_step": 7092, + "learning_rate": 0.00047123539232053426, + "loss": 1.6964, + "loss_base2": 2.4474, + "loss_pixel": 0.182, + "loss_text": 1.5143, + "ppl": 5.4543, + "step": 7092 + }, + { + "epoch": 0.04, + "global_step": 7093, + "learning_rate": 0.0004712312186978297, + "loss": 1.6677, + "loss_base2": 2.406, + "loss_pixel": 0.1829, + "loss_text": 1.4848, + "ppl": 5.3, + "step": 7093 + }, + { + "epoch": 0.04, + "global_step": 7094, + "learning_rate": 0.0004712270450751252, + "loss": 1.6774, + "loss_base2": 2.42, + "loss_pixel": 0.1835, + "loss_text": 1.4939, + "ppl": 5.3516, + "step": 7094 + }, + { + "epoch": 0.04, + "global_step": 7095, + "learning_rate": 0.00047122287145242073, + "loss": 1.6969, + "loss_base2": 2.4481, + "loss_pixel": 0.1824, + "loss_text": 1.5145, + "ppl": 5.457, + "step": 7095 + }, + { + "epoch": 0.04, + "global_step": 7096, + "learning_rate": 0.00047121869782971624, + "loss": 1.6841, + "loss_base2": 2.4296, + "loss_pixel": 0.1818, + "loss_text": 1.5023, + "ppl": 5.3876, + "step": 7096 + }, + { + "epoch": 0.04, + "global_step": 7097, + "learning_rate": 0.0004712145242070117, + "loss": 1.6055, + "loss_base2": 2.3162, + "loss_pixel": 0.1825, + "loss_text": 1.423, + "ppl": 4.9803, + "step": 7097 + }, + { + "epoch": 0.04, + "global_step": 7098, + "learning_rate": 0.00047121035058430715, + "loss": 1.4669, + "loss_base2": 2.1163, + "loss_pixel": 0.1842, + "loss_text": 1.2827, + "ppl": 4.3358, + "step": 7098 + }, + { + "epoch": 0.04, + "global_step": 7099, + "learning_rate": 0.00047120617696160265, + "loss": 1.4701, + "loss_base2": 2.1209, + "loss_pixel": 0.1828, + "loss_text": 1.2873, + "ppl": 4.3497, + "step": 7099 + }, + { + "epoch": 0.04, + "global_step": 7100, + "learning_rate": 0.00047120200333889816, + "loss": 1.4887, + "loss_base2": 2.1477, + "loss_pixel": 0.1954, + "loss_text": 1.2933, + "ppl": 4.4313, + "step": 7100 + }, + { + "epoch": 0.04, + "global_step": 7101, + "learning_rate": 0.00047119782971619367, + "loss": 1.4498, + "loss_base2": 2.0916, + "loss_pixel": 0.1927, + "loss_text": 1.2571, + "ppl": 4.2623, + "step": 7101 + }, + { + "epoch": 0.04, + "global_step": 7102, + "learning_rate": 0.0004711936560934891, + "loss": 1.4667, + "loss_base2": 2.116, + "loss_pixel": 0.1947, + "loss_text": 1.2721, + "ppl": 4.3349, + "step": 7102 + }, + { + "epoch": 0.04, + "global_step": 7103, + "learning_rate": 0.00047118948247078463, + "loss": 1.4726, + "loss_base2": 2.1245, + "loss_pixel": 0.1957, + "loss_text": 1.2769, + "ppl": 4.3606, + "step": 7103 + }, + { + "epoch": 0.04, + "global_step": 7104, + "learning_rate": 0.00047118530884808014, + "loss": 1.4811, + "loss_base2": 2.1368, + "loss_pixel": 0.1934, + "loss_text": 1.2877, + "ppl": 4.3978, + "step": 7104 + }, + { + "epoch": 0.04, + "global_step": 7105, + "learning_rate": 0.00047118113522537564, + "loss": 1.5283, + "loss_base2": 2.2049, + "loss_pixel": 0.1911, + "loss_text": 1.3372, + "ppl": 4.6103, + "step": 7105 + }, + { + "epoch": 0.04, + "global_step": 7106, + "learning_rate": 0.00047117696160267115, + "loss": 1.7263, + "loss_base2": 2.4905, + "loss_pixel": 0.1947, + "loss_text": 1.5316, + "ppl": 5.6198, + "step": 7106 + }, + { + "epoch": 0.04, + "global_step": 7107, + "learning_rate": 0.0004711727879799666, + "loss": 1.7248, + "loss_base2": 2.4884, + "loss_pixel": 0.1917, + "loss_text": 1.5331, + "ppl": 5.6114, + "step": 7107 + }, + { + "epoch": 0.04, + "global_step": 7108, + "learning_rate": 0.0004711686143572621, + "loss": 1.7013, + "loss_base2": 2.4545, + "loss_pixel": 0.1897, + "loss_text": 1.5116, + "ppl": 5.4811, + "step": 7108 + }, + { + "epoch": 0.04, + "global_step": 7109, + "learning_rate": 0.0004711644407345576, + "loss": 1.7273, + "loss_base2": 2.492, + "loss_pixel": 0.1885, + "loss_text": 1.5388, + "ppl": 5.6254, + "step": 7109 + }, + { + "epoch": 0.04, + "global_step": 7110, + "learning_rate": 0.0004711602671118531, + "loss": 1.6836, + "loss_base2": 2.4289, + "loss_pixel": 0.1886, + "loss_text": 1.495, + "ppl": 5.3849, + "step": 7110 + }, + { + "epoch": 0.04, + "global_step": 7111, + "learning_rate": 0.00047115609348914863, + "loss": 1.7271, + "loss_base2": 2.4917, + "loss_pixel": 0.1881, + "loss_text": 1.539, + "ppl": 5.6243, + "step": 7111 + }, + { + "epoch": 0.04, + "global_step": 7112, + "learning_rate": 0.0004711519198664441, + "loss": 1.6925, + "loss_base2": 2.4418, + "loss_pixel": 0.1869, + "loss_text": 1.5056, + "ppl": 5.433, + "step": 7112 + }, + { + "epoch": 0.04, + "global_step": 7113, + "learning_rate": 0.0004711477462437396, + "loss": 1.7028, + "loss_base2": 2.4566, + "loss_pixel": 0.1852, + "loss_text": 1.5176, + "ppl": 5.4893, + "step": 7113 + }, + { + "epoch": 0.04, + "global_step": 7114, + "learning_rate": 0.0004711435726210351, + "loss": 1.6793, + "loss_base2": 2.4227, + "loss_pixel": 0.1848, + "loss_text": 1.4945, + "ppl": 5.3618, + "step": 7114 + }, + { + "epoch": 0.04, + "global_step": 7115, + "learning_rate": 0.0004711393989983306, + "loss": 1.7253, + "loss_base2": 2.4891, + "loss_pixel": 0.1875, + "loss_text": 1.5378, + "ppl": 5.6142, + "step": 7115 + }, + { + "epoch": 0.04, + "global_step": 7116, + "learning_rate": 0.000471135225375626, + "loss": 1.6847, + "loss_base2": 2.4305, + "loss_pixel": 0.1839, + "loss_text": 1.5008, + "ppl": 5.3908, + "step": 7116 + }, + { + "epoch": 0.04, + "global_step": 7117, + "learning_rate": 0.0004711310517529215, + "loss": 1.6857, + "loss_base2": 2.432, + "loss_pixel": 0.1842, + "loss_text": 1.5016, + "ppl": 5.3962, + "step": 7117 + }, + { + "epoch": 0.04, + "global_step": 7118, + "learning_rate": 0.000471126878130217, + "loss": 1.6781, + "loss_base2": 2.421, + "loss_pixel": 0.1847, + "loss_text": 1.4934, + "ppl": 5.3554, + "step": 7118 + }, + { + "epoch": 0.04, + "global_step": 7119, + "learning_rate": 0.00047112270450751253, + "loss": 1.6903, + "loss_base2": 2.4386, + "loss_pixel": 0.1824, + "loss_text": 1.5079, + "ppl": 5.4211, + "step": 7119 + }, + { + "epoch": 0.04, + "global_step": 7120, + "learning_rate": 0.00047111853088480804, + "loss": 1.6759, + "loss_base2": 2.4178, + "loss_pixel": 0.1831, + "loss_text": 1.4928, + "ppl": 5.3436, + "step": 7120 + }, + { + "epoch": 0.04, + "global_step": 7121, + "learning_rate": 0.0004711143572621035, + "loss": 1.6904, + "loss_base2": 2.4387, + "loss_pixel": 0.1853, + "loss_text": 1.5051, + "ppl": 5.4216, + "step": 7121 + }, + { + "epoch": 0.04, + "global_step": 7122, + "learning_rate": 0.000471110183639399, + "loss": 1.7009, + "loss_base2": 2.4539, + "loss_pixel": 0.1827, + "loss_text": 1.5182, + "ppl": 5.4789, + "step": 7122 + }, + { + "epoch": 0.04, + "global_step": 7123, + "learning_rate": 0.0004711060100166945, + "loss": 1.6957, + "loss_base2": 2.4464, + "loss_pixel": 0.1819, + "loss_text": 1.5138, + "ppl": 5.4505, + "step": 7123 + }, + { + "epoch": 0.04, + "global_step": 7124, + "learning_rate": 0.00047110183639399, + "loss": 1.701, + "loss_base2": 2.454, + "loss_pixel": 0.1827, + "loss_text": 1.5184, + "ppl": 5.4794, + "step": 7124 + }, + { + "epoch": 0.04, + "global_step": 7125, + "learning_rate": 0.00047109766277128546, + "loss": 1.6934, + "loss_base2": 2.4431, + "loss_pixel": 0.1821, + "loss_text": 1.5114, + "ppl": 5.4379, + "step": 7125 + }, + { + "epoch": 0.04, + "global_step": 7126, + "learning_rate": 0.00047109348914858097, + "loss": 1.6878, + "loss_base2": 2.435, + "loss_pixel": 0.183, + "loss_text": 1.5048, + "ppl": 5.4076, + "step": 7126 + }, + { + "epoch": 0.04, + "global_step": 7127, + "learning_rate": 0.0004710893155258765, + "loss": 1.6926, + "loss_base2": 2.4419, + "loss_pixel": 0.1804, + "loss_text": 1.5122, + "ppl": 5.4336, + "step": 7127 + }, + { + "epoch": 0.04, + "global_step": 7128, + "learning_rate": 0.000471085141903172, + "loss": 1.6923, + "loss_base2": 2.4415, + "loss_pixel": 0.1822, + "loss_text": 1.51, + "ppl": 5.432, + "step": 7128 + }, + { + "epoch": 0.04, + "global_step": 7129, + "learning_rate": 0.0004710809682804675, + "loss": 1.6873, + "loss_base2": 2.4343, + "loss_pixel": 0.1812, + "loss_text": 1.506, + "ppl": 5.4049, + "step": 7129 + }, + { + "epoch": 0.04, + "global_step": 7130, + "learning_rate": 0.00047107679465776295, + "loss": 1.6855, + "loss_base2": 2.4317, + "loss_pixel": 0.1828, + "loss_text": 1.5027, + "ppl": 5.3951, + "step": 7130 + }, + { + "epoch": 0.04, + "global_step": 7131, + "learning_rate": 0.00047107262103505845, + "loss": 1.6949, + "loss_base2": 2.4452, + "loss_pixel": 0.181, + "loss_text": 1.5139, + "ppl": 5.4461, + "step": 7131 + }, + { + "epoch": 0.04, + "global_step": 7132, + "learning_rate": 0.00047106844741235396, + "loss": 1.7064, + "loss_base2": 2.4618, + "loss_pixel": 0.1834, + "loss_text": 1.5231, + "ppl": 5.5091, + "step": 7132 + }, + { + "epoch": 0.04, + "global_step": 7133, + "learning_rate": 0.00047106427378964947, + "loss": 1.6834, + "loss_base2": 2.4286, + "loss_pixel": 0.183, + "loss_text": 1.5003, + "ppl": 5.3838, + "step": 7133 + }, + { + "epoch": 0.04, + "global_step": 7134, + "learning_rate": 0.00047106010016694487, + "loss": 1.6992, + "loss_base2": 2.4514, + "loss_pixel": 0.182, + "loss_text": 1.5172, + "ppl": 5.4696, + "step": 7134 + }, + { + "epoch": 0.04, + "global_step": 7135, + "learning_rate": 0.0004710559265442404, + "loss": 1.6919, + "loss_base2": 2.4409, + "loss_pixel": 0.1815, + "loss_text": 1.5104, + "ppl": 5.4298, + "step": 7135 + }, + { + "epoch": 0.04, + "global_step": 7136, + "learning_rate": 0.0004710517529215359, + "loss": 1.6751, + "loss_base2": 2.4167, + "loss_pixel": 0.1814, + "loss_text": 1.4937, + "ppl": 5.3393, + "step": 7136 + }, + { + "epoch": 0.04, + "global_step": 7137, + "learning_rate": 0.0004710475792988314, + "loss": 1.6839, + "loss_base2": 2.4294, + "loss_pixel": 0.1809, + "loss_text": 1.503, + "ppl": 5.3865, + "step": 7137 + }, + { + "epoch": 0.04, + "global_step": 7138, + "learning_rate": 0.0004710434056761269, + "loss": 1.6802, + "loss_base2": 2.424, + "loss_pixel": 0.1806, + "loss_text": 1.4996, + "ppl": 5.3666, + "step": 7138 + }, + { + "epoch": 0.04, + "global_step": 7139, + "learning_rate": 0.00047103923205342235, + "loss": 1.6889, + "loss_base2": 2.4366, + "loss_pixel": 0.1808, + "loss_text": 1.5081, + "ppl": 5.4135, + "step": 7139 + }, + { + "epoch": 0.04, + "global_step": 7140, + "learning_rate": 0.00047103505843071786, + "loss": 1.6981, + "loss_base2": 2.4498, + "loss_pixel": 0.1804, + "loss_text": 1.5177, + "ppl": 5.4636, + "step": 7140 + }, + { + "epoch": 0.04, + "global_step": 7141, + "learning_rate": 0.00047103088480801336, + "loss": 1.6761, + "loss_base2": 2.4181, + "loss_pixel": 0.1796, + "loss_text": 1.4964, + "ppl": 5.3447, + "step": 7141 + }, + { + "epoch": 0.04, + "global_step": 7142, + "learning_rate": 0.00047102671118530887, + "loss": 1.6819, + "loss_base2": 2.4265, + "loss_pixel": 0.18, + "loss_text": 1.5018, + "ppl": 5.3758, + "step": 7142 + }, + { + "epoch": 0.04, + "global_step": 7143, + "learning_rate": 0.0004710225375626043, + "loss": 1.6976, + "loss_base2": 2.4491, + "loss_pixel": 0.1802, + "loss_text": 1.5174, + "ppl": 5.4608, + "step": 7143 + }, + { + "epoch": 0.04, + "global_step": 7144, + "learning_rate": 0.00047101836393989983, + "loss": 1.7041, + "loss_base2": 2.4585, + "loss_pixel": 0.1802, + "loss_text": 1.5239, + "ppl": 5.4964, + "step": 7144 + }, + { + "epoch": 0.04, + "global_step": 7145, + "learning_rate": 0.00047101419031719534, + "loss": 1.6913, + "loss_base2": 2.44, + "loss_pixel": 0.1797, + "loss_text": 1.5116, + "ppl": 5.4265, + "step": 7145 + }, + { + "epoch": 0.04, + "global_step": 7146, + "learning_rate": 0.00047101001669449085, + "loss": 1.6864, + "loss_base2": 2.433, + "loss_pixel": 0.1783, + "loss_text": 1.5081, + "ppl": 5.4, + "step": 7146 + }, + { + "epoch": 0.04, + "global_step": 7147, + "learning_rate": 0.00047100584307178635, + "loss": 1.6789, + "loss_base2": 2.4221, + "loss_pixel": 0.1793, + "loss_text": 1.4997, + "ppl": 5.3597, + "step": 7147 + }, + { + "epoch": 0.04, + "global_step": 7148, + "learning_rate": 0.0004710016694490818, + "loss": 1.6794, + "loss_base2": 2.4229, + "loss_pixel": 0.1794, + "loss_text": 1.5, + "ppl": 5.3623, + "step": 7148 + }, + { + "epoch": 0.04, + "global_step": 7149, + "learning_rate": 0.0004709974958263773, + "loss": 1.6841, + "loss_base2": 2.4296, + "loss_pixel": 0.1801, + "loss_text": 1.504, + "ppl": 5.3876, + "step": 7149 + }, + { + "epoch": 0.04, + "global_step": 7150, + "learning_rate": 0.0004709933222036728, + "loss": 1.6812, + "loss_base2": 2.4255, + "loss_pixel": 0.1796, + "loss_text": 1.5016, + "ppl": 5.372, + "step": 7150 + }, + { + "epoch": 0.04, + "global_step": 7151, + "learning_rate": 0.00047098914858096833, + "loss": 1.6931, + "loss_base2": 2.4426, + "loss_pixel": 0.1788, + "loss_text": 1.5143, + "ppl": 5.4363, + "step": 7151 + }, + { + "epoch": 0.04, + "global_step": 7152, + "learning_rate": 0.0004709849749582638, + "loss": 1.579, + "loss_base2": 2.278, + "loss_pixel": 0.1802, + "loss_text": 1.3988, + "ppl": 4.8501, + "step": 7152 + }, + { + "epoch": 0.04, + "global_step": 7153, + "learning_rate": 0.00047098080133555924, + "loss": 1.4783, + "loss_base2": 2.1327, + "loss_pixel": 0.1786, + "loss_text": 1.2997, + "ppl": 4.3855, + "step": 7153 + }, + { + "epoch": 0.04, + "global_step": 7154, + "learning_rate": 0.00047097662771285474, + "loss": 1.4766, + "loss_base2": 2.1303, + "loss_pixel": 0.1799, + "loss_text": 1.2966, + "ppl": 4.378, + "step": 7154 + }, + { + "epoch": 0.04, + "global_step": 7155, + "learning_rate": 0.00047097245409015025, + "loss": 1.4598, + "loss_base2": 2.106, + "loss_pixel": 0.1791, + "loss_text": 1.2807, + "ppl": 4.3051, + "step": 7155 + }, + { + "epoch": 0.04, + "global_step": 7156, + "learning_rate": 0.00047096828046744576, + "loss": 1.4643, + "loss_base2": 2.1125, + "loss_pixel": 0.1788, + "loss_text": 1.2855, + "ppl": 4.3245, + "step": 7156 + }, + { + "epoch": 0.04, + "global_step": 7157, + "learning_rate": 0.0004709641068447412, + "loss": 1.4555, + "loss_base2": 2.0998, + "loss_pixel": 0.1786, + "loss_text": 1.2768, + "ppl": 4.2866, + "step": 7157 + }, + { + "epoch": 0.04, + "global_step": 7158, + "learning_rate": 0.0004709599332220367, + "loss": 1.4522, + "loss_base2": 2.0951, + "loss_pixel": 0.1785, + "loss_text": 1.2738, + "ppl": 4.2725, + "step": 7158 + }, + { + "epoch": 0.04, + "global_step": 7159, + "learning_rate": 0.0004709557595993322, + "loss": 1.465, + "loss_base2": 2.1135, + "loss_pixel": 0.1801, + "loss_text": 1.2848, + "ppl": 4.3275, + "step": 7159 + }, + { + "epoch": 0.04, + "global_step": 7160, + "learning_rate": 0.00047095158597662773, + "loss": 1.5552, + "loss_base2": 2.2437, + "loss_pixel": 0.1787, + "loss_text": 1.3766, + "ppl": 4.736, + "step": 7160 + }, + { + "epoch": 0.04, + "global_step": 7161, + "learning_rate": 0.0004709474123539232, + "loss": 1.6821, + "loss_base2": 2.4268, + "loss_pixel": 0.1789, + "loss_text": 1.5032, + "ppl": 5.3768, + "step": 7161 + }, + { + "epoch": 0.04, + "global_step": 7162, + "learning_rate": 0.0004709432387312187, + "loss": 1.707, + "loss_base2": 2.4627, + "loss_pixel": 0.1785, + "loss_text": 1.5285, + "ppl": 5.5124, + "step": 7162 + }, + { + "epoch": 0.04, + "global_step": 7163, + "learning_rate": 0.0004709390651085142, + "loss": 1.6631, + "loss_base2": 2.3993, + "loss_pixel": 0.1788, + "loss_text": 1.4844, + "ppl": 5.2756, + "step": 7163 + }, + { + "epoch": 0.04, + "global_step": 7164, + "learning_rate": 0.0004709348914858097, + "loss": 1.7008, + "loss_base2": 2.4537, + "loss_pixel": 0.1787, + "loss_text": 1.5221, + "ppl": 5.4783, + "step": 7164 + }, + { + "epoch": 0.04, + "global_step": 7165, + "learning_rate": 0.0004709307178631052, + "loss": 1.6925, + "loss_base2": 2.4418, + "loss_pixel": 0.1778, + "loss_text": 1.5147, + "ppl": 5.433, + "step": 7165 + }, + { + "epoch": 0.04, + "global_step": 7166, + "learning_rate": 0.00047092654424040067, + "loss": 1.6868, + "loss_base2": 2.4335, + "loss_pixel": 0.1802, + "loss_text": 1.5066, + "ppl": 5.4022, + "step": 7166 + }, + { + "epoch": 0.04, + "global_step": 7167, + "learning_rate": 0.0004709223706176962, + "loss": 1.6845, + "loss_base2": 2.4302, + "loss_pixel": 0.1791, + "loss_text": 1.5054, + "ppl": 5.3898, + "step": 7167 + }, + { + "epoch": 0.04, + "global_step": 7168, + "learning_rate": 0.0004709181969949917, + "loss": 1.699, + "loss_base2": 2.4511, + "loss_pixel": 0.1808, + "loss_text": 1.5182, + "ppl": 5.4685, + "step": 7168 + }, + { + "epoch": 0.04, + "global_step": 7169, + "learning_rate": 0.0004709140233722872, + "loss": 1.6958, + "loss_base2": 2.4465, + "loss_pixel": 0.1802, + "loss_text": 1.5157, + "ppl": 5.451, + "step": 7169 + }, + { + "epoch": 0.04, + "global_step": 7170, + "learning_rate": 0.0004709098497495827, + "loss": 1.6864, + "loss_base2": 2.433, + "loss_pixel": 0.1795, + "loss_text": 1.5068, + "ppl": 5.4, + "step": 7170 + }, + { + "epoch": 0.04, + "global_step": 7171, + "learning_rate": 0.00047090567612687815, + "loss": 1.7001, + "loss_base2": 2.4527, + "loss_pixel": 0.1785, + "loss_text": 1.5217, + "ppl": 5.4745, + "step": 7171 + }, + { + "epoch": 0.04, + "global_step": 7172, + "learning_rate": 0.0004709015025041736, + "loss": 1.6923, + "loss_base2": 2.4415, + "loss_pixel": 0.1795, + "loss_text": 1.5129, + "ppl": 5.432, + "step": 7172 + }, + { + "epoch": 0.04, + "global_step": 7173, + "learning_rate": 0.0004708973288814691, + "loss": 1.6853, + "loss_base2": 2.4314, + "loss_pixel": 0.1776, + "loss_text": 1.5077, + "ppl": 5.3941, + "step": 7173 + }, + { + "epoch": 0.04, + "global_step": 7174, + "learning_rate": 0.0004708931552587646, + "loss": 1.6886, + "loss_base2": 2.4361, + "loss_pixel": 0.1794, + "loss_text": 1.5092, + "ppl": 5.4119, + "step": 7174 + }, + { + "epoch": 0.04, + "global_step": 7175, + "learning_rate": 0.00047088898163606007, + "loss": 1.6704, + "loss_base2": 2.4099, + "loss_pixel": 0.1786, + "loss_text": 1.4919, + "ppl": 5.3143, + "step": 7175 + }, + { + "epoch": 0.04, + "global_step": 7176, + "learning_rate": 0.0004708848080133556, + "loss": 1.6751, + "loss_base2": 2.4167, + "loss_pixel": 0.1781, + "loss_text": 1.497, + "ppl": 5.3393, + "step": 7176 + }, + { + "epoch": 0.04, + "global_step": 7177, + "learning_rate": 0.0004708806343906511, + "loss": 1.6967, + "loss_base2": 2.4478, + "loss_pixel": 0.1809, + "loss_text": 1.5158, + "ppl": 5.4559, + "step": 7177 + }, + { + "epoch": 0.04, + "global_step": 7178, + "learning_rate": 0.0004708764607679466, + "loss": 1.6791, + "loss_base2": 2.4224, + "loss_pixel": 0.1782, + "loss_text": 1.5009, + "ppl": 5.3607, + "step": 7178 + }, + { + "epoch": 0.04, + "global_step": 7179, + "learning_rate": 0.0004708722871452421, + "loss": 1.668, + "loss_base2": 2.4064, + "loss_pixel": 0.1786, + "loss_text": 1.4894, + "ppl": 5.3016, + "step": 7179 + }, + { + "epoch": 0.04, + "global_step": 7180, + "learning_rate": 0.00047086811352253755, + "loss": 1.6856, + "loss_base2": 2.4318, + "loss_pixel": 0.1797, + "loss_text": 1.5059, + "ppl": 5.3957, + "step": 7180 + }, + { + "epoch": 0.04, + "global_step": 7181, + "learning_rate": 0.00047086393989983306, + "loss": 1.6752, + "loss_base2": 2.4168, + "loss_pixel": 0.1784, + "loss_text": 1.4968, + "ppl": 5.3399, + "step": 7181 + }, + { + "epoch": 0.04, + "global_step": 7182, + "learning_rate": 0.00047085976627712857, + "loss": 1.7033, + "loss_base2": 2.4573, + "loss_pixel": 0.1781, + "loss_text": 1.5253, + "ppl": 5.492, + "step": 7182 + }, + { + "epoch": 0.04, + "global_step": 7183, + "learning_rate": 0.0004708555926544241, + "loss": 1.6904, + "loss_base2": 2.4387, + "loss_pixel": 0.1782, + "loss_text": 1.5122, + "ppl": 5.4216, + "step": 7183 + }, + { + "epoch": 0.04, + "global_step": 7184, + "learning_rate": 0.00047085141903171953, + "loss": 1.6893, + "loss_base2": 2.4371, + "loss_pixel": 0.1779, + "loss_text": 1.5114, + "ppl": 5.4157, + "step": 7184 + }, + { + "epoch": 0.04, + "global_step": 7185, + "learning_rate": 0.00047084724540901504, + "loss": 1.5612, + "loss_base2": 2.2523, + "loss_pixel": 0.1796, + "loss_text": 1.3816, + "ppl": 4.7645, + "step": 7185 + }, + { + "epoch": 0.04, + "global_step": 7186, + "learning_rate": 0.00047084307178631054, + "loss": 1.4644, + "loss_base2": 2.1127, + "loss_pixel": 0.1799, + "loss_text": 1.2845, + "ppl": 4.3249, + "step": 7186 + }, + { + "epoch": 0.04, + "global_step": 7187, + "learning_rate": 0.00047083889816360605, + "loss": 1.4653, + "loss_base2": 2.114, + "loss_pixel": 0.1791, + "loss_text": 1.2862, + "ppl": 4.3288, + "step": 7187 + }, + { + "epoch": 0.04, + "global_step": 7188, + "learning_rate": 0.00047083472454090156, + "loss": 1.462, + "loss_base2": 2.1092, + "loss_pixel": 0.1782, + "loss_text": 1.2839, + "ppl": 4.3146, + "step": 7188 + }, + { + "epoch": 0.04, + "global_step": 7189, + "learning_rate": 0.000470830550918197, + "loss": 1.4675, + "loss_base2": 2.1172, + "loss_pixel": 0.1784, + "loss_text": 1.2891, + "ppl": 4.3384, + "step": 7189 + }, + { + "epoch": 0.04, + "global_step": 7190, + "learning_rate": 0.0004708263772954925, + "loss": 1.4543, + "loss_base2": 2.0981, + "loss_pixel": 0.179, + "loss_text": 1.2753, + "ppl": 4.2815, + "step": 7190 + }, + { + "epoch": 0.04, + "global_step": 7191, + "learning_rate": 0.00047082220367278797, + "loss": 1.4546, + "loss_base2": 2.0985, + "loss_pixel": 0.1796, + "loss_text": 1.2749, + "ppl": 4.2828, + "step": 7191 + }, + { + "epoch": 0.04, + "global_step": 7192, + "learning_rate": 0.0004708180300500835, + "loss": 1.514, + "loss_base2": 2.1842, + "loss_pixel": 0.1789, + "loss_text": 1.3351, + "ppl": 4.5449, + "step": 7192 + }, + { + "epoch": 0.04, + "global_step": 7193, + "learning_rate": 0.00047081385642737893, + "loss": 1.5299, + "loss_base2": 2.2072, + "loss_pixel": 0.179, + "loss_text": 1.3509, + "ppl": 4.6177, + "step": 7193 + }, + { + "epoch": 0.04, + "global_step": 7194, + "learning_rate": 0.00047080968280467444, + "loss": 1.4539, + "loss_base2": 2.0975, + "loss_pixel": 0.1782, + "loss_text": 1.2758, + "ppl": 4.2798, + "step": 7194 + }, + { + "epoch": 0.04, + "global_step": 7195, + "learning_rate": 0.00047080550918196995, + "loss": 1.4294, + "loss_base2": 2.0622, + "loss_pixel": 0.1783, + "loss_text": 1.251, + "ppl": 4.1762, + "step": 7195 + }, + { + "epoch": 0.04, + "global_step": 7196, + "learning_rate": 0.00047080133555926545, + "loss": 1.4488, + "loss_base2": 2.0902, + "loss_pixel": 0.1773, + "loss_text": 1.2715, + "ppl": 4.258, + "step": 7196 + }, + { + "epoch": 0.04, + "global_step": 7197, + "learning_rate": 0.00047079716193656096, + "loss": 1.4593, + "loss_base2": 2.1053, + "loss_pixel": 0.1782, + "loss_text": 1.2811, + "ppl": 4.3029, + "step": 7197 + }, + { + "epoch": 0.04, + "global_step": 7198, + "learning_rate": 0.0004707929883138564, + "loss": 1.4374, + "loss_base2": 2.0737, + "loss_pixel": 0.1782, + "loss_text": 1.2591, + "ppl": 4.2097, + "step": 7198 + }, + { + "epoch": 0.04, + "global_step": 7199, + "learning_rate": 0.0004707888146911519, + "loss": 1.474, + "loss_base2": 2.1265, + "loss_pixel": 0.1797, + "loss_text": 1.2944, + "ppl": 4.3667, + "step": 7199 + }, + { + "epoch": 0.04, + "global_step": 7200, + "learning_rate": 0.00047078464106844743, + "loss": 1.4498, + "loss_base2": 2.0916, + "loss_pixel": 0.178, + "loss_text": 1.2718, + "ppl": 4.2623, + "step": 7200 + }, + { + "epoch": 0.04, + "global_step": 7201, + "learning_rate": 0.00047078046744574294, + "loss": 1.4702, + "loss_base2": 2.1211, + "loss_pixel": 0.1781, + "loss_text": 1.2921, + "ppl": 4.3501, + "step": 7201 + }, + { + "epoch": 0.04, + "global_step": 7202, + "learning_rate": 0.0004707762938230384, + "loss": 1.4687, + "loss_base2": 2.1189, + "loss_pixel": 0.1781, + "loss_text": 1.2907, + "ppl": 4.3436, + "step": 7202 + }, + { + "epoch": 0.04, + "global_step": 7203, + "learning_rate": 0.0004707721202003339, + "loss": 1.4491, + "loss_base2": 2.0906, + "loss_pixel": 0.1772, + "loss_text": 1.2719, + "ppl": 4.2593, + "step": 7203 + }, + { + "epoch": 0.04, + "global_step": 7204, + "learning_rate": 0.0004707679465776294, + "loss": 1.4643, + "loss_base2": 2.1125, + "loss_pixel": 0.1785, + "loss_text": 1.2858, + "ppl": 4.3245, + "step": 7204 + }, + { + "epoch": 0.04, + "global_step": 7205, + "learning_rate": 0.0004707637729549249, + "loss": 1.4308, + "loss_base2": 2.0642, + "loss_pixel": 0.1774, + "loss_text": 1.2534, + "ppl": 4.182, + "step": 7205 + }, + { + "epoch": 0.04, + "global_step": 7206, + "learning_rate": 0.0004707595993322204, + "loss": 1.4536, + "loss_base2": 2.0971, + "loss_pixel": 0.1787, + "loss_text": 1.2749, + "ppl": 4.2785, + "step": 7206 + }, + { + "epoch": 0.04, + "global_step": 7207, + "learning_rate": 0.00047075542570951587, + "loss": 1.4848, + "loss_base2": 2.1421, + "loss_pixel": 0.1805, + "loss_text": 1.3044, + "ppl": 4.4141, + "step": 7207 + }, + { + "epoch": 0.04, + "global_step": 7208, + "learning_rate": 0.0004707512520868114, + "loss": 1.4313, + "loss_base2": 2.0649, + "loss_pixel": 0.1779, + "loss_text": 1.2534, + "ppl": 4.1841, + "step": 7208 + }, + { + "epoch": 0.04, + "global_step": 7209, + "learning_rate": 0.0004707470784641069, + "loss": 1.4769, + "loss_base2": 2.1307, + "loss_pixel": 0.1785, + "loss_text": 1.2984, + "ppl": 4.3793, + "step": 7209 + }, + { + "epoch": 0.04, + "global_step": 7210, + "learning_rate": 0.00047074290484140234, + "loss": 1.4366, + "loss_base2": 2.0726, + "loss_pixel": 0.1783, + "loss_text": 1.2583, + "ppl": 4.2064, + "step": 7210 + }, + { + "epoch": 0.04, + "global_step": 7211, + "learning_rate": 0.0004707387312186978, + "loss": 1.4488, + "loss_base2": 2.0902, + "loss_pixel": 0.1787, + "loss_text": 1.2701, + "ppl": 4.258, + "step": 7211 + }, + { + "epoch": 0.04, + "global_step": 7212, + "learning_rate": 0.0004707345575959933, + "loss": 1.4479, + "loss_base2": 2.0889, + "loss_pixel": 0.1786, + "loss_text": 1.2693, + "ppl": 4.2542, + "step": 7212 + }, + { + "epoch": 0.04, + "global_step": 7213, + "learning_rate": 0.0004707303839732888, + "loss": 1.4434, + "loss_base2": 2.0824, + "loss_pixel": 0.1778, + "loss_text": 1.2656, + "ppl": 4.2351, + "step": 7213 + }, + { + "epoch": 0.04, + "global_step": 7214, + "learning_rate": 0.0004707262103505843, + "loss": 1.4714, + "loss_base2": 2.1228, + "loss_pixel": 0.1785, + "loss_text": 1.2929, + "ppl": 4.3553, + "step": 7214 + }, + { + "epoch": 0.04, + "global_step": 7215, + "learning_rate": 0.0004707220367278798, + "loss": 1.4611, + "loss_base2": 2.1079, + "loss_pixel": 0.1794, + "loss_text": 1.2816, + "ppl": 4.3107, + "step": 7215 + }, + { + "epoch": 0.04, + "global_step": 7216, + "learning_rate": 0.0004707178631051753, + "loss": 1.4387, + "loss_base2": 2.0756, + "loss_pixel": 0.1806, + "loss_text": 1.2581, + "ppl": 4.2152, + "step": 7216 + }, + { + "epoch": 0.04, + "global_step": 7217, + "learning_rate": 0.0004707136894824708, + "loss": 1.5796, + "loss_base2": 2.2789, + "loss_pixel": 0.1794, + "loss_text": 1.4002, + "ppl": 4.853, + "step": 7217 + }, + { + "epoch": 0.04, + "global_step": 7218, + "learning_rate": 0.0004707095158597663, + "loss": 1.6854, + "loss_base2": 2.4315, + "loss_pixel": 0.1795, + "loss_text": 1.5059, + "ppl": 5.3946, + "step": 7218 + }, + { + "epoch": 0.04, + "global_step": 7219, + "learning_rate": 0.0004707053422370618, + "loss": 1.6978, + "loss_base2": 2.4494, + "loss_pixel": 0.1792, + "loss_text": 1.5186, + "ppl": 5.4619, + "step": 7219 + }, + { + "epoch": 0.04, + "global_step": 7220, + "learning_rate": 0.00047070116861435725, + "loss": 1.6988, + "loss_base2": 2.4509, + "loss_pixel": 0.181, + "loss_text": 1.5179, + "ppl": 5.4674, + "step": 7220 + }, + { + "epoch": 0.04, + "global_step": 7221, + "learning_rate": 0.00047069699499165276, + "loss": 1.7086, + "loss_base2": 2.465, + "loss_pixel": 0.1888, + "loss_text": 1.5197, + "ppl": 5.5212, + "step": 7221 + }, + { + "epoch": 0.04, + "global_step": 7222, + "learning_rate": 0.00047069282136894826, + "loss": 1.6993, + "loss_base2": 2.4516, + "loss_pixel": 0.1871, + "loss_text": 1.5122, + "ppl": 5.4701, + "step": 7222 + }, + { + "epoch": 0.04, + "global_step": 7223, + "learning_rate": 0.00047068864774624377, + "loss": 1.6953, + "loss_base2": 2.4458, + "loss_pixel": 0.1806, + "loss_text": 1.5147, + "ppl": 5.4483, + "step": 7223 + }, + { + "epoch": 0.04, + "global_step": 7224, + "learning_rate": 0.0004706844741235393, + "loss": 1.698, + "loss_base2": 2.4497, + "loss_pixel": 0.1739, + "loss_text": 1.5242, + "ppl": 5.463, + "step": 7224 + }, + { + "epoch": 0.04, + "global_step": 7225, + "learning_rate": 0.00047068030050083473, + "loss": 1.7019, + "loss_base2": 2.4553, + "loss_pixel": 0.174, + "loss_text": 1.5279, + "ppl": 5.4844, + "step": 7225 + }, + { + "epoch": 0.04, + "global_step": 7226, + "learning_rate": 0.00047067612687813024, + "loss": 1.6951, + "loss_base2": 2.4455, + "loss_pixel": 0.174, + "loss_text": 1.5211, + "ppl": 5.4472, + "step": 7226 + }, + { + "epoch": 0.04, + "global_step": 7227, + "learning_rate": 0.00047067195325542575, + "loss": 1.6618, + "loss_base2": 2.3975, + "loss_pixel": 0.1729, + "loss_text": 1.4889, + "ppl": 5.2688, + "step": 7227 + }, + { + "epoch": 0.04, + "global_step": 7228, + "learning_rate": 0.0004706677796327212, + "loss": 1.7001, + "loss_base2": 2.4527, + "loss_pixel": 0.1756, + "loss_text": 1.5244, + "ppl": 5.4745, + "step": 7228 + }, + { + "epoch": 0.04, + "global_step": 7229, + "learning_rate": 0.0004706636060100167, + "loss": 1.6874, + "loss_base2": 2.4344, + "loss_pixel": 0.1743, + "loss_text": 1.5131, + "ppl": 5.4054, + "step": 7229 + }, + { + "epoch": 0.04, + "global_step": 7230, + "learning_rate": 0.00047065943238731216, + "loss": 1.6776, + "loss_base2": 2.4203, + "loss_pixel": 0.1719, + "loss_text": 1.5056, + "ppl": 5.3527, + "step": 7230 + }, + { + "epoch": 0.04, + "global_step": 7231, + "learning_rate": 0.00047065525876460767, + "loss": 1.6828, + "loss_base2": 2.4278, + "loss_pixel": 0.1718, + "loss_text": 1.511, + "ppl": 5.3806, + "step": 7231 + }, + { + "epoch": 0.04, + "global_step": 7232, + "learning_rate": 0.0004706510851419032, + "loss": 1.6836, + "loss_base2": 2.4289, + "loss_pixel": 0.1715, + "loss_text": 1.5121, + "ppl": 5.3849, + "step": 7232 + }, + { + "epoch": 0.04, + "global_step": 7233, + "learning_rate": 0.0004706469115191987, + "loss": 1.6768, + "loss_base2": 2.4191, + "loss_pixel": 0.1714, + "loss_text": 1.5054, + "ppl": 5.3484, + "step": 7233 + }, + { + "epoch": 0.04, + "global_step": 7234, + "learning_rate": 0.00047064273789649414, + "loss": 1.6933, + "loss_base2": 2.4429, + "loss_pixel": 0.1714, + "loss_text": 1.5219, + "ppl": 5.4374, + "step": 7234 + }, + { + "epoch": 0.04, + "global_step": 7235, + "learning_rate": 0.00047063856427378964, + "loss": 1.668, + "loss_base2": 2.4064, + "loss_pixel": 0.1686, + "loss_text": 1.4994, + "ppl": 5.3016, + "step": 7235 + }, + { + "epoch": 0.04, + "global_step": 7236, + "learning_rate": 0.00047063439065108515, + "loss": 1.6789, + "loss_base2": 2.4221, + "loss_pixel": 0.1704, + "loss_text": 1.5086, + "ppl": 5.3597, + "step": 7236 + }, + { + "epoch": 0.04, + "global_step": 7237, + "learning_rate": 0.00047063021702838066, + "loss": 1.6665, + "loss_base2": 2.4043, + "loss_pixel": 0.169, + "loss_text": 1.4976, + "ppl": 5.2936, + "step": 7237 + }, + { + "epoch": 0.04, + "global_step": 7238, + "learning_rate": 0.00047062604340567616, + "loss": 1.6855, + "loss_base2": 2.4317, + "loss_pixel": 0.1705, + "loss_text": 1.515, + "ppl": 5.3951, + "step": 7238 + }, + { + "epoch": 0.04, + "global_step": 7239, + "learning_rate": 0.0004706218697829716, + "loss": 1.6749, + "loss_base2": 2.4164, + "loss_pixel": 0.1717, + "loss_text": 1.5033, + "ppl": 5.3383, + "step": 7239 + }, + { + "epoch": 0.04, + "global_step": 7240, + "learning_rate": 0.0004706176961602671, + "loss": 1.5624, + "loss_base2": 2.2541, + "loss_pixel": 0.1719, + "loss_text": 1.3906, + "ppl": 4.7703, + "step": 7240 + }, + { + "epoch": 0.04, + "global_step": 7241, + "learning_rate": 0.00047061352253756263, + "loss": 1.4639, + "loss_base2": 2.112, + "loss_pixel": 0.1709, + "loss_text": 1.293, + "ppl": 4.3228, + "step": 7241 + }, + { + "epoch": 0.04, + "global_step": 7242, + "learning_rate": 0.00047060934891485814, + "loss": 1.4463, + "loss_base2": 2.0866, + "loss_pixel": 0.1714, + "loss_text": 1.2749, + "ppl": 4.2474, + "step": 7242 + }, + { + "epoch": 0.04, + "global_step": 7243, + "learning_rate": 0.0004706051752921536, + "loss": 1.4676, + "loss_base2": 2.1173, + "loss_pixel": 0.1705, + "loss_text": 1.2971, + "ppl": 4.3388, + "step": 7243 + }, + { + "epoch": 0.04, + "global_step": 7244, + "learning_rate": 0.0004706010016694491, + "loss": 1.4624, + "loss_base2": 2.1098, + "loss_pixel": 0.171, + "loss_text": 1.2914, + "ppl": 4.3163, + "step": 7244 + }, + { + "epoch": 0.04, + "global_step": 7245, + "learning_rate": 0.0004705968280467446, + "loss": 1.4377, + "loss_base2": 2.0742, + "loss_pixel": 0.1721, + "loss_text": 1.2655, + "ppl": 4.211, + "step": 7245 + }, + { + "epoch": 0.04, + "global_step": 7246, + "learning_rate": 0.0004705926544240401, + "loss": 1.4474, + "loss_base2": 2.0882, + "loss_pixel": 0.1689, + "loss_text": 1.2785, + "ppl": 4.252, + "step": 7246 + }, + { + "epoch": 0.04, + "global_step": 7247, + "learning_rate": 0.00047058848080133557, + "loss": 1.4223, + "loss_base2": 2.0519, + "loss_pixel": 0.1688, + "loss_text": 1.2535, + "ppl": 4.1466, + "step": 7247 + }, + { + "epoch": 0.04, + "global_step": 7248, + "learning_rate": 0.000470584307178631, + "loss": 1.4261, + "loss_base2": 2.0574, + "loss_pixel": 0.1683, + "loss_text": 1.2579, + "ppl": 4.1624, + "step": 7248 + }, + { + "epoch": 0.04, + "global_step": 7249, + "learning_rate": 0.00047058013355592653, + "loss": 1.4517, + "loss_base2": 2.0944, + "loss_pixel": 0.1707, + "loss_text": 1.281, + "ppl": 4.2704, + "step": 7249 + }, + { + "epoch": 0.04, + "global_step": 7250, + "learning_rate": 0.00047057595993322204, + "loss": 1.43, + "loss_base2": 2.0631, + "loss_pixel": 0.1683, + "loss_text": 1.2617, + "ppl": 4.1787, + "step": 7250 + }, + { + "epoch": 0.04, + "global_step": 7251, + "learning_rate": 0.00047057178631051754, + "loss": 1.4589, + "loss_base2": 2.1047, + "loss_pixel": 0.172, + "loss_text": 1.2869, + "ppl": 4.3012, + "step": 7251 + }, + { + "epoch": 0.04, + "global_step": 7252, + "learning_rate": 0.000470567612687813, + "loss": 1.4461, + "loss_base2": 2.0863, + "loss_pixel": 0.1698, + "loss_text": 1.2763, + "ppl": 4.2465, + "step": 7252 + }, + { + "epoch": 0.04, + "global_step": 7253, + "learning_rate": 0.0004705634390651085, + "loss": 1.4412, + "loss_base2": 2.0792, + "loss_pixel": 0.1699, + "loss_text": 1.2714, + "ppl": 4.2258, + "step": 7253 + }, + { + "epoch": 0.04, + "global_step": 7254, + "learning_rate": 0.000470559265442404, + "loss": 1.4593, + "loss_base2": 2.1053, + "loss_pixel": 0.1812, + "loss_text": 1.2781, + "ppl": 4.3029, + "step": 7254 + }, + { + "epoch": 0.04, + "global_step": 7255, + "learning_rate": 0.0004705550918196995, + "loss": 1.4674, + "loss_base2": 2.117, + "loss_pixel": 0.1889, + "loss_text": 1.2785, + "ppl": 4.3379, + "step": 7255 + }, + { + "epoch": 0.04, + "global_step": 7256, + "learning_rate": 0.000470550918196995, + "loss": 1.5545, + "loss_base2": 2.2427, + "loss_pixel": 0.187, + "loss_text": 1.3675, + "ppl": 4.7327, + "step": 7256 + }, + { + "epoch": 0.04, + "global_step": 7257, + "learning_rate": 0.0004705467445742905, + "loss": 1.675, + "loss_base2": 2.4165, + "loss_pixel": 0.1866, + "loss_text": 1.4884, + "ppl": 5.3388, + "step": 7257 + }, + { + "epoch": 0.04, + "global_step": 7258, + "learning_rate": 0.000470542570951586, + "loss": 1.7321, + "loss_base2": 2.4989, + "loss_pixel": 0.1864, + "loss_text": 1.5457, + "ppl": 5.6525, + "step": 7258 + }, + { + "epoch": 0.04, + "global_step": 7259, + "learning_rate": 0.0004705383973288815, + "loss": 1.6992, + "loss_base2": 2.4514, + "loss_pixel": 0.1873, + "loss_text": 1.5119, + "ppl": 5.4696, + "step": 7259 + }, + { + "epoch": 0.04, + "global_step": 7260, + "learning_rate": 0.000470534223706177, + "loss": 1.7113, + "loss_base2": 2.4689, + "loss_pixel": 0.1872, + "loss_text": 1.5242, + "ppl": 5.5362, + "step": 7260 + }, + { + "epoch": 0.04, + "global_step": 7261, + "learning_rate": 0.00047053005008347245, + "loss": 1.6939, + "loss_base2": 2.4438, + "loss_pixel": 0.1847, + "loss_text": 1.5092, + "ppl": 5.4407, + "step": 7261 + }, + { + "epoch": 0.04, + "global_step": 7262, + "learning_rate": 0.00047052587646076796, + "loss": 1.6971, + "loss_base2": 2.4484, + "loss_pixel": 0.1729, + "loss_text": 1.5242, + "ppl": 5.4581, + "step": 7262 + }, + { + "epoch": 0.04, + "global_step": 7263, + "learning_rate": 0.00047052170283806347, + "loss": 1.6649, + "loss_base2": 2.4019, + "loss_pixel": 0.1713, + "loss_text": 1.4936, + "ppl": 5.2851, + "step": 7263 + }, + { + "epoch": 0.04, + "global_step": 7264, + "learning_rate": 0.000470517529215359, + "loss": 1.6871, + "loss_base2": 2.434, + "loss_pixel": 0.1724, + "loss_text": 1.5146, + "ppl": 5.4038, + "step": 7264 + }, + { + "epoch": 0.04, + "global_step": 7265, + "learning_rate": 0.0004705133555926545, + "loss": 1.6743, + "loss_base2": 2.4155, + "loss_pixel": 0.1722, + "loss_text": 1.5021, + "ppl": 5.3351, + "step": 7265 + }, + { + "epoch": 0.04, + "global_step": 7266, + "learning_rate": 0.0004705091819699499, + "loss": 1.6674, + "loss_base2": 2.4055, + "loss_pixel": 0.1711, + "loss_text": 1.4963, + "ppl": 5.2984, + "step": 7266 + }, + { + "epoch": 0.04, + "global_step": 7267, + "learning_rate": 0.0004705050083472454, + "loss": 1.6607, + "loss_base2": 2.3959, + "loss_pixel": 0.1717, + "loss_text": 1.4891, + "ppl": 5.263, + "step": 7267 + }, + { + "epoch": 0.04, + "global_step": 7268, + "learning_rate": 0.0004705008347245409, + "loss": 1.6706, + "loss_base2": 2.4102, + "loss_pixel": 0.1697, + "loss_text": 1.501, + "ppl": 5.3154, + "step": 7268 + }, + { + "epoch": 0.04, + "global_step": 7269, + "learning_rate": 0.0004704966611018364, + "loss": 1.6787, + "loss_base2": 2.4219, + "loss_pixel": 0.1693, + "loss_text": 1.5094, + "ppl": 5.3586, + "step": 7269 + }, + { + "epoch": 0.04, + "global_step": 7270, + "learning_rate": 0.00047049248747913186, + "loss": 1.6772, + "loss_base2": 2.4197, + "loss_pixel": 0.1701, + "loss_text": 1.5071, + "ppl": 5.3506, + "step": 7270 + }, + { + "epoch": 0.04, + "global_step": 7271, + "learning_rate": 0.00047048831385642736, + "loss": 1.6755, + "loss_base2": 2.4172, + "loss_pixel": 0.1718, + "loss_text": 1.5037, + "ppl": 5.3415, + "step": 7271 + }, + { + "epoch": 0.04, + "global_step": 7272, + "learning_rate": 0.00047048414023372287, + "loss": 1.6707, + "loss_base2": 2.4103, + "loss_pixel": 0.17, + "loss_text": 1.5007, + "ppl": 5.3159, + "step": 7272 + }, + { + "epoch": 0.04, + "global_step": 7273, + "learning_rate": 0.0004704799666110184, + "loss": 1.675, + "loss_base2": 2.4165, + "loss_pixel": 0.17, + "loss_text": 1.505, + "ppl": 5.3388, + "step": 7273 + }, + { + "epoch": 0.04, + "global_step": 7274, + "learning_rate": 0.0004704757929883139, + "loss": 1.6921, + "loss_base2": 2.4412, + "loss_pixel": 0.1695, + "loss_text": 1.5226, + "ppl": 5.4309, + "step": 7274 + }, + { + "epoch": 0.04, + "global_step": 7275, + "learning_rate": 0.00047047161936560934, + "loss": 1.6925, + "loss_base2": 2.4418, + "loss_pixel": 0.1708, + "loss_text": 1.5217, + "ppl": 5.433, + "step": 7275 + }, + { + "epoch": 0.04, + "global_step": 7276, + "learning_rate": 0.00047046744574290485, + "loss": 1.6849, + "loss_base2": 2.4308, + "loss_pixel": 0.1706, + "loss_text": 1.5143, + "ppl": 5.3919, + "step": 7276 + }, + { + "epoch": 0.04, + "global_step": 7277, + "learning_rate": 0.00047046327212020035, + "loss": 1.7064, + "loss_base2": 2.4618, + "loss_pixel": 0.1843, + "loss_text": 1.5221, + "ppl": 5.5091, + "step": 7277 + }, + { + "epoch": 0.04, + "global_step": 7278, + "learning_rate": 0.00047045909849749586, + "loss": 1.6844, + "loss_base2": 2.4301, + "loss_pixel": 0.1821, + "loss_text": 1.5023, + "ppl": 5.3892, + "step": 7278 + }, + { + "epoch": 0.04, + "global_step": 7279, + "learning_rate": 0.0004704549248747913, + "loss": 1.6789, + "loss_base2": 2.4221, + "loss_pixel": 0.1804, + "loss_text": 1.4984, + "ppl": 5.3597, + "step": 7279 + }, + { + "epoch": 0.04, + "global_step": 7280, + "learning_rate": 0.0004704507512520868, + "loss": 1.6628, + "loss_base2": 2.3989, + "loss_pixel": 0.1819, + "loss_text": 1.4809, + "ppl": 5.2741, + "step": 7280 + }, + { + "epoch": 0.04, + "global_step": 7281, + "learning_rate": 0.00047044657762938233, + "loss": 1.4805, + "loss_base2": 2.1359, + "loss_pixel": 0.1804, + "loss_text": 1.3001, + "ppl": 4.3951, + "step": 7281 + }, + { + "epoch": 0.04, + "global_step": 7282, + "learning_rate": 0.00047044240400667784, + "loss": 1.4755, + "loss_base2": 2.1287, + "loss_pixel": 0.179, + "loss_text": 1.2965, + "ppl": 4.3732, + "step": 7282 + }, + { + "epoch": 0.04, + "global_step": 7283, + "learning_rate": 0.00047043823038397334, + "loss": 1.4681, + "loss_base2": 2.118, + "loss_pixel": 0.1795, + "loss_text": 1.2886, + "ppl": 4.341, + "step": 7283 + }, + { + "epoch": 0.04, + "global_step": 7284, + "learning_rate": 0.00047043405676126874, + "loss": 1.439, + "loss_base2": 2.076, + "loss_pixel": 0.1799, + "loss_text": 1.2592, + "ppl": 4.2165, + "step": 7284 + }, + { + "epoch": 0.04, + "global_step": 7285, + "learning_rate": 0.00047042988313856425, + "loss": 1.4408, + "loss_base2": 2.0786, + "loss_pixel": 0.1808, + "loss_text": 1.2599, + "ppl": 4.2241, + "step": 7285 + }, + { + "epoch": 0.04, + "global_step": 7286, + "learning_rate": 0.00047042570951585976, + "loss": 1.4517, + "loss_base2": 2.0944, + "loss_pixel": 0.1802, + "loss_text": 1.2715, + "ppl": 4.2704, + "step": 7286 + }, + { + "epoch": 0.04, + "global_step": 7287, + "learning_rate": 0.00047042153589315526, + "loss": 1.4436, + "loss_base2": 2.0827, + "loss_pixel": 0.1785, + "loss_text": 1.2651, + "ppl": 4.2359, + "step": 7287 + }, + { + "epoch": 0.04, + "global_step": 7288, + "learning_rate": 0.00047041736227045077, + "loss": 1.4605, + "loss_base2": 2.1071, + "loss_pixel": 0.1797, + "loss_text": 1.2808, + "ppl": 4.3081, + "step": 7288 + }, + { + "epoch": 0.04, + "global_step": 7289, + "learning_rate": 0.0004704131886477462, + "loss": 1.5239, + "loss_base2": 2.1985, + "loss_pixel": 0.1803, + "loss_text": 1.3436, + "ppl": 4.5901, + "step": 7289 + }, + { + "epoch": 0.04, + "global_step": 7290, + "learning_rate": 0.00047040901502504173, + "loss": 1.6234, + "loss_base2": 2.3421, + "loss_pixel": 0.1796, + "loss_text": 1.4438, + "ppl": 5.0703, + "step": 7290 + }, + { + "epoch": 0.04, + "global_step": 7291, + "learning_rate": 0.00047040484140233724, + "loss": 1.6172, + "loss_base2": 2.3331, + "loss_pixel": 0.1794, + "loss_text": 1.4378, + "ppl": 5.039, + "step": 7291 + }, + { + "epoch": 0.04, + "global_step": 7292, + "learning_rate": 0.00047040066777963275, + "loss": 1.6227, + "loss_base2": 2.3411, + "loss_pixel": 0.1782, + "loss_text": 1.4446, + "ppl": 5.0668, + "step": 7292 + }, + { + "epoch": 0.04, + "global_step": 7293, + "learning_rate": 0.0004703964941569282, + "loss": 1.5873, + "loss_base2": 2.29, + "loss_pixel": 0.1787, + "loss_text": 1.4085, + "ppl": 4.8905, + "step": 7293 + }, + { + "epoch": 0.04, + "global_step": 7294, + "learning_rate": 0.0004703923205342237, + "loss": 1.4399, + "loss_base2": 2.0773, + "loss_pixel": 0.1781, + "loss_text": 1.2618, + "ppl": 4.2203, + "step": 7294 + }, + { + "epoch": 0.04, + "global_step": 7295, + "learning_rate": 0.0004703881469115192, + "loss": 1.4396, + "loss_base2": 2.0769, + "loss_pixel": 0.1792, + "loss_text": 1.2604, + "ppl": 4.219, + "step": 7295 + }, + { + "epoch": 0.04, + "global_step": 7296, + "learning_rate": 0.0004703839732888147, + "loss": 1.4521, + "loss_base2": 2.0949, + "loss_pixel": 0.178, + "loss_text": 1.2741, + "ppl": 4.2721, + "step": 7296 + }, + { + "epoch": 0.04, + "global_step": 7297, + "learning_rate": 0.00047037979966611023, + "loss": 1.4512, + "loss_base2": 2.0936, + "loss_pixel": 0.1797, + "loss_text": 1.2715, + "ppl": 4.2682, + "step": 7297 + }, + { + "epoch": 0.04, + "global_step": 7298, + "learning_rate": 0.0004703756260434057, + "loss": 1.4586, + "loss_base2": 2.1043, + "loss_pixel": 0.179, + "loss_text": 1.2796, + "ppl": 4.2999, + "step": 7298 + }, + { + "epoch": 0.04, + "global_step": 7299, + "learning_rate": 0.0004703714524207012, + "loss": 1.4447, + "loss_base2": 2.0843, + "loss_pixel": 0.1806, + "loss_text": 1.264, + "ppl": 4.2406, + "step": 7299 + }, + { + "epoch": 0.04, + "global_step": 7300, + "learning_rate": 0.0004703672787979967, + "loss": 1.4701, + "loss_base2": 2.1209, + "loss_pixel": 0.1802, + "loss_text": 1.2899, + "ppl": 4.3497, + "step": 7300 + }, + { + "epoch": 0.04, + "global_step": 7301, + "learning_rate": 0.0004703631051752922, + "loss": 1.4679, + "loss_base2": 2.1177, + "loss_pixel": 0.1792, + "loss_text": 1.2887, + "ppl": 4.3401, + "step": 7301 + }, + { + "epoch": 0.04, + "global_step": 7302, + "learning_rate": 0.00047035893155258766, + "loss": 1.4395, + "loss_base2": 2.0768, + "loss_pixel": 0.1788, + "loss_text": 1.2608, + "ppl": 4.2186, + "step": 7302 + }, + { + "epoch": 0.04, + "global_step": 7303, + "learning_rate": 0.0004703547579298831, + "loss": 1.4516, + "loss_base2": 2.0942, + "loss_pixel": 0.1773, + "loss_text": 1.2743, + "ppl": 4.2699, + "step": 7303 + }, + { + "epoch": 0.04, + "global_step": 7304, + "learning_rate": 0.0004703505843071786, + "loss": 1.4703, + "loss_base2": 2.1212, + "loss_pixel": 0.1778, + "loss_text": 1.2925, + "ppl": 4.3505, + "step": 7304 + }, + { + "epoch": 0.04, + "global_step": 7305, + "learning_rate": 0.0004703464106844741, + "loss": 1.4565, + "loss_base2": 2.1013, + "loss_pixel": 0.1788, + "loss_text": 1.2777, + "ppl": 4.2909, + "step": 7305 + }, + { + "epoch": 0.04, + "global_step": 7306, + "learning_rate": 0.00047034223706176963, + "loss": 1.4528, + "loss_base2": 2.0959, + "loss_pixel": 0.1781, + "loss_text": 1.2746, + "ppl": 4.2751, + "step": 7306 + }, + { + "epoch": 0.04, + "global_step": 7307, + "learning_rate": 0.0004703380634390651, + "loss": 1.4499, + "loss_base2": 2.0918, + "loss_pixel": 0.1781, + "loss_text": 1.2718, + "ppl": 4.2627, + "step": 7307 + }, + { + "epoch": 0.04, + "global_step": 7308, + "learning_rate": 0.0004703338898163606, + "loss": 1.4389, + "loss_base2": 2.0759, + "loss_pixel": 0.1782, + "loss_text": 1.2606, + "ppl": 4.2161, + "step": 7308 + }, + { + "epoch": 0.04, + "global_step": 7309, + "learning_rate": 0.0004703297161936561, + "loss": 1.4934, + "loss_base2": 2.1545, + "loss_pixel": 0.1786, + "loss_text": 1.3148, + "ppl": 4.4522, + "step": 7309 + }, + { + "epoch": 0.04, + "global_step": 7310, + "learning_rate": 0.0004703255425709516, + "loss": 1.665, + "loss_base2": 2.4021, + "loss_pixel": 0.18, + "loss_text": 1.485, + "ppl": 5.2857, + "step": 7310 + }, + { + "epoch": 0.04, + "global_step": 7311, + "learning_rate": 0.00047032136894824706, + "loss": 1.7306, + "loss_base2": 2.4967, + "loss_pixel": 0.1782, + "loss_text": 1.5523, + "ppl": 5.644, + "step": 7311 + }, + { + "epoch": 0.04, + "global_step": 7312, + "learning_rate": 0.00047031719532554257, + "loss": 1.7238, + "loss_base2": 2.4869, + "loss_pixel": 0.1775, + "loss_text": 1.5464, + "ppl": 5.6058, + "step": 7312 + }, + { + "epoch": 0.04, + "global_step": 7313, + "learning_rate": 0.0004703130217028381, + "loss": 1.7102, + "loss_base2": 2.4673, + "loss_pixel": 0.1779, + "loss_text": 1.5323, + "ppl": 5.5301, + "step": 7313 + }, + { + "epoch": 0.04, + "global_step": 7314, + "learning_rate": 0.0004703088480801336, + "loss": 1.7112, + "loss_base2": 2.4687, + "loss_pixel": 0.178, + "loss_text": 1.5332, + "ppl": 5.5356, + "step": 7314 + }, + { + "epoch": 0.04, + "global_step": 7315, + "learning_rate": 0.0004703046744574291, + "loss": 1.6899, + "loss_base2": 2.438, + "loss_pixel": 0.1802, + "loss_text": 1.5097, + "ppl": 5.4189, + "step": 7315 + }, + { + "epoch": 0.04, + "global_step": 7316, + "learning_rate": 0.00047030050083472454, + "loss": 1.6929, + "loss_base2": 2.4423, + "loss_pixel": 0.1796, + "loss_text": 1.5134, + "ppl": 5.4352, + "step": 7316 + }, + { + "epoch": 0.04, + "global_step": 7317, + "learning_rate": 0.00047029632721202005, + "loss": 1.7086, + "loss_base2": 2.465, + "loss_pixel": 0.179, + "loss_text": 1.5295, + "ppl": 5.5212, + "step": 7317 + }, + { + "epoch": 0.04, + "global_step": 7318, + "learning_rate": 0.00047029215358931556, + "loss": 1.6817, + "loss_base2": 2.4262, + "loss_pixel": 0.1772, + "loss_text": 1.5045, + "ppl": 5.3747, + "step": 7318 + }, + { + "epoch": 0.04, + "global_step": 7319, + "learning_rate": 0.00047028797996661107, + "loss": 1.7056, + "loss_base2": 2.4607, + "loss_pixel": 0.1788, + "loss_text": 1.5269, + "ppl": 5.5047, + "step": 7319 + }, + { + "epoch": 0.04, + "global_step": 7320, + "learning_rate": 0.0004702838063439065, + "loss": 1.6857, + "loss_base2": 2.432, + "loss_pixel": 0.1787, + "loss_text": 1.507, + "ppl": 5.3962, + "step": 7320 + }, + { + "epoch": 0.04, + "global_step": 7321, + "learning_rate": 0.000470279632721202, + "loss": 1.7071, + "loss_base2": 2.4628, + "loss_pixel": 0.1788, + "loss_text": 1.5284, + "ppl": 5.513, + "step": 7321 + }, + { + "epoch": 0.04, + "global_step": 7322, + "learning_rate": 0.0004702754590984975, + "loss": 1.692, + "loss_base2": 2.441, + "loss_pixel": 0.1785, + "loss_text": 1.5135, + "ppl": 5.4303, + "step": 7322 + }, + { + "epoch": 0.04, + "global_step": 7323, + "learning_rate": 0.000470271285475793, + "loss": 1.6921, + "loss_base2": 2.4412, + "loss_pixel": 0.1789, + "loss_text": 1.5132, + "ppl": 5.4309, + "step": 7323 + }, + { + "epoch": 0.04, + "global_step": 7324, + "learning_rate": 0.0004702671118530885, + "loss": 1.7019, + "loss_base2": 2.4553, + "loss_pixel": 0.1771, + "loss_text": 1.5248, + "ppl": 5.4844, + "step": 7324 + }, + { + "epoch": 0.04, + "global_step": 7325, + "learning_rate": 0.00047026293823038395, + "loss": 1.7027, + "loss_base2": 2.4565, + "loss_pixel": 0.1777, + "loss_text": 1.525, + "ppl": 5.4887, + "step": 7325 + }, + { + "epoch": 0.04, + "global_step": 7326, + "learning_rate": 0.00047025876460767945, + "loss": 1.708, + "loss_base2": 2.4641, + "loss_pixel": 0.1776, + "loss_text": 1.5304, + "ppl": 5.5179, + "step": 7326 + }, + { + "epoch": 0.04, + "global_step": 7327, + "learning_rate": 0.00047025459098497496, + "loss": 1.7032, + "loss_base2": 2.4572, + "loss_pixel": 0.1788, + "loss_text": 1.5244, + "ppl": 5.4915, + "step": 7327 + }, + { + "epoch": 0.04, + "global_step": 7328, + "learning_rate": 0.00047025041736227047, + "loss": 1.6794, + "loss_base2": 2.4229, + "loss_pixel": 0.1779, + "loss_text": 1.5015, + "ppl": 5.3623, + "step": 7328 + }, + { + "epoch": 0.04, + "global_step": 7329, + "learning_rate": 0.0004702462437395659, + "loss": 1.6979, + "loss_base2": 2.4496, + "loss_pixel": 0.1793, + "loss_text": 1.5186, + "ppl": 5.4625, + "step": 7329 + }, + { + "epoch": 0.04, + "global_step": 7330, + "learning_rate": 0.00047024207011686143, + "loss": 1.692, + "loss_base2": 2.441, + "loss_pixel": 0.1777, + "loss_text": 1.5143, + "ppl": 5.4303, + "step": 7330 + }, + { + "epoch": 0.04, + "global_step": 7331, + "learning_rate": 0.00047023789649415694, + "loss": 1.6853, + "loss_base2": 2.4314, + "loss_pixel": 0.1782, + "loss_text": 1.5071, + "ppl": 5.3941, + "step": 7331 + }, + { + "epoch": 0.04, + "global_step": 7332, + "learning_rate": 0.00047023372287145244, + "loss": 1.6825, + "loss_base2": 2.4273, + "loss_pixel": 0.1786, + "loss_text": 1.5038, + "ppl": 5.379, + "step": 7332 + }, + { + "epoch": 0.04, + "global_step": 7333, + "learning_rate": 0.00047022954924874795, + "loss": 1.6561, + "loss_base2": 2.3892, + "loss_pixel": 0.1768, + "loss_text": 1.4794, + "ppl": 5.2388, + "step": 7333 + }, + { + "epoch": 0.04, + "global_step": 7334, + "learning_rate": 0.0004702253756260434, + "loss": 1.6802, + "loss_base2": 2.424, + "loss_pixel": 0.1783, + "loss_text": 1.5019, + "ppl": 5.3666, + "step": 7334 + }, + { + "epoch": 0.04, + "global_step": 7335, + "learning_rate": 0.0004702212020033389, + "loss": 1.6357, + "loss_base2": 2.3598, + "loss_pixel": 0.1774, + "loss_text": 1.4584, + "ppl": 5.133, + "step": 7335 + }, + { + "epoch": 0.04, + "global_step": 7336, + "learning_rate": 0.0004702170283806344, + "loss": 1.5027, + "loss_base2": 2.1679, + "loss_pixel": 0.1781, + "loss_text": 1.3245, + "ppl": 4.4938, + "step": 7336 + }, + { + "epoch": 0.04, + "global_step": 7337, + "learning_rate": 0.0004702128547579299, + "loss": 1.4669, + "loss_base2": 2.1163, + "loss_pixel": 0.1772, + "loss_text": 1.2897, + "ppl": 4.3358, + "step": 7337 + }, + { + "epoch": 0.04, + "global_step": 7338, + "learning_rate": 0.0004702086811352254, + "loss": 1.4363, + "loss_base2": 2.0721, + "loss_pixel": 0.1769, + "loss_text": 1.2594, + "ppl": 4.2051, + "step": 7338 + }, + { + "epoch": 0.04, + "global_step": 7339, + "learning_rate": 0.0004702045075125209, + "loss": 1.4512, + "loss_base2": 2.0936, + "loss_pixel": 0.1779, + "loss_text": 1.2734, + "ppl": 4.2682, + "step": 7339 + }, + { + "epoch": 0.04, + "global_step": 7340, + "learning_rate": 0.0004702003338898164, + "loss": 1.434, + "loss_base2": 2.0688, + "loss_pixel": 0.1782, + "loss_text": 1.2558, + "ppl": 4.1954, + "step": 7340 + }, + { + "epoch": 0.04, + "global_step": 7341, + "learning_rate": 0.00047019616026711185, + "loss": 1.4484, + "loss_base2": 2.0896, + "loss_pixel": 0.1774, + "loss_text": 1.271, + "ppl": 4.2563, + "step": 7341 + }, + { + "epoch": 0.04, + "global_step": 7342, + "learning_rate": 0.00047019198664440735, + "loss": 1.4358, + "loss_base2": 2.0714, + "loss_pixel": 0.1773, + "loss_text": 1.2585, + "ppl": 4.203, + "step": 7342 + }, + { + "epoch": 0.04, + "global_step": 7343, + "learning_rate": 0.0004701878130217028, + "loss": 1.4306, + "loss_base2": 2.0639, + "loss_pixel": 0.1792, + "loss_text": 1.2514, + "ppl": 4.1812, + "step": 7343 + }, + { + "epoch": 0.04, + "global_step": 7344, + "learning_rate": 0.0004701836393989983, + "loss": 1.4605, + "loss_base2": 2.1071, + "loss_pixel": 0.1757, + "loss_text": 1.2848, + "ppl": 4.3081, + "step": 7344 + }, + { + "epoch": 0.04, + "global_step": 7345, + "learning_rate": 0.0004701794657762938, + "loss": 1.464, + "loss_base2": 2.1121, + "loss_pixel": 0.1765, + "loss_text": 1.2875, + "ppl": 4.3232, + "step": 7345 + }, + { + "epoch": 0.04, + "global_step": 7346, + "learning_rate": 0.00047017529215358933, + "loss": 1.4692, + "loss_base2": 2.1196, + "loss_pixel": 0.177, + "loss_text": 1.2922, + "ppl": 4.3458, + "step": 7346 + }, + { + "epoch": 0.04, + "global_step": 7347, + "learning_rate": 0.00047017111853088484, + "loss": 1.4452, + "loss_base2": 2.085, + "loss_pixel": 0.1768, + "loss_text": 1.2684, + "ppl": 4.2427, + "step": 7347 + }, + { + "epoch": 0.04, + "global_step": 7348, + "learning_rate": 0.0004701669449081803, + "loss": 1.4418, + "loss_base2": 2.0801, + "loss_pixel": 0.1784, + "loss_text": 1.2634, + "ppl": 4.2283, + "step": 7348 + }, + { + "epoch": 0.04, + "global_step": 7349, + "learning_rate": 0.0004701627712854758, + "loss": 1.4616, + "loss_base2": 2.1086, + "loss_pixel": 0.178, + "loss_text": 1.2836, + "ppl": 4.3129, + "step": 7349 + }, + { + "epoch": 0.04, + "global_step": 7350, + "learning_rate": 0.0004701585976627713, + "loss": 1.4369, + "loss_base2": 2.073, + "loss_pixel": 0.1781, + "loss_text": 1.2588, + "ppl": 4.2076, + "step": 7350 + }, + { + "epoch": 0.04, + "global_step": 7351, + "learning_rate": 0.0004701544240400668, + "loss": 1.6991, + "loss_base2": 2.4513, + "loss_pixel": 0.1762, + "loss_text": 1.5229, + "ppl": 5.469, + "step": 7351 + }, + { + "epoch": 0.04, + "global_step": 7352, + "learning_rate": 0.00047015025041736226, + "loss": 1.7057, + "loss_base2": 2.4608, + "loss_pixel": 0.1777, + "loss_text": 1.528, + "ppl": 5.5052, + "step": 7352 + }, + { + "epoch": 0.04, + "global_step": 7353, + "learning_rate": 0.00047014607679465777, + "loss": 1.6929, + "loss_base2": 2.4423, + "loss_pixel": 0.1774, + "loss_text": 1.5156, + "ppl": 5.4352, + "step": 7353 + }, + { + "epoch": 0.04, + "global_step": 7354, + "learning_rate": 0.0004701419031719533, + "loss": 1.7225, + "loss_base2": 2.485, + "loss_pixel": 0.1768, + "loss_text": 1.5457, + "ppl": 5.5985, + "step": 7354 + }, + { + "epoch": 0.04, + "global_step": 7355, + "learning_rate": 0.0004701377295492488, + "loss": 1.695, + "loss_base2": 2.4454, + "loss_pixel": 0.179, + "loss_text": 1.516, + "ppl": 5.4466, + "step": 7355 + }, + { + "epoch": 0.04, + "global_step": 7356, + "learning_rate": 0.0004701335559265443, + "loss": 1.7028, + "loss_base2": 2.4566, + "loss_pixel": 0.1775, + "loss_text": 1.5253, + "ppl": 5.4893, + "step": 7356 + }, + { + "epoch": 0.04, + "global_step": 7357, + "learning_rate": 0.00047012938230383975, + "loss": 1.7007, + "loss_base2": 2.4536, + "loss_pixel": 0.1783, + "loss_text": 1.5223, + "ppl": 5.4778, + "step": 7357 + }, + { + "epoch": 0.04, + "global_step": 7358, + "learning_rate": 0.00047012520868113525, + "loss": 1.7034, + "loss_base2": 2.4575, + "loss_pixel": 0.1785, + "loss_text": 1.5249, + "ppl": 5.4926, + "step": 7358 + }, + { + "epoch": 0.04, + "global_step": 7359, + "learning_rate": 0.00047012103505843076, + "loss": 1.7014, + "loss_base2": 2.4546, + "loss_pixel": 0.1778, + "loss_text": 1.5236, + "ppl": 5.4816, + "step": 7359 + }, + { + "epoch": 0.04, + "global_step": 7360, + "learning_rate": 0.0004701168614357262, + "loss": 1.6947, + "loss_base2": 2.4449, + "loss_pixel": 0.1783, + "loss_text": 1.5164, + "ppl": 5.445, + "step": 7360 + }, + { + "epoch": 0.04, + "global_step": 7361, + "learning_rate": 0.00047011268781302167, + "loss": 1.7018, + "loss_base2": 2.4552, + "loss_pixel": 0.1784, + "loss_text": 1.5234, + "ppl": 5.4838, + "step": 7361 + }, + { + "epoch": 0.04, + "global_step": 7362, + "learning_rate": 0.0004701085141903172, + "loss": 1.6809, + "loss_base2": 2.425, + "loss_pixel": 0.1774, + "loss_text": 1.5035, + "ppl": 5.3704, + "step": 7362 + }, + { + "epoch": 0.04, + "global_step": 7363, + "learning_rate": 0.0004701043405676127, + "loss": 1.6943, + "loss_base2": 2.4444, + "loss_pixel": 0.1766, + "loss_text": 1.5177, + "ppl": 5.4428, + "step": 7363 + }, + { + "epoch": 0.04, + "global_step": 7364, + "learning_rate": 0.0004701001669449082, + "loss": 1.6827, + "loss_base2": 2.4276, + "loss_pixel": 0.178, + "loss_text": 1.5047, + "ppl": 5.3801, + "step": 7364 + }, + { + "epoch": 0.04, + "global_step": 7365, + "learning_rate": 0.0004700959933222037, + "loss": 1.7105, + "loss_base2": 2.4677, + "loss_pixel": 0.1777, + "loss_text": 1.5328, + "ppl": 5.5317, + "step": 7365 + }, + { + "epoch": 0.04, + "global_step": 7366, + "learning_rate": 0.00047009181969949915, + "loss": 1.7023, + "loss_base2": 2.4559, + "loss_pixel": 0.1783, + "loss_text": 1.524, + "ppl": 5.4866, + "step": 7366 + }, + { + "epoch": 0.04, + "global_step": 7367, + "learning_rate": 0.00047008764607679466, + "loss": 1.6856, + "loss_base2": 2.4318, + "loss_pixel": 0.1771, + "loss_text": 1.5085, + "ppl": 5.3957, + "step": 7367 + }, + { + "epoch": 0.04, + "global_step": 7368, + "learning_rate": 0.00047008347245409016, + "loss": 1.6757, + "loss_base2": 2.4175, + "loss_pixel": 0.1789, + "loss_text": 1.4968, + "ppl": 5.3425, + "step": 7368 + }, + { + "epoch": 0.04, + "global_step": 7369, + "learning_rate": 0.00047007929883138567, + "loss": 1.7013, + "loss_base2": 2.4545, + "loss_pixel": 0.1777, + "loss_text": 1.5236, + "ppl": 5.4811, + "step": 7369 + }, + { + "epoch": 0.04, + "global_step": 7370, + "learning_rate": 0.0004700751252086811, + "loss": 1.6814, + "loss_base2": 2.4257, + "loss_pixel": 0.178, + "loss_text": 1.5033, + "ppl": 5.3731, + "step": 7370 + }, + { + "epoch": 0.04, + "global_step": 7371, + "learning_rate": 0.00047007095158597663, + "loss": 1.7016, + "loss_base2": 2.4549, + "loss_pixel": 0.1775, + "loss_text": 1.5241, + "ppl": 5.4827, + "step": 7371 + }, + { + "epoch": 0.04, + "global_step": 7372, + "learning_rate": 0.00047006677796327214, + "loss": 1.6865, + "loss_base2": 2.4331, + "loss_pixel": 0.1759, + "loss_text": 1.5106, + "ppl": 5.4005, + "step": 7372 + }, + { + "epoch": 0.04, + "global_step": 7373, + "learning_rate": 0.00047006260434056765, + "loss": 1.6748, + "loss_base2": 2.4162, + "loss_pixel": 0.1763, + "loss_text": 1.4984, + "ppl": 5.3377, + "step": 7373 + }, + { + "epoch": 0.04, + "global_step": 7374, + "learning_rate": 0.00047005843071786315, + "loss": 1.6762, + "loss_base2": 2.4182, + "loss_pixel": 0.1771, + "loss_text": 1.499, + "ppl": 5.3452, + "step": 7374 + }, + { + "epoch": 0.04, + "global_step": 7375, + "learning_rate": 0.0004700542570951586, + "loss": 1.6772, + "loss_base2": 2.4197, + "loss_pixel": 0.1784, + "loss_text": 1.4988, + "ppl": 5.3506, + "step": 7375 + }, + { + "epoch": 0.04, + "global_step": 7376, + "learning_rate": 0.0004700500834724541, + "loss": 1.6803, + "loss_base2": 2.4242, + "loss_pixel": 0.1779, + "loss_text": 1.5024, + "ppl": 5.3672, + "step": 7376 + }, + { + "epoch": 0.04, + "global_step": 7377, + "learning_rate": 0.0004700459098497496, + "loss": 1.6559, + "loss_base2": 2.389, + "loss_pixel": 0.1761, + "loss_text": 1.4798, + "ppl": 5.2378, + "step": 7377 + }, + { + "epoch": 0.04, + "global_step": 7378, + "learning_rate": 0.00047004173622704513, + "loss": 1.6767, + "loss_base2": 2.419, + "loss_pixel": 0.1765, + "loss_text": 1.5002, + "ppl": 5.3479, + "step": 7378 + }, + { + "epoch": 0.04, + "global_step": 7379, + "learning_rate": 0.00047003756260434053, + "loss": 1.679, + "loss_base2": 2.4223, + "loss_pixel": 0.1772, + "loss_text": 1.5018, + "ppl": 5.3602, + "step": 7379 + }, + { + "epoch": 0.04, + "global_step": 7380, + "learning_rate": 0.00047003338898163604, + "loss": 1.6679, + "loss_base2": 2.4063, + "loss_pixel": 0.1761, + "loss_text": 1.4919, + "ppl": 5.301, + "step": 7380 + }, + { + "epoch": 0.04, + "global_step": 7381, + "learning_rate": 0.00047002921535893154, + "loss": 1.686, + "loss_base2": 2.4324, + "loss_pixel": 0.1768, + "loss_text": 1.5092, + "ppl": 5.3978, + "step": 7381 + }, + { + "epoch": 0.04, + "global_step": 7382, + "learning_rate": 0.00047002504173622705, + "loss": 1.7033, + "loss_base2": 2.4573, + "loss_pixel": 0.1771, + "loss_text": 1.5262, + "ppl": 5.492, + "step": 7382 + }, + { + "epoch": 0.04, + "global_step": 7383, + "learning_rate": 0.00047002086811352256, + "loss": 1.6728, + "loss_base2": 2.4133, + "loss_pixel": 0.1778, + "loss_text": 1.4949, + "ppl": 5.3271, + "step": 7383 + }, + { + "epoch": 0.04, + "global_step": 7384, + "learning_rate": 0.000470016694490818, + "loss": 1.665, + "loss_base2": 2.4021, + "loss_pixel": 0.1762, + "loss_text": 1.4888, + "ppl": 5.2857, + "step": 7384 + }, + { + "epoch": 0.04, + "global_step": 7385, + "learning_rate": 0.0004700125208681135, + "loss": 1.6717, + "loss_base2": 2.4118, + "loss_pixel": 0.177, + "loss_text": 1.4947, + "ppl": 5.3212, + "step": 7385 + }, + { + "epoch": 0.04, + "global_step": 7386, + "learning_rate": 0.000470008347245409, + "loss": 1.6683, + "loss_base2": 2.4068, + "loss_pixel": 0.175, + "loss_text": 1.4933, + "ppl": 5.3031, + "step": 7386 + }, + { + "epoch": 0.04, + "global_step": 7387, + "learning_rate": 0.00047000417362270453, + "loss": 1.6668, + "loss_base2": 2.4047, + "loss_pixel": 0.1779, + "loss_text": 1.489, + "ppl": 5.2952, + "step": 7387 + }, + { + "epoch": 0.04, + "global_step": 7388, + "learning_rate": 0.00047, + "loss": 1.6942, + "loss_base2": 2.4442, + "loss_pixel": 0.1775, + "loss_text": 1.5167, + "ppl": 5.4423, + "step": 7388 + }, + { + "epoch": 0.04, + "global_step": 7389, + "learning_rate": 0.0004699958263772955, + "loss": 1.6806, + "loss_base2": 2.4246, + "loss_pixel": 0.1781, + "loss_text": 1.5025, + "ppl": 5.3688, + "step": 7389 + }, + { + "epoch": 0.04, + "global_step": 7390, + "learning_rate": 0.000469991652754591, + "loss": 1.6788, + "loss_base2": 2.422, + "loss_pixel": 0.1771, + "loss_text": 1.5017, + "ppl": 5.3591, + "step": 7390 + }, + { + "epoch": 0.04, + "global_step": 7391, + "learning_rate": 0.0004699874791318865, + "loss": 1.674, + "loss_base2": 2.4151, + "loss_pixel": 0.1776, + "loss_text": 1.4963, + "ppl": 5.3335, + "step": 7391 + }, + { + "epoch": 0.04, + "global_step": 7392, + "learning_rate": 0.000469983305509182, + "loss": 1.6763, + "loss_base2": 2.4184, + "loss_pixel": 0.1775, + "loss_text": 1.4988, + "ppl": 5.3457, + "step": 7392 + }, + { + "epoch": 0.04, + "global_step": 7393, + "learning_rate": 0.00046997913188647747, + "loss": 1.6727, + "loss_base2": 2.4132, + "loss_pixel": 0.1778, + "loss_text": 1.4949, + "ppl": 5.3265, + "step": 7393 + }, + { + "epoch": 0.04, + "global_step": 7394, + "learning_rate": 0.000469974958263773, + "loss": 1.6749, + "loss_base2": 2.4164, + "loss_pixel": 0.177, + "loss_text": 1.498, + "ppl": 5.3383, + "step": 7394 + }, + { + "epoch": 0.04, + "global_step": 7395, + "learning_rate": 0.0004699707846410685, + "loss": 1.6596, + "loss_base2": 2.3943, + "loss_pixel": 0.1781, + "loss_text": 1.4816, + "ppl": 5.2572, + "step": 7395 + }, + { + "epoch": 0.04, + "global_step": 7396, + "learning_rate": 0.000469966611018364, + "loss": 1.6662, + "loss_base2": 2.4038, + "loss_pixel": 0.1781, + "loss_text": 1.488, + "ppl": 5.292, + "step": 7396 + }, + { + "epoch": 0.04, + "global_step": 7397, + "learning_rate": 0.0004699624373956594, + "loss": 1.6584, + "loss_base2": 2.3926, + "loss_pixel": 0.1767, + "loss_text": 1.4817, + "ppl": 5.2509, + "step": 7397 + }, + { + "epoch": 0.04, + "global_step": 7398, + "learning_rate": 0.0004699582637729549, + "loss": 1.6827, + "loss_base2": 2.4276, + "loss_pixel": 0.1788, + "loss_text": 1.504, + "ppl": 5.3801, + "step": 7398 + }, + { + "epoch": 0.04, + "global_step": 7399, + "learning_rate": 0.0004699540901502504, + "loss": 1.6637, + "loss_base2": 2.4002, + "loss_pixel": 0.1771, + "loss_text": 1.4865, + "ppl": 5.2788, + "step": 7399 + }, + { + "epoch": 0.04, + "global_step": 7400, + "learning_rate": 0.0004699499165275459, + "loss": 1.6886, + "loss_base2": 2.4361, + "loss_pixel": 0.1774, + "loss_text": 1.5112, + "ppl": 5.4119, + "step": 7400 + }, + { + "epoch": 0.04, + "global_step": 7401, + "learning_rate": 0.0004699457429048414, + "loss": 1.6919, + "loss_base2": 2.4409, + "loss_pixel": 0.1778, + "loss_text": 1.5142, + "ppl": 5.4298, + "step": 7401 + }, + { + "epoch": 0.04, + "global_step": 7402, + "learning_rate": 0.00046994156928213687, + "loss": 1.6596, + "loss_base2": 2.3943, + "loss_pixel": 0.1764, + "loss_text": 1.4832, + "ppl": 5.2572, + "step": 7402 + }, + { + "epoch": 0.04, + "global_step": 7403, + "learning_rate": 0.0004699373956594324, + "loss": 1.6933, + "loss_base2": 2.4429, + "loss_pixel": 0.1765, + "loss_text": 1.5167, + "ppl": 5.4374, + "step": 7403 + }, + { + "epoch": 0.04, + "global_step": 7404, + "learning_rate": 0.0004699332220367279, + "loss": 1.6912, + "loss_base2": 2.4399, + "loss_pixel": 0.1771, + "loss_text": 1.514, + "ppl": 5.426, + "step": 7404 + }, + { + "epoch": 0.04, + "global_step": 7405, + "learning_rate": 0.0004699290484140234, + "loss": 1.663, + "loss_base2": 2.3992, + "loss_pixel": 0.1775, + "loss_text": 1.4855, + "ppl": 5.2751, + "step": 7405 + }, + { + "epoch": 0.04, + "global_step": 7406, + "learning_rate": 0.0004699248747913189, + "loss": 1.7027, + "loss_base2": 2.4565, + "loss_pixel": 0.1758, + "loss_text": 1.5269, + "ppl": 5.4887, + "step": 7406 + }, + { + "epoch": 0.04, + "global_step": 7407, + "learning_rate": 0.00046992070116861435, + "loss": 1.6766, + "loss_base2": 2.4188, + "loss_pixel": 0.1754, + "loss_text": 1.5012, + "ppl": 5.3473, + "step": 7407 + }, + { + "epoch": 0.04, + "global_step": 7408, + "learning_rate": 0.00046991652754590986, + "loss": 1.6655, + "loss_base2": 2.4028, + "loss_pixel": 0.1775, + "loss_text": 1.488, + "ppl": 5.2883, + "step": 7408 + }, + { + "epoch": 0.04, + "global_step": 7409, + "learning_rate": 0.00046991235392320537, + "loss": 1.6833, + "loss_base2": 2.4285, + "loss_pixel": 0.1766, + "loss_text": 1.5066, + "ppl": 5.3833, + "step": 7409 + }, + { + "epoch": 0.04, + "global_step": 7410, + "learning_rate": 0.0004699081803005009, + "loss": 1.6785, + "loss_base2": 2.4216, + "loss_pixel": 0.1766, + "loss_text": 1.5019, + "ppl": 5.3575, + "step": 7410 + }, + { + "epoch": 0.04, + "global_step": 7411, + "learning_rate": 0.00046990400667779633, + "loss": 1.6938, + "loss_base2": 2.4436, + "loss_pixel": 0.1766, + "loss_text": 1.5172, + "ppl": 5.4401, + "step": 7411 + }, + { + "epoch": 0.04, + "global_step": 7412, + "learning_rate": 0.00046989983305509184, + "loss": 1.6756, + "loss_base2": 2.4174, + "loss_pixel": 0.1774, + "loss_text": 1.4982, + "ppl": 5.342, + "step": 7412 + }, + { + "epoch": 0.04, + "global_step": 7413, + "learning_rate": 0.00046989565943238734, + "loss": 1.6767, + "loss_base2": 2.419, + "loss_pixel": 0.1781, + "loss_text": 1.4986, + "ppl": 5.3479, + "step": 7413 + }, + { + "epoch": 0.04, + "global_step": 7414, + "learning_rate": 0.00046989148580968285, + "loss": 1.6652, + "loss_base2": 2.4024, + "loss_pixel": 0.178, + "loss_text": 1.4872, + "ppl": 5.2867, + "step": 7414 + }, + { + "epoch": 0.04, + "global_step": 7415, + "learning_rate": 0.00046988731218697836, + "loss": 1.6684, + "loss_base2": 2.407, + "loss_pixel": 0.1764, + "loss_text": 1.492, + "ppl": 5.3037, + "step": 7415 + }, + { + "epoch": 0.04, + "global_step": 7416, + "learning_rate": 0.00046988313856427376, + "loss": 1.6714, + "loss_base2": 2.4113, + "loss_pixel": 0.1766, + "loss_text": 1.4949, + "ppl": 5.3196, + "step": 7416 + }, + { + "epoch": 0.04, + "global_step": 7417, + "learning_rate": 0.00046987896494156926, + "loss": 1.6801, + "loss_base2": 2.4239, + "loss_pixel": 0.1727, + "loss_text": 1.5075, + "ppl": 5.3661, + "step": 7417 + }, + { + "epoch": 0.04, + "global_step": 7418, + "learning_rate": 0.00046987479131886477, + "loss": 1.6713, + "loss_base2": 2.4112, + "loss_pixel": 0.1714, + "loss_text": 1.4999, + "ppl": 5.3191, + "step": 7418 + }, + { + "epoch": 0.04, + "global_step": 7419, + "learning_rate": 0.0004698706176961603, + "loss": 1.6718, + "loss_base2": 2.4119, + "loss_pixel": 0.1727, + "loss_text": 1.499, + "ppl": 5.3217, + "step": 7419 + }, + { + "epoch": 0.04, + "global_step": 7420, + "learning_rate": 0.00046986644407345573, + "loss": 1.6725, + "loss_base2": 2.4129, + "loss_pixel": 0.1712, + "loss_text": 1.5013, + "ppl": 5.3255, + "step": 7420 + }, + { + "epoch": 0.04, + "global_step": 7421, + "learning_rate": 0.00046986227045075124, + "loss": 1.6715, + "loss_base2": 2.4115, + "loss_pixel": 0.1718, + "loss_text": 1.4997, + "ppl": 5.3201, + "step": 7421 + }, + { + "epoch": 0.04, + "global_step": 7422, + "learning_rate": 0.00046985809682804675, + "loss": 1.6743, + "loss_base2": 2.4155, + "loss_pixel": 0.171, + "loss_text": 1.5033, + "ppl": 5.3351, + "step": 7422 + }, + { + "epoch": 0.04, + "global_step": 7423, + "learning_rate": 0.00046985392320534225, + "loss": 1.6805, + "loss_base2": 2.4244, + "loss_pixel": 0.1701, + "loss_text": 1.5105, + "ppl": 5.3682, + "step": 7423 + }, + { + "epoch": 0.04, + "global_step": 7424, + "learning_rate": 0.00046984974958263776, + "loss": 1.6602, + "loss_base2": 2.3952, + "loss_pixel": 0.1733, + "loss_text": 1.4868, + "ppl": 5.2604, + "step": 7424 + }, + { + "epoch": 0.04, + "global_step": 7425, + "learning_rate": 0.0004698455759599332, + "loss": 1.4536, + "loss_base2": 2.0971, + "loss_pixel": 0.1684, + "loss_text": 1.2852, + "ppl": 4.2785, + "step": 7425 + }, + { + "epoch": 0.04, + "global_step": 7426, + "learning_rate": 0.0004698414023372287, + "loss": 1.451, + "loss_base2": 2.0934, + "loss_pixel": 0.1682, + "loss_text": 1.2828, + "ppl": 4.2674, + "step": 7426 + }, + { + "epoch": 0.04, + "global_step": 7427, + "learning_rate": 0.00046983722871452423, + "loss": 1.4432, + "loss_base2": 2.0821, + "loss_pixel": 0.171, + "loss_text": 1.2722, + "ppl": 4.2342, + "step": 7427 + }, + { + "epoch": 0.04, + "global_step": 7428, + "learning_rate": 0.00046983305509181974, + "loss": 1.4545, + "loss_base2": 2.0984, + "loss_pixel": 0.1696, + "loss_text": 1.2849, + "ppl": 4.2823, + "step": 7428 + }, + { + "epoch": 0.04, + "global_step": 7429, + "learning_rate": 0.0004698288814691152, + "loss": 1.4365, + "loss_base2": 2.0724, + "loss_pixel": 0.17, + "loss_text": 1.2664, + "ppl": 4.2059, + "step": 7429 + }, + { + "epoch": 0.04, + "global_step": 7430, + "learning_rate": 0.0004698247078464107, + "loss": 1.4373, + "loss_base2": 2.0736, + "loss_pixel": 0.1697, + "loss_text": 1.2676, + "ppl": 4.2093, + "step": 7430 + }, + { + "epoch": 0.04, + "global_step": 7431, + "learning_rate": 0.0004698205342237062, + "loss": 1.4261, + "loss_base2": 2.0574, + "loss_pixel": 0.1697, + "loss_text": 1.2564, + "ppl": 4.1624, + "step": 7431 + }, + { + "epoch": 0.04, + "global_step": 7432, + "learning_rate": 0.0004698163606010017, + "loss": 1.4671, + "loss_base2": 2.1166, + "loss_pixel": 0.1806, + "loss_text": 1.2865, + "ppl": 4.3366, + "step": 7432 + }, + { + "epoch": 0.04, + "global_step": 7433, + "learning_rate": 0.0004698121869782972, + "loss": 1.7127, + "loss_base2": 2.4709, + "loss_pixel": 0.1793, + "loss_text": 1.5334, + "ppl": 5.5439, + "step": 7433 + }, + { + "epoch": 0.04, + "global_step": 7434, + "learning_rate": 0.00046980801335559267, + "loss": 1.7041, + "loss_base2": 2.4585, + "loss_pixel": 0.1789, + "loss_text": 1.5252, + "ppl": 5.4964, + "step": 7434 + }, + { + "epoch": 0.04, + "global_step": 7435, + "learning_rate": 0.0004698038397328881, + "loss": 1.6832, + "loss_base2": 2.4283, + "loss_pixel": 0.1794, + "loss_text": 1.5038, + "ppl": 5.3828, + "step": 7435 + }, + { + "epoch": 0.04, + "global_step": 7436, + "learning_rate": 0.00046979966611018363, + "loss": 1.6795, + "loss_base2": 2.423, + "loss_pixel": 0.1792, + "loss_text": 1.5003, + "ppl": 5.3629, + "step": 7436 + }, + { + "epoch": 0.04, + "global_step": 7437, + "learning_rate": 0.00046979549248747914, + "loss": 1.6863, + "loss_base2": 2.4328, + "loss_pixel": 0.1784, + "loss_text": 1.5079, + "ppl": 5.3995, + "step": 7437 + }, + { + "epoch": 0.04, + "global_step": 7438, + "learning_rate": 0.0004697913188647746, + "loss": 1.6878, + "loss_base2": 2.435, + "loss_pixel": 0.1796, + "loss_text": 1.5082, + "ppl": 5.4076, + "step": 7438 + }, + { + "epoch": 0.04, + "global_step": 7439, + "learning_rate": 0.0004697871452420701, + "loss": 1.6733, + "loss_base2": 2.4141, + "loss_pixel": 0.1785, + "loss_text": 1.4949, + "ppl": 5.3297, + "step": 7439 + }, + { + "epoch": 0.04, + "global_step": 7440, + "learning_rate": 0.0004697829716193656, + "loss": 1.7011, + "loss_base2": 2.4542, + "loss_pixel": 0.1785, + "loss_text": 1.5226, + "ppl": 5.48, + "step": 7440 + }, + { + "epoch": 0.04, + "global_step": 7441, + "learning_rate": 0.0004697787979966611, + "loss": 1.693, + "loss_base2": 2.4425, + "loss_pixel": 0.1783, + "loss_text": 1.5147, + "ppl": 5.4358, + "step": 7441 + }, + { + "epoch": 0.04, + "global_step": 7442, + "learning_rate": 0.0004697746243739566, + "loss": 1.6666, + "loss_base2": 2.4044, + "loss_pixel": 0.1778, + "loss_text": 1.4887, + "ppl": 5.2941, + "step": 7442 + }, + { + "epoch": 0.04, + "global_step": 7443, + "learning_rate": 0.0004697704507512521, + "loss": 1.6826, + "loss_base2": 2.4275, + "loss_pixel": 0.1777, + "loss_text": 1.5049, + "ppl": 5.3795, + "step": 7443 + }, + { + "epoch": 0.04, + "global_step": 7444, + "learning_rate": 0.0004697662771285476, + "loss": 1.6879, + "loss_base2": 2.4351, + "loss_pixel": 0.1787, + "loss_text": 1.5092, + "ppl": 5.4081, + "step": 7444 + }, + { + "epoch": 0.04, + "global_step": 7445, + "learning_rate": 0.0004697621035058431, + "loss": 1.6997, + "loss_base2": 2.4521, + "loss_pixel": 0.1782, + "loss_text": 1.5215, + "ppl": 5.4723, + "step": 7445 + }, + { + "epoch": 0.04, + "global_step": 7446, + "learning_rate": 0.0004697579298831386, + "loss": 1.6747, + "loss_base2": 2.4161, + "loss_pixel": 0.1785, + "loss_text": 1.4961, + "ppl": 5.3372, + "step": 7446 + }, + { + "epoch": 0.04, + "global_step": 7447, + "learning_rate": 0.00046975375626043405, + "loss": 1.6843, + "loss_base2": 2.4299, + "loss_pixel": 0.178, + "loss_text": 1.5063, + "ppl": 5.3887, + "step": 7447 + }, + { + "epoch": 0.04, + "global_step": 7448, + "learning_rate": 0.00046974958263772956, + "loss": 1.6842, + "loss_base2": 2.4298, + "loss_pixel": 0.1778, + "loss_text": 1.5064, + "ppl": 5.3881, + "step": 7448 + }, + { + "epoch": 0.04, + "global_step": 7449, + "learning_rate": 0.00046974540901502507, + "loss": 1.6896, + "loss_base2": 2.4376, + "loss_pixel": 0.178, + "loss_text": 1.5116, + "ppl": 5.4173, + "step": 7449 + }, + { + "epoch": 0.04, + "global_step": 7450, + "learning_rate": 0.00046974123539232057, + "loss": 1.6815, + "loss_base2": 2.4259, + "loss_pixel": 0.1771, + "loss_text": 1.5043, + "ppl": 5.3736, + "step": 7450 + }, + { + "epoch": 0.04, + "global_step": 7451, + "learning_rate": 0.0004697370617696161, + "loss": 1.6738, + "loss_base2": 2.4148, + "loss_pixel": 0.1782, + "loss_text": 1.4956, + "ppl": 5.3324, + "step": 7451 + }, + { + "epoch": 0.04, + "global_step": 7452, + "learning_rate": 0.00046973288814691153, + "loss": 1.6662, + "loss_base2": 2.4038, + "loss_pixel": 0.1777, + "loss_text": 1.4885, + "ppl": 5.292, + "step": 7452 + }, + { + "epoch": 0.04, + "global_step": 7453, + "learning_rate": 0.000469728714524207, + "loss": 1.6815, + "loss_base2": 2.4259, + "loss_pixel": 0.1774, + "loss_text": 1.5042, + "ppl": 5.3736, + "step": 7453 + }, + { + "epoch": 0.04, + "global_step": 7454, + "learning_rate": 0.0004697245409015025, + "loss": 1.6814, + "loss_base2": 2.4257, + "loss_pixel": 0.1776, + "loss_text": 1.5037, + "ppl": 5.3731, + "step": 7454 + }, + { + "epoch": 0.04, + "global_step": 7455, + "learning_rate": 0.000469720367278798, + "loss": 1.6761, + "loss_base2": 2.4181, + "loss_pixel": 0.1773, + "loss_text": 1.4988, + "ppl": 5.3447, + "step": 7455 + }, + { + "epoch": 0.04, + "global_step": 7456, + "learning_rate": 0.00046971619365609345, + "loss": 1.6676, + "loss_base2": 2.4058, + "loss_pixel": 0.177, + "loss_text": 1.4906, + "ppl": 5.2994, + "step": 7456 + }, + { + "epoch": 0.04, + "global_step": 7457, + "learning_rate": 0.00046971202003338896, + "loss": 1.6791, + "loss_base2": 2.4224, + "loss_pixel": 0.1765, + "loss_text": 1.5026, + "ppl": 5.3607, + "step": 7457 + }, + { + "epoch": 0.04, + "global_step": 7458, + "learning_rate": 0.00046970784641068447, + "loss": 1.6858, + "loss_base2": 2.4321, + "loss_pixel": 0.1762, + "loss_text": 1.5096, + "ppl": 5.3968, + "step": 7458 + }, + { + "epoch": 0.04, + "global_step": 7459, + "learning_rate": 0.00046970367278798, + "loss": 1.6558, + "loss_base2": 2.3888, + "loss_pixel": 0.1774, + "loss_text": 1.4785, + "ppl": 5.2373, + "step": 7459 + }, + { + "epoch": 0.04, + "global_step": 7460, + "learning_rate": 0.0004696994991652755, + "loss": 1.6684, + "loss_base2": 2.407, + "loss_pixel": 0.1762, + "loss_text": 1.4922, + "ppl": 5.3037, + "step": 7460 + }, + { + "epoch": 0.04, + "global_step": 7461, + "learning_rate": 0.00046969532554257094, + "loss": 1.6762, + "loss_base2": 2.4182, + "loss_pixel": 0.1763, + "loss_text": 1.4999, + "ppl": 5.3452, + "step": 7461 + }, + { + "epoch": 0.04, + "global_step": 7462, + "learning_rate": 0.00046969115191986644, + "loss": 1.663, + "loss_base2": 2.3992, + "loss_pixel": 0.1778, + "loss_text": 1.4853, + "ppl": 5.2751, + "step": 7462 + }, + { + "epoch": 0.04, + "global_step": 7463, + "learning_rate": 0.00046968697829716195, + "loss": 1.6795, + "loss_base2": 2.423, + "loss_pixel": 0.1776, + "loss_text": 1.5019, + "ppl": 5.3629, + "step": 7463 + }, + { + "epoch": 0.04, + "global_step": 7464, + "learning_rate": 0.00046968280467445746, + "loss": 1.6856, + "loss_base2": 2.4318, + "loss_pixel": 0.1758, + "loss_text": 1.5098, + "ppl": 5.3957, + "step": 7464 + }, + { + "epoch": 0.04, + "global_step": 7465, + "learning_rate": 0.00046967863105175297, + "loss": 1.6887, + "loss_base2": 2.4363, + "loss_pixel": 0.1761, + "loss_text": 1.5126, + "ppl": 5.4124, + "step": 7465 + }, + { + "epoch": 0.04, + "global_step": 7466, + "learning_rate": 0.0004696744574290484, + "loss": 1.6539, + "loss_base2": 2.3861, + "loss_pixel": 0.1767, + "loss_text": 1.4772, + "ppl": 5.2273, + "step": 7466 + }, + { + "epoch": 0.04, + "global_step": 7467, + "learning_rate": 0.0004696702838063439, + "loss": 1.67, + "loss_base2": 2.4093, + "loss_pixel": 0.1755, + "loss_text": 1.4945, + "ppl": 5.3122, + "step": 7467 + }, + { + "epoch": 0.04, + "global_step": 7468, + "learning_rate": 0.00046966611018363943, + "loss": 1.6948, + "loss_base2": 2.4451, + "loss_pixel": 0.1766, + "loss_text": 1.5182, + "ppl": 5.4456, + "step": 7468 + }, + { + "epoch": 0.04, + "global_step": 7469, + "learning_rate": 0.00046966193656093494, + "loss": 1.6646, + "loss_base2": 2.4015, + "loss_pixel": 0.1764, + "loss_text": 1.4882, + "ppl": 5.2836, + "step": 7469 + }, + { + "epoch": 0.04, + "global_step": 7470, + "learning_rate": 0.0004696577629382304, + "loss": 1.6554, + "loss_base2": 2.3882, + "loss_pixel": 0.1773, + "loss_text": 1.4781, + "ppl": 5.2352, + "step": 7470 + }, + { + "epoch": 0.04, + "global_step": 7471, + "learning_rate": 0.0004696535893155259, + "loss": 1.6821, + "loss_base2": 2.4268, + "loss_pixel": 0.1759, + "loss_text": 1.5062, + "ppl": 5.3768, + "step": 7471 + }, + { + "epoch": 0.04, + "global_step": 7472, + "learning_rate": 0.00046964941569282135, + "loss": 1.6738, + "loss_base2": 2.4148, + "loss_pixel": 0.178, + "loss_text": 1.4958, + "ppl": 5.3324, + "step": 7472 + }, + { + "epoch": 0.04, + "global_step": 7473, + "learning_rate": 0.00046964524207011686, + "loss": 1.6821, + "loss_base2": 2.4268, + "loss_pixel": 0.1758, + "loss_text": 1.5063, + "ppl": 5.3768, + "step": 7473 + }, + { + "epoch": 0.04, + "global_step": 7474, + "learning_rate": 0.00046964106844741237, + "loss": 1.669, + "loss_base2": 2.4079, + "loss_pixel": 0.1759, + "loss_text": 1.4931, + "ppl": 5.3069, + "step": 7474 + }, + { + "epoch": 0.04, + "global_step": 7475, + "learning_rate": 0.0004696368948247078, + "loss": 1.685, + "loss_base2": 2.4309, + "loss_pixel": 0.1764, + "loss_text": 1.5086, + "ppl": 5.3925, + "step": 7475 + }, + { + "epoch": 0.04, + "global_step": 7476, + "learning_rate": 0.00046963272120200333, + "loss": 1.6825, + "loss_base2": 2.4273, + "loss_pixel": 0.1781, + "loss_text": 1.5044, + "ppl": 5.379, + "step": 7476 + }, + { + "epoch": 0.04, + "global_step": 7477, + "learning_rate": 0.00046962854757929884, + "loss": 1.6605, + "loss_base2": 2.3956, + "loss_pixel": 0.1765, + "loss_text": 1.4839, + "ppl": 5.2619, + "step": 7477 + }, + { + "epoch": 0.04, + "global_step": 7478, + "learning_rate": 0.00046962437395659434, + "loss": 1.6728, + "loss_base2": 2.4133, + "loss_pixel": 0.1773, + "loss_text": 1.4955, + "ppl": 5.3271, + "step": 7478 + }, + { + "epoch": 0.04, + "global_step": 7479, + "learning_rate": 0.0004696202003338898, + "loss": 1.6698, + "loss_base2": 2.409, + "loss_pixel": 0.1778, + "loss_text": 1.492, + "ppl": 5.3111, + "step": 7479 + }, + { + "epoch": 0.04, + "global_step": 7480, + "learning_rate": 0.0004696160267111853, + "loss": 1.6796, + "loss_base2": 2.4232, + "loss_pixel": 0.1766, + "loss_text": 1.5029, + "ppl": 5.3634, + "step": 7480 + }, + { + "epoch": 0.04, + "global_step": 7481, + "learning_rate": 0.0004696118530884808, + "loss": 1.6756, + "loss_base2": 2.4174, + "loss_pixel": 0.1769, + "loss_text": 1.4988, + "ppl": 5.342, + "step": 7481 + }, + { + "epoch": 0.04, + "global_step": 7482, + "learning_rate": 0.0004696076794657763, + "loss": 1.6551, + "loss_base2": 2.3878, + "loss_pixel": 0.176, + "loss_text": 1.4791, + "ppl": 5.2336, + "step": 7482 + }, + { + "epoch": 0.04, + "global_step": 7483, + "learning_rate": 0.0004696035058430718, + "loss": 1.6653, + "loss_base2": 2.4025, + "loss_pixel": 0.1788, + "loss_text": 1.4865, + "ppl": 5.2873, + "step": 7483 + }, + { + "epoch": 0.04, + "global_step": 7484, + "learning_rate": 0.0004695993322203673, + "loss": 1.6648, + "loss_base2": 2.4018, + "loss_pixel": 0.1765, + "loss_text": 1.4882, + "ppl": 5.2846, + "step": 7484 + }, + { + "epoch": 0.04, + "global_step": 7485, + "learning_rate": 0.0004695951585976628, + "loss": 1.6606, + "loss_base2": 2.3957, + "loss_pixel": 0.1774, + "loss_text": 1.4832, + "ppl": 5.2625, + "step": 7485 + }, + { + "epoch": 0.04, + "global_step": 7486, + "learning_rate": 0.0004695909849749583, + "loss": 1.6847, + "loss_base2": 2.4305, + "loss_pixel": 0.1772, + "loss_text": 1.5074, + "ppl": 5.3908, + "step": 7486 + }, + { + "epoch": 0.04, + "global_step": 7487, + "learning_rate": 0.0004695868113522538, + "loss": 1.6674, + "loss_base2": 2.4055, + "loss_pixel": 0.1772, + "loss_text": 1.4901, + "ppl": 5.2984, + "step": 7487 + }, + { + "epoch": 0.04, + "global_step": 7488, + "learning_rate": 0.00046958263772954925, + "loss": 1.6666, + "loss_base2": 2.4044, + "loss_pixel": 0.1777, + "loss_text": 1.4889, + "ppl": 5.2941, + "step": 7488 + }, + { + "epoch": 0.04, + "global_step": 7489, + "learning_rate": 0.00046957846410684476, + "loss": 1.6758, + "loss_base2": 2.4177, + "loss_pixel": 0.1776, + "loss_text": 1.4981, + "ppl": 5.3431, + "step": 7489 + }, + { + "epoch": 0.04, + "global_step": 7490, + "learning_rate": 0.00046957429048414027, + "loss": 1.6527, + "loss_base2": 2.3843, + "loss_pixel": 0.1769, + "loss_text": 1.4757, + "ppl": 5.2211, + "step": 7490 + }, + { + "epoch": 0.04, + "global_step": 7491, + "learning_rate": 0.0004695701168614357, + "loss": 1.6796, + "loss_base2": 2.4232, + "loss_pixel": 0.179, + "loss_text": 1.5007, + "ppl": 5.3634, + "step": 7491 + }, + { + "epoch": 0.04, + "global_step": 7492, + "learning_rate": 0.00046956594323873123, + "loss": 1.6905, + "loss_base2": 2.4389, + "loss_pixel": 0.1847, + "loss_text": 1.5058, + "ppl": 5.4222, + "step": 7492 + }, + { + "epoch": 0.04, + "global_step": 7493, + "learning_rate": 0.0004695617696160267, + "loss": 1.6798, + "loss_base2": 2.4234, + "loss_pixel": 0.1851, + "loss_text": 1.4947, + "ppl": 5.3645, + "step": 7493 + }, + { + "epoch": 0.04, + "global_step": 7494, + "learning_rate": 0.0004695575959933222, + "loss": 1.6606, + "loss_base2": 2.3957, + "loss_pixel": 0.1812, + "loss_text": 1.4794, + "ppl": 5.2625, + "step": 7494 + }, + { + "epoch": 0.04, + "global_step": 7495, + "learning_rate": 0.0004695534223706177, + "loss": 1.6609, + "loss_base2": 2.3962, + "loss_pixel": 0.1757, + "loss_text": 1.4852, + "ppl": 5.264, + "step": 7495 + }, + { + "epoch": 0.04, + "global_step": 7496, + "learning_rate": 0.0004695492487479132, + "loss": 1.6674, + "loss_base2": 2.4055, + "loss_pixel": 0.1772, + "loss_text": 1.4903, + "ppl": 5.2984, + "step": 7496 + }, + { + "epoch": 0.04, + "global_step": 7497, + "learning_rate": 0.00046954507512520866, + "loss": 1.6669, + "loss_base2": 2.4048, + "loss_pixel": 0.1778, + "loss_text": 1.4892, + "ppl": 5.2957, + "step": 7497 + }, + { + "epoch": 0.04, + "global_step": 7498, + "learning_rate": 0.00046954090150250416, + "loss": 1.6741, + "loss_base2": 2.4152, + "loss_pixel": 0.1779, + "loss_text": 1.4963, + "ppl": 5.334, + "step": 7498 + }, + { + "epoch": 0.04, + "global_step": 7499, + "learning_rate": 0.00046953672787979967, + "loss": 1.6704, + "loss_base2": 2.4099, + "loss_pixel": 0.1768, + "loss_text": 1.4936, + "ppl": 5.3143, + "step": 7499 + }, + { + "epoch": 0.04, + "global_step": 7500, + "learning_rate": 0.0004695325542570952, + "loss": 1.6587, + "loss_base2": 2.393, + "loss_pixel": 0.1759, + "loss_text": 1.4827, + "ppl": 5.2525, + "step": 7500 + }, + { + "epoch": 0.04, + "global_step": 7501, + "learning_rate": 0.0004695283806343907, + "loss": 1.6752, + "loss_base2": 2.4168, + "loss_pixel": 0.1773, + "loss_text": 1.498, + "ppl": 5.3399, + "step": 7501 + }, + { + "epoch": 0.04, + "global_step": 7502, + "learning_rate": 0.00046952420701168614, + "loss": 1.6695, + "loss_base2": 2.4086, + "loss_pixel": 0.176, + "loss_text": 1.4935, + "ppl": 5.3095, + "step": 7502 + }, + { + "epoch": 0.04, + "global_step": 7503, + "learning_rate": 0.00046952003338898165, + "loss": 1.6526, + "loss_base2": 2.3842, + "loss_pixel": 0.1772, + "loss_text": 1.4754, + "ppl": 5.2205, + "step": 7503 + }, + { + "epoch": 0.04, + "global_step": 7504, + "learning_rate": 0.00046951585976627715, + "loss": 1.6757, + "loss_base2": 2.4175, + "loss_pixel": 0.1755, + "loss_text": 1.5001, + "ppl": 5.3425, + "step": 7504 + }, + { + "epoch": 0.04, + "global_step": 7505, + "learning_rate": 0.00046951168614357266, + "loss": 1.6619, + "loss_base2": 2.3976, + "loss_pixel": 0.1764, + "loss_text": 1.4855, + "ppl": 5.2693, + "step": 7505 + }, + { + "epoch": 0.04, + "global_step": 7506, + "learning_rate": 0.0004695075125208681, + "loss": 1.6744, + "loss_base2": 2.4156, + "loss_pixel": 0.1768, + "loss_text": 1.4975, + "ppl": 5.3356, + "step": 7506 + }, + { + "epoch": 0.04, + "global_step": 7507, + "learning_rate": 0.0004695033388981636, + "loss": 1.6703, + "loss_base2": 2.4097, + "loss_pixel": 0.1761, + "loss_text": 1.4943, + "ppl": 5.3138, + "step": 7507 + }, + { + "epoch": 0.04, + "global_step": 7508, + "learning_rate": 0.00046949916527545913, + "loss": 1.6681, + "loss_base2": 2.4066, + "loss_pixel": 0.1759, + "loss_text": 1.4922, + "ppl": 5.3021, + "step": 7508 + }, + { + "epoch": 0.04, + "global_step": 7509, + "learning_rate": 0.00046949499165275464, + "loss": 1.645, + "loss_base2": 2.3732, + "loss_pixel": 0.1771, + "loss_text": 1.4679, + "ppl": 5.181, + "step": 7509 + }, + { + "epoch": 0.04, + "global_step": 7510, + "learning_rate": 0.0004694908180300501, + "loss": 1.6448, + "loss_base2": 2.3729, + "loss_pixel": 0.1762, + "loss_text": 1.4686, + "ppl": 5.18, + "step": 7510 + }, + { + "epoch": 0.04, + "global_step": 7511, + "learning_rate": 0.00046948664440734554, + "loss": 1.6827, + "loss_base2": 2.4276, + "loss_pixel": 0.1756, + "loss_text": 1.5071, + "ppl": 5.3801, + "step": 7511 + }, + { + "epoch": 0.04, + "global_step": 7512, + "learning_rate": 0.00046948247078464105, + "loss": 1.6708, + "loss_base2": 2.4105, + "loss_pixel": 0.1768, + "loss_text": 1.4941, + "ppl": 5.3164, + "step": 7512 + }, + { + "epoch": 0.04, + "global_step": 7513, + "learning_rate": 0.00046947829716193656, + "loss": 1.6535, + "loss_base2": 2.3855, + "loss_pixel": 0.1765, + "loss_text": 1.477, + "ppl": 5.2252, + "step": 7513 + }, + { + "epoch": 0.04, + "global_step": 7514, + "learning_rate": 0.00046947412353923206, + "loss": 1.6737, + "loss_base2": 2.4146, + "loss_pixel": 0.1752, + "loss_text": 1.4985, + "ppl": 5.3319, + "step": 7514 + }, + { + "epoch": 0.04, + "global_step": 7515, + "learning_rate": 0.00046946994991652757, + "loss": 1.6673, + "loss_base2": 2.4054, + "loss_pixel": 0.1764, + "loss_text": 1.4909, + "ppl": 5.2978, + "step": 7515 + }, + { + "epoch": 0.04, + "global_step": 7516, + "learning_rate": 0.000469465776293823, + "loss": 1.6681, + "loss_base2": 2.4066, + "loss_pixel": 0.1753, + "loss_text": 1.4927, + "ppl": 5.3021, + "step": 7516 + }, + { + "epoch": 0.04, + "global_step": 7517, + "learning_rate": 0.00046946160267111853, + "loss": 1.6662, + "loss_base2": 2.4038, + "loss_pixel": 0.175, + "loss_text": 1.4912, + "ppl": 5.292, + "step": 7517 + }, + { + "epoch": 0.04, + "global_step": 7518, + "learning_rate": 0.00046945742904841404, + "loss": 1.6817, + "loss_base2": 2.4262, + "loss_pixel": 0.1755, + "loss_text": 1.5062, + "ppl": 5.3747, + "step": 7518 + }, + { + "epoch": 0.04, + "global_step": 7519, + "learning_rate": 0.00046945325542570955, + "loss": 1.6635, + "loss_base2": 2.3999, + "loss_pixel": 0.1745, + "loss_text": 1.489, + "ppl": 5.2778, + "step": 7519 + }, + { + "epoch": 0.04, + "global_step": 7520, + "learning_rate": 0.000469449081803005, + "loss": 1.6737, + "loss_base2": 2.4146, + "loss_pixel": 0.1762, + "loss_text": 1.4975, + "ppl": 5.3319, + "step": 7520 + }, + { + "epoch": 0.04, + "global_step": 7521, + "learning_rate": 0.0004694449081803005, + "loss": 1.6531, + "loss_base2": 2.3849, + "loss_pixel": 0.1766, + "loss_text": 1.4765, + "ppl": 5.2231, + "step": 7521 + }, + { + "epoch": 0.04, + "global_step": 7522, + "learning_rate": 0.000469440734557596, + "loss": 1.6499, + "loss_base2": 2.3803, + "loss_pixel": 0.175, + "loss_text": 1.4749, + "ppl": 5.2065, + "step": 7522 + }, + { + "epoch": 0.04, + "global_step": 7523, + "learning_rate": 0.0004694365609348915, + "loss": 1.6584, + "loss_base2": 2.3926, + "loss_pixel": 0.1759, + "loss_text": 1.4825, + "ppl": 5.2509, + "step": 7523 + }, + { + "epoch": 0.04, + "global_step": 7524, + "learning_rate": 0.00046943238731218703, + "loss": 1.6864, + "loss_base2": 2.433, + "loss_pixel": 0.1752, + "loss_text": 1.5112, + "ppl": 5.4, + "step": 7524 + }, + { + "epoch": 0.04, + "global_step": 7525, + "learning_rate": 0.0004694282136894825, + "loss": 1.5853, + "loss_base2": 2.2871, + "loss_pixel": 0.1765, + "loss_text": 1.4088, + "ppl": 4.8808, + "step": 7525 + }, + { + "epoch": 0.04, + "global_step": 7526, + "learning_rate": 0.000469424040066778, + "loss": 1.4412, + "loss_base2": 2.0792, + "loss_pixel": 0.1754, + "loss_text": 1.2657, + "ppl": 4.2258, + "step": 7526 + }, + { + "epoch": 0.04, + "global_step": 7527, + "learning_rate": 0.0004694198664440735, + "loss": 1.4667, + "loss_base2": 2.116, + "loss_pixel": 0.1761, + "loss_text": 1.2906, + "ppl": 4.3349, + "step": 7527 + }, + { + "epoch": 0.04, + "global_step": 7528, + "learning_rate": 0.000469415692821369, + "loss": 1.4484, + "loss_base2": 2.0896, + "loss_pixel": 0.1765, + "loss_text": 1.2719, + "ppl": 4.2563, + "step": 7528 + }, + { + "epoch": 0.04, + "global_step": 7529, + "learning_rate": 0.0004694115191986644, + "loss": 1.4554, + "loss_base2": 2.0997, + "loss_pixel": 0.177, + "loss_text": 1.2785, + "ppl": 4.2862, + "step": 7529 + }, + { + "epoch": 0.04, + "global_step": 7530, + "learning_rate": 0.0004694073455759599, + "loss": 1.4619, + "loss_base2": 2.1091, + "loss_pixel": 0.1751, + "loss_text": 1.2868, + "ppl": 4.3141, + "step": 7530 + }, + { + "epoch": 0.04, + "global_step": 7531, + "learning_rate": 0.0004694031719532554, + "loss": 1.4742, + "loss_base2": 2.1268, + "loss_pixel": 0.1767, + "loss_text": 1.2975, + "ppl": 4.3675, + "step": 7531 + }, + { + "epoch": 0.04, + "global_step": 7532, + "learning_rate": 0.0004693989983305509, + "loss": 1.4671, + "loss_base2": 2.1166, + "loss_pixel": 0.1753, + "loss_text": 1.2919, + "ppl": 4.3366, + "step": 7532 + }, + { + "epoch": 0.04, + "global_step": 7533, + "learning_rate": 0.00046939482470784643, + "loss": 1.4476, + "loss_base2": 2.0884, + "loss_pixel": 0.1775, + "loss_text": 1.27, + "ppl": 4.2529, + "step": 7533 + }, + { + "epoch": 0.04, + "global_step": 7534, + "learning_rate": 0.0004693906510851419, + "loss": 1.4512, + "loss_base2": 2.0936, + "loss_pixel": 0.1775, + "loss_text": 1.2737, + "ppl": 4.2682, + "step": 7534 + }, + { + "epoch": 0.04, + "global_step": 7535, + "learning_rate": 0.0004693864774624374, + "loss": 1.4656, + "loss_base2": 2.1144, + "loss_pixel": 0.1753, + "loss_text": 1.2903, + "ppl": 4.3301, + "step": 7535 + }, + { + "epoch": 0.04, + "global_step": 7536, + "learning_rate": 0.0004693823038397329, + "loss": 1.4382, + "loss_base2": 2.0749, + "loss_pixel": 0.1753, + "loss_text": 1.2629, + "ppl": 4.2131, + "step": 7536 + }, + { + "epoch": 0.04, + "global_step": 7537, + "learning_rate": 0.0004693781302170284, + "loss": 1.4365, + "loss_base2": 2.0724, + "loss_pixel": 0.1759, + "loss_text": 1.2607, + "ppl": 4.2059, + "step": 7537 + }, + { + "epoch": 0.04, + "global_step": 7538, + "learning_rate": 0.00046937395659432386, + "loss": 1.4459, + "loss_base2": 2.086, + "loss_pixel": 0.177, + "loss_text": 1.2689, + "ppl": 4.2457, + "step": 7538 + }, + { + "epoch": 0.04, + "global_step": 7539, + "learning_rate": 0.00046936978297161937, + "loss": 1.4318, + "loss_base2": 2.0657, + "loss_pixel": 0.1772, + "loss_text": 1.2546, + "ppl": 4.1862, + "step": 7539 + }, + { + "epoch": 0.04, + "global_step": 7540, + "learning_rate": 0.0004693656093489149, + "loss": 1.4317, + "loss_base2": 2.0655, + "loss_pixel": 0.1769, + "loss_text": 1.2548, + "ppl": 4.1858, + "step": 7540 + }, + { + "epoch": 0.04, + "global_step": 7541, + "learning_rate": 0.0004693614357262104, + "loss": 1.4378, + "loss_base2": 2.0743, + "loss_pixel": 0.1768, + "loss_text": 1.2611, + "ppl": 4.2114, + "step": 7541 + }, + { + "epoch": 0.04, + "global_step": 7542, + "learning_rate": 0.0004693572621035059, + "loss": 1.5245, + "loss_base2": 2.1994, + "loss_pixel": 0.177, + "loss_text": 1.3475, + "ppl": 4.5928, + "step": 7542 + }, + { + "epoch": 0.04, + "global_step": 7543, + "learning_rate": 0.00046935308848080134, + "loss": 1.6471, + "loss_base2": 2.3763, + "loss_pixel": 0.1763, + "loss_text": 1.4708, + "ppl": 5.1919, + "step": 7543 + }, + { + "epoch": 0.04, + "global_step": 7544, + "learning_rate": 0.00046934891485809685, + "loss": 1.6754, + "loss_base2": 2.4171, + "loss_pixel": 0.1765, + "loss_text": 1.4989, + "ppl": 5.3409, + "step": 7544 + }, + { + "epoch": 0.04, + "global_step": 7545, + "learning_rate": 0.00046934474123539236, + "loss": 1.6563, + "loss_base2": 2.3895, + "loss_pixel": 0.1759, + "loss_text": 1.4804, + "ppl": 5.2399, + "step": 7545 + }, + { + "epoch": 0.04, + "global_step": 7546, + "learning_rate": 0.00046934056761268787, + "loss": 1.6827, + "loss_base2": 2.4276, + "loss_pixel": 0.1778, + "loss_text": 1.505, + "ppl": 5.3801, + "step": 7546 + }, + { + "epoch": 0.04, + "global_step": 7547, + "learning_rate": 0.00046933639398998326, + "loss": 1.6785, + "loss_base2": 2.4216, + "loss_pixel": 0.1757, + "loss_text": 1.5027, + "ppl": 5.3575, + "step": 7547 + }, + { + "epoch": 0.04, + "global_step": 7548, + "learning_rate": 0.00046933222036727877, + "loss": 1.6818, + "loss_base2": 2.4263, + "loss_pixel": 0.1767, + "loss_text": 1.5051, + "ppl": 5.3752, + "step": 7548 + }, + { + "epoch": 0.04, + "global_step": 7549, + "learning_rate": 0.0004693280467445743, + "loss": 1.686, + "loss_base2": 2.4324, + "loss_pixel": 0.1767, + "loss_text": 1.5093, + "ppl": 5.3978, + "step": 7549 + }, + { + "epoch": 0.04, + "global_step": 7550, + "learning_rate": 0.0004693238731218698, + "loss": 1.67, + "loss_base2": 2.4093, + "loss_pixel": 0.1771, + "loss_text": 1.4928, + "ppl": 5.3122, + "step": 7550 + }, + { + "epoch": 0.04, + "global_step": 7551, + "learning_rate": 0.0004693196994991653, + "loss": 1.6721, + "loss_base2": 2.4123, + "loss_pixel": 0.1777, + "loss_text": 1.4945, + "ppl": 5.3233, + "step": 7551 + }, + { + "epoch": 0.04, + "global_step": 7552, + "learning_rate": 0.00046931552587646075, + "loss": 1.672, + "loss_base2": 2.4122, + "loss_pixel": 0.1774, + "loss_text": 1.4946, + "ppl": 5.3228, + "step": 7552 + }, + { + "epoch": 0.04, + "global_step": 7553, + "learning_rate": 0.00046931135225375625, + "loss": 1.6798, + "loss_base2": 2.4234, + "loss_pixel": 0.1753, + "loss_text": 1.5045, + "ppl": 5.3645, + "step": 7553 + }, + { + "epoch": 0.04, + "global_step": 7554, + "learning_rate": 0.00046930717863105176, + "loss": 1.6708, + "loss_base2": 2.4105, + "loss_pixel": 0.1763, + "loss_text": 1.4945, + "ppl": 5.3164, + "step": 7554 + }, + { + "epoch": 0.04, + "global_step": 7555, + "learning_rate": 0.00046930300500834727, + "loss": 1.6855, + "loss_base2": 2.4317, + "loss_pixel": 0.1772, + "loss_text": 1.5083, + "ppl": 5.3951, + "step": 7555 + }, + { + "epoch": 0.04, + "global_step": 7556, + "learning_rate": 0.0004692988313856427, + "loss": 1.6666, + "loss_base2": 2.4044, + "loss_pixel": 0.1753, + "loss_text": 1.4913, + "ppl": 5.2941, + "step": 7556 + }, + { + "epoch": 0.04, + "global_step": 7557, + "learning_rate": 0.00046929465776293823, + "loss": 1.6851, + "loss_base2": 2.4311, + "loss_pixel": 0.1757, + "loss_text": 1.5093, + "ppl": 5.393, + "step": 7557 + }, + { + "epoch": 0.04, + "global_step": 7558, + "learning_rate": 0.00046929048414023374, + "loss": 1.6724, + "loss_base2": 2.4128, + "loss_pixel": 0.1766, + "loss_text": 1.4958, + "ppl": 5.3249, + "step": 7558 + }, + { + "epoch": 0.04, + "global_step": 7559, + "learning_rate": 0.00046928631051752924, + "loss": 1.6904, + "loss_base2": 2.4387, + "loss_pixel": 0.1766, + "loss_text": 1.5137, + "ppl": 5.4216, + "step": 7559 + }, + { + "epoch": 0.04, + "global_step": 7560, + "learning_rate": 0.00046928213689482475, + "loss": 1.6755, + "loss_base2": 2.4172, + "loss_pixel": 0.1749, + "loss_text": 1.5005, + "ppl": 5.3415, + "step": 7560 + }, + { + "epoch": 0.04, + "global_step": 7561, + "learning_rate": 0.0004692779632721202, + "loss": 1.6789, + "loss_base2": 2.4221, + "loss_pixel": 0.1752, + "loss_text": 1.5037, + "ppl": 5.3597, + "step": 7561 + }, + { + "epoch": 0.04, + "global_step": 7562, + "learning_rate": 0.0004692737896494157, + "loss": 1.6717, + "loss_base2": 2.4118, + "loss_pixel": 0.1756, + "loss_text": 1.4961, + "ppl": 5.3212, + "step": 7562 + }, + { + "epoch": 0.04, + "global_step": 7563, + "learning_rate": 0.0004692696160267112, + "loss": 1.6566, + "loss_base2": 2.39, + "loss_pixel": 0.1786, + "loss_text": 1.4779, + "ppl": 5.2415, + "step": 7563 + }, + { + "epoch": 0.04, + "global_step": 7564, + "learning_rate": 0.0004692654424040067, + "loss": 1.6623, + "loss_base2": 2.3982, + "loss_pixel": 0.1755, + "loss_text": 1.4868, + "ppl": 5.2714, + "step": 7564 + }, + { + "epoch": 0.04, + "global_step": 7565, + "learning_rate": 0.0004692612687813022, + "loss": 1.6768, + "loss_base2": 2.4191, + "loss_pixel": 0.1777, + "loss_text": 1.499, + "ppl": 5.3484, + "step": 7565 + }, + { + "epoch": 0.04, + "global_step": 7566, + "learning_rate": 0.00046925709515859763, + "loss": 1.6673, + "loss_base2": 2.4054, + "loss_pixel": 0.1756, + "loss_text": 1.4916, + "ppl": 5.2978, + "step": 7566 + }, + { + "epoch": 0.04, + "global_step": 7567, + "learning_rate": 0.00046925292153589314, + "loss": 1.6887, + "loss_base2": 2.4363, + "loss_pixel": 0.175, + "loss_text": 1.5136, + "ppl": 5.4124, + "step": 7567 + }, + { + "epoch": 0.04, + "global_step": 7568, + "learning_rate": 0.00046924874791318865, + "loss": 1.6697, + "loss_base2": 2.4089, + "loss_pixel": 0.1747, + "loss_text": 1.4949, + "ppl": 5.3106, + "step": 7568 + }, + { + "epoch": 0.04, + "global_step": 7569, + "learning_rate": 0.00046924457429048415, + "loss": 1.6649, + "loss_base2": 2.4019, + "loss_pixel": 0.1761, + "loss_text": 1.4887, + "ppl": 5.2851, + "step": 7569 + }, + { + "epoch": 0.04, + "global_step": 7570, + "learning_rate": 0.0004692404006677796, + "loss": 1.6705, + "loss_base2": 2.41, + "loss_pixel": 0.1773, + "loss_text": 1.4932, + "ppl": 5.3148, + "step": 7570 + }, + { + "epoch": 0.04, + "global_step": 7571, + "learning_rate": 0.0004692362270450751, + "loss": 1.6745, + "loss_base2": 2.4158, + "loss_pixel": 0.1754, + "loss_text": 1.4992, + "ppl": 5.3361, + "step": 7571 + }, + { + "epoch": 0.04, + "global_step": 7572, + "learning_rate": 0.0004692320534223706, + "loss": 1.6923, + "loss_base2": 2.4415, + "loss_pixel": 0.1778, + "loss_text": 1.5145, + "ppl": 5.432, + "step": 7572 + }, + { + "epoch": 0.04, + "global_step": 7573, + "learning_rate": 0.00046922787979966613, + "loss": 1.6641, + "loss_base2": 2.4008, + "loss_pixel": 0.1764, + "loss_text": 1.4877, + "ppl": 5.2809, + "step": 7573 + }, + { + "epoch": 0.04, + "global_step": 7574, + "learning_rate": 0.00046922370617696164, + "loss": 1.6762, + "loss_base2": 2.4182, + "loss_pixel": 0.1762, + "loss_text": 1.5, + "ppl": 5.3452, + "step": 7574 + }, + { + "epoch": 0.04, + "global_step": 7575, + "learning_rate": 0.0004692195325542571, + "loss": 1.6691, + "loss_base2": 2.408, + "loss_pixel": 0.1779, + "loss_text": 1.4911, + "ppl": 5.3074, + "step": 7575 + }, + { + "epoch": 0.04, + "global_step": 7576, + "learning_rate": 0.0004692153589315526, + "loss": 1.6673, + "loss_base2": 2.4054, + "loss_pixel": 0.1761, + "loss_text": 1.4912, + "ppl": 5.2978, + "step": 7576 + }, + { + "epoch": 0.04, + "global_step": 7577, + "learning_rate": 0.0004692111853088481, + "loss": 1.6408, + "loss_base2": 2.3672, + "loss_pixel": 0.1747, + "loss_text": 1.4661, + "ppl": 5.1593, + "step": 7577 + }, + { + "epoch": 0.04, + "global_step": 7578, + "learning_rate": 0.0004692070116861436, + "loss": 1.6796, + "loss_base2": 2.4232, + "loss_pixel": 0.1756, + "loss_text": 1.504, + "ppl": 5.3634, + "step": 7578 + }, + { + "epoch": 0.04, + "global_step": 7579, + "learning_rate": 0.00046920283806343906, + "loss": 1.6772, + "loss_base2": 2.4197, + "loss_pixel": 0.1762, + "loss_text": 1.5009, + "ppl": 5.3506, + "step": 7579 + }, + { + "epoch": 0.04, + "global_step": 7580, + "learning_rate": 0.00046919866444073457, + "loss": 1.6628, + "loss_base2": 2.3989, + "loss_pixel": 0.176, + "loss_text": 1.4869, + "ppl": 5.2741, + "step": 7580 + }, + { + "epoch": 0.04, + "global_step": 7581, + "learning_rate": 0.0004691944908180301, + "loss": 1.6611, + "loss_base2": 2.3965, + "loss_pixel": 0.1768, + "loss_text": 1.4843, + "ppl": 5.2651, + "step": 7581 + }, + { + "epoch": 0.04, + "global_step": 7582, + "learning_rate": 0.0004691903171953256, + "loss": 1.6797, + "loss_base2": 2.4233, + "loss_pixel": 0.176, + "loss_text": 1.5037, + "ppl": 5.3639, + "step": 7582 + }, + { + "epoch": 0.04, + "global_step": 7583, + "learning_rate": 0.0004691861435726211, + "loss": 1.6455, + "loss_base2": 2.374, + "loss_pixel": 0.1751, + "loss_text": 1.4704, + "ppl": 5.1836, + "step": 7583 + }, + { + "epoch": 0.04, + "global_step": 7584, + "learning_rate": 0.00046918196994991655, + "loss": 1.6802, + "loss_base2": 2.424, + "loss_pixel": 0.176, + "loss_text": 1.5043, + "ppl": 5.3666, + "step": 7584 + }, + { + "epoch": 0.04, + "global_step": 7585, + "learning_rate": 0.000469177796327212, + "loss": 1.6693, + "loss_base2": 2.4083, + "loss_pixel": 0.1753, + "loss_text": 1.494, + "ppl": 5.3085, + "step": 7585 + }, + { + "epoch": 0.04, + "global_step": 7586, + "learning_rate": 0.0004691736227045075, + "loss": 1.6714, + "loss_base2": 2.4113, + "loss_pixel": 0.1762, + "loss_text": 1.4952, + "ppl": 5.3196, + "step": 7586 + }, + { + "epoch": 0.04, + "global_step": 7587, + "learning_rate": 0.000469169449081803, + "loss": 1.6659, + "loss_base2": 2.4034, + "loss_pixel": 0.1748, + "loss_text": 1.4911, + "ppl": 5.2904, + "step": 7587 + }, + { + "epoch": 0.04, + "global_step": 7588, + "learning_rate": 0.00046916527545909847, + "loss": 1.6659, + "loss_base2": 2.4034, + "loss_pixel": 0.1762, + "loss_text": 1.4897, + "ppl": 5.2904, + "step": 7588 + }, + { + "epoch": 0.04, + "global_step": 7589, + "learning_rate": 0.000469161101836394, + "loss": 1.6667, + "loss_base2": 2.4045, + "loss_pixel": 0.1739, + "loss_text": 1.4928, + "ppl": 5.2947, + "step": 7589 + }, + { + "epoch": 0.04, + "global_step": 7590, + "learning_rate": 0.0004691569282136895, + "loss": 1.5511, + "loss_base2": 2.2378, + "loss_pixel": 0.1756, + "loss_text": 1.3755, + "ppl": 4.7167, + "step": 7590 + }, + { + "epoch": 0.04, + "global_step": 7591, + "learning_rate": 0.000469152754590985, + "loss": 1.4563, + "loss_base2": 2.101, + "loss_pixel": 0.1776, + "loss_text": 1.2787, + "ppl": 4.2901, + "step": 7591 + }, + { + "epoch": 0.04, + "global_step": 7592, + "learning_rate": 0.0004691485809682805, + "loss": 1.4542, + "loss_base2": 2.098, + "loss_pixel": 0.1757, + "loss_text": 1.2785, + "ppl": 4.2811, + "step": 7592 + }, + { + "epoch": 0.04, + "global_step": 7593, + "learning_rate": 0.00046914440734557595, + "loss": 1.4409, + "loss_base2": 2.0788, + "loss_pixel": 0.1763, + "loss_text": 1.2646, + "ppl": 4.2245, + "step": 7593 + }, + { + "epoch": 0.04, + "global_step": 7594, + "learning_rate": 0.00046914023372287146, + "loss": 1.4564, + "loss_base2": 2.1011, + "loss_pixel": 0.1761, + "loss_text": 1.2802, + "ppl": 4.2905, + "step": 7594 + }, + { + "epoch": 0.04, + "global_step": 7595, + "learning_rate": 0.00046913606010016697, + "loss": 1.4563, + "loss_base2": 2.101, + "loss_pixel": 0.1774, + "loss_text": 1.2788, + "ppl": 4.2901, + "step": 7595 + }, + { + "epoch": 0.04, + "global_step": 7596, + "learning_rate": 0.00046913188647746247, + "loss": 1.4528, + "loss_base2": 2.0959, + "loss_pixel": 0.1756, + "loss_text": 1.2772, + "ppl": 4.2751, + "step": 7596 + }, + { + "epoch": 0.04, + "global_step": 7597, + "learning_rate": 0.0004691277128547579, + "loss": 1.4537, + "loss_base2": 2.0972, + "loss_pixel": 0.1751, + "loss_text": 1.2786, + "ppl": 4.2789, + "step": 7597 + }, + { + "epoch": 0.04, + "global_step": 7598, + "learning_rate": 0.00046912353923205343, + "loss": 1.6988, + "loss_base2": 2.4509, + "loss_pixel": 0.1763, + "loss_text": 1.5226, + "ppl": 5.4674, + "step": 7598 + }, + { + "epoch": 0.04, + "global_step": 7599, + "learning_rate": 0.00046911936560934894, + "loss": 1.6892, + "loss_base2": 2.437, + "loss_pixel": 0.1749, + "loss_text": 1.5143, + "ppl": 5.4151, + "step": 7599 + }, + { + "epoch": 0.04, + "global_step": 7600, + "learning_rate": 0.00046911519198664445, + "loss": 1.6873, + "loss_base2": 2.4343, + "loss_pixel": 0.1767, + "loss_text": 1.5105, + "ppl": 5.4049, + "step": 7600 + }, + { + "epoch": 0.04, + "global_step": 7601, + "learning_rate": 0.00046911101836393995, + "loss": 1.6911, + "loss_base2": 2.4397, + "loss_pixel": 0.1777, + "loss_text": 1.5134, + "ppl": 5.4254, + "step": 7601 + }, + { + "epoch": 0.04, + "global_step": 7602, + "learning_rate": 0.0004691068447412354, + "loss": 1.6935, + "loss_base2": 2.4432, + "loss_pixel": 0.1756, + "loss_text": 1.5178, + "ppl": 5.4385, + "step": 7602 + }, + { + "epoch": 0.04, + "global_step": 7603, + "learning_rate": 0.0004691026711185309, + "loss": 1.6868, + "loss_base2": 2.4335, + "loss_pixel": 0.176, + "loss_text": 1.5108, + "ppl": 5.4022, + "step": 7603 + }, + { + "epoch": 0.04, + "global_step": 7604, + "learning_rate": 0.00046909849749582637, + "loss": 1.6666, + "loss_base2": 2.4044, + "loss_pixel": 0.1777, + "loss_text": 1.4889, + "ppl": 5.2941, + "step": 7604 + }, + { + "epoch": 0.04, + "global_step": 7605, + "learning_rate": 0.0004690943238731219, + "loss": 1.6852, + "loss_base2": 2.4312, + "loss_pixel": 0.1752, + "loss_text": 1.51, + "ppl": 5.3935, + "step": 7605 + }, + { + "epoch": 0.04, + "global_step": 7606, + "learning_rate": 0.00046909015025041733, + "loss": 1.6807, + "loss_base2": 2.4247, + "loss_pixel": 0.1748, + "loss_text": 1.5059, + "ppl": 5.3693, + "step": 7606 + }, + { + "epoch": 0.04, + "global_step": 7607, + "learning_rate": 0.00046908597662771284, + "loss": 1.6888, + "loss_base2": 2.4364, + "loss_pixel": 0.1765, + "loss_text": 1.5123, + "ppl": 5.413, + "step": 7607 + }, + { + "epoch": 0.04, + "global_step": 7608, + "learning_rate": 0.00046908180300500834, + "loss": 1.6673, + "loss_base2": 2.4054, + "loss_pixel": 0.1749, + "loss_text": 1.4924, + "ppl": 5.2978, + "step": 7608 + }, + { + "epoch": 0.04, + "global_step": 7609, + "learning_rate": 0.00046907762938230385, + "loss": 1.6891, + "loss_base2": 2.4369, + "loss_pixel": 0.1748, + "loss_text": 1.5142, + "ppl": 5.4146, + "step": 7609 + }, + { + "epoch": 0.04, + "global_step": 7610, + "learning_rate": 0.00046907345575959936, + "loss": 1.6819, + "loss_base2": 2.4265, + "loss_pixel": 0.1764, + "loss_text": 1.5056, + "ppl": 5.3758, + "step": 7610 + }, + { + "epoch": 0.04, + "global_step": 7611, + "learning_rate": 0.0004690692821368948, + "loss": 1.6749, + "loss_base2": 2.4164, + "loss_pixel": 0.1747, + "loss_text": 1.5003, + "ppl": 5.3383, + "step": 7611 + }, + { + "epoch": 0.04, + "global_step": 7612, + "learning_rate": 0.0004690651085141903, + "loss": 1.6579, + "loss_base2": 2.3918, + "loss_pixel": 0.1749, + "loss_text": 1.483, + "ppl": 5.2483, + "step": 7612 + }, + { + "epoch": 0.04, + "global_step": 7613, + "learning_rate": 0.0004690609348914858, + "loss": 1.6716, + "loss_base2": 2.4116, + "loss_pixel": 0.1751, + "loss_text": 1.4965, + "ppl": 5.3207, + "step": 7613 + }, + { + "epoch": 0.04, + "global_step": 7614, + "learning_rate": 0.00046905676126878133, + "loss": 1.6641, + "loss_base2": 2.4008, + "loss_pixel": 0.1751, + "loss_text": 1.489, + "ppl": 5.2809, + "step": 7614 + }, + { + "epoch": 0.04, + "global_step": 7615, + "learning_rate": 0.0004690525876460768, + "loss": 1.67, + "loss_base2": 2.4093, + "loss_pixel": 0.1757, + "loss_text": 1.4942, + "ppl": 5.3122, + "step": 7615 + }, + { + "epoch": 0.04, + "global_step": 7616, + "learning_rate": 0.0004690484140233723, + "loss": 1.6826, + "loss_base2": 2.4275, + "loss_pixel": 0.1767, + "loss_text": 1.5059, + "ppl": 5.3795, + "step": 7616 + }, + { + "epoch": 0.04, + "global_step": 7617, + "learning_rate": 0.0004690442404006678, + "loss": 1.67, + "loss_base2": 2.4093, + "loss_pixel": 0.1739, + "loss_text": 1.4961, + "ppl": 5.3122, + "step": 7617 + }, + { + "epoch": 0.04, + "global_step": 7618, + "learning_rate": 0.0004690400667779633, + "loss": 1.6709, + "loss_base2": 2.4106, + "loss_pixel": 0.1766, + "loss_text": 1.4944, + "ppl": 5.317, + "step": 7618 + }, + { + "epoch": 0.04, + "global_step": 7619, + "learning_rate": 0.0004690358931552588, + "loss": 1.6077, + "loss_base2": 2.3194, + "loss_pixel": 0.1757, + "loss_text": 1.4319, + "ppl": 4.9913, + "step": 7619 + }, + { + "epoch": 0.04, + "global_step": 7620, + "learning_rate": 0.00046903171953255427, + "loss": 1.6782, + "loss_base2": 2.4211, + "loss_pixel": 0.1755, + "loss_text": 1.5027, + "ppl": 5.3559, + "step": 7620 + }, + { + "epoch": 0.04, + "global_step": 7621, + "learning_rate": 0.0004690275459098498, + "loss": 1.6848, + "loss_base2": 2.4307, + "loss_pixel": 0.1773, + "loss_text": 1.5075, + "ppl": 5.3914, + "step": 7621 + }, + { + "epoch": 0.04, + "global_step": 7622, + "learning_rate": 0.00046902337228714523, + "loss": 1.6601, + "loss_base2": 2.395, + "loss_pixel": 0.1762, + "loss_text": 1.4839, + "ppl": 5.2598, + "step": 7622 + }, + { + "epoch": 0.04, + "global_step": 7623, + "learning_rate": 0.00046901919866444074, + "loss": 1.6619, + "loss_base2": 2.3976, + "loss_pixel": 0.1746, + "loss_text": 1.4874, + "ppl": 5.2693, + "step": 7623 + }, + { + "epoch": 0.04, + "global_step": 7624, + "learning_rate": 0.0004690150250417362, + "loss": 1.6853, + "loss_base2": 2.4314, + "loss_pixel": 0.1754, + "loss_text": 1.5099, + "ppl": 5.3941, + "step": 7624 + }, + { + "epoch": 0.04, + "global_step": 7625, + "learning_rate": 0.0004690108514190317, + "loss": 1.6625, + "loss_base2": 2.3985, + "loss_pixel": 0.1753, + "loss_text": 1.4872, + "ppl": 5.2725, + "step": 7625 + }, + { + "epoch": 0.04, + "global_step": 7626, + "learning_rate": 0.0004690066777963272, + "loss": 1.667, + "loss_base2": 2.405, + "loss_pixel": 0.175, + "loss_text": 1.492, + "ppl": 5.2963, + "step": 7626 + }, + { + "epoch": 0.04, + "global_step": 7627, + "learning_rate": 0.0004690025041736227, + "loss": 1.6717, + "loss_base2": 2.4118, + "loss_pixel": 0.1755, + "loss_text": 1.4961, + "ppl": 5.3212, + "step": 7627 + }, + { + "epoch": 0.04, + "global_step": 7628, + "learning_rate": 0.0004689983305509182, + "loss": 1.6506, + "loss_base2": 2.3813, + "loss_pixel": 0.1758, + "loss_text": 1.4749, + "ppl": 5.2101, + "step": 7628 + }, + { + "epoch": 0.04, + "global_step": 7629, + "learning_rate": 0.00046899415692821367, + "loss": 1.6573, + "loss_base2": 2.391, + "loss_pixel": 0.1753, + "loss_text": 1.482, + "ppl": 5.2451, + "step": 7629 + }, + { + "epoch": 0.04, + "global_step": 7630, + "learning_rate": 0.0004689899833055092, + "loss": 1.6784, + "loss_base2": 2.4214, + "loss_pixel": 0.1747, + "loss_text": 1.5037, + "ppl": 5.357, + "step": 7630 + }, + { + "epoch": 0.04, + "global_step": 7631, + "learning_rate": 0.0004689858096828047, + "loss": 1.6462, + "loss_base2": 2.375, + "loss_pixel": 0.1749, + "loss_text": 1.4712, + "ppl": 5.1872, + "step": 7631 + }, + { + "epoch": 0.04, + "global_step": 7632, + "learning_rate": 0.0004689816360601002, + "loss": 1.6675, + "loss_base2": 2.4057, + "loss_pixel": 0.1747, + "loss_text": 1.4928, + "ppl": 5.2989, + "step": 7632 + }, + { + "epoch": 0.04, + "global_step": 7633, + "learning_rate": 0.0004689774624373957, + "loss": 1.6587, + "loss_base2": 2.393, + "loss_pixel": 0.1761, + "loss_text": 1.4826, + "ppl": 5.2525, + "step": 7633 + }, + { + "epoch": 0.04, + "global_step": 7634, + "learning_rate": 0.00046897328881469115, + "loss": 1.6633, + "loss_base2": 2.3996, + "loss_pixel": 0.1754, + "loss_text": 1.4879, + "ppl": 5.2767, + "step": 7634 + }, + { + "epoch": 0.04, + "global_step": 7635, + "learning_rate": 0.00046896911519198666, + "loss": 1.6681, + "loss_base2": 2.4066, + "loss_pixel": 0.1753, + "loss_text": 1.4928, + "ppl": 5.3021, + "step": 7635 + }, + { + "epoch": 0.04, + "global_step": 7636, + "learning_rate": 0.00046896494156928217, + "loss": 1.6674, + "loss_base2": 2.4055, + "loss_pixel": 0.1735, + "loss_text": 1.494, + "ppl": 5.2984, + "step": 7636 + }, + { + "epoch": 0.04, + "global_step": 7637, + "learning_rate": 0.0004689607679465777, + "loss": 1.6771, + "loss_base2": 2.4195, + "loss_pixel": 0.176, + "loss_text": 1.5011, + "ppl": 5.35, + "step": 7637 + }, + { + "epoch": 0.04, + "global_step": 7638, + "learning_rate": 0.00046895659432387313, + "loss": 1.6729, + "loss_base2": 2.4135, + "loss_pixel": 0.1758, + "loss_text": 1.497, + "ppl": 5.3276, + "step": 7638 + }, + { + "epoch": 0.04, + "global_step": 7639, + "learning_rate": 0.00046895242070116864, + "loss": 1.6639, + "loss_base2": 2.4005, + "loss_pixel": 0.1762, + "loss_text": 1.4878, + "ppl": 5.2799, + "step": 7639 + }, + { + "epoch": 0.04, + "global_step": 7640, + "learning_rate": 0.00046894824707846414, + "loss": 1.6578, + "loss_base2": 2.3917, + "loss_pixel": 0.1763, + "loss_text": 1.4815, + "ppl": 5.2478, + "step": 7640 + }, + { + "epoch": 0.04, + "global_step": 7641, + "learning_rate": 0.0004689440734557596, + "loss": 1.5309, + "loss_base2": 2.2086, + "loss_pixel": 0.1765, + "loss_text": 1.3543, + "ppl": 4.6223, + "step": 7641 + }, + { + "epoch": 0.04, + "global_step": 7642, + "learning_rate": 0.0004689398998330551, + "loss": 1.4652, + "loss_base2": 2.1138, + "loss_pixel": 0.1755, + "loss_text": 1.2897, + "ppl": 4.3284, + "step": 7642 + }, + { + "epoch": 0.04, + "global_step": 7643, + "learning_rate": 0.00046893572621035056, + "loss": 1.442, + "loss_base2": 2.0804, + "loss_pixel": 0.1752, + "loss_text": 1.2668, + "ppl": 4.2291, + "step": 7643 + }, + { + "epoch": 0.04, + "global_step": 7644, + "learning_rate": 0.00046893155258764606, + "loss": 1.4564, + "loss_base2": 2.1011, + "loss_pixel": 0.1751, + "loss_text": 1.2812, + "ppl": 4.2905, + "step": 7644 + }, + { + "epoch": 0.04, + "global_step": 7645, + "learning_rate": 0.00046892737896494157, + "loss": 1.4483, + "loss_base2": 2.0895, + "loss_pixel": 0.1761, + "loss_text": 1.2722, + "ppl": 4.2559, + "step": 7645 + }, + { + "epoch": 0.04, + "global_step": 7646, + "learning_rate": 0.0004689232053422371, + "loss": 1.4624, + "loss_base2": 2.1098, + "loss_pixel": 0.1765, + "loss_text": 1.286, + "ppl": 4.3163, + "step": 7646 + }, + { + "epoch": 0.04, + "global_step": 7647, + "learning_rate": 0.00046891903171953253, + "loss": 1.4484, + "loss_base2": 2.0896, + "loss_pixel": 0.176, + "loss_text": 1.2725, + "ppl": 4.2563, + "step": 7647 + }, + { + "epoch": 0.04, + "global_step": 7648, + "learning_rate": 0.00046891485809682804, + "loss": 1.4547, + "loss_base2": 2.0987, + "loss_pixel": 0.1757, + "loss_text": 1.279, + "ppl": 4.2832, + "step": 7648 + }, + { + "epoch": 0.04, + "global_step": 7649, + "learning_rate": 0.00046891068447412355, + "loss": 1.484, + "loss_base2": 2.141, + "loss_pixel": 0.1781, + "loss_text": 1.3059, + "ppl": 4.4106, + "step": 7649 + }, + { + "epoch": 0.04, + "global_step": 7650, + "learning_rate": 0.00046890651085141905, + "loss": 1.5796, + "loss_base2": 2.2789, + "loss_pixel": 0.1769, + "loss_text": 1.4026, + "ppl": 4.853, + "step": 7650 + }, + { + "epoch": 0.04, + "global_step": 7651, + "learning_rate": 0.00046890233722871456, + "loss": 1.426, + "loss_base2": 2.0573, + "loss_pixel": 0.1763, + "loss_text": 1.2496, + "ppl": 4.162, + "step": 7651 + }, + { + "epoch": 0.04, + "global_step": 7652, + "learning_rate": 0.00046889816360601, + "loss": 1.4304, + "loss_base2": 2.0636, + "loss_pixel": 0.1748, + "loss_text": 1.2556, + "ppl": 4.1804, + "step": 7652 + }, + { + "epoch": 0.04, + "global_step": 7653, + "learning_rate": 0.0004688939899833055, + "loss": 1.448, + "loss_base2": 2.089, + "loss_pixel": 0.1759, + "loss_text": 1.2721, + "ppl": 4.2546, + "step": 7653 + }, + { + "epoch": 0.04, + "global_step": 7654, + "learning_rate": 0.00046888981636060103, + "loss": 1.4579, + "loss_base2": 2.1033, + "loss_pixel": 0.1743, + "loss_text": 1.2836, + "ppl": 4.2969, + "step": 7654 + }, + { + "epoch": 0.04, + "global_step": 7655, + "learning_rate": 0.00046888564273789654, + "loss": 1.4477, + "loss_base2": 2.0886, + "loss_pixel": 0.1762, + "loss_text": 1.2715, + "ppl": 4.2533, + "step": 7655 + }, + { + "epoch": 0.04, + "global_step": 7656, + "learning_rate": 0.000468881469115192, + "loss": 1.4319, + "loss_base2": 2.0658, + "loss_pixel": 0.1747, + "loss_text": 1.2573, + "ppl": 4.1866, + "step": 7656 + }, + { + "epoch": 0.04, + "global_step": 7657, + "learning_rate": 0.0004688772954924875, + "loss": 1.4363, + "loss_base2": 2.0721, + "loss_pixel": 0.1755, + "loss_text": 1.2608, + "ppl": 4.2051, + "step": 7657 + }, + { + "epoch": 0.04, + "global_step": 7658, + "learning_rate": 0.000468873121869783, + "loss": 1.4705, + "loss_base2": 2.1215, + "loss_pixel": 0.1763, + "loss_text": 1.2942, + "ppl": 4.3514, + "step": 7658 + }, + { + "epoch": 0.04, + "global_step": 7659, + "learning_rate": 0.0004688689482470785, + "loss": 1.5281, + "loss_base2": 2.2046, + "loss_pixel": 0.1753, + "loss_text": 1.3528, + "ppl": 4.6094, + "step": 7659 + }, + { + "epoch": 0.04, + "global_step": 7660, + "learning_rate": 0.00046886477462437397, + "loss": 1.6591, + "loss_base2": 2.3936, + "loss_pixel": 0.174, + "loss_text": 1.4851, + "ppl": 5.2546, + "step": 7660 + }, + { + "epoch": 0.04, + "global_step": 7661, + "learning_rate": 0.0004688606010016694, + "loss": 1.6827, + "loss_base2": 2.4276, + "loss_pixel": 0.1745, + "loss_text": 1.5082, + "ppl": 5.3801, + "step": 7661 + }, + { + "epoch": 0.04, + "global_step": 7662, + "learning_rate": 0.0004688564273789649, + "loss": 1.7022, + "loss_base2": 2.4558, + "loss_pixel": 0.1751, + "loss_text": 1.5271, + "ppl": 5.486, + "step": 7662 + }, + { + "epoch": 0.04, + "global_step": 7663, + "learning_rate": 0.00046885225375626043, + "loss": 1.6807, + "loss_base2": 2.4247, + "loss_pixel": 0.1746, + "loss_text": 1.5061, + "ppl": 5.3693, + "step": 7663 + }, + { + "epoch": 0.04, + "global_step": 7664, + "learning_rate": 0.00046884808013355594, + "loss": 1.6801, + "loss_base2": 2.4239, + "loss_pixel": 0.1759, + "loss_text": 1.5042, + "ppl": 5.3661, + "step": 7664 + }, + { + "epoch": 0.04, + "global_step": 7665, + "learning_rate": 0.0004688439065108514, + "loss": 1.6808, + "loss_base2": 2.4249, + "loss_pixel": 0.1763, + "loss_text": 1.5044, + "ppl": 5.3699, + "step": 7665 + }, + { + "epoch": 0.04, + "global_step": 7666, + "learning_rate": 0.0004688397328881469, + "loss": 1.6708, + "loss_base2": 2.4105, + "loss_pixel": 0.1759, + "loss_text": 1.4949, + "ppl": 5.3164, + "step": 7666 + }, + { + "epoch": 0.04, + "global_step": 7667, + "learning_rate": 0.0004688355592654424, + "loss": 1.7064, + "loss_base2": 2.4618, + "loss_pixel": 0.1752, + "loss_text": 1.5312, + "ppl": 5.5091, + "step": 7667 + }, + { + "epoch": 0.04, + "global_step": 7668, + "learning_rate": 0.0004688313856427379, + "loss": 1.6777, + "loss_base2": 2.4204, + "loss_pixel": 0.1748, + "loss_text": 1.5029, + "ppl": 5.3532, + "step": 7668 + }, + { + "epoch": 0.04, + "global_step": 7669, + "learning_rate": 0.0004688272120200334, + "loss": 1.6681, + "loss_base2": 2.4066, + "loss_pixel": 0.1761, + "loss_text": 1.4921, + "ppl": 5.3021, + "step": 7669 + }, + { + "epoch": 0.04, + "global_step": 7670, + "learning_rate": 0.0004688230383973289, + "loss": 1.6818, + "loss_base2": 2.4263, + "loss_pixel": 0.1742, + "loss_text": 1.5076, + "ppl": 5.3752, + "step": 7670 + }, + { + "epoch": 0.04, + "global_step": 7671, + "learning_rate": 0.0004688188647746244, + "loss": 1.6865, + "loss_base2": 2.4331, + "loss_pixel": 0.1746, + "loss_text": 1.5119, + "ppl": 5.4005, + "step": 7671 + }, + { + "epoch": 0.04, + "global_step": 7672, + "learning_rate": 0.0004688146911519199, + "loss": 1.6849, + "loss_base2": 2.4308, + "loss_pixel": 0.1754, + "loss_text": 1.5094, + "ppl": 5.3919, + "step": 7672 + }, + { + "epoch": 0.04, + "global_step": 7673, + "learning_rate": 0.0004688105175292154, + "loss": 1.6805, + "loss_base2": 2.4244, + "loss_pixel": 0.1763, + "loss_text": 1.5042, + "ppl": 5.3682, + "step": 7673 + }, + { + "epoch": 0.04, + "global_step": 7674, + "learning_rate": 0.00046880634390651085, + "loss": 1.6793, + "loss_base2": 2.4227, + "loss_pixel": 0.1747, + "loss_text": 1.5046, + "ppl": 5.3618, + "step": 7674 + }, + { + "epoch": 0.04, + "global_step": 7675, + "learning_rate": 0.00046880217028380636, + "loss": 1.6753, + "loss_base2": 2.4169, + "loss_pixel": 0.1759, + "loss_text": 1.4994, + "ppl": 5.3404, + "step": 7675 + }, + { + "epoch": 0.04, + "global_step": 7676, + "learning_rate": 0.00046879799666110187, + "loss": 1.6845, + "loss_base2": 2.4302, + "loss_pixel": 0.1757, + "loss_text": 1.5088, + "ppl": 5.3898, + "step": 7676 + }, + { + "epoch": 0.04, + "global_step": 7677, + "learning_rate": 0.00046879382303839737, + "loss": 1.6635, + "loss_base2": 2.3999, + "loss_pixel": 0.176, + "loss_text": 1.4875, + "ppl": 5.2778, + "step": 7677 + }, + { + "epoch": 0.04, + "global_step": 7678, + "learning_rate": 0.0004687896494156929, + "loss": 1.6904, + "loss_base2": 2.4387, + "loss_pixel": 0.1823, + "loss_text": 1.5082, + "ppl": 5.4216, + "step": 7678 + }, + { + "epoch": 0.04, + "global_step": 7679, + "learning_rate": 0.0004687854757929883, + "loss": 1.6966, + "loss_base2": 2.4477, + "loss_pixel": 0.1832, + "loss_text": 1.5134, + "ppl": 5.4554, + "step": 7679 + }, + { + "epoch": 0.04, + "global_step": 7680, + "learning_rate": 0.0004687813021702838, + "loss": 1.6627, + "loss_base2": 2.3988, + "loss_pixel": 0.1835, + "loss_text": 1.4791, + "ppl": 5.2735, + "step": 7680 + }, + { + "epoch": 0.04, + "global_step": 7681, + "learning_rate": 0.0004687771285475793, + "loss": 1.6761, + "loss_base2": 2.4181, + "loss_pixel": 0.1833, + "loss_text": 1.4927, + "ppl": 5.3447, + "step": 7681 + }, + { + "epoch": 0.04, + "global_step": 7682, + "learning_rate": 0.0004687729549248748, + "loss": 1.6765, + "loss_base2": 2.4187, + "loss_pixel": 0.1827, + "loss_text": 1.4938, + "ppl": 5.3468, + "step": 7682 + }, + { + "epoch": 0.04, + "global_step": 7683, + "learning_rate": 0.00046876878130217025, + "loss": 1.6104, + "loss_base2": 2.3233, + "loss_pixel": 0.1779, + "loss_text": 1.4325, + "ppl": 5.0048, + "step": 7683 + }, + { + "epoch": 0.04, + "global_step": 7684, + "learning_rate": 0.00046876460767946576, + "loss": 1.4617, + "loss_base2": 2.1088, + "loss_pixel": 0.175, + "loss_text": 1.2867, + "ppl": 4.3133, + "step": 7684 + }, + { + "epoch": 0.04, + "global_step": 7685, + "learning_rate": 0.00046876043405676127, + "loss": 1.4416, + "loss_base2": 2.0798, + "loss_pixel": 0.1758, + "loss_text": 1.2658, + "ppl": 4.2275, + "step": 7685 + }, + { + "epoch": 0.04, + "global_step": 7686, + "learning_rate": 0.0004687562604340568, + "loss": 1.443, + "loss_base2": 2.0818, + "loss_pixel": 0.1756, + "loss_text": 1.2674, + "ppl": 4.2334, + "step": 7686 + }, + { + "epoch": 0.04, + "global_step": 7687, + "learning_rate": 0.0004687520868113523, + "loss": 1.4765, + "loss_base2": 2.1301, + "loss_pixel": 0.1758, + "loss_text": 1.3008, + "ppl": 4.3776, + "step": 7687 + }, + { + "epoch": 0.04, + "global_step": 7688, + "learning_rate": 0.00046874791318864774, + "loss": 1.4563, + "loss_base2": 2.101, + "loss_pixel": 0.1741, + "loss_text": 1.2823, + "ppl": 4.2901, + "step": 7688 + }, + { + "epoch": 0.04, + "global_step": 7689, + "learning_rate": 0.00046874373956594324, + "loss": 1.443, + "loss_base2": 2.0818, + "loss_pixel": 0.1765, + "loss_text": 1.2665, + "ppl": 4.2334, + "step": 7689 + }, + { + "epoch": 0.04, + "global_step": 7690, + "learning_rate": 0.00046873956594323875, + "loss": 1.4709, + "loss_base2": 2.1221, + "loss_pixel": 0.1792, + "loss_text": 1.2917, + "ppl": 4.3532, + "step": 7690 + }, + { + "epoch": 0.04, + "global_step": 7691, + "learning_rate": 0.00046873539232053426, + "loss": 1.4566, + "loss_base2": 2.1014, + "loss_pixel": 0.1776, + "loss_text": 1.2789, + "ppl": 4.2913, + "step": 7691 + }, + { + "epoch": 0.04, + "global_step": 7692, + "learning_rate": 0.00046873121869782977, + "loss": 1.4336, + "loss_base2": 2.0682, + "loss_pixel": 0.1764, + "loss_text": 1.2572, + "ppl": 4.1938, + "step": 7692 + }, + { + "epoch": 0.04, + "global_step": 7693, + "learning_rate": 0.0004687270450751252, + "loss": 1.4387, + "loss_base2": 2.0756, + "loss_pixel": 0.1754, + "loss_text": 1.2633, + "ppl": 4.2152, + "step": 7693 + }, + { + "epoch": 0.04, + "global_step": 7694, + "learning_rate": 0.0004687228714524207, + "loss": 1.4349, + "loss_base2": 2.0701, + "loss_pixel": 0.1775, + "loss_text": 1.2574, + "ppl": 4.1992, + "step": 7694 + }, + { + "epoch": 0.04, + "global_step": 7695, + "learning_rate": 0.00046871869782971623, + "loss": 1.4493, + "loss_base2": 2.0909, + "loss_pixel": 0.1753, + "loss_text": 1.274, + "ppl": 4.2601, + "step": 7695 + }, + { + "epoch": 0.04, + "global_step": 7696, + "learning_rate": 0.00046871452420701174, + "loss": 1.4475, + "loss_base2": 2.0883, + "loss_pixel": 0.1771, + "loss_text": 1.2704, + "ppl": 4.2525, + "step": 7696 + }, + { + "epoch": 0.04, + "global_step": 7697, + "learning_rate": 0.00046871035058430714, + "loss": 1.4568, + "loss_base2": 2.1017, + "loss_pixel": 0.1751, + "loss_text": 1.2817, + "ppl": 4.2922, + "step": 7697 + }, + { + "epoch": 0.04, + "global_step": 7698, + "learning_rate": 0.00046870617696160265, + "loss": 1.4407, + "loss_base2": 2.0785, + "loss_pixel": 0.1748, + "loss_text": 1.2659, + "ppl": 4.2237, + "step": 7698 + }, + { + "epoch": 0.04, + "global_step": 7699, + "learning_rate": 0.00046870200333889815, + "loss": 1.4527, + "loss_base2": 2.0958, + "loss_pixel": 0.1759, + "loss_text": 1.2767, + "ppl": 4.2746, + "step": 7699 + }, + { + "epoch": 0.04, + "global_step": 7700, + "learning_rate": 0.00046869782971619366, + "loss": 1.4455, + "loss_base2": 2.0854, + "loss_pixel": 0.1756, + "loss_text": 1.2699, + "ppl": 4.244, + "step": 7700 + }, + { + "epoch": 0.04, + "global_step": 7701, + "learning_rate": 0.00046869365609348917, + "loss": 1.5977, + "loss_base2": 2.305, + "loss_pixel": 0.1758, + "loss_text": 1.4219, + "ppl": 4.9417, + "step": 7701 + }, + { + "epoch": 0.04, + "global_step": 7702, + "learning_rate": 0.0004686894824707846, + "loss": 1.7084, + "loss_base2": 2.4647, + "loss_pixel": 0.1759, + "loss_text": 1.5325, + "ppl": 5.5201, + "step": 7702 + }, + { + "epoch": 0.04, + "global_step": 7703, + "learning_rate": 0.00046868530884808013, + "loss": 1.7078, + "loss_base2": 2.4638, + "loss_pixel": 0.1764, + "loss_text": 1.5315, + "ppl": 5.5168, + "step": 7703 + }, + { + "epoch": 0.04, + "global_step": 7704, + "learning_rate": 0.00046868113522537564, + "loss": 1.6791, + "loss_base2": 2.4224, + "loss_pixel": 0.1752, + "loss_text": 1.5038, + "ppl": 5.3607, + "step": 7704 + }, + { + "epoch": 0.04, + "global_step": 7705, + "learning_rate": 0.00046867696160267114, + "loss": 1.6746, + "loss_base2": 2.4159, + "loss_pixel": 0.1754, + "loss_text": 1.4993, + "ppl": 5.3367, + "step": 7705 + }, + { + "epoch": 0.04, + "global_step": 7706, + "learning_rate": 0.0004686727879799666, + "loss": 1.6869, + "loss_base2": 2.4337, + "loss_pixel": 0.1755, + "loss_text": 1.5114, + "ppl": 5.4027, + "step": 7706 + }, + { + "epoch": 0.04, + "global_step": 7707, + "learning_rate": 0.0004686686143572621, + "loss": 1.6817, + "loss_base2": 2.4262, + "loss_pixel": 0.1751, + "loss_text": 1.5066, + "ppl": 5.3747, + "step": 7707 + }, + { + "epoch": 0.04, + "global_step": 7708, + "learning_rate": 0.0004686644407345576, + "loss": 1.6946, + "loss_base2": 2.4448, + "loss_pixel": 0.1754, + "loss_text": 1.5192, + "ppl": 5.4445, + "step": 7708 + }, + { + "epoch": 0.04, + "global_step": 7709, + "learning_rate": 0.0004686602671118531, + "loss": 1.6939, + "loss_base2": 2.4438, + "loss_pixel": 0.1762, + "loss_text": 1.5178, + "ppl": 5.4407, + "step": 7709 + }, + { + "epoch": 0.04, + "global_step": 7710, + "learning_rate": 0.0004686560934891486, + "loss": 1.6757, + "loss_base2": 2.4175, + "loss_pixel": 0.1754, + "loss_text": 1.5003, + "ppl": 5.3425, + "step": 7710 + }, + { + "epoch": 0.04, + "global_step": 7711, + "learning_rate": 0.0004686519198664441, + "loss": 1.6762, + "loss_base2": 2.4182, + "loss_pixel": 0.1746, + "loss_text": 1.5016, + "ppl": 5.3452, + "step": 7711 + }, + { + "epoch": 0.04, + "global_step": 7712, + "learning_rate": 0.0004686477462437396, + "loss": 1.6862, + "loss_base2": 2.4327, + "loss_pixel": 0.1767, + "loss_text": 1.5095, + "ppl": 5.3989, + "step": 7712 + }, + { + "epoch": 0.04, + "global_step": 7713, + "learning_rate": 0.0004686435726210351, + "loss": 1.6424, + "loss_base2": 2.3695, + "loss_pixel": 0.1756, + "loss_text": 1.4668, + "ppl": 5.1676, + "step": 7713 + }, + { + "epoch": 0.04, + "global_step": 7714, + "learning_rate": 0.0004686393989983306, + "loss": 1.6681, + "loss_base2": 2.4066, + "loss_pixel": 0.1747, + "loss_text": 1.4934, + "ppl": 5.3021, + "step": 7714 + }, + { + "epoch": 0.04, + "global_step": 7715, + "learning_rate": 0.00046863522537562605, + "loss": 1.6929, + "loss_base2": 2.4423, + "loss_pixel": 0.1758, + "loss_text": 1.5171, + "ppl": 5.4352, + "step": 7715 + }, + { + "epoch": 0.04, + "global_step": 7716, + "learning_rate": 0.0004686310517529215, + "loss": 1.6623, + "loss_base2": 2.3982, + "loss_pixel": 0.1744, + "loss_text": 1.4879, + "ppl": 5.2714, + "step": 7716 + }, + { + "epoch": 0.04, + "global_step": 7717, + "learning_rate": 0.000468626878130217, + "loss": 1.6734, + "loss_base2": 2.4142, + "loss_pixel": 0.1743, + "loss_text": 1.4991, + "ppl": 5.3303, + "step": 7717 + }, + { + "epoch": 0.04, + "global_step": 7718, + "learning_rate": 0.0004686227045075125, + "loss": 1.6752, + "loss_base2": 2.4168, + "loss_pixel": 0.1744, + "loss_text": 1.5009, + "ppl": 5.3399, + "step": 7718 + }, + { + "epoch": 0.04, + "global_step": 7719, + "learning_rate": 0.00046861853088480803, + "loss": 1.6676, + "loss_base2": 2.4058, + "loss_pixel": 0.1749, + "loss_text": 1.4928, + "ppl": 5.2994, + "step": 7719 + }, + { + "epoch": 0.04, + "global_step": 7720, + "learning_rate": 0.0004686143572621035, + "loss": 1.6548, + "loss_base2": 2.3874, + "loss_pixel": 0.1746, + "loss_text": 1.4802, + "ppl": 5.232, + "step": 7720 + }, + { + "epoch": 0.04, + "global_step": 7721, + "learning_rate": 0.000468610183639399, + "loss": 1.6662, + "loss_base2": 2.4038, + "loss_pixel": 0.1751, + "loss_text": 1.4912, + "ppl": 5.292, + "step": 7721 + }, + { + "epoch": 0.04, + "global_step": 7722, + "learning_rate": 0.0004686060100166945, + "loss": 1.674, + "loss_base2": 2.4151, + "loss_pixel": 0.1763, + "loss_text": 1.4977, + "ppl": 5.3335, + "step": 7722 + }, + { + "epoch": 0.04, + "global_step": 7723, + "learning_rate": 0.00046860183639399, + "loss": 1.6681, + "loss_base2": 2.4066, + "loss_pixel": 0.1752, + "loss_text": 1.493, + "ppl": 5.3021, + "step": 7723 + }, + { + "epoch": 0.04, + "global_step": 7724, + "learning_rate": 0.00046859766277128546, + "loss": 1.6885, + "loss_base2": 2.436, + "loss_pixel": 0.1748, + "loss_text": 1.5138, + "ppl": 5.4114, + "step": 7724 + }, + { + "epoch": 0.04, + "global_step": 7725, + "learning_rate": 0.00046859348914858097, + "loss": 1.6773, + "loss_base2": 2.4198, + "loss_pixel": 0.1736, + "loss_text": 1.5037, + "ppl": 5.3511, + "step": 7725 + }, + { + "epoch": 0.04, + "global_step": 7726, + "learning_rate": 0.00046858931552587647, + "loss": 1.6571, + "loss_base2": 2.3907, + "loss_pixel": 0.1747, + "loss_text": 1.4825, + "ppl": 5.2441, + "step": 7726 + }, + { + "epoch": 0.04, + "global_step": 7727, + "learning_rate": 0.000468585141903172, + "loss": 1.6458, + "loss_base2": 2.3744, + "loss_pixel": 0.1755, + "loss_text": 1.4703, + "ppl": 5.1852, + "step": 7727 + }, + { + "epoch": 0.04, + "global_step": 7728, + "learning_rate": 0.0004685809682804675, + "loss": 1.6615, + "loss_base2": 2.397, + "loss_pixel": 0.1764, + "loss_text": 1.4852, + "ppl": 5.2672, + "step": 7728 + }, + { + "epoch": 0.04, + "global_step": 7729, + "learning_rate": 0.00046857679465776294, + "loss": 1.6642, + "loss_base2": 2.4009, + "loss_pixel": 0.1766, + "loss_text": 1.4876, + "ppl": 5.2814, + "step": 7729 + }, + { + "epoch": 0.04, + "global_step": 7730, + "learning_rate": 0.00046857262103505845, + "loss": 1.6642, + "loss_base2": 2.4009, + "loss_pixel": 0.1774, + "loss_text": 1.4867, + "ppl": 5.2814, + "step": 7730 + }, + { + "epoch": 0.04, + "global_step": 7731, + "learning_rate": 0.00046856844741235395, + "loss": 1.6734, + "loss_base2": 2.4142, + "loss_pixel": 0.1746, + "loss_text": 1.4988, + "ppl": 5.3303, + "step": 7731 + }, + { + "epoch": 0.04, + "global_step": 7732, + "learning_rate": 0.00046856427378964946, + "loss": 1.6913, + "loss_base2": 2.44, + "loss_pixel": 0.176, + "loss_text": 1.5153, + "ppl": 5.4265, + "step": 7732 + }, + { + "epoch": 0.04, + "global_step": 7733, + "learning_rate": 0.0004685601001669449, + "loss": 1.6599, + "loss_base2": 2.3947, + "loss_pixel": 0.1755, + "loss_text": 1.4844, + "ppl": 5.2588, + "step": 7733 + }, + { + "epoch": 0.04, + "global_step": 7734, + "learning_rate": 0.0004685559265442404, + "loss": 1.6303, + "loss_base2": 2.352, + "loss_pixel": 0.1763, + "loss_text": 1.454, + "ppl": 5.1054, + "step": 7734 + }, + { + "epoch": 0.04, + "global_step": 7735, + "learning_rate": 0.0004685517529215359, + "loss": 1.6862, + "loss_base2": 2.4327, + "loss_pixel": 0.175, + "loss_text": 1.5113, + "ppl": 5.3989, + "step": 7735 + }, + { + "epoch": 0.04, + "global_step": 7736, + "learning_rate": 0.0004685475792988314, + "loss": 1.6859, + "loss_base2": 2.4322, + "loss_pixel": 0.1757, + "loss_text": 1.5102, + "ppl": 5.3973, + "step": 7736 + }, + { + "epoch": 0.04, + "global_step": 7737, + "learning_rate": 0.0004685434056761269, + "loss": 1.6644, + "loss_base2": 2.4012, + "loss_pixel": 0.1751, + "loss_text": 1.4893, + "ppl": 5.2825, + "step": 7737 + }, + { + "epoch": 0.04, + "global_step": 7738, + "learning_rate": 0.00046853923205342234, + "loss": 1.6743, + "loss_base2": 2.4155, + "loss_pixel": 0.1737, + "loss_text": 1.5005, + "ppl": 5.3351, + "step": 7738 + }, + { + "epoch": 0.04, + "global_step": 7739, + "learning_rate": 0.00046853505843071785, + "loss": 1.671, + "loss_base2": 2.4107, + "loss_pixel": 0.1772, + "loss_text": 1.4938, + "ppl": 5.3175, + "step": 7739 + }, + { + "epoch": 0.04, + "global_step": 7740, + "learning_rate": 0.00046853088480801336, + "loss": 1.6641, + "loss_base2": 2.4008, + "loss_pixel": 0.1738, + "loss_text": 1.4903, + "ppl": 5.2809, + "step": 7740 + }, + { + "epoch": 0.04, + "global_step": 7741, + "learning_rate": 0.00046852671118530887, + "loss": 1.6738, + "loss_base2": 2.4148, + "loss_pixel": 0.1741, + "loss_text": 1.4996, + "ppl": 5.3324, + "step": 7741 + }, + { + "epoch": 0.04, + "global_step": 7742, + "learning_rate": 0.0004685225375626043, + "loss": 1.6553, + "loss_base2": 2.3881, + "loss_pixel": 0.1754, + "loss_text": 1.4798, + "ppl": 5.2347, + "step": 7742 + }, + { + "epoch": 0.04, + "global_step": 7743, + "learning_rate": 0.0004685183639398998, + "loss": 1.6675, + "loss_base2": 2.4057, + "loss_pixel": 0.1746, + "loss_text": 1.4929, + "ppl": 5.2989, + "step": 7743 + }, + { + "epoch": 0.04, + "global_step": 7744, + "learning_rate": 0.00046851419031719533, + "loss": 1.6693, + "loss_base2": 2.4083, + "loss_pixel": 0.1755, + "loss_text": 1.4939, + "ppl": 5.3085, + "step": 7744 + }, + { + "epoch": 0.04, + "global_step": 7745, + "learning_rate": 0.00046851001669449084, + "loss": 1.6264, + "loss_base2": 2.3464, + "loss_pixel": 0.1756, + "loss_text": 1.4508, + "ppl": 5.0855, + "step": 7745 + }, + { + "epoch": 0.04, + "global_step": 7746, + "learning_rate": 0.00046850584307178635, + "loss": 1.6606, + "loss_base2": 2.3957, + "loss_pixel": 0.1796, + "loss_text": 1.4811, + "ppl": 5.2625, + "step": 7746 + }, + { + "epoch": 0.04, + "global_step": 7747, + "learning_rate": 0.0004685016694490818, + "loss": 1.667, + "loss_base2": 2.405, + "loss_pixel": 0.1815, + "loss_text": 1.4855, + "ppl": 5.2963, + "step": 7747 + }, + { + "epoch": 0.04, + "global_step": 7748, + "learning_rate": 0.0004684974958263773, + "loss": 1.6881, + "loss_base2": 2.4354, + "loss_pixel": 0.1821, + "loss_text": 1.5059, + "ppl": 5.4092, + "step": 7748 + }, + { + "epoch": 0.04, + "global_step": 7749, + "learning_rate": 0.0004684933222036728, + "loss": 1.6558, + "loss_base2": 2.3888, + "loss_pixel": 0.1759, + "loss_text": 1.4799, + "ppl": 5.2373, + "step": 7749 + }, + { + "epoch": 0.04, + "global_step": 7750, + "learning_rate": 0.0004684891485809683, + "loss": 1.6704, + "loss_base2": 2.4099, + "loss_pixel": 0.1717, + "loss_text": 1.4987, + "ppl": 5.3143, + "step": 7750 + }, + { + "epoch": 0.04, + "global_step": 7751, + "learning_rate": 0.00046848497495826383, + "loss": 1.6551, + "loss_base2": 2.3878, + "loss_pixel": 0.1713, + "loss_text": 1.4839, + "ppl": 5.2336, + "step": 7751 + }, + { + "epoch": 0.04, + "global_step": 7752, + "learning_rate": 0.0004684808013355593, + "loss": 1.6722, + "loss_base2": 2.4125, + "loss_pixel": 0.1728, + "loss_text": 1.4994, + "ppl": 5.3239, + "step": 7752 + }, + { + "epoch": 0.04, + "global_step": 7753, + "learning_rate": 0.0004684766277128548, + "loss": 1.6619, + "loss_base2": 2.3976, + "loss_pixel": 0.1714, + "loss_text": 1.4905, + "ppl": 5.2693, + "step": 7753 + }, + { + "epoch": 0.04, + "global_step": 7754, + "learning_rate": 0.00046847245409015024, + "loss": 1.6569, + "loss_base2": 2.3904, + "loss_pixel": 0.1726, + "loss_text": 1.4842, + "ppl": 5.243, + "step": 7754 + }, + { + "epoch": 0.04, + "global_step": 7755, + "learning_rate": 0.00046846828046744575, + "loss": 1.6497, + "loss_base2": 2.38, + "loss_pixel": 0.1683, + "loss_text": 1.4814, + "ppl": 5.2054, + "step": 7755 + }, + { + "epoch": 0.04, + "global_step": 7756, + "learning_rate": 0.0004684641068447412, + "loss": 1.6404, + "loss_base2": 2.3666, + "loss_pixel": 0.1717, + "loss_text": 1.4686, + "ppl": 5.1572, + "step": 7756 + }, + { + "epoch": 0.04, + "global_step": 7757, + "learning_rate": 0.0004684599332220367, + "loss": 1.6541, + "loss_base2": 2.3864, + "loss_pixel": 0.1703, + "loss_text": 1.4838, + "ppl": 5.2284, + "step": 7757 + }, + { + "epoch": 0.04, + "global_step": 7758, + "learning_rate": 0.0004684557595993322, + "loss": 1.6686, + "loss_base2": 2.4073, + "loss_pixel": 0.1715, + "loss_text": 1.4971, + "ppl": 5.3047, + "step": 7758 + }, + { + "epoch": 0.04, + "global_step": 7759, + "learning_rate": 0.0004684515859766277, + "loss": 1.6447, + "loss_base2": 2.3728, + "loss_pixel": 0.1685, + "loss_text": 1.4761, + "ppl": 5.1795, + "step": 7759 + }, + { + "epoch": 0.04, + "global_step": 7760, + "learning_rate": 0.00046844741235392323, + "loss": 1.6749, + "loss_base2": 2.4164, + "loss_pixel": 0.1707, + "loss_text": 1.5042, + "ppl": 5.3383, + "step": 7760 + }, + { + "epoch": 0.04, + "global_step": 7761, + "learning_rate": 0.0004684432387312187, + "loss": 1.6718, + "loss_base2": 2.4119, + "loss_pixel": 0.1715, + "loss_text": 1.5002, + "ppl": 5.3217, + "step": 7761 + }, + { + "epoch": 0.04, + "global_step": 7762, + "learning_rate": 0.0004684390651085142, + "loss": 1.6587, + "loss_base2": 2.393, + "loss_pixel": 0.1721, + "loss_text": 1.4866, + "ppl": 5.2525, + "step": 7762 + }, + { + "epoch": 0.04, + "global_step": 7763, + "learning_rate": 0.0004684348914858097, + "loss": 1.6615, + "loss_base2": 2.397, + "loss_pixel": 0.1705, + "loss_text": 1.491, + "ppl": 5.2672, + "step": 7763 + }, + { + "epoch": 0.04, + "global_step": 7764, + "learning_rate": 0.0004684307178631052, + "loss": 1.6752, + "loss_base2": 2.4168, + "loss_pixel": 0.17, + "loss_text": 1.5053, + "ppl": 5.3399, + "step": 7764 + }, + { + "epoch": 0.04, + "global_step": 7765, + "learning_rate": 0.00046842654424040066, + "loss": 1.6667, + "loss_base2": 2.4045, + "loss_pixel": 0.1696, + "loss_text": 1.4971, + "ppl": 5.2947, + "step": 7765 + }, + { + "epoch": 0.04, + "global_step": 7766, + "learning_rate": 0.00046842237061769617, + "loss": 1.6458, + "loss_base2": 2.3744, + "loss_pixel": 0.1714, + "loss_text": 1.4744, + "ppl": 5.1852, + "step": 7766 + }, + { + "epoch": 0.04, + "global_step": 7767, + "learning_rate": 0.0004684181969949917, + "loss": 1.6705, + "loss_base2": 2.41, + "loss_pixel": 0.1783, + "loss_text": 1.4922, + "ppl": 5.3148, + "step": 7767 + }, + { + "epoch": 0.04, + "global_step": 7768, + "learning_rate": 0.0004684140233722872, + "loss": 1.6722, + "loss_base2": 2.4125, + "loss_pixel": 0.1788, + "loss_text": 1.4934, + "ppl": 5.3239, + "step": 7768 + }, + { + "epoch": 0.04, + "global_step": 7769, + "learning_rate": 0.0004684098497495827, + "loss": 1.6473, + "loss_base2": 2.3766, + "loss_pixel": 0.1778, + "loss_text": 1.4695, + "ppl": 5.1929, + "step": 7769 + }, + { + "epoch": 0.04, + "global_step": 7770, + "learning_rate": 0.00046840567612687814, + "loss": 1.6021, + "loss_base2": 2.3113, + "loss_pixel": 0.1756, + "loss_text": 1.4265, + "ppl": 4.9634, + "step": 7770 + }, + { + "epoch": 0.04, + "global_step": 7771, + "learning_rate": 0.00046840150250417365, + "loss": 1.6612, + "loss_base2": 2.3966, + "loss_pixel": 0.1772, + "loss_text": 1.484, + "ppl": 5.2656, + "step": 7771 + }, + { + "epoch": 0.04, + "global_step": 7772, + "learning_rate": 0.0004683973288814691, + "loss": 1.6628, + "loss_base2": 2.3989, + "loss_pixel": 0.1763, + "loss_text": 1.4865, + "ppl": 5.2741, + "step": 7772 + }, + { + "epoch": 0.04, + "global_step": 7773, + "learning_rate": 0.0004683931552587646, + "loss": 1.6482, + "loss_base2": 2.3778, + "loss_pixel": 0.1767, + "loss_text": 1.4715, + "ppl": 5.1976, + "step": 7773 + }, + { + "epoch": 0.04, + "global_step": 7774, + "learning_rate": 0.00046838898163606006, + "loss": 1.6647, + "loss_base2": 2.4017, + "loss_pixel": 0.1783, + "loss_text": 1.4864, + "ppl": 5.2841, + "step": 7774 + }, + { + "epoch": 0.04, + "global_step": 7775, + "learning_rate": 0.00046838480801335557, + "loss": 1.6635, + "loss_base2": 2.3999, + "loss_pixel": 0.1756, + "loss_text": 1.488, + "ppl": 5.2778, + "step": 7775 + }, + { + "epoch": 0.04, + "global_step": 7776, + "learning_rate": 0.0004683806343906511, + "loss": 1.6709, + "loss_base2": 2.4106, + "loss_pixel": 0.1771, + "loss_text": 1.4937, + "ppl": 5.317, + "step": 7776 + }, + { + "epoch": 0.04, + "global_step": 7777, + "learning_rate": 0.0004683764607679466, + "loss": 1.6705, + "loss_base2": 2.41, + "loss_pixel": 0.1763, + "loss_text": 1.4942, + "ppl": 5.3148, + "step": 7777 + }, + { + "epoch": 0.04, + "global_step": 7778, + "learning_rate": 0.0004683722871452421, + "loss": 1.6694, + "loss_base2": 2.4084, + "loss_pixel": 0.1765, + "loss_text": 1.4929, + "ppl": 5.309, + "step": 7778 + }, + { + "epoch": 0.04, + "global_step": 7779, + "learning_rate": 0.00046836811352253755, + "loss": 1.6748, + "loss_base2": 2.4162, + "loss_pixel": 0.1755, + "loss_text": 1.4993, + "ppl": 5.3377, + "step": 7779 + }, + { + "epoch": 0.04, + "global_step": 7780, + "learning_rate": 0.00046836393989983305, + "loss": 1.6634, + "loss_base2": 2.3998, + "loss_pixel": 0.1749, + "loss_text": 1.4885, + "ppl": 5.2772, + "step": 7780 + }, + { + "epoch": 0.04, + "global_step": 7781, + "learning_rate": 0.00046835976627712856, + "loss": 1.6759, + "loss_base2": 2.4178, + "loss_pixel": 0.1754, + "loss_text": 1.5005, + "ppl": 5.3436, + "step": 7781 + }, + { + "epoch": 0.04, + "global_step": 7782, + "learning_rate": 0.00046835559265442407, + "loss": 1.6672, + "loss_base2": 2.4053, + "loss_pixel": 0.1756, + "loss_text": 1.4916, + "ppl": 5.2973, + "step": 7782 + }, + { + "epoch": 0.04, + "global_step": 7783, + "learning_rate": 0.0004683514190317195, + "loss": 1.6814, + "loss_base2": 2.4257, + "loss_pixel": 0.1749, + "loss_text": 1.5065, + "ppl": 5.3731, + "step": 7783 + }, + { + "epoch": 0.04, + "global_step": 7784, + "learning_rate": 0.00046834724540901503, + "loss": 1.668, + "loss_base2": 2.4064, + "loss_pixel": 0.1764, + "loss_text": 1.4916, + "ppl": 5.3016, + "step": 7784 + }, + { + "epoch": 0.04, + "global_step": 7785, + "learning_rate": 0.00046834307178631054, + "loss": 1.6622, + "loss_base2": 2.398, + "loss_pixel": 0.175, + "loss_text": 1.4872, + "ppl": 5.2709, + "step": 7785 + }, + { + "epoch": 0.04, + "global_step": 7786, + "learning_rate": 0.00046833889816360604, + "loss": 1.6718, + "loss_base2": 2.4119, + "loss_pixel": 0.1755, + "loss_text": 1.4963, + "ppl": 5.3217, + "step": 7786 + }, + { + "epoch": 0.04, + "global_step": 7787, + "learning_rate": 0.00046833472454090155, + "loss": 1.6831, + "loss_base2": 2.4282, + "loss_pixel": 0.1741, + "loss_text": 1.509, + "ppl": 5.3822, + "step": 7787 + }, + { + "epoch": 0.04, + "global_step": 7788, + "learning_rate": 0.000468330550918197, + "loss": 1.673, + "loss_base2": 2.4136, + "loss_pixel": 0.1748, + "loss_text": 1.4982, + "ppl": 5.3281, + "step": 7788 + }, + { + "epoch": 0.04, + "global_step": 7789, + "learning_rate": 0.0004683263772954925, + "loss": 1.6885, + "loss_base2": 2.436, + "loss_pixel": 0.1765, + "loss_text": 1.512, + "ppl": 5.4114, + "step": 7789 + }, + { + "epoch": 0.04, + "global_step": 7790, + "learning_rate": 0.000468322203672788, + "loss": 1.6707, + "loss_base2": 2.4103, + "loss_pixel": 0.1753, + "loss_text": 1.4953, + "ppl": 5.3159, + "step": 7790 + }, + { + "epoch": 0.04, + "global_step": 7791, + "learning_rate": 0.00046831803005008347, + "loss": 1.6622, + "loss_base2": 2.398, + "loss_pixel": 0.1748, + "loss_text": 1.4874, + "ppl": 5.2709, + "step": 7791 + }, + { + "epoch": 0.04, + "global_step": 7792, + "learning_rate": 0.0004683138564273789, + "loss": 1.6593, + "loss_base2": 2.3939, + "loss_pixel": 0.1743, + "loss_text": 1.485, + "ppl": 5.2556, + "step": 7792 + }, + { + "epoch": 0.04, + "global_step": 7793, + "learning_rate": 0.00046830968280467443, + "loss": 1.6618, + "loss_base2": 2.3975, + "loss_pixel": 0.1746, + "loss_text": 1.4872, + "ppl": 5.2688, + "step": 7793 + }, + { + "epoch": 0.04, + "global_step": 7794, + "learning_rate": 0.00046830550918196994, + "loss": 1.6592, + "loss_base2": 2.3937, + "loss_pixel": 0.1747, + "loss_text": 1.4846, + "ppl": 5.2551, + "step": 7794 + }, + { + "epoch": 0.04, + "global_step": 7795, + "learning_rate": 0.00046830133555926545, + "loss": 1.6746, + "loss_base2": 2.4159, + "loss_pixel": 0.1748, + "loss_text": 1.4998, + "ppl": 5.3367, + "step": 7795 + }, + { + "epoch": 0.04, + "global_step": 7796, + "learning_rate": 0.00046829716193656095, + "loss": 1.6685, + "loss_base2": 2.4071, + "loss_pixel": 0.1737, + "loss_text": 1.4948, + "ppl": 5.3042, + "step": 7796 + }, + { + "epoch": 0.04, + "global_step": 7797, + "learning_rate": 0.0004682929883138564, + "loss": 1.6359, + "loss_base2": 2.3601, + "loss_pixel": 0.1737, + "loss_text": 1.4622, + "ppl": 5.1341, + "step": 7797 + }, + { + "epoch": 0.04, + "global_step": 7798, + "learning_rate": 0.0004682888146911519, + "loss": 1.6862, + "loss_base2": 2.4327, + "loss_pixel": 0.1733, + "loss_text": 1.5128, + "ppl": 5.3989, + "step": 7798 + }, + { + "epoch": 0.04, + "global_step": 7799, + "learning_rate": 0.0004682846410684474, + "loss": 1.648, + "loss_base2": 2.3776, + "loss_pixel": 0.1749, + "loss_text": 1.4731, + "ppl": 5.1966, + "step": 7799 + }, + { + "epoch": 0.04, + "global_step": 7800, + "learning_rate": 0.00046828046744574293, + "loss": 1.6781, + "loss_base2": 2.421, + "loss_pixel": 0.1744, + "loss_text": 1.5036, + "ppl": 5.3554, + "step": 7800 + }, + { + "epoch": 0.04, + "global_step": 7801, + "learning_rate": 0.0004682762938230384, + "loss": 1.6559, + "loss_base2": 2.389, + "loss_pixel": 0.1749, + "loss_text": 1.481, + "ppl": 5.2378, + "step": 7801 + }, + { + "epoch": 0.04, + "global_step": 7802, + "learning_rate": 0.0004682721202003339, + "loss": 1.6663, + "loss_base2": 2.404, + "loss_pixel": 0.1743, + "loss_text": 1.4921, + "ppl": 5.2925, + "step": 7802 + }, + { + "epoch": 0.04, + "global_step": 7803, + "learning_rate": 0.0004682679465776294, + "loss": 1.6582, + "loss_base2": 2.3923, + "loss_pixel": 0.1739, + "loss_text": 1.4843, + "ppl": 5.2499, + "step": 7803 + }, + { + "epoch": 0.04, + "global_step": 7804, + "learning_rate": 0.0004682637729549249, + "loss": 1.6705, + "loss_base2": 2.41, + "loss_pixel": 0.1759, + "loss_text": 1.4946, + "ppl": 5.3148, + "step": 7804 + }, + { + "epoch": 0.04, + "global_step": 7805, + "learning_rate": 0.0004682595993322204, + "loss": 1.6622, + "loss_base2": 2.398, + "loss_pixel": 0.174, + "loss_text": 1.4882, + "ppl": 5.2709, + "step": 7805 + }, + { + "epoch": 0.04, + "global_step": 7806, + "learning_rate": 0.00046825542570951587, + "loss": 1.669, + "loss_base2": 2.4079, + "loss_pixel": 0.1745, + "loss_text": 1.4945, + "ppl": 5.3069, + "step": 7806 + }, + { + "epoch": 0.04, + "global_step": 7807, + "learning_rate": 0.00046825125208681137, + "loss": 1.6502, + "loss_base2": 2.3807, + "loss_pixel": 0.1752, + "loss_text": 1.4751, + "ppl": 5.208, + "step": 7807 + }, + { + "epoch": 0.04, + "global_step": 7808, + "learning_rate": 0.0004682470784641069, + "loss": 1.6471, + "loss_base2": 2.3763, + "loss_pixel": 0.1747, + "loss_text": 1.4724, + "ppl": 5.1919, + "step": 7808 + }, + { + "epoch": 0.04, + "global_step": 7809, + "learning_rate": 0.0004682429048414024, + "loss": 1.6627, + "loss_base2": 2.3988, + "loss_pixel": 0.1752, + "loss_text": 1.4875, + "ppl": 5.2735, + "step": 7809 + }, + { + "epoch": 0.04, + "global_step": 7810, + "learning_rate": 0.00046823873121869784, + "loss": 1.6595, + "loss_base2": 2.3942, + "loss_pixel": 0.177, + "loss_text": 1.4825, + "ppl": 5.2567, + "step": 7810 + }, + { + "epoch": 0.04, + "global_step": 7811, + "learning_rate": 0.0004682345575959933, + "loss": 1.6691, + "loss_base2": 2.408, + "loss_pixel": 0.1782, + "loss_text": 1.4909, + "ppl": 5.3074, + "step": 7811 + }, + { + "epoch": 0.04, + "global_step": 7812, + "learning_rate": 0.0004682303839732888, + "loss": 1.6675, + "loss_base2": 2.4057, + "loss_pixel": 0.1771, + "loss_text": 1.4904, + "ppl": 5.2989, + "step": 7812 + }, + { + "epoch": 0.04, + "global_step": 7813, + "learning_rate": 0.0004682262103505843, + "loss": 1.6748, + "loss_base2": 2.4162, + "loss_pixel": 0.1787, + "loss_text": 1.496, + "ppl": 5.3377, + "step": 7813 + }, + { + "epoch": 0.04, + "global_step": 7814, + "learning_rate": 0.0004682220367278798, + "loss": 1.6828, + "loss_base2": 2.4278, + "loss_pixel": 0.179, + "loss_text": 1.5038, + "ppl": 5.3806, + "step": 7814 + }, + { + "epoch": 0.04, + "global_step": 7815, + "learning_rate": 0.00046821786310517527, + "loss": 1.6623, + "loss_base2": 2.3982, + "loss_pixel": 0.1786, + "loss_text": 1.4837, + "ppl": 5.2714, + "step": 7815 + }, + { + "epoch": 0.04, + "global_step": 7816, + "learning_rate": 0.0004682136894824708, + "loss": 1.6587, + "loss_base2": 2.393, + "loss_pixel": 0.1791, + "loss_text": 1.4796, + "ppl": 5.2525, + "step": 7816 + }, + { + "epoch": 0.04, + "global_step": 7817, + "learning_rate": 0.0004682095158597663, + "loss": 1.492, + "loss_base2": 2.1525, + "loss_pixel": 0.1779, + "loss_text": 1.3141, + "ppl": 4.446, + "step": 7817 + }, + { + "epoch": 0.04, + "global_step": 7818, + "learning_rate": 0.0004682053422370618, + "loss": 1.4527, + "loss_base2": 2.0958, + "loss_pixel": 0.1778, + "loss_text": 1.2749, + "ppl": 4.2746, + "step": 7818 + }, + { + "epoch": 0.04, + "global_step": 7819, + "learning_rate": 0.0004682011686143573, + "loss": 1.4702, + "loss_base2": 2.1211, + "loss_pixel": 0.1787, + "loss_text": 1.2915, + "ppl": 4.3501, + "step": 7819 + }, + { + "epoch": 0.04, + "global_step": 7820, + "learning_rate": 0.00046819699499165275, + "loss": 1.4465, + "loss_base2": 2.0869, + "loss_pixel": 0.1781, + "loss_text": 1.2684, + "ppl": 4.2482, + "step": 7820 + }, + { + "epoch": 0.04, + "global_step": 7821, + "learning_rate": 0.00046819282136894826, + "loss": 1.4339, + "loss_base2": 2.0687, + "loss_pixel": 0.1778, + "loss_text": 1.2561, + "ppl": 4.195, + "step": 7821 + }, + { + "epoch": 0.04, + "global_step": 7822, + "learning_rate": 0.00046818864774624377, + "loss": 1.4418, + "loss_base2": 2.0801, + "loss_pixel": 0.1774, + "loss_text": 1.2644, + "ppl": 4.2283, + "step": 7822 + }, + { + "epoch": 0.04, + "global_step": 7823, + "learning_rate": 0.00046818447412353927, + "loss": 1.4725, + "loss_base2": 2.1244, + "loss_pixel": 0.1787, + "loss_text": 1.2938, + "ppl": 4.3601, + "step": 7823 + }, + { + "epoch": 0.04, + "global_step": 7824, + "learning_rate": 0.0004681803005008347, + "loss": 1.4486, + "loss_base2": 2.0899, + "loss_pixel": 0.177, + "loss_text": 1.2715, + "ppl": 4.2572, + "step": 7824 + }, + { + "epoch": 0.04, + "global_step": 7825, + "learning_rate": 0.00046817612687813023, + "loss": 1.6794, + "loss_base2": 2.4229, + "loss_pixel": 0.177, + "loss_text": 1.5024, + "ppl": 5.3623, + "step": 7825 + }, + { + "epoch": 0.04, + "global_step": 7826, + "learning_rate": 0.00046817195325542574, + "loss": 1.7099, + "loss_base2": 2.4669, + "loss_pixel": 0.1808, + "loss_text": 1.5291, + "ppl": 5.5284, + "step": 7826 + }, + { + "epoch": 0.04, + "global_step": 7827, + "learning_rate": 0.00046816777963272125, + "loss": 1.6935, + "loss_base2": 2.4432, + "loss_pixel": 0.18, + "loss_text": 1.5135, + "ppl": 5.4385, + "step": 7827 + }, + { + "epoch": 0.04, + "global_step": 7828, + "learning_rate": 0.00046816360601001676, + "loss": 1.7077, + "loss_base2": 2.4637, + "loss_pixel": 0.1778, + "loss_text": 1.5299, + "ppl": 5.5163, + "step": 7828 + }, + { + "epoch": 0.04, + "global_step": 7829, + "learning_rate": 0.00046815943238731215, + "loss": 1.6714, + "loss_base2": 2.4113, + "loss_pixel": 0.1776, + "loss_text": 1.4938, + "ppl": 5.3196, + "step": 7829 + }, + { + "epoch": 0.04, + "global_step": 7830, + "learning_rate": 0.00046815525876460766, + "loss": 1.668, + "loss_base2": 2.4064, + "loss_pixel": 0.1781, + "loss_text": 1.4898, + "ppl": 5.3016, + "step": 7830 + }, + { + "epoch": 0.04, + "global_step": 7831, + "learning_rate": 0.00046815108514190317, + "loss": 1.677, + "loss_base2": 2.4194, + "loss_pixel": 0.1778, + "loss_text": 1.4992, + "ppl": 5.3495, + "step": 7831 + }, + { + "epoch": 0.04, + "global_step": 7832, + "learning_rate": 0.0004681469115191987, + "loss": 1.6757, + "loss_base2": 2.4175, + "loss_pixel": 0.1765, + "loss_text": 1.4991, + "ppl": 5.3425, + "step": 7832 + }, + { + "epoch": 0.04, + "global_step": 7833, + "learning_rate": 0.00046814273789649413, + "loss": 1.6836, + "loss_base2": 2.4289, + "loss_pixel": 0.1759, + "loss_text": 1.5076, + "ppl": 5.3849, + "step": 7833 + }, + { + "epoch": 0.04, + "global_step": 7834, + "learning_rate": 0.00046813856427378964, + "loss": 1.6699, + "loss_base2": 2.4092, + "loss_pixel": 0.1741, + "loss_text": 1.4958, + "ppl": 5.3116, + "step": 7834 + }, + { + "epoch": 0.04, + "global_step": 7835, + "learning_rate": 0.00046813439065108514, + "loss": 1.661, + "loss_base2": 2.3963, + "loss_pixel": 0.1727, + "loss_text": 1.4883, + "ppl": 5.2646, + "step": 7835 + }, + { + "epoch": 0.04, + "global_step": 7836, + "learning_rate": 0.00046813021702838065, + "loss": 1.6824, + "loss_base2": 2.4272, + "loss_pixel": 0.1752, + "loss_text": 1.5072, + "ppl": 5.3784, + "step": 7836 + }, + { + "epoch": 0.04, + "global_step": 7837, + "learning_rate": 0.00046812604340567616, + "loss": 1.6717, + "loss_base2": 2.4118, + "loss_pixel": 0.1731, + "loss_text": 1.4986, + "ppl": 5.3212, + "step": 7837 + }, + { + "epoch": 0.04, + "global_step": 7838, + "learning_rate": 0.0004681218697829716, + "loss": 1.6672, + "loss_base2": 2.4053, + "loss_pixel": 0.1725, + "loss_text": 1.4947, + "ppl": 5.2973, + "step": 7838 + }, + { + "epoch": 0.04, + "global_step": 7839, + "learning_rate": 0.0004681176961602671, + "loss": 1.6558, + "loss_base2": 2.3888, + "loss_pixel": 0.1696, + "loss_text": 1.4863, + "ppl": 5.2373, + "step": 7839 + }, + { + "epoch": 0.04, + "global_step": 7840, + "learning_rate": 0.0004681135225375626, + "loss": 1.6598, + "loss_base2": 2.3946, + "loss_pixel": 0.1705, + "loss_text": 1.4894, + "ppl": 5.2583, + "step": 7840 + }, + { + "epoch": 0.04, + "global_step": 7841, + "learning_rate": 0.00046810934891485813, + "loss": 1.6753, + "loss_base2": 2.4169, + "loss_pixel": 0.1688, + "loss_text": 1.5066, + "ppl": 5.3404, + "step": 7841 + }, + { + "epoch": 0.04, + "global_step": 7842, + "learning_rate": 0.0004681051752921536, + "loss": 1.6637, + "loss_base2": 2.4002, + "loss_pixel": 0.1682, + "loss_text": 1.4955, + "ppl": 5.2788, + "step": 7842 + }, + { + "epoch": 0.04, + "global_step": 7843, + "learning_rate": 0.0004681010016694491, + "loss": 1.6801, + "loss_base2": 2.4239, + "loss_pixel": 0.1706, + "loss_text": 1.5095, + "ppl": 5.3661, + "step": 7843 + }, + { + "epoch": 0.04, + "global_step": 7844, + "learning_rate": 0.0004680968280467446, + "loss": 1.6621, + "loss_base2": 2.3979, + "loss_pixel": 0.1688, + "loss_text": 1.4934, + "ppl": 5.2704, + "step": 7844 + }, + { + "epoch": 0.04, + "global_step": 7845, + "learning_rate": 0.0004680926544240401, + "loss": 1.6527, + "loss_base2": 2.3843, + "loss_pixel": 0.1705, + "loss_text": 1.4822, + "ppl": 5.2211, + "step": 7845 + }, + { + "epoch": 0.04, + "global_step": 7846, + "learning_rate": 0.0004680884808013356, + "loss": 1.6481, + "loss_base2": 2.3777, + "loss_pixel": 0.1686, + "loss_text": 1.4795, + "ppl": 5.1971, + "step": 7846 + }, + { + "epoch": 0.04, + "global_step": 7847, + "learning_rate": 0.000468084307178631, + "loss": 1.4593, + "loss_base2": 2.1053, + "loss_pixel": 0.168, + "loss_text": 1.2913, + "ppl": 4.3029, + "step": 7847 + }, + { + "epoch": 0.04, + "global_step": 7848, + "learning_rate": 0.0004680801335559265, + "loss": 1.457, + "loss_base2": 2.102, + "loss_pixel": 0.1685, + "loss_text": 1.2885, + "ppl": 4.2931, + "step": 7848 + }, + { + "epoch": 0.04, + "global_step": 7849, + "learning_rate": 0.00046807595993322203, + "loss": 1.4458, + "loss_base2": 2.0858, + "loss_pixel": 0.1712, + "loss_text": 1.2746, + "ppl": 4.2452, + "step": 7849 + }, + { + "epoch": 0.04, + "global_step": 7850, + "learning_rate": 0.00046807178631051754, + "loss": 1.4308, + "loss_base2": 2.0642, + "loss_pixel": 0.1774, + "loss_text": 1.2534, + "ppl": 4.182, + "step": 7850 + }, + { + "epoch": 0.04, + "global_step": 7851, + "learning_rate": 0.000468067612687813, + "loss": 1.4492, + "loss_base2": 2.0908, + "loss_pixel": 0.1778, + "loss_text": 1.2715, + "ppl": 4.2597, + "step": 7851 + }, + { + "epoch": 0.04, + "global_step": 7852, + "learning_rate": 0.0004680634390651085, + "loss": 1.4348, + "loss_base2": 2.07, + "loss_pixel": 0.1758, + "loss_text": 1.259, + "ppl": 4.1988, + "step": 7852 + }, + { + "epoch": 0.04, + "global_step": 7853, + "learning_rate": 0.000468059265442404, + "loss": 1.4377, + "loss_base2": 2.0742, + "loss_pixel": 0.175, + "loss_text": 1.2627, + "ppl": 4.211, + "step": 7853 + }, + { + "epoch": 0.04, + "global_step": 7854, + "learning_rate": 0.0004680550918196995, + "loss": 1.4358, + "loss_base2": 2.0714, + "loss_pixel": 0.1762, + "loss_text": 1.2596, + "ppl": 4.203, + "step": 7854 + }, + { + "epoch": 0.04, + "global_step": 7855, + "learning_rate": 0.000468050918196995, + "loss": 1.4497, + "loss_base2": 2.0915, + "loss_pixel": 0.1772, + "loss_text": 1.2724, + "ppl": 4.2618, + "step": 7855 + }, + { + "epoch": 0.04, + "global_step": 7856, + "learning_rate": 0.00046804674457429047, + "loss": 1.4453, + "loss_base2": 2.0851, + "loss_pixel": 0.1758, + "loss_text": 1.2695, + "ppl": 4.2431, + "step": 7856 + }, + { + "epoch": 0.04, + "global_step": 7857, + "learning_rate": 0.000468042570951586, + "loss": 1.4373, + "loss_base2": 2.0736, + "loss_pixel": 0.1758, + "loss_text": 1.2615, + "ppl": 4.2093, + "step": 7857 + }, + { + "epoch": 0.04, + "global_step": 7858, + "learning_rate": 0.0004680383973288815, + "loss": 1.4527, + "loss_base2": 2.0958, + "loss_pixel": 0.1754, + "loss_text": 1.2773, + "ppl": 4.2746, + "step": 7858 + }, + { + "epoch": 0.04, + "global_step": 7859, + "learning_rate": 0.000468034223706177, + "loss": 1.4501, + "loss_base2": 2.0921, + "loss_pixel": 0.1752, + "loss_text": 1.2749, + "ppl": 4.2635, + "step": 7859 + }, + { + "epoch": 0.04, + "global_step": 7860, + "learning_rate": 0.00046803005008347245, + "loss": 1.4333, + "loss_base2": 2.0678, + "loss_pixel": 0.175, + "loss_text": 1.2583, + "ppl": 4.1925, + "step": 7860 + }, + { + "epoch": 0.04, + "global_step": 7861, + "learning_rate": 0.00046802587646076795, + "loss": 1.4594, + "loss_base2": 2.1055, + "loss_pixel": 0.1737, + "loss_text": 1.2857, + "ppl": 4.3034, + "step": 7861 + }, + { + "epoch": 0.04, + "global_step": 7862, + "learning_rate": 0.00046802170283806346, + "loss": 1.4488, + "loss_base2": 2.0902, + "loss_pixel": 0.1761, + "loss_text": 1.2727, + "ppl": 4.258, + "step": 7862 + }, + { + "epoch": 0.04, + "global_step": 7863, + "learning_rate": 0.00046801752921535897, + "loss": 1.6388, + "loss_base2": 2.3643, + "loss_pixel": 0.176, + "loss_text": 1.4628, + "ppl": 5.149, + "step": 7863 + }, + { + "epoch": 0.04, + "global_step": 7864, + "learning_rate": 0.0004680133555926545, + "loss": 1.6779, + "loss_base2": 2.4207, + "loss_pixel": 0.177, + "loss_text": 1.5009, + "ppl": 5.3543, + "step": 7864 + }, + { + "epoch": 0.04, + "global_step": 7865, + "learning_rate": 0.00046800918196994993, + "loss": 1.6729, + "loss_base2": 2.4135, + "loss_pixel": 0.1757, + "loss_text": 1.4973, + "ppl": 5.3276, + "step": 7865 + }, + { + "epoch": 0.04, + "global_step": 7866, + "learning_rate": 0.0004680050083472454, + "loss": 1.6547, + "loss_base2": 2.3872, + "loss_pixel": 0.1767, + "loss_text": 1.478, + "ppl": 5.2315, + "step": 7866 + }, + { + "epoch": 0.04, + "global_step": 7867, + "learning_rate": 0.0004680008347245409, + "loss": 1.6762, + "loss_base2": 2.4182, + "loss_pixel": 0.1757, + "loss_text": 1.5004, + "ppl": 5.3452, + "step": 7867 + }, + { + "epoch": 0.04, + "global_step": 7868, + "learning_rate": 0.0004679966611018364, + "loss": 1.672, + "loss_base2": 2.4122, + "loss_pixel": 0.1752, + "loss_text": 1.4968, + "ppl": 5.3228, + "step": 7868 + }, + { + "epoch": 0.04, + "global_step": 7869, + "learning_rate": 0.0004679924874791319, + "loss": 1.6762, + "loss_base2": 2.4182, + "loss_pixel": 0.1752, + "loss_text": 1.5011, + "ppl": 5.3452, + "step": 7869 + }, + { + "epoch": 0.04, + "global_step": 7870, + "learning_rate": 0.00046798831385642736, + "loss": 1.6633, + "loss_base2": 2.3996, + "loss_pixel": 0.1756, + "loss_text": 1.4876, + "ppl": 5.2767, + "step": 7870 + }, + { + "epoch": 0.04, + "global_step": 7871, + "learning_rate": 0.00046798414023372287, + "loss": 1.6725, + "loss_base2": 2.4129, + "loss_pixel": 0.1761, + "loss_text": 1.4964, + "ppl": 5.3255, + "step": 7871 + }, + { + "epoch": 0.04, + "global_step": 7872, + "learning_rate": 0.00046797996661101837, + "loss": 1.6849, + "loss_base2": 2.4308, + "loss_pixel": 0.1751, + "loss_text": 1.5098, + "ppl": 5.3919, + "step": 7872 + }, + { + "epoch": 0.04, + "global_step": 7873, + "learning_rate": 0.0004679757929883139, + "loss": 1.6809, + "loss_base2": 2.425, + "loss_pixel": 0.1765, + "loss_text": 1.5044, + "ppl": 5.3704, + "step": 7873 + }, + { + "epoch": 0.04, + "global_step": 7874, + "learning_rate": 0.00046797161936560933, + "loss": 1.691, + "loss_base2": 2.4396, + "loss_pixel": 0.176, + "loss_text": 1.515, + "ppl": 5.4249, + "step": 7874 + }, + { + "epoch": 0.04, + "global_step": 7875, + "learning_rate": 0.00046796744574290484, + "loss": 1.6763, + "loss_base2": 2.4184, + "loss_pixel": 0.1771, + "loss_text": 1.4992, + "ppl": 5.3457, + "step": 7875 + }, + { + "epoch": 0.04, + "global_step": 7876, + "learning_rate": 0.00046796327212020035, + "loss": 1.6541, + "loss_base2": 2.3864, + "loss_pixel": 0.1758, + "loss_text": 1.4783, + "ppl": 5.2284, + "step": 7876 + }, + { + "epoch": 0.04, + "global_step": 7877, + "learning_rate": 0.00046795909849749585, + "loss": 1.6688, + "loss_base2": 2.4076, + "loss_pixel": 0.1762, + "loss_text": 1.4926, + "ppl": 5.3058, + "step": 7877 + }, + { + "epoch": 0.04, + "global_step": 7878, + "learning_rate": 0.00046795492487479136, + "loss": 1.6684, + "loss_base2": 2.407, + "loss_pixel": 0.1761, + "loss_text": 1.4923, + "ppl": 5.3037, + "step": 7878 + }, + { + "epoch": 0.04, + "global_step": 7879, + "learning_rate": 0.0004679507512520868, + "loss": 1.6703, + "loss_base2": 2.4097, + "loss_pixel": 0.1746, + "loss_text": 1.4956, + "ppl": 5.3138, + "step": 7879 + }, + { + "epoch": 0.04, + "global_step": 7880, + "learning_rate": 0.0004679465776293823, + "loss": 1.6606, + "loss_base2": 2.3957, + "loss_pixel": 0.1763, + "loss_text": 1.4843, + "ppl": 5.2625, + "step": 7880 + }, + { + "epoch": 0.04, + "global_step": 7881, + "learning_rate": 0.00046794240400667783, + "loss": 1.6722, + "loss_base2": 2.4125, + "loss_pixel": 0.1762, + "loss_text": 1.496, + "ppl": 5.3239, + "step": 7881 + }, + { + "epoch": 0.04, + "global_step": 7882, + "learning_rate": 0.00046793823038397334, + "loss": 1.6667, + "loss_base2": 2.4045, + "loss_pixel": 0.1752, + "loss_text": 1.4915, + "ppl": 5.2947, + "step": 7882 + }, + { + "epoch": 0.04, + "global_step": 7883, + "learning_rate": 0.0004679340567612688, + "loss": 1.6551, + "loss_base2": 2.3878, + "loss_pixel": 0.1744, + "loss_text": 1.4806, + "ppl": 5.2336, + "step": 7883 + }, + { + "epoch": 0.04, + "global_step": 7884, + "learning_rate": 0.0004679298831385643, + "loss": 1.6588, + "loss_base2": 2.3931, + "loss_pixel": 0.1744, + "loss_text": 1.4845, + "ppl": 5.253, + "step": 7884 + }, + { + "epoch": 0.04, + "global_step": 7885, + "learning_rate": 0.00046792570951585975, + "loss": 1.6832, + "loss_base2": 2.4283, + "loss_pixel": 0.1749, + "loss_text": 1.5083, + "ppl": 5.3828, + "step": 7885 + }, + { + "epoch": 0.04, + "global_step": 7886, + "learning_rate": 0.00046792153589315526, + "loss": 1.669, + "loss_base2": 2.4079, + "loss_pixel": 0.1754, + "loss_text": 1.4936, + "ppl": 5.3069, + "step": 7886 + }, + { + "epoch": 0.04, + "global_step": 7887, + "learning_rate": 0.00046791736227045077, + "loss": 1.6502, + "loss_base2": 2.3807, + "loss_pixel": 0.176, + "loss_text": 1.4742, + "ppl": 5.208, + "step": 7887 + }, + { + "epoch": 0.04, + "global_step": 7888, + "learning_rate": 0.0004679131886477462, + "loss": 1.6725, + "loss_base2": 2.4129, + "loss_pixel": 0.1756, + "loss_text": 1.4969, + "ppl": 5.3255, + "step": 7888 + }, + { + "epoch": 0.04, + "global_step": 7889, + "learning_rate": 0.0004679090150250417, + "loss": 1.6678, + "loss_base2": 2.4061, + "loss_pixel": 0.1755, + "loss_text": 1.4923, + "ppl": 5.3005, + "step": 7889 + }, + { + "epoch": 0.04, + "global_step": 7890, + "learning_rate": 0.00046790484140233723, + "loss": 1.6492, + "loss_base2": 2.3793, + "loss_pixel": 0.175, + "loss_text": 1.4742, + "ppl": 5.2028, + "step": 7890 + }, + { + "epoch": 0.04, + "global_step": 7891, + "learning_rate": 0.00046790066777963274, + "loss": 1.6657, + "loss_base2": 2.4031, + "loss_pixel": 0.174, + "loss_text": 1.4917, + "ppl": 5.2894, + "step": 7891 + }, + { + "epoch": 0.04, + "global_step": 7892, + "learning_rate": 0.0004678964941569282, + "loss": 1.6588, + "loss_base2": 2.3931, + "loss_pixel": 0.1753, + "loss_text": 1.4835, + "ppl": 5.253, + "step": 7892 + }, + { + "epoch": 0.04, + "global_step": 7893, + "learning_rate": 0.0004678923205342237, + "loss": 1.669, + "loss_base2": 2.4079, + "loss_pixel": 0.1759, + "loss_text": 1.493, + "ppl": 5.3069, + "step": 7893 + }, + { + "epoch": 0.04, + "global_step": 7894, + "learning_rate": 0.0004678881469115192, + "loss": 1.664, + "loss_base2": 2.4006, + "loss_pixel": 0.1751, + "loss_text": 1.4889, + "ppl": 5.2804, + "step": 7894 + }, + { + "epoch": 0.04, + "global_step": 7895, + "learning_rate": 0.0004678839732888147, + "loss": 1.657, + "loss_base2": 2.3905, + "loss_pixel": 0.175, + "loss_text": 1.482, + "ppl": 5.2436, + "step": 7895 + }, + { + "epoch": 0.04, + "global_step": 7896, + "learning_rate": 0.0004678797996661102, + "loss": 1.6689, + "loss_base2": 2.4077, + "loss_pixel": 0.1747, + "loss_text": 1.4942, + "ppl": 5.3063, + "step": 7896 + }, + { + "epoch": 0.04, + "global_step": 7897, + "learning_rate": 0.0004678756260434057, + "loss": 1.644, + "loss_base2": 2.3718, + "loss_pixel": 0.1742, + "loss_text": 1.4698, + "ppl": 5.1758, + "step": 7897 + }, + { + "epoch": 0.04, + "global_step": 7898, + "learning_rate": 0.0004678714524207012, + "loss": 1.6689, + "loss_base2": 2.4077, + "loss_pixel": 0.1738, + "loss_text": 1.4951, + "ppl": 5.3063, + "step": 7898 + }, + { + "epoch": 0.04, + "global_step": 7899, + "learning_rate": 0.0004678672787979967, + "loss": 1.6508, + "loss_base2": 2.3816, + "loss_pixel": 0.1746, + "loss_text": 1.4762, + "ppl": 5.2111, + "step": 7899 + }, + { + "epoch": 0.04, + "global_step": 7900, + "learning_rate": 0.0004678631051752922, + "loss": 1.6549, + "loss_base2": 2.3875, + "loss_pixel": 0.1732, + "loss_text": 1.4817, + "ppl": 5.2326, + "step": 7900 + }, + { + "epoch": 0.04, + "global_step": 7901, + "learning_rate": 0.00046785893155258765, + "loss": 1.6557, + "loss_base2": 2.3887, + "loss_pixel": 0.1746, + "loss_text": 1.4811, + "ppl": 5.2367, + "step": 7901 + }, + { + "epoch": 0.04, + "global_step": 7902, + "learning_rate": 0.00046785475792988316, + "loss": 1.6672, + "loss_base2": 2.4053, + "loss_pixel": 0.1739, + "loss_text": 1.4933, + "ppl": 5.2973, + "step": 7902 + }, + { + "epoch": 0.04, + "global_step": 7903, + "learning_rate": 0.00046785058430717867, + "loss": 1.6573, + "loss_base2": 2.391, + "loss_pixel": 0.1752, + "loss_text": 1.4822, + "ppl": 5.2451, + "step": 7903 + }, + { + "epoch": 0.04, + "global_step": 7904, + "learning_rate": 0.0004678464106844741, + "loss": 1.6618, + "loss_base2": 2.3975, + "loss_pixel": 0.1745, + "loss_text": 1.4873, + "ppl": 5.2688, + "step": 7904 + }, + { + "epoch": 0.04, + "global_step": 7905, + "learning_rate": 0.0004678422370617696, + "loss": 1.6869, + "loss_base2": 2.4337, + "loss_pixel": 0.1746, + "loss_text": 1.5123, + "ppl": 5.4027, + "step": 7905 + }, + { + "epoch": 0.04, + "global_step": 7906, + "learning_rate": 0.0004678380634390651, + "loss": 1.6652, + "loss_base2": 2.4024, + "loss_pixel": 0.1754, + "loss_text": 1.4898, + "ppl": 5.2867, + "step": 7906 + }, + { + "epoch": 0.04, + "global_step": 7907, + "learning_rate": 0.0004678338898163606, + "loss": 1.6682, + "loss_base2": 2.4067, + "loss_pixel": 0.1756, + "loss_text": 1.4926, + "ppl": 5.3026, + "step": 7907 + }, + { + "epoch": 0.04, + "global_step": 7908, + "learning_rate": 0.0004678297161936561, + "loss": 1.5407, + "loss_base2": 2.2228, + "loss_pixel": 0.1756, + "loss_text": 1.3651, + "ppl": 4.6679, + "step": 7908 + }, + { + "epoch": 0.04, + "global_step": 7909, + "learning_rate": 0.0004678255425709516, + "loss": 1.4261, + "loss_base2": 2.0574, + "loss_pixel": 0.1694, + "loss_text": 1.2567, + "ppl": 4.1624, + "step": 7909 + }, + { + "epoch": 0.04, + "global_step": 7910, + "learning_rate": 0.00046782136894824705, + "loss": 1.4369, + "loss_base2": 2.073, + "loss_pixel": 0.1692, + "loss_text": 1.2677, + "ppl": 4.2076, + "step": 7910 + }, + { + "epoch": 0.04, + "global_step": 7911, + "learning_rate": 0.00046781719532554256, + "loss": 1.4363, + "loss_base2": 2.0721, + "loss_pixel": 0.1709, + "loss_text": 1.2653, + "ppl": 4.2051, + "step": 7911 + }, + { + "epoch": 0.04, + "global_step": 7912, + "learning_rate": 0.00046781302170283807, + "loss": 1.4404, + "loss_base2": 2.0781, + "loss_pixel": 0.1681, + "loss_text": 1.2723, + "ppl": 4.2224, + "step": 7912 + }, + { + "epoch": 0.04, + "global_step": 7913, + "learning_rate": 0.0004678088480801336, + "loss": 1.4495, + "loss_base2": 2.0912, + "loss_pixel": 0.1686, + "loss_text": 1.2808, + "ppl": 4.261, + "step": 7913 + }, + { + "epoch": 0.04, + "global_step": 7914, + "learning_rate": 0.0004678046744574291, + "loss": 1.4237, + "loss_base2": 2.054, + "loss_pixel": 0.1686, + "loss_text": 1.2551, + "ppl": 4.1525, + "step": 7914 + }, + { + "epoch": 0.04, + "global_step": 7915, + "learning_rate": 0.00046780050083472454, + "loss": 1.3973, + "loss_base2": 2.0159, + "loss_pixel": 0.1674, + "loss_text": 1.2299, + "ppl": 4.0443, + "step": 7915 + }, + { + "epoch": 0.04, + "global_step": 7916, + "learning_rate": 0.00046779632721202004, + "loss": 1.6861, + "loss_base2": 2.4325, + "loss_pixel": 0.17, + "loss_text": 1.5161, + "ppl": 5.3984, + "step": 7916 + }, + { + "epoch": 0.04, + "global_step": 7917, + "learning_rate": 0.00046779215358931555, + "loss": 1.6901, + "loss_base2": 2.4383, + "loss_pixel": 0.1686, + "loss_text": 1.5215, + "ppl": 5.42, + "step": 7917 + }, + { + "epoch": 0.04, + "global_step": 7918, + "learning_rate": 0.00046778797996661106, + "loss": 1.6316, + "loss_base2": 2.3539, + "loss_pixel": 0.1683, + "loss_text": 1.4633, + "ppl": 5.112, + "step": 7918 + }, + { + "epoch": 0.04, + "global_step": 7919, + "learning_rate": 0.00046778380634390657, + "loss": 1.6748, + "loss_base2": 2.4162, + "loss_pixel": 0.1686, + "loss_text": 1.5062, + "ppl": 5.3377, + "step": 7919 + }, + { + "epoch": 0.04, + "global_step": 7920, + "learning_rate": 0.000467779632721202, + "loss": 1.6586, + "loss_base2": 2.3929, + "loss_pixel": 0.1667, + "loss_text": 1.492, + "ppl": 5.252, + "step": 7920 + }, + { + "epoch": 0.04, + "global_step": 7921, + "learning_rate": 0.0004677754590984975, + "loss": 1.6638, + "loss_base2": 2.4004, + "loss_pixel": 0.169, + "loss_text": 1.4948, + "ppl": 5.2793, + "step": 7921 + }, + { + "epoch": 0.04, + "global_step": 7922, + "learning_rate": 0.00046777128547579303, + "loss": 1.6608, + "loss_base2": 2.396, + "loss_pixel": 0.1687, + "loss_text": 1.4921, + "ppl": 5.2635, + "step": 7922 + }, + { + "epoch": 0.04, + "global_step": 7923, + "learning_rate": 0.0004677671118530885, + "loss": 1.6649, + "loss_base2": 2.4019, + "loss_pixel": 0.1666, + "loss_text": 1.4984, + "ppl": 5.2851, + "step": 7923 + }, + { + "epoch": 0.04, + "global_step": 7924, + "learning_rate": 0.00046776293823038394, + "loss": 1.6578, + "loss_base2": 2.3917, + "loss_pixel": 0.1716, + "loss_text": 1.4862, + "ppl": 5.2478, + "step": 7924 + }, + { + "epoch": 0.04, + "global_step": 7925, + "learning_rate": 0.00046775876460767945, + "loss": 1.6714, + "loss_base2": 2.4113, + "loss_pixel": 0.1759, + "loss_text": 1.4955, + "ppl": 5.3196, + "step": 7925 + }, + { + "epoch": 0.04, + "global_step": 7926, + "learning_rate": 0.00046775459098497495, + "loss": 1.6681, + "loss_base2": 2.4066, + "loss_pixel": 0.1767, + "loss_text": 1.4913, + "ppl": 5.3021, + "step": 7926 + }, + { + "epoch": 0.04, + "global_step": 7927, + "learning_rate": 0.00046775041736227046, + "loss": 1.6744, + "loss_base2": 2.4156, + "loss_pixel": 0.1758, + "loss_text": 1.4986, + "ppl": 5.3356, + "step": 7927 + }, + { + "epoch": 0.04, + "global_step": 7928, + "learning_rate": 0.00046774624373956597, + "loss": 1.6577, + "loss_base2": 2.3916, + "loss_pixel": 0.1752, + "loss_text": 1.4825, + "ppl": 5.2472, + "step": 7928 + }, + { + "epoch": 0.04, + "global_step": 7929, + "learning_rate": 0.0004677420701168614, + "loss": 1.6725, + "loss_base2": 2.4129, + "loss_pixel": 0.1744, + "loss_text": 1.498, + "ppl": 5.3255, + "step": 7929 + }, + { + "epoch": 0.04, + "global_step": 7930, + "learning_rate": 0.00046773789649415693, + "loss": 1.6824, + "loss_base2": 2.4272, + "loss_pixel": 0.1749, + "loss_text": 1.5075, + "ppl": 5.3784, + "step": 7930 + }, + { + "epoch": 0.04, + "global_step": 7931, + "learning_rate": 0.00046773372287145244, + "loss": 1.6616, + "loss_base2": 2.3972, + "loss_pixel": 0.1758, + "loss_text": 1.4859, + "ppl": 5.2677, + "step": 7931 + }, + { + "epoch": 0.04, + "global_step": 7932, + "learning_rate": 0.00046772954924874794, + "loss": 1.6879, + "loss_base2": 2.4351, + "loss_pixel": 0.1757, + "loss_text": 1.5121, + "ppl": 5.4081, + "step": 7932 + }, + { + "epoch": 0.04, + "global_step": 7933, + "learning_rate": 0.0004677253756260434, + "loss": 1.6688, + "loss_base2": 2.4076, + "loss_pixel": 0.1752, + "loss_text": 1.4936, + "ppl": 5.3058, + "step": 7933 + }, + { + "epoch": 0.04, + "global_step": 7934, + "learning_rate": 0.0004677212020033389, + "loss": 1.6608, + "loss_base2": 2.396, + "loss_pixel": 0.1746, + "loss_text": 1.4863, + "ppl": 5.2635, + "step": 7934 + }, + { + "epoch": 0.04, + "global_step": 7935, + "learning_rate": 0.0004677170283806344, + "loss": 1.6636, + "loss_base2": 2.4001, + "loss_pixel": 0.1739, + "loss_text": 1.4897, + "ppl": 5.2783, + "step": 7935 + }, + { + "epoch": 0.04, + "global_step": 7936, + "learning_rate": 0.0004677128547579299, + "loss": 1.6644, + "loss_base2": 2.4012, + "loss_pixel": 0.1738, + "loss_text": 1.4906, + "ppl": 5.2825, + "step": 7936 + }, + { + "epoch": 0.04, + "global_step": 7937, + "learning_rate": 0.0004677086811352254, + "loss": 1.5682, + "loss_base2": 2.2624, + "loss_pixel": 0.1737, + "loss_text": 1.3945, + "ppl": 4.798, + "step": 7937 + }, + { + "epoch": 0.04, + "global_step": 7938, + "learning_rate": 0.0004677045075125209, + "loss": 1.4453, + "loss_base2": 2.0851, + "loss_pixel": 0.1758, + "loss_text": 1.2695, + "ppl": 4.2431, + "step": 7938 + }, + { + "epoch": 0.04, + "global_step": 7939, + "learning_rate": 0.0004677003338898164, + "loss": 1.4337, + "loss_base2": 2.0684, + "loss_pixel": 0.1731, + "loss_text": 1.2606, + "ppl": 4.1942, + "step": 7939 + }, + { + "epoch": 0.04, + "global_step": 7940, + "learning_rate": 0.0004676961602671119, + "loss": 1.4206, + "loss_base2": 2.0495, + "loss_pixel": 0.174, + "loss_text": 1.2465, + "ppl": 4.1396, + "step": 7940 + }, + { + "epoch": 0.04, + "global_step": 7941, + "learning_rate": 0.00046769198664440735, + "loss": 1.4423, + "loss_base2": 2.0808, + "loss_pixel": 0.1746, + "loss_text": 1.2676, + "ppl": 4.2304, + "step": 7941 + }, + { + "epoch": 0.04, + "global_step": 7942, + "learning_rate": 0.0004676878130217028, + "loss": 1.4302, + "loss_base2": 2.0633, + "loss_pixel": 0.1729, + "loss_text": 1.2574, + "ppl": 4.1795, + "step": 7942 + }, + { + "epoch": 0.04, + "global_step": 7943, + "learning_rate": 0.0004676836393989983, + "loss": 1.44, + "loss_base2": 2.0775, + "loss_pixel": 0.1724, + "loss_text": 1.2676, + "ppl": 4.2207, + "step": 7943 + }, + { + "epoch": 0.04, + "global_step": 7944, + "learning_rate": 0.0004676794657762938, + "loss": 1.4371, + "loss_base2": 2.0733, + "loss_pixel": 0.1732, + "loss_text": 1.2639, + "ppl": 4.2085, + "step": 7944 + }, + { + "epoch": 0.04, + "global_step": 7945, + "learning_rate": 0.0004676752921535893, + "loss": 1.4252, + "loss_base2": 2.0561, + "loss_pixel": 0.1742, + "loss_text": 1.251, + "ppl": 4.1587, + "step": 7945 + }, + { + "epoch": 0.04, + "global_step": 7946, + "learning_rate": 0.00046767111853088483, + "loss": 1.4329, + "loss_base2": 2.0672, + "loss_pixel": 0.1744, + "loss_text": 1.2585, + "ppl": 4.1908, + "step": 7946 + }, + { + "epoch": 0.04, + "global_step": 7947, + "learning_rate": 0.0004676669449081803, + "loss": 1.4339, + "loss_base2": 2.0687, + "loss_pixel": 0.1743, + "loss_text": 1.2596, + "ppl": 4.195, + "step": 7947 + }, + { + "epoch": 0.04, + "global_step": 7948, + "learning_rate": 0.0004676627712854758, + "loss": 1.4354, + "loss_base2": 2.0708, + "loss_pixel": 0.1733, + "loss_text": 1.2621, + "ppl": 4.2013, + "step": 7948 + }, + { + "epoch": 0.04, + "global_step": 7949, + "learning_rate": 0.0004676585976627713, + "loss": 1.4365, + "loss_base2": 2.0724, + "loss_pixel": 0.1733, + "loss_text": 1.2633, + "ppl": 4.2059, + "step": 7949 + }, + { + "epoch": 0.04, + "global_step": 7950, + "learning_rate": 0.0004676544240400668, + "loss": 1.4471, + "loss_base2": 2.0877, + "loss_pixel": 0.1736, + "loss_text": 1.2735, + "ppl": 4.2508, + "step": 7950 + }, + { + "epoch": 0.04, + "global_step": 7951, + "learning_rate": 0.00046765025041736226, + "loss": 1.434, + "loss_base2": 2.0688, + "loss_pixel": 0.1742, + "loss_text": 1.2599, + "ppl": 4.1954, + "step": 7951 + }, + { + "epoch": 0.04, + "global_step": 7952, + "learning_rate": 0.00046764607679465777, + "loss": 1.4268, + "loss_base2": 2.0584, + "loss_pixel": 0.1747, + "loss_text": 1.2521, + "ppl": 4.1653, + "step": 7952 + }, + { + "epoch": 0.04, + "global_step": 7953, + "learning_rate": 0.00046764190317195327, + "loss": 1.5856, + "loss_base2": 2.2875, + "loss_pixel": 0.1736, + "loss_text": 1.412, + "ppl": 4.8822, + "step": 7953 + }, + { + "epoch": 0.04, + "global_step": 7954, + "learning_rate": 0.0004676377295492488, + "loss": 1.4272, + "loss_base2": 2.059, + "loss_pixel": 0.1727, + "loss_text": 1.2546, + "ppl": 4.167, + "step": 7954 + }, + { + "epoch": 0.04, + "global_step": 7955, + "learning_rate": 0.0004676335559265443, + "loss": 1.444, + "loss_base2": 2.0833, + "loss_pixel": 0.1731, + "loss_text": 1.2709, + "ppl": 4.2376, + "step": 7955 + }, + { + "epoch": 0.04, + "global_step": 7956, + "learning_rate": 0.00046762938230383974, + "loss": 1.4433, + "loss_base2": 2.0822, + "loss_pixel": 0.1727, + "loss_text": 1.2706, + "ppl": 4.2346, + "step": 7956 + }, + { + "epoch": 0.04, + "global_step": 7957, + "learning_rate": 0.00046762520868113525, + "loss": 1.4352, + "loss_base2": 2.0706, + "loss_pixel": 0.1756, + "loss_text": 1.2596, + "ppl": 4.2005, + "step": 7957 + }, + { + "epoch": 0.04, + "global_step": 7958, + "learning_rate": 0.00046762103505843076, + "loss": 1.4155, + "loss_base2": 2.0421, + "loss_pixel": 0.1746, + "loss_text": 1.2408, + "ppl": 4.1185, + "step": 7958 + }, + { + "epoch": 0.04, + "global_step": 7959, + "learning_rate": 0.00046761686143572626, + "loss": 1.4287, + "loss_base2": 2.0612, + "loss_pixel": 0.1759, + "loss_text": 1.2528, + "ppl": 4.1733, + "step": 7959 + }, + { + "epoch": 0.04, + "global_step": 7960, + "learning_rate": 0.00046761268781302166, + "loss": 1.4389, + "loss_base2": 2.0759, + "loss_pixel": 0.1749, + "loss_text": 1.2639, + "ppl": 4.2161, + "step": 7960 + }, + { + "epoch": 0.04, + "global_step": 7961, + "learning_rate": 0.00046760851419031717, + "loss": 1.4312, + "loss_base2": 2.0648, + "loss_pixel": 0.1729, + "loss_text": 1.2583, + "ppl": 4.1837, + "step": 7961 + }, + { + "epoch": 0.04, + "global_step": 7962, + "learning_rate": 0.0004676043405676127, + "loss": 1.4433, + "loss_base2": 2.0822, + "loss_pixel": 0.1743, + "loss_text": 1.2691, + "ppl": 4.2346, + "step": 7962 + }, + { + "epoch": 0.04, + "global_step": 7963, + "learning_rate": 0.0004676001669449082, + "loss": 1.4429, + "loss_base2": 2.0817, + "loss_pixel": 0.1739, + "loss_text": 1.269, + "ppl": 4.233, + "step": 7963 + }, + { + "epoch": 0.04, + "global_step": 7964, + "learning_rate": 0.0004675959933222037, + "loss": 1.4206, + "loss_base2": 2.0495, + "loss_pixel": 0.1724, + "loss_text": 1.2482, + "ppl": 4.1396, + "step": 7964 + }, + { + "epoch": 0.04, + "global_step": 7965, + "learning_rate": 0.00046759181969949914, + "loss": 1.4333, + "loss_base2": 2.0678, + "loss_pixel": 0.1735, + "loss_text": 1.2599, + "ppl": 4.1925, + "step": 7965 + }, + { + "epoch": 0.04, + "global_step": 7966, + "learning_rate": 0.00046758764607679465, + "loss": 1.4173, + "loss_base2": 2.0447, + "loss_pixel": 0.1742, + "loss_text": 1.2431, + "ppl": 4.126, + "step": 7966 + }, + { + "epoch": 0.04, + "global_step": 7967, + "learning_rate": 0.00046758347245409016, + "loss": 1.4474, + "loss_base2": 2.0882, + "loss_pixel": 0.1735, + "loss_text": 1.2739, + "ppl": 4.252, + "step": 7967 + }, + { + "epoch": 0.04, + "global_step": 7968, + "learning_rate": 0.00046757929883138567, + "loss": 1.4455, + "loss_base2": 2.0854, + "loss_pixel": 0.173, + "loss_text": 1.2725, + "ppl": 4.244, + "step": 7968 + }, + { + "epoch": 0.04, + "global_step": 7969, + "learning_rate": 0.0004675751252086811, + "loss": 1.7027, + "loss_base2": 2.4565, + "loss_pixel": 0.1735, + "loss_text": 1.5292, + "ppl": 5.4887, + "step": 7969 + }, + { + "epoch": 0.04, + "global_step": 7970, + "learning_rate": 0.0004675709515859766, + "loss": 1.6832, + "loss_base2": 2.4283, + "loss_pixel": 0.1734, + "loss_text": 1.5098, + "ppl": 5.3828, + "step": 7970 + }, + { + "epoch": 0.04, + "global_step": 7971, + "learning_rate": 0.00046756677796327213, + "loss": 1.6514, + "loss_base2": 2.3825, + "loss_pixel": 0.1735, + "loss_text": 1.478, + "ppl": 5.2143, + "step": 7971 + }, + { + "epoch": 0.04, + "global_step": 7972, + "learning_rate": 0.00046756260434056764, + "loss": 1.6677, + "loss_base2": 2.406, + "loss_pixel": 0.1748, + "loss_text": 1.4929, + "ppl": 5.3, + "step": 7972 + }, + { + "epoch": 0.04, + "global_step": 7973, + "learning_rate": 0.00046755843071786315, + "loss": 1.6779, + "loss_base2": 2.4207, + "loss_pixel": 0.1744, + "loss_text": 1.5035, + "ppl": 5.3543, + "step": 7973 + }, + { + "epoch": 0.04, + "global_step": 7974, + "learning_rate": 0.0004675542570951586, + "loss": 1.6725, + "loss_base2": 2.4129, + "loss_pixel": 0.1741, + "loss_text": 1.4984, + "ppl": 5.3255, + "step": 7974 + }, + { + "epoch": 0.04, + "global_step": 7975, + "learning_rate": 0.0004675500834724541, + "loss": 1.6584, + "loss_base2": 2.3926, + "loss_pixel": 0.173, + "loss_text": 1.4854, + "ppl": 5.2509, + "step": 7975 + }, + { + "epoch": 0.04, + "global_step": 7976, + "learning_rate": 0.0004675459098497496, + "loss": 1.6741, + "loss_base2": 2.4152, + "loss_pixel": 0.1754, + "loss_text": 1.4987, + "ppl": 5.334, + "step": 7976 + }, + { + "epoch": 0.04, + "global_step": 7977, + "learning_rate": 0.0004675417362270451, + "loss": 1.6904, + "loss_base2": 2.4387, + "loss_pixel": 0.1734, + "loss_text": 1.5169, + "ppl": 5.4216, + "step": 7977 + }, + { + "epoch": 0.04, + "global_step": 7978, + "learning_rate": 0.00046753756260434063, + "loss": 1.6687, + "loss_base2": 2.4074, + "loss_pixel": 0.1734, + "loss_text": 1.4953, + "ppl": 5.3053, + "step": 7978 + }, + { + "epoch": 0.04, + "global_step": 7979, + "learning_rate": 0.00046753338898163603, + "loss": 1.6737, + "loss_base2": 2.4146, + "loss_pixel": 0.1737, + "loss_text": 1.5, + "ppl": 5.3319, + "step": 7979 + }, + { + "epoch": 0.04, + "global_step": 7980, + "learning_rate": 0.00046752921535893154, + "loss": 1.6626, + "loss_base2": 2.3986, + "loss_pixel": 0.174, + "loss_text": 1.4886, + "ppl": 5.273, + "step": 7980 + }, + { + "epoch": 0.04, + "global_step": 7981, + "learning_rate": 0.00046752504173622704, + "loss": 1.677, + "loss_base2": 2.4194, + "loss_pixel": 0.1739, + "loss_text": 1.5031, + "ppl": 5.3495, + "step": 7981 + }, + { + "epoch": 0.04, + "global_step": 7982, + "learning_rate": 0.00046752086811352255, + "loss": 1.6516, + "loss_base2": 2.3828, + "loss_pixel": 0.1752, + "loss_text": 1.4763, + "ppl": 5.2153, + "step": 7982 + }, + { + "epoch": 0.04, + "global_step": 7983, + "learning_rate": 0.000467516694490818, + "loss": 1.6701, + "loss_base2": 2.4094, + "loss_pixel": 0.174, + "loss_text": 1.4962, + "ppl": 5.3127, + "step": 7983 + }, + { + "epoch": 0.04, + "global_step": 7984, + "learning_rate": 0.0004675125208681135, + "loss": 1.6485, + "loss_base2": 2.3783, + "loss_pixel": 0.1727, + "loss_text": 1.4758, + "ppl": 5.1992, + "step": 7984 + }, + { + "epoch": 0.04, + "global_step": 7985, + "learning_rate": 0.000467508347245409, + "loss": 1.6952, + "loss_base2": 2.4457, + "loss_pixel": 0.1737, + "loss_text": 1.5216, + "ppl": 5.4477, + "step": 7985 + }, + { + "epoch": 0.04, + "global_step": 7986, + "learning_rate": 0.0004675041736227045, + "loss": 1.6557, + "loss_base2": 2.3887, + "loss_pixel": 0.1734, + "loss_text": 1.4823, + "ppl": 5.2367, + "step": 7986 + }, + { + "epoch": 0.04, + "global_step": 7987, + "learning_rate": 0.00046750000000000003, + "loss": 1.6633, + "loss_base2": 2.3996, + "loss_pixel": 0.1757, + "loss_text": 1.4876, + "ppl": 5.2767, + "step": 7987 + }, + { + "epoch": 0.04, + "global_step": 7988, + "learning_rate": 0.0004674958263772955, + "loss": 1.6639, + "loss_base2": 2.4005, + "loss_pixel": 0.1734, + "loss_text": 1.4906, + "ppl": 5.2799, + "step": 7988 + }, + { + "epoch": 0.04, + "global_step": 7989, + "learning_rate": 0.000467491652754591, + "loss": 1.6655, + "loss_base2": 2.4028, + "loss_pixel": 0.1736, + "loss_text": 1.4919, + "ppl": 5.2883, + "step": 7989 + }, + { + "epoch": 0.04, + "global_step": 7990, + "learning_rate": 0.0004674874791318865, + "loss": 1.6642, + "loss_base2": 2.4009, + "loss_pixel": 0.1724, + "loss_text": 1.4918, + "ppl": 5.2814, + "step": 7990 + }, + { + "epoch": 0.04, + "global_step": 7991, + "learning_rate": 0.000467483305509182, + "loss": 1.672, + "loss_base2": 2.4122, + "loss_pixel": 0.1738, + "loss_text": 1.4982, + "ppl": 5.3228, + "step": 7991 + }, + { + "epoch": 0.04, + "global_step": 7992, + "learning_rate": 0.00046747913188647746, + "loss": 1.67, + "loss_base2": 2.4093, + "loss_pixel": 0.1733, + "loss_text": 1.4967, + "ppl": 5.3122, + "step": 7992 + }, + { + "epoch": 0.04, + "global_step": 7993, + "learning_rate": 0.00046747495826377297, + "loss": 1.6213, + "loss_base2": 2.339, + "loss_pixel": 0.1735, + "loss_text": 1.4478, + "ppl": 5.0597, + "step": 7993 + }, + { + "epoch": 0.04, + "global_step": 7994, + "learning_rate": 0.0004674707846410685, + "loss": 1.6214, + "loss_base2": 2.3392, + "loss_pixel": 0.1751, + "loss_text": 1.4463, + "ppl": 5.0602, + "step": 7994 + }, + { + "epoch": 0.04, + "global_step": 7995, + "learning_rate": 0.000467466611018364, + "loss": 1.666, + "loss_base2": 2.4035, + "loss_pixel": 0.1726, + "loss_text": 1.4935, + "ppl": 5.291, + "step": 7995 + }, + { + "epoch": 0.04, + "global_step": 7996, + "learning_rate": 0.0004674624373956595, + "loss": 1.6489, + "loss_base2": 2.3789, + "loss_pixel": 0.1731, + "loss_text": 1.4759, + "ppl": 5.2013, + "step": 7996 + }, + { + "epoch": 0.04, + "global_step": 7997, + "learning_rate": 0.0004674582637729549, + "loss": 1.645, + "loss_base2": 2.3732, + "loss_pixel": 0.1735, + "loss_text": 1.4715, + "ppl": 5.181, + "step": 7997 + }, + { + "epoch": 0.04, + "global_step": 7998, + "learning_rate": 0.0004674540901502504, + "loss": 1.6779, + "loss_base2": 2.4207, + "loss_pixel": 0.1731, + "loss_text": 1.5048, + "ppl": 5.3543, + "step": 7998 + }, + { + "epoch": 0.04, + "global_step": 7999, + "learning_rate": 0.0004674499165275459, + "loss": 1.6836, + "loss_base2": 2.4289, + "loss_pixel": 0.1737, + "loss_text": 1.5099, + "ppl": 5.3849, + "step": 7999 + }, + { + "epoch": 0.04, + "global_step": 8000, + "learning_rate": 0.0004674457429048414, + "loss": 1.6642, + "loss_base2": 2.4009, + "loss_pixel": 0.1731, + "loss_text": 1.4911, + "ppl": 5.2814, + "step": 8000 + }, + { + "epoch": 0.04, + "global_step": 8001, + "learning_rate": 0.00046744156928213686, + "loss": 1.6674, + "loss_base2": 2.4055, + "loss_pixel": 0.1728, + "loss_text": 1.4946, + "ppl": 5.2984, + "step": 8001 + }, + { + "epoch": 0.04, + "global_step": 8002, + "learning_rate": 0.00046743739565943237, + "loss": 1.656, + "loss_base2": 2.3891, + "loss_pixel": 0.174, + "loss_text": 1.4821, + "ppl": 5.2383, + "step": 8002 + }, + { + "epoch": 0.04, + "global_step": 8003, + "learning_rate": 0.0004674332220367279, + "loss": 1.6657, + "loss_base2": 2.4031, + "loss_pixel": 0.1737, + "loss_text": 1.4919, + "ppl": 5.2894, + "step": 8003 + }, + { + "epoch": 0.04, + "global_step": 8004, + "learning_rate": 0.0004674290484140234, + "loss": 1.6667, + "loss_base2": 2.4045, + "loss_pixel": 0.1727, + "loss_text": 1.494, + "ppl": 5.2947, + "step": 8004 + }, + { + "epoch": 0.04, + "global_step": 8005, + "learning_rate": 0.0004674248747913189, + "loss": 1.6777, + "loss_base2": 2.4204, + "loss_pixel": 0.1743, + "loss_text": 1.5035, + "ppl": 5.3532, + "step": 8005 + }, + { + "epoch": 0.04, + "global_step": 8006, + "learning_rate": 0.00046742070116861435, + "loss": 1.6601, + "loss_base2": 2.395, + "loss_pixel": 0.1732, + "loss_text": 1.4869, + "ppl": 5.2598, + "step": 8006 + }, + { + "epoch": 0.04, + "global_step": 8007, + "learning_rate": 0.00046741652754590985, + "loss": 1.6637, + "loss_base2": 2.4002, + "loss_pixel": 0.1724, + "loss_text": 1.4913, + "ppl": 5.2788, + "step": 8007 + }, + { + "epoch": 0.04, + "global_step": 8008, + "learning_rate": 0.00046741235392320536, + "loss": 1.6725, + "loss_base2": 2.4129, + "loss_pixel": 0.1742, + "loss_text": 1.4983, + "ppl": 5.3255, + "step": 8008 + }, + { + "epoch": 0.04, + "global_step": 8009, + "learning_rate": 0.00046740818030050087, + "loss": 1.6667, + "loss_base2": 2.4045, + "loss_pixel": 0.1727, + "loss_text": 1.494, + "ppl": 5.2947, + "step": 8009 + }, + { + "epoch": 0.04, + "global_step": 8010, + "learning_rate": 0.0004674040066777963, + "loss": 1.6745, + "loss_base2": 2.4158, + "loss_pixel": 0.1741, + "loss_text": 1.5003, + "ppl": 5.3361, + "step": 8010 + }, + { + "epoch": 0.04, + "global_step": 8011, + "learning_rate": 0.00046739983305509183, + "loss": 1.6718, + "loss_base2": 2.4119, + "loss_pixel": 0.1741, + "loss_text": 1.4977, + "ppl": 5.3217, + "step": 8011 + }, + { + "epoch": 0.04, + "global_step": 8012, + "learning_rate": 0.00046739565943238734, + "loss": 1.6473, + "loss_base2": 2.3766, + "loss_pixel": 0.1735, + "loss_text": 1.4738, + "ppl": 5.1929, + "step": 8012 + }, + { + "epoch": 0.04, + "global_step": 8013, + "learning_rate": 0.00046739148580968284, + "loss": 1.6536, + "loss_base2": 2.3856, + "loss_pixel": 0.1723, + "loss_text": 1.4813, + "ppl": 5.2258, + "step": 8013 + }, + { + "epoch": 0.04, + "global_step": 8014, + "learning_rate": 0.00046738731218697835, + "loss": 1.6554, + "loss_base2": 2.3882, + "loss_pixel": 0.1721, + "loss_text": 1.4832, + "ppl": 5.2352, + "step": 8014 + }, + { + "epoch": 0.04, + "global_step": 8015, + "learning_rate": 0.0004673831385642738, + "loss": 1.6598, + "loss_base2": 2.3946, + "loss_pixel": 0.1719, + "loss_text": 1.4879, + "ppl": 5.2583, + "step": 8015 + }, + { + "epoch": 0.04, + "global_step": 8016, + "learning_rate": 0.00046737896494156926, + "loss": 1.6538, + "loss_base2": 2.3859, + "loss_pixel": 0.1723, + "loss_text": 1.4815, + "ppl": 5.2268, + "step": 8016 + }, + { + "epoch": 0.04, + "global_step": 8017, + "learning_rate": 0.00046737479131886477, + "loss": 1.6538, + "loss_base2": 2.3859, + "loss_pixel": 0.1723, + "loss_text": 1.4816, + "ppl": 5.2268, + "step": 8017 + }, + { + "epoch": 0.04, + "global_step": 8018, + "learning_rate": 0.00046737061769616027, + "loss": 1.5963, + "loss_base2": 2.303, + "loss_pixel": 0.1712, + "loss_text": 1.4251, + "ppl": 4.9347, + "step": 8018 + }, + { + "epoch": 0.04, + "global_step": 8019, + "learning_rate": 0.0004673664440734557, + "loss": 1.6632, + "loss_base2": 2.3995, + "loss_pixel": 0.1721, + "loss_text": 1.4911, + "ppl": 5.2762, + "step": 8019 + }, + { + "epoch": 0.04, + "global_step": 8020, + "learning_rate": 0.00046736227045075123, + "loss": 1.6574, + "loss_base2": 2.3911, + "loss_pixel": 0.1731, + "loss_text": 1.4843, + "ppl": 5.2457, + "step": 8020 + }, + { + "epoch": 0.04, + "global_step": 8021, + "learning_rate": 0.00046735809682804674, + "loss": 1.6577, + "loss_base2": 2.3916, + "loss_pixel": 0.1728, + "loss_text": 1.4849, + "ppl": 5.2472, + "step": 8021 + }, + { + "epoch": 0.04, + "global_step": 8022, + "learning_rate": 0.00046735392320534225, + "loss": 1.6397, + "loss_base2": 2.3656, + "loss_pixel": 0.1735, + "loss_text": 1.4662, + "ppl": 5.1536, + "step": 8022 + }, + { + "epoch": 0.04, + "global_step": 8023, + "learning_rate": 0.00046734974958263775, + "loss": 1.6592, + "loss_base2": 2.3937, + "loss_pixel": 0.1733, + "loss_text": 1.4858, + "ppl": 5.2551, + "step": 8023 + }, + { + "epoch": 0.04, + "global_step": 8024, + "learning_rate": 0.0004673455759599332, + "loss": 1.6265, + "loss_base2": 2.3465, + "loss_pixel": 0.1735, + "loss_text": 1.453, + "ppl": 5.086, + "step": 8024 + }, + { + "epoch": 0.04, + "global_step": 8025, + "learning_rate": 0.0004673414023372287, + "loss": 1.6562, + "loss_base2": 2.3894, + "loss_pixel": 0.1735, + "loss_text": 1.4826, + "ppl": 5.2394, + "step": 8025 + }, + { + "epoch": 0.04, + "global_step": 8026, + "learning_rate": 0.0004673372287145242, + "loss": 1.6585, + "loss_base2": 2.3927, + "loss_pixel": 0.1732, + "loss_text": 1.4853, + "ppl": 5.2514, + "step": 8026 + }, + { + "epoch": 0.04, + "global_step": 8027, + "learning_rate": 0.00046733305509181973, + "loss": 1.6681, + "loss_base2": 2.4066, + "loss_pixel": 0.1741, + "loss_text": 1.4941, + "ppl": 5.3021, + "step": 8027 + }, + { + "epoch": 0.04, + "global_step": 8028, + "learning_rate": 0.0004673288814691152, + "loss": 1.6786, + "loss_base2": 2.4217, + "loss_pixel": 0.1744, + "loss_text": 1.5042, + "ppl": 5.358, + "step": 8028 + }, + { + "epoch": 0.04, + "global_step": 8029, + "learning_rate": 0.0004673247078464107, + "loss": 1.6697, + "loss_base2": 2.4089, + "loss_pixel": 0.173, + "loss_text": 1.4967, + "ppl": 5.3106, + "step": 8029 + }, + { + "epoch": 0.04, + "global_step": 8030, + "learning_rate": 0.0004673205342237062, + "loss": 1.653, + "loss_base2": 2.3848, + "loss_pixel": 0.173, + "loss_text": 1.48, + "ppl": 5.2226, + "step": 8030 + }, + { + "epoch": 0.04, + "global_step": 8031, + "learning_rate": 0.0004673163606010017, + "loss": 1.6724, + "loss_base2": 2.4128, + "loss_pixel": 0.1757, + "loss_text": 1.4967, + "ppl": 5.3249, + "step": 8031 + }, + { + "epoch": 0.04, + "global_step": 8032, + "learning_rate": 0.0004673121869782972, + "loss": 1.665, + "loss_base2": 2.4021, + "loss_pixel": 0.174, + "loss_text": 1.491, + "ppl": 5.2857, + "step": 8032 + }, + { + "epoch": 0.04, + "global_step": 8033, + "learning_rate": 0.00046730801335559267, + "loss": 1.6496, + "loss_base2": 2.3799, + "loss_pixel": 0.1745, + "loss_text": 1.4751, + "ppl": 5.2049, + "step": 8033 + }, + { + "epoch": 0.04, + "global_step": 8034, + "learning_rate": 0.00046730383973288817, + "loss": 1.6589, + "loss_base2": 2.3933, + "loss_pixel": 0.1727, + "loss_text": 1.4862, + "ppl": 5.2535, + "step": 8034 + }, + { + "epoch": 0.04, + "global_step": 8035, + "learning_rate": 0.0004672996661101836, + "loss": 1.6722, + "loss_base2": 2.4125, + "loss_pixel": 0.1744, + "loss_text": 1.4978, + "ppl": 5.3239, + "step": 8035 + }, + { + "epoch": 0.04, + "global_step": 8036, + "learning_rate": 0.00046729549248747913, + "loss": 1.6645, + "loss_base2": 2.4014, + "loss_pixel": 0.1745, + "loss_text": 1.49, + "ppl": 5.283, + "step": 8036 + }, + { + "epoch": 0.04, + "global_step": 8037, + "learning_rate": 0.00046729131886477464, + "loss": 1.6482, + "loss_base2": 2.3778, + "loss_pixel": 0.1737, + "loss_text": 1.4745, + "ppl": 5.1976, + "step": 8037 + }, + { + "epoch": 0.04, + "global_step": 8038, + "learning_rate": 0.0004672871452420701, + "loss": 1.6516, + "loss_base2": 2.3828, + "loss_pixel": 0.1719, + "loss_text": 1.4798, + "ppl": 5.2153, + "step": 8038 + }, + { + "epoch": 0.04, + "global_step": 8039, + "learning_rate": 0.0004672829716193656, + "loss": 1.6584, + "loss_base2": 2.3926, + "loss_pixel": 0.1739, + "loss_text": 1.4845, + "ppl": 5.2509, + "step": 8039 + }, + { + "epoch": 0.04, + "global_step": 8040, + "learning_rate": 0.0004672787979966611, + "loss": 1.6274, + "loss_base2": 2.3478, + "loss_pixel": 0.1744, + "loss_text": 1.453, + "ppl": 5.0906, + "step": 8040 + }, + { + "epoch": 0.04, + "global_step": 8041, + "learning_rate": 0.0004672746243739566, + "loss": 1.6552, + "loss_base2": 2.3879, + "loss_pixel": 0.1728, + "loss_text": 1.4824, + "ppl": 5.2341, + "step": 8041 + }, + { + "epoch": 0.04, + "global_step": 8042, + "learning_rate": 0.00046727045075125207, + "loss": 1.6646, + "loss_base2": 2.4015, + "loss_pixel": 0.1742, + "loss_text": 1.4904, + "ppl": 5.2836, + "step": 8042 + }, + { + "epoch": 0.04, + "global_step": 8043, + "learning_rate": 0.0004672662771285476, + "loss": 1.6536, + "loss_base2": 2.3856, + "loss_pixel": 0.1742, + "loss_text": 1.4794, + "ppl": 5.2258, + "step": 8043 + }, + { + "epoch": 0.04, + "global_step": 8044, + "learning_rate": 0.0004672621035058431, + "loss": 1.4602, + "loss_base2": 2.1066, + "loss_pixel": 0.1741, + "loss_text": 1.2862, + "ppl": 4.3068, + "step": 8044 + }, + { + "epoch": 0.04, + "global_step": 8045, + "learning_rate": 0.0004672579298831386, + "loss": 1.4282, + "loss_base2": 2.0605, + "loss_pixel": 0.1726, + "loss_text": 1.2556, + "ppl": 4.1712, + "step": 8045 + }, + { + "epoch": 0.04, + "global_step": 8046, + "learning_rate": 0.0004672537562604341, + "loss": 1.4454, + "loss_base2": 2.0853, + "loss_pixel": 0.1736, + "loss_text": 1.2719, + "ppl": 4.2435, + "step": 8046 + }, + { + "epoch": 0.04, + "global_step": 8047, + "learning_rate": 0.00046724958263772955, + "loss": 1.4397, + "loss_base2": 2.077, + "loss_pixel": 0.173, + "loss_text": 1.2667, + "ppl": 4.2194, + "step": 8047 + }, + { + "epoch": 0.04, + "global_step": 8048, + "learning_rate": 0.00046724540901502506, + "loss": 1.4426, + "loss_base2": 2.0812, + "loss_pixel": 0.1735, + "loss_text": 1.2691, + "ppl": 4.2317, + "step": 8048 + }, + { + "epoch": 0.04, + "global_step": 8049, + "learning_rate": 0.00046724123539232057, + "loss": 1.4199, + "loss_base2": 2.0485, + "loss_pixel": 0.1723, + "loss_text": 1.2476, + "ppl": 4.1367, + "step": 8049 + }, + { + "epoch": 0.04, + "global_step": 8050, + "learning_rate": 0.0004672370617696161, + "loss": 1.432, + "loss_base2": 2.0659, + "loss_pixel": 0.171, + "loss_text": 1.261, + "ppl": 4.1871, + "step": 8050 + }, + { + "epoch": 0.05, + "global_step": 8051, + "learning_rate": 0.0004672328881469115, + "loss": 1.4333, + "loss_base2": 2.0678, + "loss_pixel": 0.1727, + "loss_text": 1.2605, + "ppl": 4.1925, + "step": 8051 + }, + { + "epoch": 0.05, + "global_step": 8052, + "learning_rate": 0.00046722871452420703, + "loss": 1.4907, + "loss_base2": 2.1506, + "loss_pixel": 0.1726, + "loss_text": 1.3181, + "ppl": 4.4402, + "step": 8052 + }, + { + "epoch": 0.05, + "global_step": 8053, + "learning_rate": 0.00046722454090150254, + "loss": 1.5958, + "loss_base2": 2.3023, + "loss_pixel": 0.1726, + "loss_text": 1.4232, + "ppl": 4.9323, + "step": 8053 + }, + { + "epoch": 0.05, + "global_step": 8054, + "learning_rate": 0.000467220367278798, + "loss": 1.5072, + "loss_base2": 2.1744, + "loss_pixel": 0.172, + "loss_text": 1.3352, + "ppl": 4.5141, + "step": 8054 + }, + { + "epoch": 0.05, + "global_step": 8055, + "learning_rate": 0.0004672161936560935, + "loss": 1.4305, + "loss_base2": 2.0638, + "loss_pixel": 0.1729, + "loss_text": 1.2576, + "ppl": 4.1808, + "step": 8055 + }, + { + "epoch": 0.05, + "global_step": 8056, + "learning_rate": 0.00046721202003338895, + "loss": 1.4375, + "loss_base2": 2.0739, + "loss_pixel": 0.1712, + "loss_text": 1.2663, + "ppl": 4.2102, + "step": 8056 + }, + { + "epoch": 0.05, + "global_step": 8057, + "learning_rate": 0.00046720784641068446, + "loss": 1.4399, + "loss_base2": 2.0773, + "loss_pixel": 0.1735, + "loss_text": 1.2663, + "ppl": 4.2203, + "step": 8057 + }, + { + "epoch": 0.05, + "global_step": 8058, + "learning_rate": 0.00046720367278797997, + "loss": 1.4405, + "loss_base2": 2.0782, + "loss_pixel": 0.1718, + "loss_text": 1.2687, + "ppl": 4.2228, + "step": 8058 + }, + { + "epoch": 0.05, + "global_step": 8059, + "learning_rate": 0.0004671994991652755, + "loss": 1.4243, + "loss_base2": 2.0548, + "loss_pixel": 0.1721, + "loss_text": 1.2522, + "ppl": 4.1549, + "step": 8059 + }, + { + "epoch": 0.05, + "global_step": 8060, + "learning_rate": 0.00046719532554257093, + "loss": 1.4155, + "loss_base2": 2.0421, + "loss_pixel": 0.1732, + "loss_text": 1.2423, + "ppl": 4.1185, + "step": 8060 + }, + { + "epoch": 0.05, + "global_step": 8061, + "learning_rate": 0.00046719115191986644, + "loss": 1.4394, + "loss_base2": 2.0766, + "loss_pixel": 0.173, + "loss_text": 1.2664, + "ppl": 4.2182, + "step": 8061 + }, + { + "epoch": 0.05, + "global_step": 8062, + "learning_rate": 0.00046718697829716194, + "loss": 1.5521, + "loss_base2": 2.2392, + "loss_pixel": 0.1736, + "loss_text": 1.3785, + "ppl": 4.7214, + "step": 8062 + }, + { + "epoch": 0.05, + "global_step": 8063, + "learning_rate": 0.00046718280467445745, + "loss": 1.6608, + "loss_base2": 2.396, + "loss_pixel": 0.1742, + "loss_text": 1.4866, + "ppl": 5.2635, + "step": 8063 + }, + { + "epoch": 0.05, + "global_step": 8064, + "learning_rate": 0.00046717863105175296, + "loss": 1.6962, + "loss_base2": 2.4471, + "loss_pixel": 0.1735, + "loss_text": 1.5227, + "ppl": 5.4532, + "step": 8064 + }, + { + "epoch": 0.05, + "global_step": 8065, + "learning_rate": 0.0004671744574290484, + "loss": 1.6924, + "loss_base2": 2.4416, + "loss_pixel": 0.1737, + "loss_text": 1.5187, + "ppl": 5.4325, + "step": 8065 + }, + { + "epoch": 0.05, + "global_step": 8066, + "learning_rate": 0.0004671702838063439, + "loss": 1.6959, + "loss_base2": 2.4467, + "loss_pixel": 0.1739, + "loss_text": 1.522, + "ppl": 5.4516, + "step": 8066 + }, + { + "epoch": 0.05, + "global_step": 8067, + "learning_rate": 0.0004671661101836394, + "loss": 1.6642, + "loss_base2": 2.4009, + "loss_pixel": 0.1729, + "loss_text": 1.4914, + "ppl": 5.2814, + "step": 8067 + }, + { + "epoch": 0.05, + "global_step": 8068, + "learning_rate": 0.00046716193656093493, + "loss": 1.6741, + "loss_base2": 2.4152, + "loss_pixel": 0.1734, + "loss_text": 1.5007, + "ppl": 5.334, + "step": 8068 + }, + { + "epoch": 0.05, + "global_step": 8069, + "learning_rate": 0.0004671577629382304, + "loss": 1.664, + "loss_base2": 2.4006, + "loss_pixel": 0.1727, + "loss_text": 1.4912, + "ppl": 5.2804, + "step": 8069 + }, + { + "epoch": 0.05, + "global_step": 8070, + "learning_rate": 0.0004671535893155259, + "loss": 1.6795, + "loss_base2": 2.423, + "loss_pixel": 0.1729, + "loss_text": 1.5066, + "ppl": 5.3629, + "step": 8070 + }, + { + "epoch": 0.05, + "global_step": 8071, + "learning_rate": 0.0004671494156928214, + "loss": 1.664, + "loss_base2": 2.4006, + "loss_pixel": 0.1739, + "loss_text": 1.4901, + "ppl": 5.2804, + "step": 8071 + }, + { + "epoch": 0.05, + "global_step": 8072, + "learning_rate": 0.0004671452420701169, + "loss": 1.6649, + "loss_base2": 2.4019, + "loss_pixel": 0.1747, + "loss_text": 1.4902, + "ppl": 5.2851, + "step": 8072 + }, + { + "epoch": 0.05, + "global_step": 8073, + "learning_rate": 0.00046714106844741236, + "loss": 1.6737, + "loss_base2": 2.4146, + "loss_pixel": 0.1727, + "loss_text": 1.501, + "ppl": 5.3319, + "step": 8073 + }, + { + "epoch": 0.05, + "global_step": 8074, + "learning_rate": 0.0004671368948247078, + "loss": 1.6774, + "loss_base2": 2.42, + "loss_pixel": 0.1731, + "loss_text": 1.5042, + "ppl": 5.3516, + "step": 8074 + }, + { + "epoch": 0.05, + "global_step": 8075, + "learning_rate": 0.0004671327212020033, + "loss": 1.6813, + "loss_base2": 2.4256, + "loss_pixel": 0.1728, + "loss_text": 1.5085, + "ppl": 5.3725, + "step": 8075 + }, + { + "epoch": 0.05, + "global_step": 8076, + "learning_rate": 0.00046712854757929883, + "loss": 1.6665, + "loss_base2": 2.4043, + "loss_pixel": 0.1731, + "loss_text": 1.4934, + "ppl": 5.2936, + "step": 8076 + }, + { + "epoch": 0.05, + "global_step": 8077, + "learning_rate": 0.00046712437395659434, + "loss": 1.6727, + "loss_base2": 2.4132, + "loss_pixel": 0.1724, + "loss_text": 1.5002, + "ppl": 5.3265, + "step": 8077 + }, + { + "epoch": 0.05, + "global_step": 8078, + "learning_rate": 0.0004671202003338898, + "loss": 1.665, + "loss_base2": 2.4021, + "loss_pixel": 0.1731, + "loss_text": 1.4919, + "ppl": 5.2857, + "step": 8078 + }, + { + "epoch": 0.05, + "global_step": 8079, + "learning_rate": 0.0004671160267111853, + "loss": 1.6498, + "loss_base2": 2.3802, + "loss_pixel": 0.1729, + "loss_text": 1.4769, + "ppl": 5.2059, + "step": 8079 + }, + { + "epoch": 0.05, + "global_step": 8080, + "learning_rate": 0.0004671118530884808, + "loss": 1.6521, + "loss_base2": 2.3835, + "loss_pixel": 0.1734, + "loss_text": 1.4787, + "ppl": 5.2179, + "step": 8080 + }, + { + "epoch": 0.05, + "global_step": 8081, + "learning_rate": 0.0004671076794657763, + "loss": 1.6628, + "loss_base2": 2.3989, + "loss_pixel": 0.1729, + "loss_text": 1.4899, + "ppl": 5.2741, + "step": 8081 + }, + { + "epoch": 0.05, + "global_step": 8082, + "learning_rate": 0.0004671035058430718, + "loss": 1.667, + "loss_base2": 2.405, + "loss_pixel": 0.1721, + "loss_text": 1.4949, + "ppl": 5.2963, + "step": 8082 + }, + { + "epoch": 0.05, + "global_step": 8083, + "learning_rate": 0.00046709933222036727, + "loss": 1.6692, + "loss_base2": 2.4081, + "loss_pixel": 0.174, + "loss_text": 1.4952, + "ppl": 5.3079, + "step": 8083 + }, + { + "epoch": 0.05, + "global_step": 8084, + "learning_rate": 0.0004670951585976628, + "loss": 1.6647, + "loss_base2": 2.4017, + "loss_pixel": 0.1728, + "loss_text": 1.4919, + "ppl": 5.2841, + "step": 8084 + }, + { + "epoch": 0.05, + "global_step": 8085, + "learning_rate": 0.0004670909849749583, + "loss": 1.6582, + "loss_base2": 2.3923, + "loss_pixel": 0.177, + "loss_text": 1.4812, + "ppl": 5.2499, + "step": 8085 + }, + { + "epoch": 0.05, + "global_step": 8086, + "learning_rate": 0.0004670868113522538, + "loss": 1.6769, + "loss_base2": 2.4193, + "loss_pixel": 0.1736, + "loss_text": 1.5033, + "ppl": 5.3489, + "step": 8086 + }, + { + "epoch": 0.05, + "global_step": 8087, + "learning_rate": 0.00046708263772954925, + "loss": 1.6659, + "loss_base2": 2.4034, + "loss_pixel": 0.1746, + "loss_text": 1.4913, + "ppl": 5.2904, + "step": 8087 + }, + { + "epoch": 0.05, + "global_step": 8088, + "learning_rate": 0.00046707846410684475, + "loss": 1.6664, + "loss_base2": 2.4041, + "loss_pixel": 0.1757, + "loss_text": 1.4907, + "ppl": 5.2931, + "step": 8088 + }, + { + "epoch": 0.05, + "global_step": 8089, + "learning_rate": 0.00046707429048414026, + "loss": 1.6591, + "loss_base2": 2.3936, + "loss_pixel": 0.172, + "loss_text": 1.4871, + "ppl": 5.2546, + "step": 8089 + }, + { + "epoch": 0.05, + "global_step": 8090, + "learning_rate": 0.00046707011686143577, + "loss": 1.6563, + "loss_base2": 2.3895, + "loss_pixel": 0.1725, + "loss_text": 1.4838, + "ppl": 5.2399, + "step": 8090 + }, + { + "epoch": 0.05, + "global_step": 8091, + "learning_rate": 0.0004670659432387313, + "loss": 1.6713, + "loss_base2": 2.4112, + "loss_pixel": 0.1726, + "loss_text": 1.4987, + "ppl": 5.3191, + "step": 8091 + }, + { + "epoch": 0.05, + "global_step": 8092, + "learning_rate": 0.0004670617696160267, + "loss": 1.664, + "loss_base2": 2.4006, + "loss_pixel": 0.1722, + "loss_text": 1.4917, + "ppl": 5.2804, + "step": 8092 + }, + { + "epoch": 0.05, + "global_step": 8093, + "learning_rate": 0.0004670575959933222, + "loss": 1.6431, + "loss_base2": 2.3705, + "loss_pixel": 0.1733, + "loss_text": 1.4698, + "ppl": 5.1712, + "step": 8093 + }, + { + "epoch": 0.05, + "global_step": 8094, + "learning_rate": 0.0004670534223706177, + "loss": 1.661, + "loss_base2": 2.3963, + "loss_pixel": 0.1752, + "loss_text": 1.4858, + "ppl": 5.2646, + "step": 8094 + }, + { + "epoch": 0.05, + "global_step": 8095, + "learning_rate": 0.0004670492487479132, + "loss": 1.6496, + "loss_base2": 2.3799, + "loss_pixel": 0.1741, + "loss_text": 1.4755, + "ppl": 5.2049, + "step": 8095 + }, + { + "epoch": 0.05, + "global_step": 8096, + "learning_rate": 0.0004670450751252087, + "loss": 1.6643, + "loss_base2": 2.4011, + "loss_pixel": 0.1724, + "loss_text": 1.4919, + "ppl": 5.282, + "step": 8096 + }, + { + "epoch": 0.05, + "global_step": 8097, + "learning_rate": 0.00046704090150250416, + "loss": 1.6668, + "loss_base2": 2.4047, + "loss_pixel": 0.1722, + "loss_text": 1.4945, + "ppl": 5.2952, + "step": 8097 + }, + { + "epoch": 0.05, + "global_step": 8098, + "learning_rate": 0.00046703672787979967, + "loss": 1.6679, + "loss_base2": 2.4063, + "loss_pixel": 0.1722, + "loss_text": 1.4957, + "ppl": 5.301, + "step": 8098 + }, + { + "epoch": 0.05, + "global_step": 8099, + "learning_rate": 0.00046703255425709517, + "loss": 1.6595, + "loss_base2": 2.3942, + "loss_pixel": 0.1732, + "loss_text": 1.4863, + "ppl": 5.2567, + "step": 8099 + }, + { + "epoch": 0.05, + "global_step": 8100, + "learning_rate": 0.0004670283806343907, + "loss": 1.6657, + "loss_base2": 2.4031, + "loss_pixel": 0.1732, + "loss_text": 1.4925, + "ppl": 5.2894, + "step": 8100 + }, + { + "epoch": 0.05, + "global_step": 8101, + "learning_rate": 0.00046702420701168613, + "loss": 1.6489, + "loss_base2": 2.3789, + "loss_pixel": 0.1731, + "loss_text": 1.4758, + "ppl": 5.2013, + "step": 8101 + }, + { + "epoch": 0.05, + "global_step": 8102, + "learning_rate": 0.00046702003338898164, + "loss": 1.6679, + "loss_base2": 2.4063, + "loss_pixel": 0.1732, + "loss_text": 1.4946, + "ppl": 5.301, + "step": 8102 + }, + { + "epoch": 0.05, + "global_step": 8103, + "learning_rate": 0.00046701585976627715, + "loss": 1.6543, + "loss_base2": 2.3867, + "loss_pixel": 0.1717, + "loss_text": 1.4826, + "ppl": 5.2294, + "step": 8103 + }, + { + "epoch": 0.05, + "global_step": 8104, + "learning_rate": 0.00046701168614357266, + "loss": 1.6576, + "loss_base2": 2.3914, + "loss_pixel": 0.172, + "loss_text": 1.4856, + "ppl": 5.2467, + "step": 8104 + }, + { + "epoch": 0.05, + "global_step": 8105, + "learning_rate": 0.00046700751252086816, + "loss": 1.6553, + "loss_base2": 2.3881, + "loss_pixel": 0.1716, + "loss_text": 1.4837, + "ppl": 5.2347, + "step": 8105 + }, + { + "epoch": 0.05, + "global_step": 8106, + "learning_rate": 0.0004670033388981636, + "loss": 1.6588, + "loss_base2": 2.3931, + "loss_pixel": 0.1723, + "loss_text": 1.4865, + "ppl": 5.253, + "step": 8106 + }, + { + "epoch": 0.05, + "global_step": 8107, + "learning_rate": 0.0004669991652754591, + "loss": 1.6412, + "loss_base2": 2.3678, + "loss_pixel": 0.1724, + "loss_text": 1.4688, + "ppl": 5.1614, + "step": 8107 + }, + { + "epoch": 0.05, + "global_step": 8108, + "learning_rate": 0.00046699499165275463, + "loss": 1.6594, + "loss_base2": 2.394, + "loss_pixel": 0.1725, + "loss_text": 1.4869, + "ppl": 5.2562, + "step": 8108 + }, + { + "epoch": 0.05, + "global_step": 8109, + "learning_rate": 0.00046699081803005014, + "loss": 1.6621, + "loss_base2": 2.3979, + "loss_pixel": 0.1722, + "loss_text": 1.4899, + "ppl": 5.2704, + "step": 8109 + }, + { + "epoch": 0.05, + "global_step": 8110, + "learning_rate": 0.00046698664440734554, + "loss": 1.6563, + "loss_base2": 2.3895, + "loss_pixel": 0.1714, + "loss_text": 1.485, + "ppl": 5.2399, + "step": 8110 + }, + { + "epoch": 0.05, + "global_step": 8111, + "learning_rate": 0.00046698247078464104, + "loss": 1.6535, + "loss_base2": 2.3855, + "loss_pixel": 0.1734, + "loss_text": 1.4801, + "ppl": 5.2252, + "step": 8111 + }, + { + "epoch": 0.05, + "global_step": 8112, + "learning_rate": 0.00046697829716193655, + "loss": 1.6569, + "loss_base2": 2.3904, + "loss_pixel": 0.1718, + "loss_text": 1.4851, + "ppl": 5.243, + "step": 8112 + }, + { + "epoch": 0.05, + "global_step": 8113, + "learning_rate": 0.00046697412353923206, + "loss": 1.6819, + "loss_base2": 2.4265, + "loss_pixel": 0.1729, + "loss_text": 1.509, + "ppl": 5.3758, + "step": 8113 + }, + { + "epoch": 0.05, + "global_step": 8114, + "learning_rate": 0.00046696994991652757, + "loss": 1.654, + "loss_base2": 2.3862, + "loss_pixel": 0.1714, + "loss_text": 1.4825, + "ppl": 5.2278, + "step": 8114 + }, + { + "epoch": 0.05, + "global_step": 8115, + "learning_rate": 0.000466965776293823, + "loss": 1.6633, + "loss_base2": 2.3996, + "loss_pixel": 0.1734, + "loss_text": 1.4899, + "ppl": 5.2767, + "step": 8115 + }, + { + "epoch": 0.05, + "global_step": 8116, + "learning_rate": 0.0004669616026711185, + "loss": 1.6602, + "loss_base2": 2.3952, + "loss_pixel": 0.1713, + "loss_text": 1.4888, + "ppl": 5.2604, + "step": 8116 + }, + { + "epoch": 0.05, + "global_step": 8117, + "learning_rate": 0.00046695742904841403, + "loss": 1.6581, + "loss_base2": 2.3921, + "loss_pixel": 0.1724, + "loss_text": 1.4857, + "ppl": 5.2493, + "step": 8117 + }, + { + "epoch": 0.05, + "global_step": 8118, + "learning_rate": 0.00046695325542570954, + "loss": 1.654, + "loss_base2": 2.3862, + "loss_pixel": 0.1758, + "loss_text": 1.4782, + "ppl": 5.2278, + "step": 8118 + }, + { + "epoch": 0.05, + "global_step": 8119, + "learning_rate": 0.000466949081803005, + "loss": 1.6577, + "loss_base2": 2.3916, + "loss_pixel": 0.1731, + "loss_text": 1.4846, + "ppl": 5.2472, + "step": 8119 + }, + { + "epoch": 0.05, + "global_step": 8120, + "learning_rate": 0.0004669449081803005, + "loss": 1.6565, + "loss_base2": 2.3898, + "loss_pixel": 0.1747, + "loss_text": 1.4819, + "ppl": 5.2409, + "step": 8120 + }, + { + "epoch": 0.05, + "global_step": 8121, + "learning_rate": 0.000466940734557596, + "loss": 1.6639, + "loss_base2": 2.4005, + "loss_pixel": 0.1731, + "loss_text": 1.4908, + "ppl": 5.2799, + "step": 8121 + }, + { + "epoch": 0.05, + "global_step": 8122, + "learning_rate": 0.0004669365609348915, + "loss": 1.6664, + "loss_base2": 2.4041, + "loss_pixel": 0.1737, + "loss_text": 1.4927, + "ppl": 5.2931, + "step": 8122 + }, + { + "epoch": 0.05, + "global_step": 8123, + "learning_rate": 0.000466932387312187, + "loss": 1.6628, + "loss_base2": 2.3989, + "loss_pixel": 0.1718, + "loss_text": 1.491, + "ppl": 5.2741, + "step": 8123 + }, + { + "epoch": 0.05, + "global_step": 8124, + "learning_rate": 0.0004669282136894825, + "loss": 1.6652, + "loss_base2": 2.4024, + "loss_pixel": 0.1709, + "loss_text": 1.4943, + "ppl": 5.2867, + "step": 8124 + }, + { + "epoch": 0.05, + "global_step": 8125, + "learning_rate": 0.000466924040066778, + "loss": 1.6465, + "loss_base2": 2.3754, + "loss_pixel": 0.1724, + "loss_text": 1.4741, + "ppl": 5.1888, + "step": 8125 + }, + { + "epoch": 0.05, + "global_step": 8126, + "learning_rate": 0.0004669198664440735, + "loss": 1.6622, + "loss_base2": 2.398, + "loss_pixel": 0.1708, + "loss_text": 1.4914, + "ppl": 5.2709, + "step": 8126 + }, + { + "epoch": 0.05, + "global_step": 8127, + "learning_rate": 0.000466915692821369, + "loss": 1.6602, + "loss_base2": 2.3952, + "loss_pixel": 0.1719, + "loss_text": 1.4883, + "ppl": 5.2604, + "step": 8127 + }, + { + "epoch": 0.05, + "global_step": 8128, + "learning_rate": 0.00046691151919866445, + "loss": 1.6653, + "loss_base2": 2.4025, + "loss_pixel": 0.1717, + "loss_text": 1.4936, + "ppl": 5.2873, + "step": 8128 + }, + { + "epoch": 0.05, + "global_step": 8129, + "learning_rate": 0.0004669073455759599, + "loss": 1.639, + "loss_base2": 2.3646, + "loss_pixel": 0.1731, + "loss_text": 1.4659, + "ppl": 5.15, + "step": 8129 + }, + { + "epoch": 0.05, + "global_step": 8130, + "learning_rate": 0.0004669031719532554, + "loss": 1.6719, + "loss_base2": 2.412, + "loss_pixel": 0.1709, + "loss_text": 1.501, + "ppl": 5.3223, + "step": 8130 + }, + { + "epoch": 0.05, + "global_step": 8131, + "learning_rate": 0.0004668989983305509, + "loss": 1.6564, + "loss_base2": 2.3897, + "loss_pixel": 0.1715, + "loss_text": 1.4849, + "ppl": 5.2404, + "step": 8131 + }, + { + "epoch": 0.05, + "global_step": 8132, + "learning_rate": 0.0004668948247078464, + "loss": 1.465, + "loss_base2": 2.1135, + "loss_pixel": 0.1726, + "loss_text": 1.2924, + "ppl": 4.3275, + "step": 8132 + }, + { + "epoch": 0.05, + "global_step": 8133, + "learning_rate": 0.0004668906510851419, + "loss": 1.4325, + "loss_base2": 2.0667, + "loss_pixel": 0.1727, + "loss_text": 1.2598, + "ppl": 4.1892, + "step": 8133 + }, + { + "epoch": 0.05, + "global_step": 8134, + "learning_rate": 0.0004668864774624374, + "loss": 1.4399, + "loss_base2": 2.0773, + "loss_pixel": 0.1711, + "loss_text": 1.2688, + "ppl": 4.2203, + "step": 8134 + }, + { + "epoch": 0.05, + "global_step": 8135, + "learning_rate": 0.0004668823038397329, + "loss": 1.43, + "loss_base2": 2.0631, + "loss_pixel": 0.1723, + "loss_text": 1.2577, + "ppl": 4.1787, + "step": 8135 + }, + { + "epoch": 0.05, + "global_step": 8136, + "learning_rate": 0.0004668781302170284, + "loss": 1.425, + "loss_base2": 2.0558, + "loss_pixel": 0.1725, + "loss_text": 1.2525, + "ppl": 4.1579, + "step": 8136 + }, + { + "epoch": 0.05, + "global_step": 8137, + "learning_rate": 0.00046687395659432385, + "loss": 1.4293, + "loss_base2": 2.062, + "loss_pixel": 0.172, + "loss_text": 1.2573, + "ppl": 4.1758, + "step": 8137 + }, + { + "epoch": 0.05, + "global_step": 8138, + "learning_rate": 0.00046686978297161936, + "loss": 1.4408, + "loss_base2": 2.0786, + "loss_pixel": 0.1722, + "loss_text": 1.2686, + "ppl": 4.2241, + "step": 8138 + }, + { + "epoch": 0.05, + "global_step": 8139, + "learning_rate": 0.00046686560934891487, + "loss": 1.5194, + "loss_base2": 2.192, + "loss_pixel": 0.1711, + "loss_text": 1.3483, + "ppl": 4.5695, + "step": 8139 + }, + { + "epoch": 0.05, + "global_step": 8140, + "learning_rate": 0.0004668614357262104, + "loss": 1.587, + "loss_base2": 2.2896, + "loss_pixel": 0.1729, + "loss_text": 1.414, + "ppl": 4.8891, + "step": 8140 + }, + { + "epoch": 0.05, + "global_step": 8141, + "learning_rate": 0.0004668572621035059, + "loss": 1.4876, + "loss_base2": 2.1462, + "loss_pixel": 0.1722, + "loss_text": 1.3154, + "ppl": 4.4265, + "step": 8141 + }, + { + "epoch": 0.05, + "global_step": 8142, + "learning_rate": 0.00046685308848080134, + "loss": 1.4304, + "loss_base2": 2.0636, + "loss_pixel": 0.1742, + "loss_text": 1.2562, + "ppl": 4.1804, + "step": 8142 + }, + { + "epoch": 0.05, + "global_step": 8143, + "learning_rate": 0.00046684891485809684, + "loss": 1.4249, + "loss_base2": 2.0557, + "loss_pixel": 0.1752, + "loss_text": 1.2496, + "ppl": 4.1574, + "step": 8143 + }, + { + "epoch": 0.05, + "global_step": 8144, + "learning_rate": 0.00046684474123539235, + "loss": 1.4267, + "loss_base2": 2.0583, + "loss_pixel": 0.1722, + "loss_text": 1.2545, + "ppl": 4.1649, + "step": 8144 + }, + { + "epoch": 0.05, + "global_step": 8145, + "learning_rate": 0.00046684056761268786, + "loss": 1.4509, + "loss_base2": 2.0932, + "loss_pixel": 0.173, + "loss_text": 1.278, + "ppl": 4.267, + "step": 8145 + }, + { + "epoch": 0.05, + "global_step": 8146, + "learning_rate": 0.0004668363939899833, + "loss": 1.4502, + "loss_base2": 2.0922, + "loss_pixel": 0.173, + "loss_text": 1.2772, + "ppl": 4.264, + "step": 8146 + }, + { + "epoch": 0.05, + "global_step": 8147, + "learning_rate": 0.0004668322203672788, + "loss": 1.4356, + "loss_base2": 2.0711, + "loss_pixel": 0.1733, + "loss_text": 1.2623, + "ppl": 4.2022, + "step": 8147 + }, + { + "epoch": 0.05, + "global_step": 8148, + "learning_rate": 0.00046682804674457427, + "loss": 1.4344, + "loss_base2": 2.0694, + "loss_pixel": 0.1738, + "loss_text": 1.2606, + "ppl": 4.1971, + "step": 8148 + }, + { + "epoch": 0.05, + "global_step": 8149, + "learning_rate": 0.0004668238731218698, + "loss": 1.4456, + "loss_base2": 2.0856, + "loss_pixel": 0.1738, + "loss_text": 1.2718, + "ppl": 4.2444, + "step": 8149 + }, + { + "epoch": 0.05, + "global_step": 8150, + "learning_rate": 0.0004668196994991653, + "loss": 1.4491, + "loss_base2": 2.0906, + "loss_pixel": 0.1743, + "loss_text": 1.2748, + "ppl": 4.2593, + "step": 8150 + }, + { + "epoch": 0.05, + "global_step": 8151, + "learning_rate": 0.00046681552587646074, + "loss": 1.4295, + "loss_base2": 2.0623, + "loss_pixel": 0.1727, + "loss_text": 1.2568, + "ppl": 4.1766, + "step": 8151 + }, + { + "epoch": 0.05, + "global_step": 8152, + "learning_rate": 0.00046681135225375625, + "loss": 1.4439, + "loss_base2": 2.0831, + "loss_pixel": 0.1762, + "loss_text": 1.2677, + "ppl": 4.2372, + "step": 8152 + }, + { + "epoch": 0.05, + "global_step": 8153, + "learning_rate": 0.00046680717863105175, + "loss": 1.4409, + "loss_base2": 2.0788, + "loss_pixel": 0.1718, + "loss_text": 1.2691, + "ppl": 4.2245, + "step": 8153 + }, + { + "epoch": 0.05, + "global_step": 8154, + "learning_rate": 0.00046680300500834726, + "loss": 1.4561, + "loss_base2": 2.1007, + "loss_pixel": 0.1722, + "loss_text": 1.2839, + "ppl": 4.2892, + "step": 8154 + }, + { + "epoch": 0.05, + "global_step": 8155, + "learning_rate": 0.00046679883138564277, + "loss": 1.4351, + "loss_base2": 2.0704, + "loss_pixel": 0.1727, + "loss_text": 1.2624, + "ppl": 4.2001, + "step": 8155 + }, + { + "epoch": 0.05, + "global_step": 8156, + "learning_rate": 0.0004667946577629382, + "loss": 1.5298, + "loss_base2": 2.207, + "loss_pixel": 0.173, + "loss_text": 1.3568, + "ppl": 4.6173, + "step": 8156 + }, + { + "epoch": 0.05, + "global_step": 8157, + "learning_rate": 0.00046679048414023373, + "loss": 1.6883, + "loss_base2": 2.4357, + "loss_pixel": 0.1719, + "loss_text": 1.5164, + "ppl": 5.4103, + "step": 8157 + }, + { + "epoch": 0.05, + "global_step": 8158, + "learning_rate": 0.00046678631051752924, + "loss": 1.6935, + "loss_base2": 2.4432, + "loss_pixel": 0.1731, + "loss_text": 1.5204, + "ppl": 5.4385, + "step": 8158 + }, + { + "epoch": 0.05, + "global_step": 8159, + "learning_rate": 0.00046678213689482474, + "loss": 1.678, + "loss_base2": 2.4208, + "loss_pixel": 0.1721, + "loss_text": 1.5058, + "ppl": 5.3548, + "step": 8159 + }, + { + "epoch": 0.05, + "global_step": 8160, + "learning_rate": 0.0004667779632721202, + "loss": 1.6632, + "loss_base2": 2.3995, + "loss_pixel": 0.1735, + "loss_text": 1.4897, + "ppl": 5.2762, + "step": 8160 + }, + { + "epoch": 0.05, + "global_step": 8161, + "learning_rate": 0.0004667737896494157, + "loss": 1.6835, + "loss_base2": 2.4288, + "loss_pixel": 0.1713, + "loss_text": 1.5121, + "ppl": 5.3844, + "step": 8161 + }, + { + "epoch": 0.05, + "global_step": 8162, + "learning_rate": 0.0004667696160267112, + "loss": 1.6665, + "loss_base2": 2.4043, + "loss_pixel": 0.1716, + "loss_text": 1.495, + "ppl": 5.2936, + "step": 8162 + }, + { + "epoch": 0.05, + "global_step": 8163, + "learning_rate": 0.0004667654424040067, + "loss": 1.6642, + "loss_base2": 2.4009, + "loss_pixel": 0.1736, + "loss_text": 1.4906, + "ppl": 5.2814, + "step": 8163 + }, + { + "epoch": 0.05, + "global_step": 8164, + "learning_rate": 0.0004667612687813022, + "loss": 1.6686, + "loss_base2": 2.4073, + "loss_pixel": 0.1715, + "loss_text": 1.4971, + "ppl": 5.3047, + "step": 8164 + }, + { + "epoch": 0.05, + "global_step": 8165, + "learning_rate": 0.0004667570951585977, + "loss": 1.6725, + "loss_base2": 2.4129, + "loss_pixel": 0.1715, + "loss_text": 1.501, + "ppl": 5.3255, + "step": 8165 + }, + { + "epoch": 0.05, + "global_step": 8166, + "learning_rate": 0.00046675292153589313, + "loss": 1.6443, + "loss_base2": 2.3722, + "loss_pixel": 0.1718, + "loss_text": 1.4725, + "ppl": 5.1774, + "step": 8166 + }, + { + "epoch": 0.05, + "global_step": 8167, + "learning_rate": 0.00046674874791318864, + "loss": 1.6654, + "loss_base2": 2.4027, + "loss_pixel": 0.172, + "loss_text": 1.4934, + "ppl": 5.2878, + "step": 8167 + }, + { + "epoch": 0.05, + "global_step": 8168, + "learning_rate": 0.00046674457429048415, + "loss": 1.6619, + "loss_base2": 2.3976, + "loss_pixel": 0.1727, + "loss_text": 1.4892, + "ppl": 5.2693, + "step": 8168 + }, + { + "epoch": 0.05, + "global_step": 8169, + "learning_rate": 0.0004667404006677796, + "loss": 1.6372, + "loss_base2": 2.362, + "loss_pixel": 0.1708, + "loss_text": 1.4664, + "ppl": 5.1408, + "step": 8169 + }, + { + "epoch": 0.05, + "global_step": 8170, + "learning_rate": 0.0004667362270450751, + "loss": 1.6526, + "loss_base2": 2.3842, + "loss_pixel": 0.173, + "loss_text": 1.4796, + "ppl": 5.2205, + "step": 8170 + }, + { + "epoch": 0.05, + "global_step": 8171, + "learning_rate": 0.0004667320534223706, + "loss": 1.6613, + "loss_base2": 2.3967, + "loss_pixel": 0.1717, + "loss_text": 1.4895, + "ppl": 5.2662, + "step": 8171 + }, + { + "epoch": 0.05, + "global_step": 8172, + "learning_rate": 0.0004667278797996661, + "loss": 1.6699, + "loss_base2": 2.4092, + "loss_pixel": 0.171, + "loss_text": 1.499, + "ppl": 5.3116, + "step": 8172 + }, + { + "epoch": 0.05, + "global_step": 8173, + "learning_rate": 0.00046672370617696163, + "loss": 1.6725, + "loss_base2": 2.4129, + "loss_pixel": 0.1736, + "loss_text": 1.4989, + "ppl": 5.3255, + "step": 8173 + }, + { + "epoch": 0.05, + "global_step": 8174, + "learning_rate": 0.0004667195325542571, + "loss": 1.6694, + "loss_base2": 2.4084, + "loss_pixel": 0.1802, + "loss_text": 1.4891, + "ppl": 5.309, + "step": 8174 + }, + { + "epoch": 0.05, + "global_step": 8175, + "learning_rate": 0.0004667153589315526, + "loss": 1.6755, + "loss_base2": 2.4172, + "loss_pixel": 0.1806, + "loss_text": 1.4949, + "ppl": 5.3415, + "step": 8175 + }, + { + "epoch": 0.05, + "global_step": 8176, + "learning_rate": 0.0004667111853088481, + "loss": 1.6628, + "loss_base2": 2.3989, + "loss_pixel": 0.1739, + "loss_text": 1.4889, + "ppl": 5.2741, + "step": 8176 + }, + { + "epoch": 0.05, + "global_step": 8177, + "learning_rate": 0.0004667070116861436, + "loss": 1.6396, + "loss_base2": 2.3654, + "loss_pixel": 0.173, + "loss_text": 1.4667, + "ppl": 5.1531, + "step": 8177 + }, + { + "epoch": 0.05, + "global_step": 8178, + "learning_rate": 0.00046670283806343906, + "loss": 1.6418, + "loss_base2": 2.3686, + "loss_pixel": 0.1721, + "loss_text": 1.4698, + "ppl": 5.1645, + "step": 8178 + }, + { + "epoch": 0.05, + "global_step": 8179, + "learning_rate": 0.00046669866444073457, + "loss": 1.6672, + "loss_base2": 2.4053, + "loss_pixel": 0.1719, + "loss_text": 1.4954, + "ppl": 5.2973, + "step": 8179 + }, + { + "epoch": 0.05, + "global_step": 8180, + "learning_rate": 0.0004666944908180301, + "loss": 1.6666, + "loss_base2": 2.4044, + "loss_pixel": 0.1714, + "loss_text": 1.4953, + "ppl": 5.2941, + "step": 8180 + }, + { + "epoch": 0.05, + "global_step": 8181, + "learning_rate": 0.0004666903171953256, + "loss": 1.6609, + "loss_base2": 2.3962, + "loss_pixel": 0.1718, + "loss_text": 1.4891, + "ppl": 5.264, + "step": 8181 + }, + { + "epoch": 0.05, + "global_step": 8182, + "learning_rate": 0.0004666861435726211, + "loss": 1.5583, + "loss_base2": 2.2482, + "loss_pixel": 0.1721, + "loss_text": 1.3862, + "ppl": 4.7507, + "step": 8182 + }, + { + "epoch": 0.05, + "global_step": 8183, + "learning_rate": 0.00046668196994991654, + "loss": 1.4547, + "loss_base2": 2.0987, + "loss_pixel": 0.1713, + "loss_text": 1.2834, + "ppl": 4.2832, + "step": 8183 + }, + { + "epoch": 0.05, + "global_step": 8184, + "learning_rate": 0.00046667779632721205, + "loss": 1.4315, + "loss_base2": 2.0652, + "loss_pixel": 0.1723, + "loss_text": 1.2592, + "ppl": 4.185, + "step": 8184 + }, + { + "epoch": 0.05, + "global_step": 8185, + "learning_rate": 0.0004666736227045075, + "loss": 1.422, + "loss_base2": 2.0515, + "loss_pixel": 0.1729, + "loss_text": 1.2491, + "ppl": 4.1454, + "step": 8185 + }, + { + "epoch": 0.05, + "global_step": 8186, + "learning_rate": 0.000466669449081803, + "loss": 1.4383, + "loss_base2": 2.075, + "loss_pixel": 0.173, + "loss_text": 1.2653, + "ppl": 4.2135, + "step": 8186 + }, + { + "epoch": 0.05, + "global_step": 8187, + "learning_rate": 0.00046666527545909846, + "loss": 1.4355, + "loss_base2": 2.071, + "loss_pixel": 0.1726, + "loss_text": 1.2628, + "ppl": 4.2017, + "step": 8187 + }, + { + "epoch": 0.05, + "global_step": 8188, + "learning_rate": 0.00046666110183639397, + "loss": 1.4182, + "loss_base2": 2.046, + "loss_pixel": 0.1718, + "loss_text": 1.2464, + "ppl": 4.1297, + "step": 8188 + }, + { + "epoch": 0.05, + "global_step": 8189, + "learning_rate": 0.0004666569282136895, + "loss": 1.4289, + "loss_base2": 2.0615, + "loss_pixel": 0.1726, + "loss_text": 1.2563, + "ppl": 4.1741, + "step": 8189 + }, + { + "epoch": 0.05, + "global_step": 8190, + "learning_rate": 0.000466652754590985, + "loss": 1.511, + "loss_base2": 2.1799, + "loss_pixel": 0.1748, + "loss_text": 1.3362, + "ppl": 4.5313, + "step": 8190 + }, + { + "epoch": 0.05, + "global_step": 8191, + "learning_rate": 0.0004666485809682805, + "loss": 1.6862, + "loss_base2": 2.4327, + "loss_pixel": 0.1721, + "loss_text": 1.5141, + "ppl": 5.3989, + "step": 8191 + }, + { + "epoch": 0.05, + "global_step": 8192, + "learning_rate": 0.00046664440734557594, + "loss": 1.6799, + "loss_base2": 2.4236, + "loss_pixel": 0.1723, + "loss_text": 1.5076, + "ppl": 5.365, + "step": 8192 + }, + { + "epoch": 0.05, + "global_step": 8193, + "learning_rate": 0.00046664023372287145, + "loss": 1.682, + "loss_base2": 2.4266, + "loss_pixel": 0.1713, + "loss_text": 1.5107, + "ppl": 5.3763, + "step": 8193 + }, + { + "epoch": 0.05, + "global_step": 8194, + "learning_rate": 0.00046663606010016696, + "loss": 1.6721, + "loss_base2": 2.4123, + "loss_pixel": 0.172, + "loss_text": 1.5002, + "ppl": 5.3233, + "step": 8194 + }, + { + "epoch": 0.05, + "global_step": 8195, + "learning_rate": 0.00046663188647746247, + "loss": 1.6566, + "loss_base2": 2.39, + "loss_pixel": 0.1722, + "loss_text": 1.4843, + "ppl": 5.2415, + "step": 8195 + }, + { + "epoch": 0.05, + "global_step": 8196, + "learning_rate": 0.0004666277128547579, + "loss": 1.6715, + "loss_base2": 2.4115, + "loss_pixel": 0.1731, + "loss_text": 1.4984, + "ppl": 5.3201, + "step": 8196 + }, + { + "epoch": 0.05, + "global_step": 8197, + "learning_rate": 0.0004666235392320534, + "loss": 1.6548, + "loss_base2": 2.3874, + "loss_pixel": 0.1714, + "loss_text": 1.4833, + "ppl": 5.232, + "step": 8197 + }, + { + "epoch": 0.05, + "global_step": 8198, + "learning_rate": 0.00046661936560934893, + "loss": 1.6397, + "loss_base2": 2.3656, + "loss_pixel": 0.1716, + "loss_text": 1.4681, + "ppl": 5.1536, + "step": 8198 + }, + { + "epoch": 0.05, + "global_step": 8199, + "learning_rate": 0.00046661519198664444, + "loss": 1.6776, + "loss_base2": 2.4203, + "loss_pixel": 0.1713, + "loss_text": 1.5064, + "ppl": 5.3527, + "step": 8199 + }, + { + "epoch": 0.05, + "global_step": 8200, + "learning_rate": 0.00046661101836393995, + "loss": 1.6665, + "loss_base2": 2.4043, + "loss_pixel": 0.1721, + "loss_text": 1.4944, + "ppl": 5.2936, + "step": 8200 + }, + { + "epoch": 0.05, + "global_step": 8201, + "learning_rate": 0.0004666068447412354, + "loss": 1.6595, + "loss_base2": 2.3942, + "loss_pixel": 0.1717, + "loss_text": 1.4878, + "ppl": 5.2567, + "step": 8201 + }, + { + "epoch": 0.05, + "global_step": 8202, + "learning_rate": 0.0004666026711185309, + "loss": 1.6597, + "loss_base2": 2.3944, + "loss_pixel": 0.1712, + "loss_text": 1.4885, + "ppl": 5.2577, + "step": 8202 + }, + { + "epoch": 0.05, + "global_step": 8203, + "learning_rate": 0.0004665984974958264, + "loss": 1.6569, + "loss_base2": 2.3904, + "loss_pixel": 0.1718, + "loss_text": 1.4851, + "ppl": 5.243, + "step": 8203 + }, + { + "epoch": 0.05, + "global_step": 8204, + "learning_rate": 0.00046659432387312187, + "loss": 1.6546, + "loss_base2": 2.3871, + "loss_pixel": 0.1712, + "loss_text": 1.4834, + "ppl": 5.231, + "step": 8204 + }, + { + "epoch": 0.05, + "global_step": 8205, + "learning_rate": 0.0004665901502504173, + "loss": 1.6542, + "loss_base2": 2.3865, + "loss_pixel": 0.171, + "loss_text": 1.4832, + "ppl": 5.2289, + "step": 8205 + }, + { + "epoch": 0.05, + "global_step": 8206, + "learning_rate": 0.00046658597662771283, + "loss": 1.6721, + "loss_base2": 2.4123, + "loss_pixel": 0.1714, + "loss_text": 1.5007, + "ppl": 5.3233, + "step": 8206 + }, + { + "epoch": 0.05, + "global_step": 8207, + "learning_rate": 0.00046658180300500834, + "loss": 1.6686, + "loss_base2": 2.4073, + "loss_pixel": 0.1717, + "loss_text": 1.4969, + "ppl": 5.3047, + "step": 8207 + }, + { + "epoch": 0.05, + "global_step": 8208, + "learning_rate": 0.00046657762938230384, + "loss": 1.6646, + "loss_base2": 2.4015, + "loss_pixel": 0.1714, + "loss_text": 1.4932, + "ppl": 5.2836, + "step": 8208 + }, + { + "epoch": 0.05, + "global_step": 8209, + "learning_rate": 0.00046657345575959935, + "loss": 1.6606, + "loss_base2": 2.3957, + "loss_pixel": 0.1734, + "loss_text": 1.4871, + "ppl": 5.2625, + "step": 8209 + }, + { + "epoch": 0.05, + "global_step": 8210, + "learning_rate": 0.0004665692821368948, + "loss": 1.6506, + "loss_base2": 2.3813, + "loss_pixel": 0.1711, + "loss_text": 1.4794, + "ppl": 5.2101, + "step": 8210 + }, + { + "epoch": 0.05, + "global_step": 8211, + "learning_rate": 0.0004665651085141903, + "loss": 1.666, + "loss_base2": 2.4035, + "loss_pixel": 0.1718, + "loss_text": 1.4942, + "ppl": 5.291, + "step": 8211 + }, + { + "epoch": 0.05, + "global_step": 8212, + "learning_rate": 0.0004665609348914858, + "loss": 1.6404, + "loss_base2": 2.3666, + "loss_pixel": 0.1709, + "loss_text": 1.4694, + "ppl": 5.1572, + "step": 8212 + }, + { + "epoch": 0.05, + "global_step": 8213, + "learning_rate": 0.0004665567612687813, + "loss": 1.6714, + "loss_base2": 2.4113, + "loss_pixel": 0.1707, + "loss_text": 1.5007, + "ppl": 5.3196, + "step": 8213 + }, + { + "epoch": 0.05, + "global_step": 8214, + "learning_rate": 0.00046655258764607683, + "loss": 1.6619, + "loss_base2": 2.3976, + "loss_pixel": 0.1709, + "loss_text": 1.491, + "ppl": 5.2693, + "step": 8214 + }, + { + "epoch": 0.05, + "global_step": 8215, + "learning_rate": 0.0004665484140233723, + "loss": 1.4879, + "loss_base2": 2.1466, + "loss_pixel": 0.173, + "loss_text": 1.3149, + "ppl": 4.4278, + "step": 8215 + }, + { + "epoch": 0.05, + "global_step": 8216, + "learning_rate": 0.0004665442404006678, + "loss": 1.4436, + "loss_base2": 2.0827, + "loss_pixel": 0.1713, + "loss_text": 1.2722, + "ppl": 4.2359, + "step": 8216 + }, + { + "epoch": 0.05, + "global_step": 8217, + "learning_rate": 0.0004665400667779633, + "loss": 1.4329, + "loss_base2": 2.0672, + "loss_pixel": 0.1714, + "loss_text": 1.2616, + "ppl": 4.1908, + "step": 8217 + }, + { + "epoch": 0.05, + "global_step": 8218, + "learning_rate": 0.0004665358931552588, + "loss": 1.4242, + "loss_base2": 2.0547, + "loss_pixel": 0.171, + "loss_text": 1.2533, + "ppl": 4.1545, + "step": 8218 + }, + { + "epoch": 0.05, + "global_step": 8219, + "learning_rate": 0.00046653171953255426, + "loss": 1.4274, + "loss_base2": 2.0593, + "loss_pixel": 0.1713, + "loss_text": 1.2561, + "ppl": 4.1678, + "step": 8219 + }, + { + "epoch": 0.05, + "global_step": 8220, + "learning_rate": 0.00046652754590984977, + "loss": 1.426, + "loss_base2": 2.0573, + "loss_pixel": 0.1715, + "loss_text": 1.2544, + "ppl": 4.162, + "step": 8220 + }, + { + "epoch": 0.05, + "global_step": 8221, + "learning_rate": 0.0004665233722871453, + "loss": 1.4259, + "loss_base2": 2.0571, + "loss_pixel": 0.1713, + "loss_text": 1.2547, + "ppl": 4.1616, + "step": 8221 + }, + { + "epoch": 0.05, + "global_step": 8222, + "learning_rate": 0.0004665191986644408, + "loss": 1.416, + "loss_base2": 2.0429, + "loss_pixel": 0.1704, + "loss_text": 1.2456, + "ppl": 4.1206, + "step": 8222 + }, + { + "epoch": 0.05, + "global_step": 8223, + "learning_rate": 0.00046651502504173624, + "loss": 1.5045, + "loss_base2": 2.1705, + "loss_pixel": 0.1698, + "loss_text": 1.3347, + "ppl": 4.5019, + "step": 8223 + }, + { + "epoch": 0.05, + "global_step": 8224, + "learning_rate": 0.0004665108514190317, + "loss": 1.6405, + "loss_base2": 2.3667, + "loss_pixel": 0.1734, + "loss_text": 1.4671, + "ppl": 5.1577, + "step": 8224 + }, + { + "epoch": 0.05, + "global_step": 8225, + "learning_rate": 0.0004665066777963272, + "loss": 1.6572, + "loss_base2": 2.3908, + "loss_pixel": 0.1712, + "loss_text": 1.486, + "ppl": 5.2446, + "step": 8225 + }, + { + "epoch": 0.05, + "global_step": 8226, + "learning_rate": 0.0004665025041736227, + "loss": 1.6772, + "loss_base2": 2.4197, + "loss_pixel": 0.1692, + "loss_text": 1.508, + "ppl": 5.3506, + "step": 8226 + }, + { + "epoch": 0.05, + "global_step": 8227, + "learning_rate": 0.0004664983305509182, + "loss": 1.6815, + "loss_base2": 2.4259, + "loss_pixel": 0.1707, + "loss_text": 1.5108, + "ppl": 5.3736, + "step": 8227 + }, + { + "epoch": 0.05, + "global_step": 8228, + "learning_rate": 0.00046649415692821367, + "loss": 1.6783, + "loss_base2": 2.4213, + "loss_pixel": 0.1704, + "loss_text": 1.5079, + "ppl": 5.3564, + "step": 8228 + }, + { + "epoch": 0.05, + "global_step": 8229, + "learning_rate": 0.00046648998330550917, + "loss": 1.6616, + "loss_base2": 2.3972, + "loss_pixel": 0.1713, + "loss_text": 1.4903, + "ppl": 5.2677, + "step": 8229 + }, + { + "epoch": 0.05, + "global_step": 8230, + "learning_rate": 0.0004664858096828047, + "loss": 1.6594, + "loss_base2": 2.394, + "loss_pixel": 0.1719, + "loss_text": 1.4875, + "ppl": 5.2562, + "step": 8230 + }, + { + "epoch": 0.05, + "global_step": 8231, + "learning_rate": 0.0004664816360601002, + "loss": 1.6647, + "loss_base2": 2.4017, + "loss_pixel": 0.1724, + "loss_text": 1.4923, + "ppl": 5.2841, + "step": 8231 + }, + { + "epoch": 0.05, + "global_step": 8232, + "learning_rate": 0.0004664774624373957, + "loss": 1.6713, + "loss_base2": 2.4112, + "loss_pixel": 0.1716, + "loss_text": 1.4997, + "ppl": 5.3191, + "step": 8232 + }, + { + "epoch": 0.05, + "global_step": 8233, + "learning_rate": 0.00046647328881469115, + "loss": 1.6761, + "loss_base2": 2.4181, + "loss_pixel": 0.1714, + "loss_text": 1.5047, + "ppl": 5.3447, + "step": 8233 + }, + { + "epoch": 0.05, + "global_step": 8234, + "learning_rate": 0.00046646911519198666, + "loss": 1.662, + "loss_base2": 2.3978, + "loss_pixel": 0.1705, + "loss_text": 1.4915, + "ppl": 5.2698, + "step": 8234 + }, + { + "epoch": 0.05, + "global_step": 8235, + "learning_rate": 0.00046646494156928216, + "loss": 1.6697, + "loss_base2": 2.4089, + "loss_pixel": 0.17, + "loss_text": 1.4996, + "ppl": 5.3106, + "step": 8235 + }, + { + "epoch": 0.05, + "global_step": 8236, + "learning_rate": 0.00046646076794657767, + "loss": 1.6475, + "loss_base2": 2.3768, + "loss_pixel": 0.17, + "loss_text": 1.4775, + "ppl": 5.194, + "step": 8236 + }, + { + "epoch": 0.05, + "global_step": 8237, + "learning_rate": 0.0004664565943238731, + "loss": 1.6579, + "loss_base2": 2.3918, + "loss_pixel": 0.1715, + "loss_text": 1.4864, + "ppl": 5.2483, + "step": 8237 + }, + { + "epoch": 0.05, + "global_step": 8238, + "learning_rate": 0.00046645242070116863, + "loss": 1.6698, + "loss_base2": 2.409, + "loss_pixel": 0.1702, + "loss_text": 1.4996, + "ppl": 5.3111, + "step": 8238 + }, + { + "epoch": 0.05, + "global_step": 8239, + "learning_rate": 0.00046644824707846414, + "loss": 1.6521, + "loss_base2": 2.3835, + "loss_pixel": 0.1698, + "loss_text": 1.4823, + "ppl": 5.2179, + "step": 8239 + }, + { + "epoch": 0.05, + "global_step": 8240, + "learning_rate": 0.00046644407345575964, + "loss": 1.6632, + "loss_base2": 2.3995, + "loss_pixel": 0.1705, + "loss_text": 1.4927, + "ppl": 5.2762, + "step": 8240 + }, + { + "epoch": 0.05, + "global_step": 8241, + "learning_rate": 0.00046643989983305515, + "loss": 1.6602, + "loss_base2": 2.3952, + "loss_pixel": 0.1714, + "loss_text": 1.4889, + "ppl": 5.2604, + "step": 8241 + }, + { + "epoch": 0.05, + "global_step": 8242, + "learning_rate": 0.00046643572621035055, + "loss": 1.6527, + "loss_base2": 2.3843, + "loss_pixel": 0.1721, + "loss_text": 1.4807, + "ppl": 5.2211, + "step": 8242 + }, + { + "epoch": 0.05, + "global_step": 8243, + "learning_rate": 0.00046643155258764606, + "loss": 1.6511, + "loss_base2": 2.382, + "loss_pixel": 0.1718, + "loss_text": 1.4793, + "ppl": 5.2127, + "step": 8243 + }, + { + "epoch": 0.05, + "global_step": 8244, + "learning_rate": 0.00046642737896494157, + "loss": 1.6664, + "loss_base2": 2.4041, + "loss_pixel": 0.171, + "loss_text": 1.4955, + "ppl": 5.2931, + "step": 8244 + }, + { + "epoch": 0.05, + "global_step": 8245, + "learning_rate": 0.00046642320534223707, + "loss": 1.6463, + "loss_base2": 2.3751, + "loss_pixel": 0.1704, + "loss_text": 1.4758, + "ppl": 5.1877, + "step": 8245 + }, + { + "epoch": 0.05, + "global_step": 8246, + "learning_rate": 0.0004664190317195325, + "loss": 1.6726, + "loss_base2": 2.4131, + "loss_pixel": 0.1712, + "loss_text": 1.5014, + "ppl": 5.326, + "step": 8246 + }, + { + "epoch": 0.05, + "global_step": 8247, + "learning_rate": 0.00046641485809682803, + "loss": 1.6657, + "loss_base2": 2.4031, + "loss_pixel": 0.1718, + "loss_text": 1.494, + "ppl": 5.2894, + "step": 8247 + }, + { + "epoch": 0.05, + "global_step": 8248, + "learning_rate": 0.00046641068447412354, + "loss": 1.6588, + "loss_base2": 2.3931, + "loss_pixel": 0.1715, + "loss_text": 1.4873, + "ppl": 5.253, + "step": 8248 + }, + { + "epoch": 0.05, + "global_step": 8249, + "learning_rate": 0.00046640651085141905, + "loss": 1.6473, + "loss_base2": 2.3766, + "loss_pixel": 0.1707, + "loss_text": 1.4766, + "ppl": 5.1929, + "step": 8249 + }, + { + "epoch": 0.05, + "global_step": 8250, + "learning_rate": 0.00046640233722871456, + "loss": 1.6431, + "loss_base2": 2.3705, + "loss_pixel": 0.1708, + "loss_text": 1.4722, + "ppl": 5.1712, + "step": 8250 + }, + { + "epoch": 0.05, + "global_step": 8251, + "learning_rate": 0.00046639816360601, + "loss": 1.657, + "loss_base2": 2.3905, + "loss_pixel": 0.172, + "loss_text": 1.4849, + "ppl": 5.2436, + "step": 8251 + }, + { + "epoch": 0.05, + "global_step": 8252, + "learning_rate": 0.0004663939899833055, + "loss": 1.6549, + "loss_base2": 2.3875, + "loss_pixel": 0.171, + "loss_text": 1.4838, + "ppl": 5.2326, + "step": 8252 + }, + { + "epoch": 0.05, + "global_step": 8253, + "learning_rate": 0.000466389816360601, + "loss": 1.6705, + "loss_base2": 2.41, + "loss_pixel": 0.1724, + "loss_text": 1.4982, + "ppl": 5.3148, + "step": 8253 + }, + { + "epoch": 0.05, + "global_step": 8254, + "learning_rate": 0.00046638564273789653, + "loss": 1.6578, + "loss_base2": 2.3917, + "loss_pixel": 0.1705, + "loss_text": 1.4873, + "ppl": 5.2478, + "step": 8254 + }, + { + "epoch": 0.05, + "global_step": 8255, + "learning_rate": 0.000466381469115192, + "loss": 1.6447, + "loss_base2": 2.3728, + "loss_pixel": 0.1705, + "loss_text": 1.4741, + "ppl": 5.1795, + "step": 8255 + }, + { + "epoch": 0.05, + "global_step": 8256, + "learning_rate": 0.0004663772954924875, + "loss": 1.668, + "loss_base2": 2.4064, + "loss_pixel": 0.1712, + "loss_text": 1.4968, + "ppl": 5.3016, + "step": 8256 + }, + { + "epoch": 0.05, + "global_step": 8257, + "learning_rate": 0.000466373121869783, + "loss": 1.6467, + "loss_base2": 2.3757, + "loss_pixel": 0.1713, + "loss_text": 1.4754, + "ppl": 5.1898, + "step": 8257 + }, + { + "epoch": 0.05, + "global_step": 8258, + "learning_rate": 0.0004663689482470785, + "loss": 1.6487, + "loss_base2": 2.3786, + "loss_pixel": 0.1719, + "loss_text": 1.4769, + "ppl": 5.2002, + "step": 8258 + }, + { + "epoch": 0.05, + "global_step": 8259, + "learning_rate": 0.000466364774624374, + "loss": 1.6515, + "loss_base2": 2.3826, + "loss_pixel": 0.171, + "loss_text": 1.4805, + "ppl": 5.2148, + "step": 8259 + }, + { + "epoch": 0.05, + "global_step": 8260, + "learning_rate": 0.0004663606010016694, + "loss": 1.6741, + "loss_base2": 2.4152, + "loss_pixel": 0.172, + "loss_text": 1.5021, + "ppl": 5.334, + "step": 8260 + }, + { + "epoch": 0.05, + "global_step": 8261, + "learning_rate": 0.0004663564273789649, + "loss": 1.6561, + "loss_base2": 2.3892, + "loss_pixel": 0.1719, + "loss_text": 1.4841, + "ppl": 5.2388, + "step": 8261 + }, + { + "epoch": 0.05, + "global_step": 8262, + "learning_rate": 0.0004663522537562604, + "loss": 1.6676, + "loss_base2": 2.4058, + "loss_pixel": 0.1714, + "loss_text": 1.4963, + "ppl": 5.2994, + "step": 8262 + }, + { + "epoch": 0.05, + "global_step": 8263, + "learning_rate": 0.00046634808013355593, + "loss": 1.6402, + "loss_base2": 2.3663, + "loss_pixel": 0.1714, + "loss_text": 1.4688, + "ppl": 5.1562, + "step": 8263 + }, + { + "epoch": 0.05, + "global_step": 8264, + "learning_rate": 0.0004663439065108514, + "loss": 1.6615, + "loss_base2": 2.397, + "loss_pixel": 0.1705, + "loss_text": 1.491, + "ppl": 5.2672, + "step": 8264 + }, + { + "epoch": 0.05, + "global_step": 8265, + "learning_rate": 0.0004663397328881469, + "loss": 1.6534, + "loss_base2": 2.3854, + "loss_pixel": 0.1708, + "loss_text": 1.4826, + "ppl": 5.2247, + "step": 8265 + }, + { + "epoch": 0.05, + "global_step": 8266, + "learning_rate": 0.0004663355592654424, + "loss": 1.6503, + "loss_base2": 2.3809, + "loss_pixel": 0.171, + "loss_text": 1.4793, + "ppl": 5.2085, + "step": 8266 + }, + { + "epoch": 0.05, + "global_step": 8267, + "learning_rate": 0.0004663313856427379, + "loss": 1.6572, + "loss_base2": 2.3908, + "loss_pixel": 0.1724, + "loss_text": 1.4849, + "ppl": 5.2446, + "step": 8267 + }, + { + "epoch": 0.05, + "global_step": 8268, + "learning_rate": 0.0004663272120200334, + "loss": 1.6549, + "loss_base2": 2.3875, + "loss_pixel": 0.1751, + "loss_text": 1.4797, + "ppl": 5.2326, + "step": 8268 + }, + { + "epoch": 0.05, + "global_step": 8269, + "learning_rate": 0.00046632303839732887, + "loss": 1.6272, + "loss_base2": 2.3476, + "loss_pixel": 0.1715, + "loss_text": 1.4557, + "ppl": 5.0896, + "step": 8269 + }, + { + "epoch": 0.05, + "global_step": 8270, + "learning_rate": 0.0004663188647746244, + "loss": 1.6294, + "loss_base2": 2.3507, + "loss_pixel": 0.1709, + "loss_text": 1.4585, + "ppl": 5.1008, + "step": 8270 + }, + { + "epoch": 0.05, + "global_step": 8271, + "learning_rate": 0.0004663146911519199, + "loss": 1.5819, + "loss_base2": 2.2822, + "loss_pixel": 0.1713, + "loss_text": 1.4106, + "ppl": 4.8642, + "step": 8271 + }, + { + "epoch": 0.05, + "global_step": 8272, + "learning_rate": 0.0004663105175292154, + "loss": 1.6596, + "loss_base2": 2.3943, + "loss_pixel": 0.1718, + "loss_text": 1.4877, + "ppl": 5.2572, + "step": 8272 + }, + { + "epoch": 0.05, + "global_step": 8273, + "learning_rate": 0.0004663063439065109, + "loss": 1.6586, + "loss_base2": 2.3929, + "loss_pixel": 0.1706, + "loss_text": 1.488, + "ppl": 5.252, + "step": 8273 + }, + { + "epoch": 0.05, + "global_step": 8274, + "learning_rate": 0.00046630217028380635, + "loss": 1.6562, + "loss_base2": 2.3894, + "loss_pixel": 0.1692, + "loss_text": 1.487, + "ppl": 5.2394, + "step": 8274 + }, + { + "epoch": 0.05, + "global_step": 8275, + "learning_rate": 0.00046629799666110186, + "loss": 1.6584, + "loss_base2": 2.3926, + "loss_pixel": 0.1718, + "loss_text": 1.4866, + "ppl": 5.2509, + "step": 8275 + }, + { + "epoch": 0.05, + "global_step": 8276, + "learning_rate": 0.00046629382303839737, + "loss": 1.6592, + "loss_base2": 2.3937, + "loss_pixel": 0.1699, + "loss_text": 1.4892, + "ppl": 5.2551, + "step": 8276 + }, + { + "epoch": 0.05, + "global_step": 8277, + "learning_rate": 0.0004662896494156929, + "loss": 1.6474, + "loss_base2": 2.3767, + "loss_pixel": 0.1684, + "loss_text": 1.479, + "ppl": 5.1935, + "step": 8277 + }, + { + "epoch": 0.05, + "global_step": 8278, + "learning_rate": 0.0004662854757929883, + "loss": 1.6562, + "loss_base2": 2.3894, + "loss_pixel": 0.1697, + "loss_text": 1.4865, + "ppl": 5.2394, + "step": 8278 + }, + { + "epoch": 0.05, + "global_step": 8279, + "learning_rate": 0.0004662813021702838, + "loss": 1.6766, + "loss_base2": 2.4188, + "loss_pixel": 0.1704, + "loss_text": 1.5062, + "ppl": 5.3473, + "step": 8279 + }, + { + "epoch": 0.05, + "global_step": 8280, + "learning_rate": 0.0004662771285475793, + "loss": 1.6562, + "loss_base2": 2.3894, + "loss_pixel": 0.1708, + "loss_text": 1.4855, + "ppl": 5.2394, + "step": 8280 + }, + { + "epoch": 0.05, + "global_step": 8281, + "learning_rate": 0.0004662729549248748, + "loss": 1.6456, + "loss_base2": 2.3741, + "loss_pixel": 0.1714, + "loss_text": 1.4742, + "ppl": 5.1841, + "step": 8281 + }, + { + "epoch": 0.05, + "global_step": 8282, + "learning_rate": 0.0004662687813021703, + "loss": 1.6375, + "loss_base2": 2.3624, + "loss_pixel": 0.172, + "loss_text": 1.4656, + "ppl": 5.1423, + "step": 8282 + }, + { + "epoch": 0.05, + "global_step": 8283, + "learning_rate": 0.00046626460767946575, + "loss": 1.6543, + "loss_base2": 2.3867, + "loss_pixel": 0.1709, + "loss_text": 1.4834, + "ppl": 5.2294, + "step": 8283 + }, + { + "epoch": 0.05, + "global_step": 8284, + "learning_rate": 0.00046626043405676126, + "loss": 1.648, + "loss_base2": 2.3776, + "loss_pixel": 0.1705, + "loss_text": 1.4775, + "ppl": 5.1966, + "step": 8284 + }, + { + "epoch": 0.05, + "global_step": 8285, + "learning_rate": 0.00046625626043405677, + "loss": 1.6337, + "loss_base2": 2.3569, + "loss_pixel": 0.1711, + "loss_text": 1.4626, + "ppl": 5.1228, + "step": 8285 + }, + { + "epoch": 0.05, + "global_step": 8286, + "learning_rate": 0.0004662520868113523, + "loss": 1.631, + "loss_base2": 2.353, + "loss_pixel": 0.1705, + "loss_text": 1.4605, + "ppl": 5.109, + "step": 8286 + }, + { + "epoch": 0.05, + "global_step": 8287, + "learning_rate": 0.00046624791318864773, + "loss": 1.6576, + "loss_base2": 2.3914, + "loss_pixel": 0.171, + "loss_text": 1.4866, + "ppl": 5.2467, + "step": 8287 + }, + { + "epoch": 0.05, + "global_step": 8288, + "learning_rate": 0.00046624373956594324, + "loss": 1.6504, + "loss_base2": 2.381, + "loss_pixel": 0.1759, + "loss_text": 1.4745, + "ppl": 5.2091, + "step": 8288 + }, + { + "epoch": 0.05, + "global_step": 8289, + "learning_rate": 0.00046623956594323874, + "loss": 1.6451, + "loss_base2": 2.3734, + "loss_pixel": 0.1718, + "loss_text": 1.4734, + "ppl": 5.1815, + "step": 8289 + }, + { + "epoch": 0.05, + "global_step": 8290, + "learning_rate": 0.00046623539232053425, + "loss": 1.6402, + "loss_base2": 2.3663, + "loss_pixel": 0.1708, + "loss_text": 1.4694, + "ppl": 5.1562, + "step": 8290 + }, + { + "epoch": 0.05, + "global_step": 8291, + "learning_rate": 0.00046623121869782976, + "loss": 1.6458, + "loss_base2": 2.3744, + "loss_pixel": 0.1708, + "loss_text": 1.4749, + "ppl": 5.1852, + "step": 8291 + }, + { + "epoch": 0.05, + "global_step": 8292, + "learning_rate": 0.0004662270450751252, + "loss": 1.6593, + "loss_base2": 2.3939, + "loss_pixel": 0.1706, + "loss_text": 1.4887, + "ppl": 5.2556, + "step": 8292 + }, + { + "epoch": 0.05, + "global_step": 8293, + "learning_rate": 0.0004662228714524207, + "loss": 1.6559, + "loss_base2": 2.389, + "loss_pixel": 0.1714, + "loss_text": 1.4845, + "ppl": 5.2378, + "step": 8293 + }, + { + "epoch": 0.05, + "global_step": 8294, + "learning_rate": 0.0004662186978297162, + "loss": 1.6625, + "loss_base2": 2.3985, + "loss_pixel": 0.1722, + "loss_text": 1.4902, + "ppl": 5.2725, + "step": 8294 + }, + { + "epoch": 0.05, + "global_step": 8295, + "learning_rate": 0.00046621452420701173, + "loss": 1.6612, + "loss_base2": 2.3966, + "loss_pixel": 0.1692, + "loss_text": 1.492, + "ppl": 5.2656, + "step": 8295 + }, + { + "epoch": 0.05, + "global_step": 8296, + "learning_rate": 0.0004662103505843072, + "loss": 1.6421, + "loss_base2": 2.369, + "loss_pixel": 0.1712, + "loss_text": 1.4709, + "ppl": 5.166, + "step": 8296 + }, + { + "epoch": 0.05, + "global_step": 8297, + "learning_rate": 0.0004662061769616027, + "loss": 1.452, + "loss_base2": 2.0948, + "loss_pixel": 0.1693, + "loss_text": 1.2828, + "ppl": 4.2716, + "step": 8297 + }, + { + "epoch": 0.05, + "global_step": 8298, + "learning_rate": 0.00046620200333889815, + "loss": 1.4753, + "loss_base2": 2.1284, + "loss_pixel": 0.1701, + "loss_text": 1.3052, + "ppl": 4.3723, + "step": 8298 + }, + { + "epoch": 0.05, + "global_step": 8299, + "learning_rate": 0.00046619782971619365, + "loss": 1.4527, + "loss_base2": 2.0958, + "loss_pixel": 0.17, + "loss_text": 1.2827, + "ppl": 4.2746, + "step": 8299 + }, + { + "epoch": 0.05, + "global_step": 8300, + "learning_rate": 0.00046619365609348916, + "loss": 1.4426, + "loss_base2": 2.0812, + "loss_pixel": 0.1706, + "loss_text": 1.272, + "ppl": 4.2317, + "step": 8300 + }, + { + "epoch": 0.05, + "global_step": 8301, + "learning_rate": 0.0004661894824707846, + "loss": 1.4468, + "loss_base2": 2.0873, + "loss_pixel": 0.1706, + "loss_text": 1.2762, + "ppl": 4.2495, + "step": 8301 + }, + { + "epoch": 0.05, + "global_step": 8302, + "learning_rate": 0.0004661853088480801, + "loss": 1.4392, + "loss_base2": 2.0763, + "loss_pixel": 0.1699, + "loss_text": 1.2693, + "ppl": 4.2173, + "step": 8302 + }, + { + "epoch": 0.05, + "global_step": 8303, + "learning_rate": 0.00046618113522537563, + "loss": 1.4358, + "loss_base2": 2.0714, + "loss_pixel": 0.1696, + "loss_text": 1.2662, + "ppl": 4.203, + "step": 8303 + }, + { + "epoch": 0.05, + "global_step": 8304, + "learning_rate": 0.00046617696160267114, + "loss": 1.429, + "loss_base2": 2.0616, + "loss_pixel": 0.1702, + "loss_text": 1.2588, + "ppl": 4.1745, + "step": 8304 + }, + { + "epoch": 0.05, + "global_step": 8305, + "learning_rate": 0.0004661727879799666, + "loss": 1.431, + "loss_base2": 2.0645, + "loss_pixel": 0.1688, + "loss_text": 1.2623, + "ppl": 4.1829, + "step": 8305 + }, + { + "epoch": 0.05, + "global_step": 8306, + "learning_rate": 0.0004661686143572621, + "loss": 1.4456, + "loss_base2": 2.0856, + "loss_pixel": 0.1728, + "loss_text": 1.2728, + "ppl": 4.2444, + "step": 8306 + }, + { + "epoch": 0.05, + "global_step": 8307, + "learning_rate": 0.0004661644407345576, + "loss": 1.4442, + "loss_base2": 2.0835, + "loss_pixel": 0.1706, + "loss_text": 1.2736, + "ppl": 4.2385, + "step": 8307 + }, + { + "epoch": 0.05, + "global_step": 8308, + "learning_rate": 0.0004661602671118531, + "loss": 1.4279, + "loss_base2": 2.06, + "loss_pixel": 0.1696, + "loss_text": 1.2583, + "ppl": 4.1699, + "step": 8308 + }, + { + "epoch": 0.05, + "global_step": 8309, + "learning_rate": 0.0004661560934891486, + "loss": 1.4281, + "loss_base2": 2.0603, + "loss_pixel": 0.1697, + "loss_text": 1.2584, + "ppl": 4.1708, + "step": 8309 + }, + { + "epoch": 0.05, + "global_step": 8310, + "learning_rate": 0.00046615191986644407, + "loss": 1.4209, + "loss_base2": 2.0499, + "loss_pixel": 0.1716, + "loss_text": 1.2493, + "ppl": 4.1408, + "step": 8310 + }, + { + "epoch": 0.05, + "global_step": 8311, + "learning_rate": 0.0004661477462437396, + "loss": 1.4174, + "loss_base2": 2.0449, + "loss_pixel": 0.1714, + "loss_text": 1.246, + "ppl": 4.1264, + "step": 8311 + }, + { + "epoch": 0.05, + "global_step": 8312, + "learning_rate": 0.0004661435726210351, + "loss": 1.4172, + "loss_base2": 2.0446, + "loss_pixel": 0.171, + "loss_text": 1.2462, + "ppl": 4.1256, + "step": 8312 + }, + { + "epoch": 0.05, + "global_step": 8313, + "learning_rate": 0.0004661393989983306, + "loss": 1.6503, + "loss_base2": 2.3809, + "loss_pixel": 0.1734, + "loss_text": 1.4769, + "ppl": 5.2085, + "step": 8313 + }, + { + "epoch": 0.05, + "global_step": 8314, + "learning_rate": 0.00046613522537562605, + "loss": 1.657, + "loss_base2": 2.3905, + "loss_pixel": 0.171, + "loss_text": 1.486, + "ppl": 5.2436, + "step": 8314 + }, + { + "epoch": 0.05, + "global_step": 8315, + "learning_rate": 0.00046613105175292156, + "loss": 1.6673, + "loss_base2": 2.4054, + "loss_pixel": 0.1704, + "loss_text": 1.497, + "ppl": 5.2978, + "step": 8315 + }, + { + "epoch": 0.05, + "global_step": 8316, + "learning_rate": 0.00046612687813021706, + "loss": 1.6587, + "loss_base2": 2.393, + "loss_pixel": 0.1704, + "loss_text": 1.4884, + "ppl": 5.2525, + "step": 8316 + }, + { + "epoch": 0.05, + "global_step": 8317, + "learning_rate": 0.0004661227045075125, + "loss": 1.6757, + "loss_base2": 2.4175, + "loss_pixel": 0.1706, + "loss_text": 1.5051, + "ppl": 5.3425, + "step": 8317 + }, + { + "epoch": 0.05, + "global_step": 8318, + "learning_rate": 0.000466118530884808, + "loss": 1.6651, + "loss_base2": 2.4022, + "loss_pixel": 0.1709, + "loss_text": 1.4942, + "ppl": 5.2862, + "step": 8318 + }, + { + "epoch": 0.05, + "global_step": 8319, + "learning_rate": 0.0004661143572621035, + "loss": 1.6653, + "loss_base2": 2.4025, + "loss_pixel": 0.1715, + "loss_text": 1.4938, + "ppl": 5.2873, + "step": 8319 + }, + { + "epoch": 0.05, + "global_step": 8320, + "learning_rate": 0.000466110183639399, + "loss": 1.6758, + "loss_base2": 2.4177, + "loss_pixel": 0.171, + "loss_text": 1.5048, + "ppl": 5.3431, + "step": 8320 + }, + { + "epoch": 0.05, + "global_step": 8321, + "learning_rate": 0.0004661060100166945, + "loss": 1.6675, + "loss_base2": 2.4057, + "loss_pixel": 0.1721, + "loss_text": 1.4954, + "ppl": 5.2989, + "step": 8321 + }, + { + "epoch": 0.05, + "global_step": 8322, + "learning_rate": 0.00046610183639399, + "loss": 1.6549, + "loss_base2": 2.3875, + "loss_pixel": 0.1713, + "loss_text": 1.4836, + "ppl": 5.2326, + "step": 8322 + }, + { + "epoch": 0.05, + "global_step": 8323, + "learning_rate": 0.00046609766277128545, + "loss": 1.6532, + "loss_base2": 2.3851, + "loss_pixel": 0.1706, + "loss_text": 1.4826, + "ppl": 5.2237, + "step": 8323 + }, + { + "epoch": 0.05, + "global_step": 8324, + "learning_rate": 0.00046609348914858096, + "loss": 1.656, + "loss_base2": 2.3891, + "loss_pixel": 0.1697, + "loss_text": 1.4864, + "ppl": 5.2383, + "step": 8324 + }, + { + "epoch": 0.05, + "global_step": 8325, + "learning_rate": 0.00046608931552587647, + "loss": 1.6774, + "loss_base2": 2.42, + "loss_pixel": 0.1724, + "loss_text": 1.505, + "ppl": 5.3516, + "step": 8325 + }, + { + "epoch": 0.05, + "global_step": 8326, + "learning_rate": 0.000466085141903172, + "loss": 1.6617, + "loss_base2": 2.3973, + "loss_pixel": 0.1716, + "loss_text": 1.49, + "ppl": 5.2683, + "step": 8326 + }, + { + "epoch": 0.05, + "global_step": 8327, + "learning_rate": 0.0004660809682804675, + "loss": 1.651, + "loss_base2": 2.3819, + "loss_pixel": 0.1718, + "loss_text": 1.4792, + "ppl": 5.2122, + "step": 8327 + }, + { + "epoch": 0.05, + "global_step": 8328, + "learning_rate": 0.00046607679465776293, + "loss": 1.6639, + "loss_base2": 2.4005, + "loss_pixel": 0.1716, + "loss_text": 1.4923, + "ppl": 5.2799, + "step": 8328 + }, + { + "epoch": 0.05, + "global_step": 8329, + "learning_rate": 0.00046607262103505844, + "loss": 1.6574, + "loss_base2": 2.3911, + "loss_pixel": 0.17, + "loss_text": 1.4874, + "ppl": 5.2457, + "step": 8329 + }, + { + "epoch": 0.05, + "global_step": 8330, + "learning_rate": 0.00046606844741235395, + "loss": 1.6655, + "loss_base2": 2.4028, + "loss_pixel": 0.1709, + "loss_text": 1.4945, + "ppl": 5.2883, + "step": 8330 + }, + { + "epoch": 0.05, + "global_step": 8331, + "learning_rate": 0.00046606427378964946, + "loss": 1.6439, + "loss_base2": 2.3716, + "loss_pixel": 0.1708, + "loss_text": 1.4731, + "ppl": 5.1753, + "step": 8331 + }, + { + "epoch": 0.05, + "global_step": 8332, + "learning_rate": 0.00046606010016694496, + "loss": 1.6326, + "loss_base2": 2.3553, + "loss_pixel": 0.1707, + "loss_text": 1.4619, + "ppl": 5.1172, + "step": 8332 + }, + { + "epoch": 0.05, + "global_step": 8333, + "learning_rate": 0.0004660559265442404, + "loss": 1.6538, + "loss_base2": 2.3859, + "loss_pixel": 0.1694, + "loss_text": 1.4844, + "ppl": 5.2268, + "step": 8333 + }, + { + "epoch": 0.05, + "global_step": 8334, + "learning_rate": 0.0004660517529215359, + "loss": 1.6537, + "loss_base2": 2.3858, + "loss_pixel": 0.169, + "loss_text": 1.4847, + "ppl": 5.2263, + "step": 8334 + }, + { + "epoch": 0.05, + "global_step": 8335, + "learning_rate": 0.0004660475792988314, + "loss": 1.6544, + "loss_base2": 2.3868, + "loss_pixel": 0.1694, + "loss_text": 1.4851, + "ppl": 5.2299, + "step": 8335 + }, + { + "epoch": 0.05, + "global_step": 8336, + "learning_rate": 0.0004660434056761269, + "loss": 1.6353, + "loss_base2": 2.3592, + "loss_pixel": 0.1705, + "loss_text": 1.4648, + "ppl": 5.131, + "step": 8336 + }, + { + "epoch": 0.05, + "global_step": 8337, + "learning_rate": 0.00046603923205342234, + "loss": 1.6584, + "loss_base2": 2.3926, + "loss_pixel": 0.171, + "loss_text": 1.4874, + "ppl": 5.2509, + "step": 8337 + }, + { + "epoch": 0.05, + "global_step": 8338, + "learning_rate": 0.00046603505843071784, + "loss": 1.6637, + "loss_base2": 2.4002, + "loss_pixel": 0.1699, + "loss_text": 1.4938, + "ppl": 5.2788, + "step": 8338 + }, + { + "epoch": 0.05, + "global_step": 8339, + "learning_rate": 0.00046603088480801335, + "loss": 1.6402, + "loss_base2": 2.3663, + "loss_pixel": 0.1708, + "loss_text": 1.4694, + "ppl": 5.1562, + "step": 8339 + }, + { + "epoch": 0.05, + "global_step": 8340, + "learning_rate": 0.00046602671118530886, + "loss": 1.6595, + "loss_base2": 2.3942, + "loss_pixel": 0.1716, + "loss_text": 1.4879, + "ppl": 5.2567, + "step": 8340 + }, + { + "epoch": 0.05, + "global_step": 8341, + "learning_rate": 0.00046602253756260437, + "loss": 1.6648, + "loss_base2": 2.4018, + "loss_pixel": 0.1692, + "loss_text": 1.4955, + "ppl": 5.2846, + "step": 8341 + }, + { + "epoch": 0.05, + "global_step": 8342, + "learning_rate": 0.0004660183639398998, + "loss": 1.6476, + "loss_base2": 2.377, + "loss_pixel": 0.1695, + "loss_text": 1.4781, + "ppl": 5.1945, + "step": 8342 + }, + { + "epoch": 0.05, + "global_step": 8343, + "learning_rate": 0.0004660141903171953, + "loss": 1.6518, + "loss_base2": 2.383, + "loss_pixel": 0.1704, + "loss_text": 1.4814, + "ppl": 5.2164, + "step": 8343 + }, + { + "epoch": 0.05, + "global_step": 8344, + "learning_rate": 0.00046601001669449083, + "loss": 1.6538, + "loss_base2": 2.3859, + "loss_pixel": 0.1706, + "loss_text": 1.4833, + "ppl": 5.2268, + "step": 8344 + }, + { + "epoch": 0.05, + "global_step": 8345, + "learning_rate": 0.00046600584307178634, + "loss": 1.6546, + "loss_base2": 2.3871, + "loss_pixel": 0.1693, + "loss_text": 1.4853, + "ppl": 5.231, + "step": 8345 + }, + { + "epoch": 0.05, + "global_step": 8346, + "learning_rate": 0.0004660016694490818, + "loss": 1.6581, + "loss_base2": 2.3921, + "loss_pixel": 0.1695, + "loss_text": 1.4886, + "ppl": 5.2493, + "step": 8346 + }, + { + "epoch": 0.05, + "global_step": 8347, + "learning_rate": 0.0004659974958263773, + "loss": 1.6696, + "loss_base2": 2.4087, + "loss_pixel": 0.1691, + "loss_text": 1.5006, + "ppl": 5.31, + "step": 8347 + }, + { + "epoch": 0.05, + "global_step": 8348, + "learning_rate": 0.0004659933222036728, + "loss": 1.6436, + "loss_base2": 2.3712, + "loss_pixel": 0.1698, + "loss_text": 1.4738, + "ppl": 5.1738, + "step": 8348 + }, + { + "epoch": 0.05, + "global_step": 8349, + "learning_rate": 0.0004659891485809683, + "loss": 1.6533, + "loss_base2": 2.3852, + "loss_pixel": 0.1689, + "loss_text": 1.4844, + "ppl": 5.2242, + "step": 8349 + }, + { + "epoch": 0.05, + "global_step": 8350, + "learning_rate": 0.0004659849749582638, + "loss": 1.6428, + "loss_base2": 2.3701, + "loss_pixel": 0.171, + "loss_text": 1.4718, + "ppl": 5.1696, + "step": 8350 + }, + { + "epoch": 0.05, + "global_step": 8351, + "learning_rate": 0.0004659808013355593, + "loss": 1.6442, + "loss_base2": 2.3721, + "loss_pixel": 0.1693, + "loss_text": 1.4749, + "ppl": 5.1769, + "step": 8351 + }, + { + "epoch": 0.05, + "global_step": 8352, + "learning_rate": 0.0004659766277128548, + "loss": 1.6417, + "loss_base2": 2.3685, + "loss_pixel": 0.1697, + "loss_text": 1.4719, + "ppl": 5.1639, + "step": 8352 + }, + { + "epoch": 0.05, + "global_step": 8353, + "learning_rate": 0.0004659724540901503, + "loss": 1.6414, + "loss_base2": 2.368, + "loss_pixel": 0.1688, + "loss_text": 1.4726, + "ppl": 5.1624, + "step": 8353 + }, + { + "epoch": 0.05, + "global_step": 8354, + "learning_rate": 0.00046596828046744574, + "loss": 1.6501, + "loss_base2": 2.3806, + "loss_pixel": 0.1707, + "loss_text": 1.4794, + "ppl": 5.2075, + "step": 8354 + }, + { + "epoch": 0.05, + "global_step": 8355, + "learning_rate": 0.0004659641068447412, + "loss": 1.654, + "loss_base2": 2.3862, + "loss_pixel": 0.1687, + "loss_text": 1.4853, + "ppl": 5.2278, + "step": 8355 + }, + { + "epoch": 0.05, + "global_step": 8356, + "learning_rate": 0.0004659599332220367, + "loss": 1.6444, + "loss_base2": 2.3724, + "loss_pixel": 0.1695, + "loss_text": 1.4749, + "ppl": 5.1779, + "step": 8356 + }, + { + "epoch": 0.05, + "global_step": 8357, + "learning_rate": 0.0004659557595993322, + "loss": 1.6459, + "loss_base2": 2.3745, + "loss_pixel": 0.1713, + "loss_text": 1.4746, + "ppl": 5.1857, + "step": 8357 + }, + { + "epoch": 0.05, + "global_step": 8358, + "learning_rate": 0.0004659515859766277, + "loss": 1.663, + "loss_base2": 2.3992, + "loss_pixel": 0.1675, + "loss_text": 1.4955, + "ppl": 5.2751, + "step": 8358 + }, + { + "epoch": 0.05, + "global_step": 8359, + "learning_rate": 0.0004659474123539232, + "loss": 1.6542, + "loss_base2": 2.3865, + "loss_pixel": 0.169, + "loss_text": 1.4853, + "ppl": 5.2289, + "step": 8359 + }, + { + "epoch": 0.05, + "global_step": 8360, + "learning_rate": 0.0004659432387312187, + "loss": 1.6493, + "loss_base2": 2.3794, + "loss_pixel": 0.1677, + "loss_text": 1.4815, + "ppl": 5.2033, + "step": 8360 + }, + { + "epoch": 0.05, + "global_step": 8361, + "learning_rate": 0.0004659390651085142, + "loss": 1.6328, + "loss_base2": 2.3556, + "loss_pixel": 0.1683, + "loss_text": 1.4645, + "ppl": 5.1182, + "step": 8361 + }, + { + "epoch": 0.05, + "global_step": 8362, + "learning_rate": 0.0004659348914858097, + "loss": 1.6548, + "loss_base2": 2.3874, + "loss_pixel": 0.1681, + "loss_text": 1.4867, + "ppl": 5.232, + "step": 8362 + }, + { + "epoch": 0.05, + "global_step": 8363, + "learning_rate": 0.0004659307178631052, + "loss": 1.6283, + "loss_base2": 2.3491, + "loss_pixel": 0.1669, + "loss_text": 1.4614, + "ppl": 5.0952, + "step": 8363 + }, + { + "epoch": 0.05, + "global_step": 8364, + "learning_rate": 0.00046592654424040065, + "loss": 1.6461, + "loss_base2": 2.3748, + "loss_pixel": 0.1658, + "loss_text": 1.4803, + "ppl": 5.1867, + "step": 8364 + }, + { + "epoch": 0.05, + "global_step": 8365, + "learning_rate": 0.00046592237061769616, + "loss": 1.6674, + "loss_base2": 2.4055, + "loss_pixel": 0.1678, + "loss_text": 1.4996, + "ppl": 5.2984, + "step": 8365 + }, + { + "epoch": 0.05, + "global_step": 8366, + "learning_rate": 0.00046591819699499167, + "loss": 1.6406, + "loss_base2": 2.3669, + "loss_pixel": 0.1646, + "loss_text": 1.476, + "ppl": 5.1583, + "step": 8366 + }, + { + "epoch": 0.05, + "global_step": 8367, + "learning_rate": 0.0004659140233722872, + "loss": 1.6373, + "loss_base2": 2.3621, + "loss_pixel": 0.1646, + "loss_text": 1.4727, + "ppl": 5.1413, + "step": 8367 + }, + { + "epoch": 0.05, + "global_step": 8368, + "learning_rate": 0.0004659098497495827, + "loss": 1.6593, + "loss_base2": 2.3939, + "loss_pixel": 0.1641, + "loss_text": 1.4951, + "ppl": 5.2556, + "step": 8368 + }, + { + "epoch": 0.05, + "global_step": 8369, + "learning_rate": 0.00046590567612687814, + "loss": 1.6468, + "loss_base2": 2.3758, + "loss_pixel": 0.1643, + "loss_text": 1.4825, + "ppl": 5.1903, + "step": 8369 + }, + { + "epoch": 0.05, + "global_step": 8370, + "learning_rate": 0.00046590150250417364, + "loss": 1.6555, + "loss_base2": 2.3884, + "loss_pixel": 0.1654, + "loss_text": 1.4901, + "ppl": 5.2357, + "step": 8370 + }, + { + "epoch": 0.05, + "global_step": 8371, + "learning_rate": 0.00046589732888146915, + "loss": 1.6499, + "loss_base2": 2.3803, + "loss_pixel": 0.1643, + "loss_text": 1.4856, + "ppl": 5.2065, + "step": 8371 + }, + { + "epoch": 0.05, + "global_step": 8372, + "learning_rate": 0.00046589315525876466, + "loss": 1.6272, + "loss_base2": 2.3476, + "loss_pixel": 0.1659, + "loss_text": 1.4613, + "ppl": 5.0896, + "step": 8372 + }, + { + "epoch": 0.05, + "global_step": 8373, + "learning_rate": 0.00046588898163606006, + "loss": 1.6396, + "loss_base2": 2.3654, + "loss_pixel": 0.1634, + "loss_text": 1.4761, + "ppl": 5.1531, + "step": 8373 + }, + { + "epoch": 0.05, + "global_step": 8374, + "learning_rate": 0.00046588480801335557, + "loss": 1.6335, + "loss_base2": 2.3566, + "loss_pixel": 0.1661, + "loss_text": 1.4674, + "ppl": 5.1218, + "step": 8374 + }, + { + "epoch": 0.05, + "global_step": 8375, + "learning_rate": 0.00046588063439065107, + "loss": 1.6365, + "loss_base2": 2.361, + "loss_pixel": 0.163, + "loss_text": 1.4734, + "ppl": 5.1372, + "step": 8375 + }, + { + "epoch": 0.05, + "global_step": 8376, + "learning_rate": 0.0004658764607679466, + "loss": 1.6473, + "loss_base2": 2.3766, + "loss_pixel": 0.1633, + "loss_text": 1.484, + "ppl": 5.1929, + "step": 8376 + }, + { + "epoch": 0.05, + "global_step": 8377, + "learning_rate": 0.0004658722871452421, + "loss": 1.654, + "loss_base2": 2.3862, + "loss_pixel": 0.1631, + "loss_text": 1.4909, + "ppl": 5.2278, + "step": 8377 + }, + { + "epoch": 0.05, + "global_step": 8378, + "learning_rate": 0.00046586811352253754, + "loss": 1.6438, + "loss_base2": 2.3715, + "loss_pixel": 0.163, + "loss_text": 1.4808, + "ppl": 5.1748, + "step": 8378 + }, + { + "epoch": 0.05, + "global_step": 8379, + "learning_rate": 0.00046586393989983305, + "loss": 1.6401, + "loss_base2": 2.3662, + "loss_pixel": 0.1639, + "loss_text": 1.4762, + "ppl": 5.1557, + "step": 8379 + }, + { + "epoch": 0.05, + "global_step": 8380, + "learning_rate": 0.00046585976627712856, + "loss": 1.6456, + "loss_base2": 2.3741, + "loss_pixel": 0.1629, + "loss_text": 1.4828, + "ppl": 5.1841, + "step": 8380 + }, + { + "epoch": 0.05, + "global_step": 8381, + "learning_rate": 0.00046585559265442406, + "loss": 1.6434, + "loss_base2": 2.3709, + "loss_pixel": 0.1628, + "loss_text": 1.4806, + "ppl": 5.1727, + "step": 8381 + }, + { + "epoch": 0.05, + "global_step": 8382, + "learning_rate": 0.00046585141903171957, + "loss": 1.6593, + "loss_base2": 2.3939, + "loss_pixel": 0.1637, + "loss_text": 1.4956, + "ppl": 5.2556, + "step": 8382 + }, + { + "epoch": 0.05, + "global_step": 8383, + "learning_rate": 0.000465847245409015, + "loss": 1.6494, + "loss_base2": 2.3796, + "loss_pixel": 0.1616, + "loss_text": 1.4878, + "ppl": 5.2039, + "step": 8383 + }, + { + "epoch": 0.05, + "global_step": 8384, + "learning_rate": 0.00046584307178631053, + "loss": 1.6388, + "loss_base2": 2.3643, + "loss_pixel": 0.1624, + "loss_text": 1.4764, + "ppl": 5.149, + "step": 8384 + }, + { + "epoch": 0.05, + "global_step": 8385, + "learning_rate": 0.00046583889816360604, + "loss": 1.649, + "loss_base2": 2.379, + "loss_pixel": 0.1666, + "loss_text": 1.4824, + "ppl": 5.2018, + "step": 8385 + }, + { + "epoch": 0.05, + "global_step": 8386, + "learning_rate": 0.00046583472454090154, + "loss": 1.632, + "loss_base2": 2.3545, + "loss_pixel": 0.1722, + "loss_text": 1.4598, + "ppl": 5.1141, + "step": 8386 + }, + { + "epoch": 0.05, + "global_step": 8387, + "learning_rate": 0.000465830550918197, + "loss": 1.6455, + "loss_base2": 2.374, + "loss_pixel": 0.1727, + "loss_text": 1.4728, + "ppl": 5.1836, + "step": 8387 + }, + { + "epoch": 0.05, + "global_step": 8388, + "learning_rate": 0.0004658263772954925, + "loss": 1.6493, + "loss_base2": 2.3794, + "loss_pixel": 0.1722, + "loss_text": 1.4771, + "ppl": 5.2033, + "step": 8388 + }, + { + "epoch": 0.05, + "global_step": 8389, + "learning_rate": 0.000465822203672788, + "loss": 1.6391, + "loss_base2": 2.3647, + "loss_pixel": 0.1711, + "loss_text": 1.468, + "ppl": 5.1505, + "step": 8389 + }, + { + "epoch": 0.05, + "global_step": 8390, + "learning_rate": 0.0004658180300500835, + "loss": 1.6722, + "loss_base2": 2.4125, + "loss_pixel": 0.1712, + "loss_text": 1.501, + "ppl": 5.3239, + "step": 8390 + }, + { + "epoch": 0.05, + "global_step": 8391, + "learning_rate": 0.00046581385642737903, + "loss": 1.6371, + "loss_base2": 2.3618, + "loss_pixel": 0.1718, + "loss_text": 1.4653, + "ppl": 5.1402, + "step": 8391 + }, + { + "epoch": 0.05, + "global_step": 8392, + "learning_rate": 0.0004658096828046744, + "loss": 1.6373, + "loss_base2": 2.3621, + "loss_pixel": 0.1719, + "loss_text": 1.4653, + "ppl": 5.1413, + "step": 8392 + }, + { + "epoch": 0.05, + "global_step": 8393, + "learning_rate": 0.00046580550918196993, + "loss": 1.6616, + "loss_base2": 2.3972, + "loss_pixel": 0.1729, + "loss_text": 1.4886, + "ppl": 5.2677, + "step": 8393 + }, + { + "epoch": 0.05, + "global_step": 8394, + "learning_rate": 0.00046580133555926544, + "loss": 1.6471, + "loss_base2": 2.3763, + "loss_pixel": 0.1716, + "loss_text": 1.4755, + "ppl": 5.1919, + "step": 8394 + }, + { + "epoch": 0.05, + "global_step": 8395, + "learning_rate": 0.00046579716193656095, + "loss": 1.6476, + "loss_base2": 2.377, + "loss_pixel": 0.1701, + "loss_text": 1.4776, + "ppl": 5.1945, + "step": 8395 + }, + { + "epoch": 0.05, + "global_step": 8396, + "learning_rate": 0.0004657929883138564, + "loss": 1.614, + "loss_base2": 2.3285, + "loss_pixel": 0.1705, + "loss_text": 1.4436, + "ppl": 5.0229, + "step": 8396 + }, + { + "epoch": 0.05, + "global_step": 8397, + "learning_rate": 0.0004657888146911519, + "loss": 1.6544, + "loss_base2": 2.3868, + "loss_pixel": 0.1707, + "loss_text": 1.4838, + "ppl": 5.2299, + "step": 8397 + }, + { + "epoch": 0.05, + "global_step": 8398, + "learning_rate": 0.0004657846410684474, + "loss": 1.6438, + "loss_base2": 2.3715, + "loss_pixel": 0.1708, + "loss_text": 1.473, + "ppl": 5.1748, + "step": 8398 + }, + { + "epoch": 0.05, + "global_step": 8399, + "learning_rate": 0.0004657804674457429, + "loss": 1.6548, + "loss_base2": 2.3874, + "loss_pixel": 0.1698, + "loss_text": 1.485, + "ppl": 5.232, + "step": 8399 + }, + { + "epoch": 0.05, + "global_step": 8400, + "learning_rate": 0.00046577629382303843, + "loss": 1.6552, + "loss_base2": 2.3879, + "loss_pixel": 0.1701, + "loss_text": 1.4851, + "ppl": 5.2341, + "step": 8400 + }, + { + "epoch": 0.05, + "global_step": 8401, + "learning_rate": 0.0004657721202003339, + "loss": 1.649, + "loss_base2": 2.379, + "loss_pixel": 0.171, + "loss_text": 1.478, + "ppl": 5.2018, + "step": 8401 + }, + { + "epoch": 0.05, + "global_step": 8402, + "learning_rate": 0.0004657679465776294, + "loss": 1.6657, + "loss_base2": 2.4031, + "loss_pixel": 0.1719, + "loss_text": 1.4938, + "ppl": 5.2894, + "step": 8402 + }, + { + "epoch": 0.05, + "global_step": 8403, + "learning_rate": 0.0004657637729549249, + "loss": 1.6641, + "loss_base2": 2.4008, + "loss_pixel": 0.1721, + "loss_text": 1.4919, + "ppl": 5.2809, + "step": 8403 + }, + { + "epoch": 0.05, + "global_step": 8404, + "learning_rate": 0.0004657595993322204, + "loss": 1.6562, + "loss_base2": 2.3894, + "loss_pixel": 0.1704, + "loss_text": 1.4858, + "ppl": 5.2394, + "step": 8404 + }, + { + "epoch": 0.05, + "global_step": 8405, + "learning_rate": 0.00046575542570951586, + "loss": 1.6519, + "loss_base2": 2.3832, + "loss_pixel": 0.1709, + "loss_text": 1.481, + "ppl": 5.2169, + "step": 8405 + }, + { + "epoch": 0.05, + "global_step": 8406, + "learning_rate": 0.00046575125208681137, + "loss": 1.6509, + "loss_base2": 2.3817, + "loss_pixel": 0.1731, + "loss_text": 1.4777, + "ppl": 5.2117, + "step": 8406 + }, + { + "epoch": 0.05, + "global_step": 8407, + "learning_rate": 0.0004657470784641069, + "loss": 1.6506, + "loss_base2": 2.3813, + "loss_pixel": 0.1707, + "loss_text": 1.4799, + "ppl": 5.2101, + "step": 8407 + }, + { + "epoch": 0.05, + "global_step": 8408, + "learning_rate": 0.0004657429048414024, + "loss": 1.6377, + "loss_base2": 2.3627, + "loss_pixel": 0.1717, + "loss_text": 1.4659, + "ppl": 5.1433, + "step": 8408 + }, + { + "epoch": 0.05, + "global_step": 8409, + "learning_rate": 0.0004657387312186979, + "loss": 1.6502, + "loss_base2": 2.3807, + "loss_pixel": 0.1715, + "loss_text": 1.4787, + "ppl": 5.208, + "step": 8409 + }, + { + "epoch": 0.05, + "global_step": 8410, + "learning_rate": 0.0004657345575959933, + "loss": 1.6347, + "loss_base2": 2.3584, + "loss_pixel": 0.1709, + "loss_text": 1.4638, + "ppl": 5.1279, + "step": 8410 + }, + { + "epoch": 0.05, + "global_step": 8411, + "learning_rate": 0.0004657303839732888, + "loss": 1.6542, + "loss_base2": 2.3865, + "loss_pixel": 0.174, + "loss_text": 1.4802, + "ppl": 5.2289, + "step": 8411 + }, + { + "epoch": 0.05, + "global_step": 8412, + "learning_rate": 0.0004657262103505843, + "loss": 1.6444, + "loss_base2": 2.3724, + "loss_pixel": 0.1714, + "loss_text": 1.473, + "ppl": 5.1779, + "step": 8412 + }, + { + "epoch": 0.05, + "global_step": 8413, + "learning_rate": 0.0004657220367278798, + "loss": 1.6384, + "loss_base2": 2.3637, + "loss_pixel": 0.1702, + "loss_text": 1.4683, + "ppl": 5.1469, + "step": 8413 + }, + { + "epoch": 0.05, + "global_step": 8414, + "learning_rate": 0.00046571786310517526, + "loss": 1.6433, + "loss_base2": 2.3708, + "loss_pixel": 0.1696, + "loss_text": 1.4737, + "ppl": 5.1722, + "step": 8414 + }, + { + "epoch": 0.05, + "global_step": 8415, + "learning_rate": 0.00046571368948247077, + "loss": 1.6694, + "loss_base2": 2.4084, + "loss_pixel": 0.171, + "loss_text": 1.4983, + "ppl": 5.309, + "step": 8415 + }, + { + "epoch": 0.05, + "global_step": 8416, + "learning_rate": 0.0004657095158597663, + "loss": 1.6659, + "loss_base2": 2.4034, + "loss_pixel": 0.17, + "loss_text": 1.4959, + "ppl": 5.2904, + "step": 8416 + }, + { + "epoch": 0.05, + "global_step": 8417, + "learning_rate": 0.0004657053422370618, + "loss": 1.646, + "loss_base2": 2.3747, + "loss_pixel": 0.1706, + "loss_text": 1.4754, + "ppl": 5.1862, + "step": 8417 + }, + { + "epoch": 0.05, + "global_step": 8418, + "learning_rate": 0.0004657011686143573, + "loss": 1.6587, + "loss_base2": 2.393, + "loss_pixel": 0.1698, + "loss_text": 1.489, + "ppl": 5.2525, + "step": 8418 + }, + { + "epoch": 0.05, + "global_step": 8419, + "learning_rate": 0.00046569699499165274, + "loss": 1.6483, + "loss_base2": 2.378, + "loss_pixel": 0.1701, + "loss_text": 1.4782, + "ppl": 5.1981, + "step": 8419 + }, + { + "epoch": 0.05, + "global_step": 8420, + "learning_rate": 0.00046569282136894825, + "loss": 1.6532, + "loss_base2": 2.3851, + "loss_pixel": 0.1707, + "loss_text": 1.4825, + "ppl": 5.2237, + "step": 8420 + }, + { + "epoch": 0.05, + "global_step": 8421, + "learning_rate": 0.00046568864774624376, + "loss": 1.64, + "loss_base2": 2.366, + "loss_pixel": 0.1708, + "loss_text": 1.4692, + "ppl": 5.1552, + "step": 8421 + }, + { + "epoch": 0.05, + "global_step": 8422, + "learning_rate": 0.00046568447412353927, + "loss": 1.64, + "loss_base2": 2.366, + "loss_pixel": 0.1711, + "loss_text": 1.4689, + "ppl": 5.1552, + "step": 8422 + }, + { + "epoch": 0.05, + "global_step": 8423, + "learning_rate": 0.0004656803005008347, + "loss": 1.6474, + "loss_base2": 2.3767, + "loss_pixel": 0.1698, + "loss_text": 1.4775, + "ppl": 5.1935, + "step": 8423 + }, + { + "epoch": 0.05, + "global_step": 8424, + "learning_rate": 0.0004656761268781302, + "loss": 1.6393, + "loss_base2": 2.365, + "loss_pixel": 0.1714, + "loss_text": 1.4679, + "ppl": 5.1516, + "step": 8424 + }, + { + "epoch": 0.05, + "global_step": 8425, + "learning_rate": 0.00046567195325542573, + "loss": 1.6576, + "loss_base2": 2.3914, + "loss_pixel": 0.1706, + "loss_text": 1.4869, + "ppl": 5.2467, + "step": 8425 + }, + { + "epoch": 0.05, + "global_step": 8426, + "learning_rate": 0.00046566777963272124, + "loss": 1.6629, + "loss_base2": 2.3991, + "loss_pixel": 0.1706, + "loss_text": 1.4922, + "ppl": 5.2746, + "step": 8426 + }, + { + "epoch": 0.05, + "global_step": 8427, + "learning_rate": 0.00046566360601001675, + "loss": 1.6637, + "loss_base2": 2.4002, + "loss_pixel": 0.1694, + "loss_text": 1.4943, + "ppl": 5.2788, + "step": 8427 + }, + { + "epoch": 0.05, + "global_step": 8428, + "learning_rate": 0.0004656594323873122, + "loss": 1.647, + "loss_base2": 2.3761, + "loss_pixel": 0.17, + "loss_text": 1.4771, + "ppl": 5.1914, + "step": 8428 + }, + { + "epoch": 0.05, + "global_step": 8429, + "learning_rate": 0.00046565525876460765, + "loss": 1.6453, + "loss_base2": 2.3737, + "loss_pixel": 0.1711, + "loss_text": 1.4742, + "ppl": 5.1826, + "step": 8429 + }, + { + "epoch": 0.05, + "global_step": 8430, + "learning_rate": 0.00046565108514190316, + "loss": 1.6631, + "loss_base2": 2.3993, + "loss_pixel": 0.1709, + "loss_text": 1.4922, + "ppl": 5.2756, + "step": 8430 + }, + { + "epoch": 0.05, + "global_step": 8431, + "learning_rate": 0.00046564691151919867, + "loss": 1.6406, + "loss_base2": 2.3669, + "loss_pixel": 0.1698, + "loss_text": 1.4707, + "ppl": 5.1583, + "step": 8431 + }, + { + "epoch": 0.05, + "global_step": 8432, + "learning_rate": 0.0004656427378964941, + "loss": 1.6507, + "loss_base2": 2.3815, + "loss_pixel": 0.171, + "loss_text": 1.4797, + "ppl": 5.2106, + "step": 8432 + }, + { + "epoch": 0.05, + "global_step": 8433, + "learning_rate": 0.00046563856427378963, + "loss": 1.6033, + "loss_base2": 2.3131, + "loss_pixel": 0.1739, + "loss_text": 1.4295, + "ppl": 4.9694, + "step": 8433 + }, + { + "epoch": 0.05, + "global_step": 8434, + "learning_rate": 0.00046563439065108514, + "loss": 1.515, + "loss_base2": 2.1857, + "loss_pixel": 0.1888, + "loss_text": 1.3262, + "ppl": 4.5494, + "step": 8434 + }, + { + "epoch": 0.05, + "global_step": 8435, + "learning_rate": 0.00046563021702838064, + "loss": 1.4675, + "loss_base2": 2.1172, + "loss_pixel": 0.2101, + "loss_text": 1.2575, + "ppl": 4.3384, + "step": 8435 + }, + { + "epoch": 0.05, + "global_step": 8436, + "learning_rate": 0.00046562604340567615, + "loss": 1.4778, + "loss_base2": 2.132, + "loss_pixel": 0.2215, + "loss_text": 1.2563, + "ppl": 4.3833, + "step": 8436 + }, + { + "epoch": 0.05, + "global_step": 8437, + "learning_rate": 0.0004656218697829716, + "loss": 1.5245, + "loss_base2": 2.1994, + "loss_pixel": 0.2297, + "loss_text": 1.2948, + "ppl": 4.5928, + "step": 8437 + }, + { + "epoch": 0.05, + "global_step": 8438, + "learning_rate": 0.0004656176961602671, + "loss": 1.4835, + "loss_base2": 2.1402, + "loss_pixel": 0.2272, + "loss_text": 1.2563, + "ppl": 4.4083, + "step": 8438 + }, + { + "epoch": 0.05, + "global_step": 8439, + "learning_rate": 0.0004656135225375626, + "loss": 1.4786, + "loss_base2": 2.1332, + "loss_pixel": 0.234, + "loss_text": 1.2447, + "ppl": 4.3868, + "step": 8439 + }, + { + "epoch": 0.05, + "global_step": 8440, + "learning_rate": 0.0004656093489148581, + "loss": 1.503, + "loss_base2": 2.1684, + "loss_pixel": 0.2476, + "loss_text": 1.2554, + "ppl": 4.4952, + "step": 8440 + }, + { + "epoch": 0.05, + "global_step": 8441, + "learning_rate": 0.00046560517529215363, + "loss": 1.5908, + "loss_base2": 2.295, + "loss_pixel": 0.2482, + "loss_text": 1.3426, + "ppl": 4.9077, + "step": 8441 + }, + { + "epoch": 0.05, + "global_step": 8442, + "learning_rate": 0.0004656010016694491, + "loss": 1.7292, + "loss_base2": 2.4947, + "loss_pixel": 0.2387, + "loss_text": 1.4905, + "ppl": 5.6361, + "step": 8442 + }, + { + "epoch": 0.05, + "global_step": 8443, + "learning_rate": 0.0004655968280467446, + "loss": 1.7406, + "loss_base2": 2.5112, + "loss_pixel": 0.2396, + "loss_text": 1.501, + "ppl": 5.7008, + "step": 8443 + }, + { + "epoch": 0.05, + "global_step": 8444, + "learning_rate": 0.0004655926544240401, + "loss": 1.7239, + "loss_base2": 2.4871, + "loss_pixel": 0.2328, + "loss_text": 1.4911, + "ppl": 5.6064, + "step": 8444 + }, + { + "epoch": 0.05, + "global_step": 8445, + "learning_rate": 0.0004655884808013356, + "loss": 1.7225, + "loss_base2": 2.485, + "loss_pixel": 0.225, + "loss_text": 1.4975, + "ppl": 5.5985, + "step": 8445 + }, + { + "epoch": 0.05, + "global_step": 8446, + "learning_rate": 0.00046558430717863106, + "loss": 1.7172, + "loss_base2": 2.4774, + "loss_pixel": 0.2212, + "loss_text": 1.496, + "ppl": 5.5689, + "step": 8446 + }, + { + "epoch": 0.05, + "global_step": 8447, + "learning_rate": 0.00046558013355592657, + "loss": 1.7226, + "loss_base2": 2.4852, + "loss_pixel": 0.2178, + "loss_text": 1.5048, + "ppl": 5.5991, + "step": 8447 + }, + { + "epoch": 0.05, + "global_step": 8448, + "learning_rate": 0.000465575959933222, + "loss": 1.7125, + "loss_base2": 2.4706, + "loss_pixel": 0.2259, + "loss_text": 1.4867, + "ppl": 5.5428, + "step": 8448 + }, + { + "epoch": 0.05, + "global_step": 8449, + "learning_rate": 0.00046557178631051753, + "loss": 1.7599, + "loss_base2": 2.539, + "loss_pixel": 0.2621, + "loss_text": 1.4978, + "ppl": 5.8119, + "step": 8449 + }, + { + "epoch": 0.05, + "global_step": 8450, + "learning_rate": 0.00046556761268781304, + "loss": 1.727, + "loss_base2": 2.4915, + "loss_pixel": 0.2358, + "loss_text": 1.4913, + "ppl": 5.6238, + "step": 8450 + }, + { + "epoch": 0.05, + "global_step": 8451, + "learning_rate": 0.0004655634390651085, + "loss": 1.7123, + "loss_base2": 2.4703, + "loss_pixel": 0.2265, + "loss_text": 1.4858, + "ppl": 5.5417, + "step": 8451 + }, + { + "epoch": 0.05, + "global_step": 8452, + "learning_rate": 0.000465559265442404, + "loss": 1.7324, + "loss_base2": 2.4993, + "loss_pixel": 0.222, + "loss_text": 1.5104, + "ppl": 5.6542, + "step": 8452 + }, + { + "epoch": 0.05, + "global_step": 8453, + "learning_rate": 0.0004655550918196995, + "loss": 1.6967, + "loss_base2": 2.4478, + "loss_pixel": 0.222, + "loss_text": 1.4746, + "ppl": 5.4559, + "step": 8453 + }, + { + "epoch": 0.05, + "global_step": 8454, + "learning_rate": 0.000465550918196995, + "loss": 1.6991, + "loss_base2": 2.4513, + "loss_pixel": 0.226, + "loss_text": 1.4732, + "ppl": 5.469, + "step": 8454 + }, + { + "epoch": 0.05, + "global_step": 8455, + "learning_rate": 0.00046554674457429047, + "loss": 1.7182, + "loss_base2": 2.4788, + "loss_pixel": 0.2194, + "loss_text": 1.4988, + "ppl": 5.5745, + "step": 8455 + }, + { + "epoch": 0.05, + "global_step": 8456, + "learning_rate": 0.000465542570951586, + "loss": 1.7081, + "loss_base2": 2.4643, + "loss_pixel": 0.2176, + "loss_text": 1.4905, + "ppl": 5.5185, + "step": 8456 + }, + { + "epoch": 0.05, + "global_step": 8457, + "learning_rate": 0.0004655383973288815, + "loss": 1.7183, + "loss_base2": 2.479, + "loss_pixel": 0.2281, + "loss_text": 1.4902, + "ppl": 5.575, + "step": 8457 + }, + { + "epoch": 0.05, + "global_step": 8458, + "learning_rate": 0.000465534223706177, + "loss": 1.716, + "loss_base2": 2.4757, + "loss_pixel": 0.2138, + "loss_text": 1.5023, + "ppl": 5.5622, + "step": 8458 + }, + { + "epoch": 0.05, + "global_step": 8459, + "learning_rate": 0.0004655300500834725, + "loss": 1.7096, + "loss_base2": 2.4664, + "loss_pixel": 0.2106, + "loss_text": 1.499, + "ppl": 5.5268, + "step": 8459 + }, + { + "epoch": 0.05, + "global_step": 8460, + "learning_rate": 0.00046552587646076795, + "loss": 1.6884, + "loss_base2": 2.4358, + "loss_pixel": 0.2076, + "loss_text": 1.4808, + "ppl": 5.4108, + "step": 8460 + }, + { + "epoch": 0.05, + "global_step": 8461, + "learning_rate": 0.00046552170283806346, + "loss": 1.689, + "loss_base2": 2.4367, + "loss_pixel": 0.2037, + "loss_text": 1.4854, + "ppl": 5.4141, + "step": 8461 + }, + { + "epoch": 0.05, + "global_step": 8462, + "learning_rate": 0.00046551752921535896, + "loss": 1.6852, + "loss_base2": 2.4312, + "loss_pixel": 0.1989, + "loss_text": 1.4863, + "ppl": 5.3935, + "step": 8462 + }, + { + "epoch": 0.05, + "global_step": 8463, + "learning_rate": 0.00046551335559265447, + "loss": 1.6198, + "loss_base2": 2.3369, + "loss_pixel": 0.1975, + "loss_text": 1.4223, + "ppl": 5.0521, + "step": 8463 + }, + { + "epoch": 0.05, + "global_step": 8464, + "learning_rate": 0.0004655091819699499, + "loss": 1.6643, + "loss_base2": 2.4011, + "loss_pixel": 0.1976, + "loss_text": 1.4667, + "ppl": 5.282, + "step": 8464 + }, + { + "epoch": 0.05, + "global_step": 8465, + "learning_rate": 0.00046550500834724543, + "loss": 1.7115, + "loss_base2": 2.4692, + "loss_pixel": 0.1952, + "loss_text": 1.5163, + "ppl": 5.5373, + "step": 8465 + }, + { + "epoch": 0.05, + "global_step": 8466, + "learning_rate": 0.00046550083472454094, + "loss": 1.6791, + "loss_base2": 2.4224, + "loss_pixel": 0.1902, + "loss_text": 1.4889, + "ppl": 5.3607, + "step": 8466 + }, + { + "epoch": 0.05, + "global_step": 8467, + "learning_rate": 0.0004654966611018364, + "loss": 1.6805, + "loss_base2": 2.4244, + "loss_pixel": 0.1925, + "loss_text": 1.488, + "ppl": 5.3682, + "step": 8467 + }, + { + "epoch": 0.05, + "global_step": 8468, + "learning_rate": 0.0004654924874791319, + "loss": 1.6665, + "loss_base2": 2.4043, + "loss_pixel": 0.1903, + "loss_text": 1.4762, + "ppl": 5.2936, + "step": 8468 + }, + { + "epoch": 0.05, + "global_step": 8469, + "learning_rate": 0.00046548831385642735, + "loss": 1.6704, + "loss_base2": 2.4099, + "loss_pixel": 0.1879, + "loss_text": 1.4825, + "ppl": 5.3143, + "step": 8469 + }, + { + "epoch": 0.05, + "global_step": 8470, + "learning_rate": 0.00046548414023372286, + "loss": 1.6696, + "loss_base2": 2.4087, + "loss_pixel": 0.1873, + "loss_text": 1.4824, + "ppl": 5.31, + "step": 8470 + }, + { + "epoch": 0.05, + "global_step": 8471, + "learning_rate": 0.00046547996661101837, + "loss": 1.6738, + "loss_base2": 2.4148, + "loss_pixel": 0.1823, + "loss_text": 1.4915, + "ppl": 5.3324, + "step": 8471 + }, + { + "epoch": 0.05, + "global_step": 8472, + "learning_rate": 0.0004654757929883139, + "loss": 1.6719, + "loss_base2": 2.412, + "loss_pixel": 0.1837, + "loss_text": 1.4882, + "ppl": 5.3223, + "step": 8472 + }, + { + "epoch": 0.05, + "global_step": 8473, + "learning_rate": 0.0004654716193656093, + "loss": 1.6512, + "loss_base2": 2.3822, + "loss_pixel": 0.1828, + "loss_text": 1.4684, + "ppl": 5.2132, + "step": 8473 + }, + { + "epoch": 0.05, + "global_step": 8474, + "learning_rate": 0.00046546744574290483, + "loss": 1.6534, + "loss_base2": 2.3854, + "loss_pixel": 0.1793, + "loss_text": 1.4741, + "ppl": 5.2247, + "step": 8474 + }, + { + "epoch": 0.05, + "global_step": 8475, + "learning_rate": 0.00046546327212020034, + "loss": 1.6581, + "loss_base2": 2.3921, + "loss_pixel": 0.1827, + "loss_text": 1.4753, + "ppl": 5.2493, + "step": 8475 + }, + { + "epoch": 0.05, + "global_step": 8476, + "learning_rate": 0.00046545909849749585, + "loss": 1.6609, + "loss_base2": 2.3962, + "loss_pixel": 0.1793, + "loss_text": 1.4816, + "ppl": 5.264, + "step": 8476 + }, + { + "epoch": 0.05, + "global_step": 8477, + "learning_rate": 0.00046545492487479136, + "loss": 1.666, + "loss_base2": 2.4035, + "loss_pixel": 0.1778, + "loss_text": 1.4883, + "ppl": 5.291, + "step": 8477 + }, + { + "epoch": 0.05, + "global_step": 8478, + "learning_rate": 0.0004654507512520868, + "loss": 1.6573, + "loss_base2": 2.391, + "loss_pixel": 0.1779, + "loss_text": 1.4794, + "ppl": 5.2451, + "step": 8478 + }, + { + "epoch": 0.05, + "global_step": 8479, + "learning_rate": 0.0004654465776293823, + "loss": 1.6754, + "loss_base2": 2.4171, + "loss_pixel": 0.183, + "loss_text": 1.4923, + "ppl": 5.3409, + "step": 8479 + }, + { + "epoch": 0.05, + "global_step": 8480, + "learning_rate": 0.0004654424040066778, + "loss": 1.6852, + "loss_base2": 2.4312, + "loss_pixel": 0.1926, + "loss_text": 1.4926, + "ppl": 5.3935, + "step": 8480 + }, + { + "epoch": 0.05, + "global_step": 8481, + "learning_rate": 0.00046543823038397333, + "loss": 1.6837, + "loss_base2": 2.4291, + "loss_pixel": 0.1895, + "loss_text": 1.4942, + "ppl": 5.3854, + "step": 8481 + }, + { + "epoch": 0.05, + "global_step": 8482, + "learning_rate": 0.0004654340567612688, + "loss": 1.6841, + "loss_base2": 2.4296, + "loss_pixel": 0.1896, + "loss_text": 1.4945, + "ppl": 5.3876, + "step": 8482 + }, + { + "epoch": 0.05, + "global_step": 8483, + "learning_rate": 0.0004654298831385643, + "loss": 1.6619, + "loss_base2": 2.3976, + "loss_pixel": 0.1867, + "loss_text": 1.4752, + "ppl": 5.2693, + "step": 8483 + }, + { + "epoch": 0.05, + "global_step": 8484, + "learning_rate": 0.0004654257095158598, + "loss": 1.6616, + "loss_base2": 2.3972, + "loss_pixel": 0.186, + "loss_text": 1.4755, + "ppl": 5.2677, + "step": 8484 + }, + { + "epoch": 0.05, + "global_step": 8485, + "learning_rate": 0.0004654215358931553, + "loss": 1.6846, + "loss_base2": 2.4304, + "loss_pixel": 0.1885, + "loss_text": 1.4961, + "ppl": 5.3903, + "step": 8485 + }, + { + "epoch": 0.05, + "global_step": 8486, + "learning_rate": 0.00046541736227045076, + "loss": 1.6678, + "loss_base2": 2.4061, + "loss_pixel": 0.1853, + "loss_text": 1.4824, + "ppl": 5.3005, + "step": 8486 + }, + { + "epoch": 0.05, + "global_step": 8487, + "learning_rate": 0.0004654131886477462, + "loss": 1.6565, + "loss_base2": 2.3898, + "loss_pixel": 0.1859, + "loss_text": 1.4706, + "ppl": 5.2409, + "step": 8487 + }, + { + "epoch": 0.05, + "global_step": 8488, + "learning_rate": 0.0004654090150250417, + "loss": 1.6524, + "loss_base2": 2.3839, + "loss_pixel": 0.1837, + "loss_text": 1.4687, + "ppl": 5.2195, + "step": 8488 + }, + { + "epoch": 0.05, + "global_step": 8489, + "learning_rate": 0.0004654048414023372, + "loss": 1.691, + "loss_base2": 2.4396, + "loss_pixel": 0.1831, + "loss_text": 1.5079, + "ppl": 5.4249, + "step": 8489 + }, + { + "epoch": 0.05, + "global_step": 8490, + "learning_rate": 0.00046540066777963273, + "loss": 1.6527, + "loss_base2": 2.3843, + "loss_pixel": 0.1815, + "loss_text": 1.4712, + "ppl": 5.2211, + "step": 8490 + }, + { + "epoch": 0.05, + "global_step": 8491, + "learning_rate": 0.0004653964941569282, + "loss": 1.6774, + "loss_base2": 2.42, + "loss_pixel": 0.1824, + "loss_text": 1.495, + "ppl": 5.3516, + "step": 8491 + }, + { + "epoch": 0.05, + "global_step": 8492, + "learning_rate": 0.0004653923205342237, + "loss": 1.6737, + "loss_base2": 2.4146, + "loss_pixel": 0.1824, + "loss_text": 1.4913, + "ppl": 5.3319, + "step": 8492 + }, + { + "epoch": 0.05, + "global_step": 8493, + "learning_rate": 0.0004653881469115192, + "loss": 1.655, + "loss_base2": 2.3877, + "loss_pixel": 0.1804, + "loss_text": 1.4745, + "ppl": 5.2331, + "step": 8493 + }, + { + "epoch": 0.05, + "global_step": 8494, + "learning_rate": 0.0004653839732888147, + "loss": 1.6489, + "loss_base2": 2.3789, + "loss_pixel": 0.1787, + "loss_text": 1.4702, + "ppl": 5.2013, + "step": 8494 + }, + { + "epoch": 0.05, + "global_step": 8495, + "learning_rate": 0.0004653797996661102, + "loss": 1.6675, + "loss_base2": 2.4057, + "loss_pixel": 0.1801, + "loss_text": 1.4875, + "ppl": 5.2989, + "step": 8495 + }, + { + "epoch": 0.05, + "global_step": 8496, + "learning_rate": 0.00046537562604340567, + "loss": 1.6503, + "loss_base2": 2.3809, + "loss_pixel": 0.1779, + "loss_text": 1.4724, + "ppl": 5.2085, + "step": 8496 + }, + { + "epoch": 0.05, + "global_step": 8497, + "learning_rate": 0.0004653714524207012, + "loss": 1.6659, + "loss_base2": 2.4034, + "loss_pixel": 0.1792, + "loss_text": 1.4867, + "ppl": 5.2904, + "step": 8497 + }, + { + "epoch": 0.05, + "global_step": 8498, + "learning_rate": 0.0004653672787979967, + "loss": 1.6526, + "loss_base2": 2.3842, + "loss_pixel": 0.1786, + "loss_text": 1.474, + "ppl": 5.2205, + "step": 8498 + }, + { + "epoch": 0.05, + "global_step": 8499, + "learning_rate": 0.0004653631051752922, + "loss": 1.6565, + "loss_base2": 2.3898, + "loss_pixel": 0.1769, + "loss_text": 1.4795, + "ppl": 5.2409, + "step": 8499 + }, + { + "epoch": 0.05, + "global_step": 8500, + "learning_rate": 0.0004653589315525877, + "loss": 1.6556, + "loss_base2": 2.3885, + "loss_pixel": 0.1775, + "loss_text": 1.4781, + "ppl": 5.2362, + "step": 8500 + }, + { + "epoch": 0.05, + "global_step": 8501, + "learning_rate": 0.00046535475792988315, + "loss": 1.6128, + "loss_base2": 2.3268, + "loss_pixel": 0.1771, + "loss_text": 1.4357, + "ppl": 5.0168, + "step": 8501 + }, + { + "epoch": 0.05, + "global_step": 8502, + "learning_rate": 0.00046535058430717866, + "loss": 1.674, + "loss_base2": 2.4151, + "loss_pixel": 0.1775, + "loss_text": 1.4965, + "ppl": 5.3335, + "step": 8502 + }, + { + "epoch": 0.05, + "global_step": 8503, + "learning_rate": 0.00046534641068447417, + "loss": 1.6593, + "loss_base2": 2.3939, + "loss_pixel": 0.177, + "loss_text": 1.4822, + "ppl": 5.2556, + "step": 8503 + }, + { + "epoch": 0.05, + "global_step": 8504, + "learning_rate": 0.0004653422370617696, + "loss": 1.6562, + "loss_base2": 2.3894, + "loss_pixel": 0.1766, + "loss_text": 1.4796, + "ppl": 5.2394, + "step": 8504 + }, + { + "epoch": 0.05, + "global_step": 8505, + "learning_rate": 0.00046533806343906507, + "loss": 1.6494, + "loss_base2": 2.3796, + "loss_pixel": 0.1756, + "loss_text": 1.4738, + "ppl": 5.2039, + "step": 8505 + }, + { + "epoch": 0.05, + "global_step": 8506, + "learning_rate": 0.0004653338898163606, + "loss": 1.6456, + "loss_base2": 2.3741, + "loss_pixel": 0.1764, + "loss_text": 1.4692, + "ppl": 5.1841, + "step": 8506 + }, + { + "epoch": 0.05, + "global_step": 8507, + "learning_rate": 0.0004653297161936561, + "loss": 1.6627, + "loss_base2": 2.3988, + "loss_pixel": 0.176, + "loss_text": 1.4867, + "ppl": 5.2735, + "step": 8507 + }, + { + "epoch": 0.05, + "global_step": 8508, + "learning_rate": 0.0004653255425709516, + "loss": 1.653, + "loss_base2": 2.3848, + "loss_pixel": 0.1748, + "loss_text": 1.4782, + "ppl": 5.2226, + "step": 8508 + }, + { + "epoch": 0.05, + "global_step": 8509, + "learning_rate": 0.0004653213689482471, + "loss": 1.6468, + "loss_base2": 2.3758, + "loss_pixel": 0.1735, + "loss_text": 1.4733, + "ppl": 5.1903, + "step": 8509 + }, + { + "epoch": 0.05, + "global_step": 8510, + "learning_rate": 0.00046531719532554256, + "loss": 1.6488, + "loss_base2": 2.3787, + "loss_pixel": 0.1747, + "loss_text": 1.4741, + "ppl": 5.2007, + "step": 8510 + }, + { + "epoch": 0.05, + "global_step": 8511, + "learning_rate": 0.00046531302170283806, + "loss": 1.6422, + "loss_base2": 2.3692, + "loss_pixel": 0.1747, + "loss_text": 1.4676, + "ppl": 5.1665, + "step": 8511 + }, + { + "epoch": 0.05, + "global_step": 8512, + "learning_rate": 0.00046530884808013357, + "loss": 1.6469, + "loss_base2": 2.376, + "loss_pixel": 0.1752, + "loss_text": 1.4717, + "ppl": 5.1909, + "step": 8512 + }, + { + "epoch": 0.05, + "global_step": 8513, + "learning_rate": 0.0004653046744574291, + "loss": 1.6635, + "loss_base2": 2.3999, + "loss_pixel": 0.1747, + "loss_text": 1.4888, + "ppl": 5.2778, + "step": 8513 + }, + { + "epoch": 0.05, + "global_step": 8514, + "learning_rate": 0.00046530050083472453, + "loss": 1.656, + "loss_base2": 2.3891, + "loss_pixel": 0.1739, + "loss_text": 1.482, + "ppl": 5.2383, + "step": 8514 + }, + { + "epoch": 0.05, + "global_step": 8515, + "learning_rate": 0.00046529632721202004, + "loss": 1.6536, + "loss_base2": 2.3856, + "loss_pixel": 0.174, + "loss_text": 1.4796, + "ppl": 5.2258, + "step": 8515 + }, + { + "epoch": 0.05, + "global_step": 8516, + "learning_rate": 0.00046529215358931554, + "loss": 1.6636, + "loss_base2": 2.4001, + "loss_pixel": 0.1749, + "loss_text": 1.4887, + "ppl": 5.2783, + "step": 8516 + }, + { + "epoch": 0.05, + "global_step": 8517, + "learning_rate": 0.00046528797996661105, + "loss": 1.6432, + "loss_base2": 2.3706, + "loss_pixel": 0.1739, + "loss_text": 1.4693, + "ppl": 5.1717, + "step": 8517 + }, + { + "epoch": 0.05, + "global_step": 8518, + "learning_rate": 0.00046528380634390656, + "loss": 1.6618, + "loss_base2": 2.3975, + "loss_pixel": 0.1742, + "loss_text": 1.4875, + "ppl": 5.2688, + "step": 8518 + }, + { + "epoch": 0.05, + "global_step": 8519, + "learning_rate": 0.000465279632721202, + "loss": 1.6574, + "loss_base2": 2.3911, + "loss_pixel": 0.1729, + "loss_text": 1.4845, + "ppl": 5.2457, + "step": 8519 + }, + { + "epoch": 0.05, + "global_step": 8520, + "learning_rate": 0.0004652754590984975, + "loss": 1.6397, + "loss_base2": 2.3656, + "loss_pixel": 0.1743, + "loss_text": 1.4654, + "ppl": 5.1536, + "step": 8520 + }, + { + "epoch": 0.05, + "global_step": 8521, + "learning_rate": 0.000465271285475793, + "loss": 1.6448, + "loss_base2": 2.3729, + "loss_pixel": 0.1734, + "loss_text": 1.4714, + "ppl": 5.18, + "step": 8521 + }, + { + "epoch": 0.05, + "global_step": 8522, + "learning_rate": 0.00046526711185308853, + "loss": 1.6464, + "loss_base2": 2.3753, + "loss_pixel": 0.1732, + "loss_text": 1.4733, + "ppl": 5.1883, + "step": 8522 + }, + { + "epoch": 0.05, + "global_step": 8523, + "learning_rate": 0.00046526293823038393, + "loss": 1.6508, + "loss_base2": 2.3816, + "loss_pixel": 0.1727, + "loss_text": 1.4781, + "ppl": 5.2111, + "step": 8523 + }, + { + "epoch": 0.05, + "global_step": 8524, + "learning_rate": 0.00046525876460767944, + "loss": 1.6536, + "loss_base2": 2.3856, + "loss_pixel": 0.1738, + "loss_text": 1.4798, + "ppl": 5.2258, + "step": 8524 + }, + { + "epoch": 0.05, + "global_step": 8525, + "learning_rate": 0.00046525459098497495, + "loss": 1.6551, + "loss_base2": 2.3878, + "loss_pixel": 0.1732, + "loss_text": 1.4819, + "ppl": 5.2336, + "step": 8525 + }, + { + "epoch": 0.05, + "global_step": 8526, + "learning_rate": 0.00046525041736227046, + "loss": 1.6589, + "loss_base2": 2.3933, + "loss_pixel": 0.1731, + "loss_text": 1.4858, + "ppl": 5.2535, + "step": 8526 + }, + { + "epoch": 0.05, + "global_step": 8527, + "learning_rate": 0.00046524624373956596, + "loss": 1.6478, + "loss_base2": 2.3773, + "loss_pixel": 0.1724, + "loss_text": 1.4755, + "ppl": 5.1955, + "step": 8527 + }, + { + "epoch": 0.05, + "global_step": 8528, + "learning_rate": 0.0004652420701168614, + "loss": 1.6591, + "loss_base2": 2.3936, + "loss_pixel": 0.1733, + "loss_text": 1.4858, + "ppl": 5.2546, + "step": 8528 + }, + { + "epoch": 0.05, + "global_step": 8529, + "learning_rate": 0.0004652378964941569, + "loss": 1.6567, + "loss_base2": 2.3901, + "loss_pixel": 0.1728, + "loss_text": 1.4839, + "ppl": 5.242, + "step": 8529 + }, + { + "epoch": 0.05, + "global_step": 8530, + "learning_rate": 0.00046523372287145243, + "loss": 1.6557, + "loss_base2": 2.3887, + "loss_pixel": 0.173, + "loss_text": 1.4827, + "ppl": 5.2367, + "step": 8530 + }, + { + "epoch": 0.05, + "global_step": 8531, + "learning_rate": 0.00046522954924874794, + "loss": 1.6442, + "loss_base2": 2.3721, + "loss_pixel": 0.1725, + "loss_text": 1.4717, + "ppl": 5.1769, + "step": 8531 + }, + { + "epoch": 0.05, + "global_step": 8532, + "learning_rate": 0.0004652253756260434, + "loss": 1.6447, + "loss_base2": 2.3728, + "loss_pixel": 0.1731, + "loss_text": 1.4716, + "ppl": 5.1795, + "step": 8532 + }, + { + "epoch": 0.05, + "global_step": 8533, + "learning_rate": 0.0004652212020033389, + "loss": 1.6601, + "loss_base2": 2.395, + "loss_pixel": 0.1726, + "loss_text": 1.4875, + "ppl": 5.2598, + "step": 8533 + }, + { + "epoch": 0.05, + "global_step": 8534, + "learning_rate": 0.0004652170283806344, + "loss": 1.6414, + "loss_base2": 2.368, + "loss_pixel": 0.1719, + "loss_text": 1.4695, + "ppl": 5.1624, + "step": 8534 + }, + { + "epoch": 0.05, + "global_step": 8535, + "learning_rate": 0.0004652128547579299, + "loss": 1.6624, + "loss_base2": 2.3983, + "loss_pixel": 0.1725, + "loss_text": 1.4898, + "ppl": 5.2719, + "step": 8535 + }, + { + "epoch": 0.05, + "global_step": 8536, + "learning_rate": 0.0004652086811352254, + "loss": 1.6618, + "loss_base2": 2.3975, + "loss_pixel": 0.1716, + "loss_text": 1.4901, + "ppl": 5.2688, + "step": 8536 + }, + { + "epoch": 0.05, + "global_step": 8537, + "learning_rate": 0.0004652045075125209, + "loss": 1.6447, + "loss_base2": 2.3728, + "loss_pixel": 0.1746, + "loss_text": 1.4702, + "ppl": 5.1795, + "step": 8537 + }, + { + "epoch": 0.05, + "global_step": 8538, + "learning_rate": 0.0004652003338898164, + "loss": 1.6498, + "loss_base2": 2.3802, + "loss_pixel": 0.172, + "loss_text": 1.4778, + "ppl": 5.2059, + "step": 8538 + }, + { + "epoch": 0.05, + "global_step": 8539, + "learning_rate": 0.0004651961602671119, + "loss": 1.644, + "loss_base2": 2.3718, + "loss_pixel": 0.172, + "loss_text": 1.472, + "ppl": 5.1758, + "step": 8539 + }, + { + "epoch": 0.05, + "global_step": 8540, + "learning_rate": 0.0004651919866444074, + "loss": 1.6593, + "loss_base2": 2.3939, + "loss_pixel": 0.1727, + "loss_text": 1.4866, + "ppl": 5.2556, + "step": 8540 + }, + { + "epoch": 0.05, + "global_step": 8541, + "learning_rate": 0.00046518781302170285, + "loss": 1.654, + "loss_base2": 2.3862, + "loss_pixel": 0.1732, + "loss_text": 1.4807, + "ppl": 5.2278, + "step": 8541 + }, + { + "epoch": 0.05, + "global_step": 8542, + "learning_rate": 0.0004651836393989983, + "loss": 1.65, + "loss_base2": 2.3804, + "loss_pixel": 0.1723, + "loss_text": 1.4778, + "ppl": 5.207, + "step": 8542 + }, + { + "epoch": 0.05, + "global_step": 8543, + "learning_rate": 0.0004651794657762938, + "loss": 1.624, + "loss_base2": 2.3429, + "loss_pixel": 0.1723, + "loss_text": 1.4517, + "ppl": 5.0733, + "step": 8543 + }, + { + "epoch": 0.05, + "global_step": 8544, + "learning_rate": 0.0004651752921535893, + "loss": 1.6689, + "loss_base2": 2.4077, + "loss_pixel": 0.173, + "loss_text": 1.496, + "ppl": 5.3063, + "step": 8544 + }, + { + "epoch": 0.05, + "global_step": 8545, + "learning_rate": 0.0004651711185308848, + "loss": 1.6461, + "loss_base2": 2.3748, + "loss_pixel": 0.1717, + "loss_text": 1.4745, + "ppl": 5.1867, + "step": 8545 + }, + { + "epoch": 0.05, + "global_step": 8546, + "learning_rate": 0.0004651669449081803, + "loss": 1.6207, + "loss_base2": 2.3382, + "loss_pixel": 0.172, + "loss_text": 1.4487, + "ppl": 5.0566, + "step": 8546 + }, + { + "epoch": 0.05, + "global_step": 8547, + "learning_rate": 0.0004651627712854758, + "loss": 1.667, + "loss_base2": 2.405, + "loss_pixel": 0.1716, + "loss_text": 1.4954, + "ppl": 5.2963, + "step": 8547 + }, + { + "epoch": 0.05, + "global_step": 8548, + "learning_rate": 0.0004651585976627713, + "loss": 1.6457, + "loss_base2": 2.3742, + "loss_pixel": 0.1678, + "loss_text": 1.4779, + "ppl": 5.1846, + "step": 8548 + }, + { + "epoch": 0.05, + "global_step": 8549, + "learning_rate": 0.0004651544240400668, + "loss": 1.6396, + "loss_base2": 2.3654, + "loss_pixel": 0.1685, + "loss_text": 1.4711, + "ppl": 5.1531, + "step": 8549 + }, + { + "epoch": 0.05, + "global_step": 8550, + "learning_rate": 0.00046515025041736225, + "loss": 1.6573, + "loss_base2": 2.391, + "loss_pixel": 0.1672, + "loss_text": 1.4901, + "ppl": 5.2451, + "step": 8550 + }, + { + "epoch": 0.05, + "global_step": 8551, + "learning_rate": 0.00046514607679465776, + "loss": 1.6494, + "loss_base2": 2.3796, + "loss_pixel": 0.1697, + "loss_text": 1.4798, + "ppl": 5.2039, + "step": 8551 + }, + { + "epoch": 0.05, + "global_step": 8552, + "learning_rate": 0.00046514190317195327, + "loss": 1.647, + "loss_base2": 2.3761, + "loss_pixel": 0.1699, + "loss_text": 1.4771, + "ppl": 5.1914, + "step": 8552 + }, + { + "epoch": 0.05, + "global_step": 8553, + "learning_rate": 0.0004651377295492488, + "loss": 1.6173, + "loss_base2": 2.3333, + "loss_pixel": 0.1664, + "loss_text": 1.4509, + "ppl": 5.0395, + "step": 8553 + }, + { + "epoch": 0.05, + "global_step": 8554, + "learning_rate": 0.0004651335559265443, + "loss": 1.4385, + "loss_base2": 2.0753, + "loss_pixel": 0.1657, + "loss_text": 1.2728, + "ppl": 4.2144, + "step": 8554 + }, + { + "epoch": 0.05, + "global_step": 8555, + "learning_rate": 0.00046512938230383973, + "loss": 1.4521, + "loss_base2": 2.0949, + "loss_pixel": 0.1668, + "loss_text": 1.2853, + "ppl": 4.2721, + "step": 8555 + }, + { + "epoch": 0.05, + "global_step": 8556, + "learning_rate": 0.00046512520868113524, + "loss": 1.4587, + "loss_base2": 2.1045, + "loss_pixel": 0.1658, + "loss_text": 1.2929, + "ppl": 4.3004, + "step": 8556 + }, + { + "epoch": 0.05, + "global_step": 8557, + "learning_rate": 0.00046512103505843075, + "loss": 1.4313, + "loss_base2": 2.0649, + "loss_pixel": 0.1653, + "loss_text": 1.266, + "ppl": 4.1841, + "step": 8557 + }, + { + "epoch": 0.05, + "global_step": 8558, + "learning_rate": 0.00046511686143572626, + "loss": 1.4281, + "loss_base2": 2.0603, + "loss_pixel": 0.1661, + "loss_text": 1.2621, + "ppl": 4.1708, + "step": 8558 + }, + { + "epoch": 0.05, + "global_step": 8559, + "learning_rate": 0.00046511268781302176, + "loss": 1.4485, + "loss_base2": 2.0897, + "loss_pixel": 0.1651, + "loss_text": 1.2834, + "ppl": 4.2567, + "step": 8559 + }, + { + "epoch": 0.05, + "global_step": 8560, + "learning_rate": 0.00046510851419031716, + "loss": 1.4294, + "loss_base2": 2.0622, + "loss_pixel": 0.1675, + "loss_text": 1.2618, + "ppl": 4.1762, + "step": 8560 + }, + { + "epoch": 0.05, + "global_step": 8561, + "learning_rate": 0.00046510434056761267, + "loss": 1.5196, + "loss_base2": 2.1923, + "loss_pixel": 0.1676, + "loss_text": 1.352, + "ppl": 4.5704, + "step": 8561 + }, + { + "epoch": 0.05, + "global_step": 8562, + "learning_rate": 0.0004651001669449082, + "loss": 1.6593, + "loss_base2": 2.3939, + "loss_pixel": 0.1642, + "loss_text": 1.4951, + "ppl": 5.2556, + "step": 8562 + }, + { + "epoch": 0.05, + "global_step": 8563, + "learning_rate": 0.0004650959933222037, + "loss": 1.6526, + "loss_base2": 2.3842, + "loss_pixel": 0.1622, + "loss_text": 1.4904, + "ppl": 5.2205, + "step": 8563 + }, + { + "epoch": 0.05, + "global_step": 8564, + "learning_rate": 0.00046509181969949914, + "loss": 1.639, + "loss_base2": 2.3646, + "loss_pixel": 0.1638, + "loss_text": 1.4752, + "ppl": 5.15, + "step": 8564 + }, + { + "epoch": 0.05, + "global_step": 8565, + "learning_rate": 0.00046508764607679464, + "loss": 1.6563, + "loss_base2": 2.3895, + "loss_pixel": 0.1648, + "loss_text": 1.4915, + "ppl": 5.2399, + "step": 8565 + }, + { + "epoch": 0.05, + "global_step": 8566, + "learning_rate": 0.00046508347245409015, + "loss": 1.661, + "loss_base2": 2.3963, + "loss_pixel": 0.1663, + "loss_text": 1.4946, + "ppl": 5.2646, + "step": 8566 + }, + { + "epoch": 0.05, + "global_step": 8567, + "learning_rate": 0.00046507929883138566, + "loss": 1.6504, + "loss_base2": 2.381, + "loss_pixel": 0.1662, + "loss_text": 1.4842, + "ppl": 5.2091, + "step": 8567 + }, + { + "epoch": 0.05, + "global_step": 8568, + "learning_rate": 0.00046507512520868117, + "loss": 1.6646, + "loss_base2": 2.4015, + "loss_pixel": 0.1681, + "loss_text": 1.4964, + "ppl": 5.2836, + "step": 8568 + }, + { + "epoch": 0.05, + "global_step": 8569, + "learning_rate": 0.0004650709515859766, + "loss": 1.6506, + "loss_base2": 2.3813, + "loss_pixel": 0.1647, + "loss_text": 1.4859, + "ppl": 5.2101, + "step": 8569 + }, + { + "epoch": 0.05, + "global_step": 8570, + "learning_rate": 0.0004650667779632721, + "loss": 1.6396, + "loss_base2": 2.3654, + "loss_pixel": 0.1639, + "loss_text": 1.4756, + "ppl": 5.1531, + "step": 8570 + }, + { + "epoch": 0.05, + "global_step": 8571, + "learning_rate": 0.00046506260434056763, + "loss": 1.6545, + "loss_base2": 2.3869, + "loss_pixel": 0.1628, + "loss_text": 1.4917, + "ppl": 5.2305, + "step": 8571 + }, + { + "epoch": 0.05, + "global_step": 8572, + "learning_rate": 0.00046505843071786314, + "loss": 1.6559, + "loss_base2": 2.389, + "loss_pixel": 0.1646, + "loss_text": 1.4913, + "ppl": 5.2378, + "step": 8572 + }, + { + "epoch": 0.05, + "global_step": 8573, + "learning_rate": 0.0004650542570951586, + "loss": 1.6422, + "loss_base2": 2.3692, + "loss_pixel": 0.1621, + "loss_text": 1.4801, + "ppl": 5.1665, + "step": 8573 + }, + { + "epoch": 0.05, + "global_step": 8574, + "learning_rate": 0.0004650500834724541, + "loss": 1.622, + "loss_base2": 2.3401, + "loss_pixel": 0.162, + "loss_text": 1.46, + "ppl": 5.0632, + "step": 8574 + }, + { + "epoch": 0.05, + "global_step": 8575, + "learning_rate": 0.0004650459098497496, + "loss": 1.6577, + "loss_base2": 2.3916, + "loss_pixel": 0.1631, + "loss_text": 1.4946, + "ppl": 5.2472, + "step": 8575 + }, + { + "epoch": 0.05, + "global_step": 8576, + "learning_rate": 0.0004650417362270451, + "loss": 1.6522, + "loss_base2": 2.3836, + "loss_pixel": 0.1615, + "loss_text": 1.4907, + "ppl": 5.2184, + "step": 8576 + }, + { + "epoch": 0.05, + "global_step": 8577, + "learning_rate": 0.0004650375626043406, + "loss": 1.6559, + "loss_base2": 2.389, + "loss_pixel": 0.163, + "loss_text": 1.4929, + "ppl": 5.2378, + "step": 8577 + }, + { + "epoch": 0.05, + "global_step": 8578, + "learning_rate": 0.0004650333889816361, + "loss": 1.6389, + "loss_base2": 2.3644, + "loss_pixel": 0.164, + "loss_text": 1.4749, + "ppl": 5.1495, + "step": 8578 + }, + { + "epoch": 0.05, + "global_step": 8579, + "learning_rate": 0.00046502921535893153, + "loss": 1.6123, + "loss_base2": 2.3261, + "loss_pixel": 0.163, + "loss_text": 1.4493, + "ppl": 5.0143, + "step": 8579 + }, + { + "epoch": 0.05, + "global_step": 8580, + "learning_rate": 0.00046502504173622704, + "loss": 1.6582, + "loss_base2": 2.3923, + "loss_pixel": 0.1648, + "loss_text": 1.4934, + "ppl": 5.2499, + "step": 8580 + }, + { + "epoch": 0.05, + "global_step": 8581, + "learning_rate": 0.00046502086811352254, + "loss": 1.64, + "loss_base2": 2.366, + "loss_pixel": 0.1637, + "loss_text": 1.4763, + "ppl": 5.1552, + "step": 8581 + }, + { + "epoch": 0.05, + "global_step": 8582, + "learning_rate": 0.000465016694490818, + "loss": 1.6552, + "loss_base2": 2.3879, + "loss_pixel": 0.1655, + "loss_text": 1.4896, + "ppl": 5.2341, + "step": 8582 + }, + { + "epoch": 0.05, + "global_step": 8583, + "learning_rate": 0.0004650125208681135, + "loss": 1.6304, + "loss_base2": 2.3522, + "loss_pixel": 0.1612, + "loss_text": 1.4692, + "ppl": 5.1059, + "step": 8583 + }, + { + "epoch": 0.05, + "global_step": 8584, + "learning_rate": 0.000465008347245409, + "loss": 1.6129, + "loss_base2": 2.3269, + "loss_pixel": 0.1594, + "loss_text": 1.4535, + "ppl": 5.0173, + "step": 8584 + }, + { + "epoch": 0.05, + "global_step": 8585, + "learning_rate": 0.0004650041736227045, + "loss": 1.6401, + "loss_base2": 2.3662, + "loss_pixel": 0.161, + "loss_text": 1.4791, + "ppl": 5.1557, + "step": 8585 + }, + { + "epoch": 0.05, + "global_step": 8586, + "learning_rate": 0.000465, + "loss": 1.6445, + "loss_base2": 2.3725, + "loss_pixel": 0.1615, + "loss_text": 1.483, + "ppl": 5.1784, + "step": 8586 + }, + { + "epoch": 0.05, + "global_step": 8587, + "learning_rate": 0.0004649958263772955, + "loss": 1.6458, + "loss_base2": 2.3744, + "loss_pixel": 0.1618, + "loss_text": 1.484, + "ppl": 5.1852, + "step": 8587 + }, + { + "epoch": 0.05, + "global_step": 8588, + "learning_rate": 0.000464991652754591, + "loss": 1.6139, + "loss_base2": 2.3284, + "loss_pixel": 0.1609, + "loss_text": 1.4531, + "ppl": 5.0224, + "step": 8588 + }, + { + "epoch": 0.05, + "global_step": 8589, + "learning_rate": 0.0004649874791318865, + "loss": 1.6262, + "loss_base2": 2.3461, + "loss_pixel": 0.1618, + "loss_text": 1.4644, + "ppl": 5.0845, + "step": 8589 + }, + { + "epoch": 0.05, + "global_step": 8590, + "learning_rate": 0.000464983305509182, + "loss": 1.6409, + "loss_base2": 2.3673, + "loss_pixel": 0.159, + "loss_text": 1.4818, + "ppl": 5.1598, + "step": 8590 + }, + { + "epoch": 0.05, + "global_step": 8591, + "learning_rate": 0.00046497913188647746, + "loss": 1.6555, + "loss_base2": 2.3884, + "loss_pixel": 0.1612, + "loss_text": 1.4943, + "ppl": 5.2357, + "step": 8591 + }, + { + "epoch": 0.05, + "global_step": 8592, + "learning_rate": 0.00046497495826377296, + "loss": 1.6312, + "loss_base2": 2.3533, + "loss_pixel": 0.161, + "loss_text": 1.4702, + "ppl": 5.11, + "step": 8592 + }, + { + "epoch": 0.05, + "global_step": 8593, + "learning_rate": 0.00046497078464106847, + "loss": 1.6282, + "loss_base2": 2.349, + "loss_pixel": 0.1607, + "loss_text": 1.4675, + "ppl": 5.0947, + "step": 8593 + }, + { + "epoch": 0.05, + "global_step": 8594, + "learning_rate": 0.000464966611018364, + "loss": 1.64, + "loss_base2": 2.366, + "loss_pixel": 0.1632, + "loss_text": 1.4768, + "ppl": 5.1552, + "step": 8594 + }, + { + "epoch": 0.05, + "global_step": 8595, + "learning_rate": 0.0004649624373956595, + "loss": 1.6479, + "loss_base2": 2.3774, + "loss_pixel": 0.1601, + "loss_text": 1.4877, + "ppl": 5.1961, + "step": 8595 + }, + { + "epoch": 0.05, + "global_step": 8596, + "learning_rate": 0.00046495826377295494, + "loss": 1.6326, + "loss_base2": 2.3553, + "loss_pixel": 0.1592, + "loss_text": 1.4734, + "ppl": 5.1172, + "step": 8596 + }, + { + "epoch": 0.05, + "global_step": 8597, + "learning_rate": 0.00046495409015025044, + "loss": 1.6416, + "loss_base2": 2.3683, + "loss_pixel": 0.1603, + "loss_text": 1.4813, + "ppl": 5.1634, + "step": 8597 + }, + { + "epoch": 0.05, + "global_step": 8598, + "learning_rate": 0.0004649499165275459, + "loss": 1.6534, + "loss_base2": 2.3854, + "loss_pixel": 0.1704, + "loss_text": 1.483, + "ppl": 5.2247, + "step": 8598 + }, + { + "epoch": 0.05, + "global_step": 8599, + "learning_rate": 0.0004649457429048414, + "loss": 1.6454, + "loss_base2": 2.3738, + "loss_pixel": 0.1727, + "loss_text": 1.4727, + "ppl": 5.1831, + "step": 8599 + }, + { + "epoch": 0.05, + "global_step": 8600, + "learning_rate": 0.00046494156928213686, + "loss": 1.6529, + "loss_base2": 2.3846, + "loss_pixel": 0.1735, + "loss_text": 1.4795, + "ppl": 5.2221, + "step": 8600 + }, + { + "epoch": 0.05, + "global_step": 8601, + "learning_rate": 0.00046493739565943237, + "loss": 1.6581, + "loss_base2": 2.3921, + "loss_pixel": 0.1718, + "loss_text": 1.4863, + "ppl": 5.2493, + "step": 8601 + }, + { + "epoch": 0.05, + "global_step": 8602, + "learning_rate": 0.0004649332220367279, + "loss": 1.654, + "loss_base2": 2.3862, + "loss_pixel": 0.1728, + "loss_text": 1.4812, + "ppl": 5.2278, + "step": 8602 + }, + { + "epoch": 0.05, + "global_step": 8603, + "learning_rate": 0.0004649290484140234, + "loss": 1.6426, + "loss_base2": 2.3698, + "loss_pixel": 0.1715, + "loss_text": 1.4711, + "ppl": 5.1686, + "step": 8603 + }, + { + "epoch": 0.05, + "global_step": 8604, + "learning_rate": 0.0004649248747913189, + "loss": 1.6715, + "loss_base2": 2.4115, + "loss_pixel": 0.1714, + "loss_text": 1.5001, + "ppl": 5.3201, + "step": 8604 + }, + { + "epoch": 0.05, + "global_step": 8605, + "learning_rate": 0.00046492070116861434, + "loss": 1.6511, + "loss_base2": 2.382, + "loss_pixel": 0.1717, + "loss_text": 1.4794, + "ppl": 5.2127, + "step": 8605 + }, + { + "epoch": 0.05, + "global_step": 8606, + "learning_rate": 0.00046491652754590985, + "loss": 1.6532, + "loss_base2": 2.3851, + "loss_pixel": 0.1748, + "loss_text": 1.4785, + "ppl": 5.2237, + "step": 8606 + }, + { + "epoch": 0.05, + "global_step": 8607, + "learning_rate": 0.00046491235392320536, + "loss": 1.5039, + "loss_base2": 2.1697, + "loss_pixel": 0.1748, + "loss_text": 1.3291, + "ppl": 4.4992, + "step": 8607 + }, + { + "epoch": 0.05, + "global_step": 8608, + "learning_rate": 0.00046490818030050086, + "loss": 1.4485, + "loss_base2": 2.0897, + "loss_pixel": 0.1743, + "loss_text": 1.2742, + "ppl": 4.2567, + "step": 8608 + }, + { + "epoch": 0.05, + "global_step": 8609, + "learning_rate": 0.0004649040066777963, + "loss": 1.4515, + "loss_base2": 2.0941, + "loss_pixel": 0.1734, + "loss_text": 1.2782, + "ppl": 4.2695, + "step": 8609 + }, + { + "epoch": 0.05, + "global_step": 8610, + "learning_rate": 0.0004648998330550918, + "loss": 1.445, + "loss_base2": 2.0847, + "loss_pixel": 0.1729, + "loss_text": 1.2721, + "ppl": 4.2419, + "step": 8610 + }, + { + "epoch": 0.05, + "global_step": 8611, + "learning_rate": 0.00046489565943238733, + "loss": 1.4225, + "loss_base2": 2.0522, + "loss_pixel": 0.1722, + "loss_text": 1.2503, + "ppl": 4.1475, + "step": 8611 + }, + { + "epoch": 0.05, + "global_step": 8612, + "learning_rate": 0.00046489148580968284, + "loss": 1.458, + "loss_base2": 2.1034, + "loss_pixel": 0.1724, + "loss_text": 1.2855, + "ppl": 4.2974, + "step": 8612 + }, + { + "epoch": 0.05, + "global_step": 8613, + "learning_rate": 0.00046488731218697835, + "loss": 1.4564, + "loss_base2": 2.1011, + "loss_pixel": 0.1728, + "loss_text": 1.2837, + "ppl": 4.2905, + "step": 8613 + }, + { + "epoch": 0.05, + "global_step": 8614, + "learning_rate": 0.0004648831385642738, + "loss": 1.4394, + "loss_base2": 2.0766, + "loss_pixel": 0.1762, + "loss_text": 1.2632, + "ppl": 4.2182, + "step": 8614 + }, + { + "epoch": 0.05, + "global_step": 8615, + "learning_rate": 0.0004648789649415693, + "loss": 1.522, + "loss_base2": 2.1958, + "loss_pixel": 0.177, + "loss_text": 1.345, + "ppl": 4.5814, + "step": 8615 + }, + { + "epoch": 0.05, + "global_step": 8616, + "learning_rate": 0.0004648747913188648, + "loss": 1.6782, + "loss_base2": 2.4211, + "loss_pixel": 0.1748, + "loss_text": 1.5034, + "ppl": 5.3559, + "step": 8616 + }, + { + "epoch": 0.05, + "global_step": 8617, + "learning_rate": 0.00046487061769616027, + "loss": 1.6702, + "loss_base2": 2.4096, + "loss_pixel": 0.1733, + "loss_text": 1.4969, + "ppl": 5.3132, + "step": 8617 + }, + { + "epoch": 0.05, + "global_step": 8618, + "learning_rate": 0.0004648664440734558, + "loss": 1.646, + "loss_base2": 2.3747, + "loss_pixel": 0.1749, + "loss_text": 1.4711, + "ppl": 5.1862, + "step": 8618 + }, + { + "epoch": 0.05, + "global_step": 8619, + "learning_rate": 0.0004648622704507512, + "loss": 1.6705, + "loss_base2": 2.41, + "loss_pixel": 0.1748, + "loss_text": 1.4957, + "ppl": 5.3148, + "step": 8619 + }, + { + "epoch": 0.05, + "global_step": 8620, + "learning_rate": 0.00046485809682804673, + "loss": 1.6699, + "loss_base2": 2.4092, + "loss_pixel": 0.1722, + "loss_text": 1.4977, + "ppl": 5.3116, + "step": 8620 + }, + { + "epoch": 0.05, + "global_step": 8621, + "learning_rate": 0.00046485392320534224, + "loss": 1.6514, + "loss_base2": 2.3825, + "loss_pixel": 0.1743, + "loss_text": 1.4771, + "ppl": 5.2143, + "step": 8621 + }, + { + "epoch": 0.05, + "global_step": 8622, + "learning_rate": 0.00046484974958263775, + "loss": 1.6529, + "loss_base2": 2.3846, + "loss_pixel": 0.1726, + "loss_text": 1.4803, + "ppl": 5.2221, + "step": 8622 + }, + { + "epoch": 0.05, + "global_step": 8623, + "learning_rate": 0.0004648455759599332, + "loss": 1.6575, + "loss_base2": 2.3913, + "loss_pixel": 0.1722, + "loss_text": 1.4854, + "ppl": 5.2462, + "step": 8623 + }, + { + "epoch": 0.05, + "global_step": 8624, + "learning_rate": 0.0004648414023372287, + "loss": 1.6401, + "loss_base2": 2.3662, + "loss_pixel": 0.1715, + "loss_text": 1.4686, + "ppl": 5.1557, + "step": 8624 + }, + { + "epoch": 0.05, + "global_step": 8625, + "learning_rate": 0.0004648372287145242, + "loss": 1.6478, + "loss_base2": 2.3773, + "loss_pixel": 0.172, + "loss_text": 1.4757, + "ppl": 5.1955, + "step": 8625 + }, + { + "epoch": 0.05, + "global_step": 8626, + "learning_rate": 0.0004648330550918197, + "loss": 1.6586, + "loss_base2": 2.3929, + "loss_pixel": 0.1715, + "loss_text": 1.4871, + "ppl": 5.252, + "step": 8626 + }, + { + "epoch": 0.05, + "global_step": 8627, + "learning_rate": 0.00046482888146911523, + "loss": 1.6563, + "loss_base2": 2.3895, + "loss_pixel": 0.1708, + "loss_text": 1.4856, + "ppl": 5.2399, + "step": 8627 + }, + { + "epoch": 0.05, + "global_step": 8628, + "learning_rate": 0.0004648247078464107, + "loss": 1.6507, + "loss_base2": 2.3815, + "loss_pixel": 0.1714, + "loss_text": 1.4794, + "ppl": 5.2106, + "step": 8628 + }, + { + "epoch": 0.05, + "global_step": 8629, + "learning_rate": 0.0004648205342237062, + "loss": 1.6432, + "loss_base2": 2.3706, + "loss_pixel": 0.1725, + "loss_text": 1.4707, + "ppl": 5.1717, + "step": 8629 + }, + { + "epoch": 0.05, + "global_step": 8630, + "learning_rate": 0.0004648163606010017, + "loss": 1.6464, + "loss_base2": 2.3753, + "loss_pixel": 0.1725, + "loss_text": 1.4739, + "ppl": 5.1883, + "step": 8630 + }, + { + "epoch": 0.05, + "global_step": 8631, + "learning_rate": 0.0004648121869782972, + "loss": 1.6461, + "loss_base2": 2.3748, + "loss_pixel": 0.173, + "loss_text": 1.4732, + "ppl": 5.1867, + "step": 8631 + }, + { + "epoch": 0.05, + "global_step": 8632, + "learning_rate": 0.00046480801335559266, + "loss": 1.6386, + "loss_base2": 2.364, + "loss_pixel": 0.1714, + "loss_text": 1.4673, + "ppl": 5.148, + "step": 8632 + }, + { + "epoch": 0.05, + "global_step": 8633, + "learning_rate": 0.00046480383973288817, + "loss": 1.6412, + "loss_base2": 2.3678, + "loss_pixel": 0.1712, + "loss_text": 1.4699, + "ppl": 5.1614, + "step": 8633 + }, + { + "epoch": 0.05, + "global_step": 8634, + "learning_rate": 0.0004647996661101837, + "loss": 1.6459, + "loss_base2": 2.3745, + "loss_pixel": 0.1697, + "loss_text": 1.4762, + "ppl": 5.1857, + "step": 8634 + }, + { + "epoch": 0.05, + "global_step": 8635, + "learning_rate": 0.0004647954924874792, + "loss": 1.6524, + "loss_base2": 2.3839, + "loss_pixel": 0.1701, + "loss_text": 1.4823, + "ppl": 5.2195, + "step": 8635 + }, + { + "epoch": 0.05, + "global_step": 8636, + "learning_rate": 0.00046479131886477463, + "loss": 1.6575, + "loss_base2": 2.3913, + "loss_pixel": 0.1711, + "loss_text": 1.4864, + "ppl": 5.2462, + "step": 8636 + }, + { + "epoch": 0.05, + "global_step": 8637, + "learning_rate": 0.0004647871452420701, + "loss": 1.645, + "loss_base2": 2.3732, + "loss_pixel": 0.1717, + "loss_text": 1.4732, + "ppl": 5.181, + "step": 8637 + }, + { + "epoch": 0.05, + "global_step": 8638, + "learning_rate": 0.0004647829716193656, + "loss": 1.6415, + "loss_base2": 2.3682, + "loss_pixel": 0.1708, + "loss_text": 1.4707, + "ppl": 5.1629, + "step": 8638 + }, + { + "epoch": 0.05, + "global_step": 8639, + "learning_rate": 0.0004647787979966611, + "loss": 1.6423, + "loss_base2": 2.3693, + "loss_pixel": 0.1704, + "loss_text": 1.4718, + "ppl": 5.167, + "step": 8639 + }, + { + "epoch": 0.05, + "global_step": 8640, + "learning_rate": 0.0004647746243739566, + "loss": 1.5635, + "loss_base2": 2.2557, + "loss_pixel": 0.1703, + "loss_text": 1.3932, + "ppl": 4.7755, + "step": 8640 + }, + { + "epoch": 0.05, + "global_step": 8641, + "learning_rate": 0.00046477045075125206, + "loss": 1.4631, + "loss_base2": 2.1108, + "loss_pixel": 0.17, + "loss_text": 1.2932, + "ppl": 4.3193, + "step": 8641 + }, + { + "epoch": 0.05, + "global_step": 8642, + "learning_rate": 0.00046476627712854757, + "loss": 1.4448, + "loss_base2": 2.0844, + "loss_pixel": 0.1703, + "loss_text": 1.2745, + "ppl": 4.241, + "step": 8642 + }, + { + "epoch": 0.05, + "global_step": 8643, + "learning_rate": 0.0004647621035058431, + "loss": 1.4353, + "loss_base2": 2.0707, + "loss_pixel": 0.1712, + "loss_text": 1.2641, + "ppl": 4.2009, + "step": 8643 + }, + { + "epoch": 0.05, + "global_step": 8644, + "learning_rate": 0.0004647579298831386, + "loss": 1.4703, + "loss_base2": 2.1212, + "loss_pixel": 0.1707, + "loss_text": 1.2996, + "ppl": 4.3505, + "step": 8644 + }, + { + "epoch": 0.05, + "global_step": 8645, + "learning_rate": 0.0004647537562604341, + "loss": 1.4374, + "loss_base2": 2.0737, + "loss_pixel": 0.1699, + "loss_text": 1.2675, + "ppl": 4.2097, + "step": 8645 + }, + { + "epoch": 0.05, + "global_step": 8646, + "learning_rate": 0.00046474958263772954, + "loss": 1.4336, + "loss_base2": 2.0682, + "loss_pixel": 0.171, + "loss_text": 1.2626, + "ppl": 4.1938, + "step": 8646 + }, + { + "epoch": 0.05, + "global_step": 8647, + "learning_rate": 0.00046474540901502505, + "loss": 1.4561, + "loss_base2": 2.1007, + "loss_pixel": 0.1718, + "loss_text": 1.2843, + "ppl": 4.2892, + "step": 8647 + }, + { + "epoch": 0.05, + "global_step": 8648, + "learning_rate": 0.00046474123539232056, + "loss": 1.4152, + "loss_base2": 2.0417, + "loss_pixel": 0.1713, + "loss_text": 1.2438, + "ppl": 4.1173, + "step": 8648 + }, + { + "epoch": 0.05, + "global_step": 8649, + "learning_rate": 0.00046473706176961607, + "loss": 1.4205, + "loss_base2": 2.0493, + "loss_pixel": 0.1719, + "loss_text": 1.2486, + "ppl": 4.1392, + "step": 8649 + }, + { + "epoch": 0.05, + "global_step": 8650, + "learning_rate": 0.0004647328881469115, + "loss": 1.4296, + "loss_base2": 2.0625, + "loss_pixel": 0.1708, + "loss_text": 1.2588, + "ppl": 4.177, + "step": 8650 + }, + { + "epoch": 0.05, + "global_step": 8651, + "learning_rate": 0.000464728714524207, + "loss": 1.4204, + "loss_base2": 2.0492, + "loss_pixel": 0.1702, + "loss_text": 1.2501, + "ppl": 4.1388, + "step": 8651 + }, + { + "epoch": 0.05, + "global_step": 8652, + "learning_rate": 0.00046472454090150253, + "loss": 1.4496, + "loss_base2": 2.0913, + "loss_pixel": 0.1712, + "loss_text": 1.2784, + "ppl": 4.2614, + "step": 8652 + }, + { + "epoch": 0.05, + "global_step": 8653, + "learning_rate": 0.00046472036727879804, + "loss": 1.43, + "loss_base2": 2.0631, + "loss_pixel": 0.1711, + "loss_text": 1.2589, + "ppl": 4.1787, + "step": 8653 + }, + { + "epoch": 0.05, + "global_step": 8654, + "learning_rate": 0.00046471619365609355, + "loss": 1.4371, + "loss_base2": 2.0733, + "loss_pixel": 0.1702, + "loss_text": 1.2669, + "ppl": 4.2085, + "step": 8654 + }, + { + "epoch": 0.05, + "global_step": 8655, + "learning_rate": 0.00046471202003338895, + "loss": 1.421, + "loss_base2": 2.0501, + "loss_pixel": 0.1706, + "loss_text": 1.2504, + "ppl": 4.1413, + "step": 8655 + }, + { + "epoch": 0.05, + "global_step": 8656, + "learning_rate": 0.00046470784641068446, + "loss": 1.414, + "loss_base2": 2.04, + "loss_pixel": 0.1699, + "loss_text": 1.2441, + "ppl": 4.1124, + "step": 8656 + }, + { + "epoch": 0.05, + "global_step": 8657, + "learning_rate": 0.00046470367278797996, + "loss": 1.4352, + "loss_base2": 2.0706, + "loss_pixel": 0.1712, + "loss_text": 1.264, + "ppl": 4.2005, + "step": 8657 + }, + { + "epoch": 0.05, + "global_step": 8658, + "learning_rate": 0.00046469949916527547, + "loss": 1.4046, + "loss_base2": 2.0264, + "loss_pixel": 0.1705, + "loss_text": 1.234, + "ppl": 4.0739, + "step": 8658 + }, + { + "epoch": 0.05, + "global_step": 8659, + "learning_rate": 0.0004646953255425709, + "loss": 1.4183, + "loss_base2": 2.0462, + "loss_pixel": 0.1705, + "loss_text": 1.2478, + "ppl": 4.1301, + "step": 8659 + }, + { + "epoch": 0.05, + "global_step": 8660, + "learning_rate": 0.00046469115191986643, + "loss": 1.4454, + "loss_base2": 2.0853, + "loss_pixel": 0.1703, + "loss_text": 1.2751, + "ppl": 4.2435, + "step": 8660 + }, + { + "epoch": 0.05, + "global_step": 8661, + "learning_rate": 0.00046468697829716194, + "loss": 1.4268, + "loss_base2": 2.0584, + "loss_pixel": 0.1694, + "loss_text": 1.2573, + "ppl": 4.1653, + "step": 8661 + }, + { + "epoch": 0.05, + "global_step": 8662, + "learning_rate": 0.00046468280467445744, + "loss": 1.4381, + "loss_base2": 2.0747, + "loss_pixel": 0.1699, + "loss_text": 1.2682, + "ppl": 4.2127, + "step": 8662 + }, + { + "epoch": 0.05, + "global_step": 8663, + "learning_rate": 0.00046467863105175295, + "loss": 1.431, + "loss_base2": 2.0645, + "loss_pixel": 0.1713, + "loss_text": 1.2598, + "ppl": 4.1829, + "step": 8663 + }, + { + "epoch": 0.05, + "global_step": 8664, + "learning_rate": 0.0004646744574290484, + "loss": 1.4206, + "loss_base2": 2.0495, + "loss_pixel": 0.1687, + "loss_text": 1.2519, + "ppl": 4.1396, + "step": 8664 + }, + { + "epoch": 0.05, + "global_step": 8665, + "learning_rate": 0.0004646702838063439, + "loss": 1.409, + "loss_base2": 2.0328, + "loss_pixel": 0.169, + "loss_text": 1.24, + "ppl": 4.0919, + "step": 8665 + }, + { + "epoch": 0.05, + "global_step": 8666, + "learning_rate": 0.0004646661101836394, + "loss": 1.4336, + "loss_base2": 2.0682, + "loss_pixel": 0.1713, + "loss_text": 1.2624, + "ppl": 4.1938, + "step": 8666 + }, + { + "epoch": 0.05, + "global_step": 8667, + "learning_rate": 0.00046466193656093493, + "loss": 1.4381, + "loss_base2": 2.0747, + "loss_pixel": 0.1702, + "loss_text": 1.2679, + "ppl": 4.2127, + "step": 8667 + }, + { + "epoch": 0.05, + "global_step": 8668, + "learning_rate": 0.0004646577629382304, + "loss": 1.4147, + "loss_base2": 2.041, + "loss_pixel": 0.1693, + "loss_text": 1.2455, + "ppl": 4.1153, + "step": 8668 + }, + { + "epoch": 0.05, + "global_step": 8669, + "learning_rate": 0.0004646535893155259, + "loss": 1.4235, + "loss_base2": 2.0537, + "loss_pixel": 0.169, + "loss_text": 1.2544, + "ppl": 4.1516, + "step": 8669 + }, + { + "epoch": 0.05, + "global_step": 8670, + "learning_rate": 0.0004646494156928214, + "loss": 1.4297, + "loss_base2": 2.0626, + "loss_pixel": 0.1699, + "loss_text": 1.2598, + "ppl": 4.1774, + "step": 8670 + }, + { + "epoch": 0.05, + "global_step": 8671, + "learning_rate": 0.0004646452420701169, + "loss": 1.4339, + "loss_base2": 2.0687, + "loss_pixel": 0.1689, + "loss_text": 1.2651, + "ppl": 4.195, + "step": 8671 + }, + { + "epoch": 0.05, + "global_step": 8672, + "learning_rate": 0.0004646410684474124, + "loss": 1.4451, + "loss_base2": 2.0848, + "loss_pixel": 0.1699, + "loss_text": 1.2752, + "ppl": 4.2423, + "step": 8672 + }, + { + "epoch": 0.05, + "global_step": 8673, + "learning_rate": 0.0004646368948247078, + "loss": 1.4093, + "loss_base2": 2.0332, + "loss_pixel": 0.1694, + "loss_text": 1.2399, + "ppl": 4.0931, + "step": 8673 + }, + { + "epoch": 0.05, + "global_step": 8674, + "learning_rate": 0.0004646327212020033, + "loss": 1.43, + "loss_base2": 2.0631, + "loss_pixel": 0.1696, + "loss_text": 1.2604, + "ppl": 4.1787, + "step": 8674 + }, + { + "epoch": 0.05, + "global_step": 8675, + "learning_rate": 0.0004646285475792988, + "loss": 1.4353, + "loss_base2": 2.0707, + "loss_pixel": 0.1696, + "loss_text": 1.2657, + "ppl": 4.2009, + "step": 8675 + }, + { + "epoch": 0.05, + "global_step": 8676, + "learning_rate": 0.00046462437395659433, + "loss": 1.4315, + "loss_base2": 2.0652, + "loss_pixel": 0.1676, + "loss_text": 1.2638, + "ppl": 4.185, + "step": 8676 + }, + { + "epoch": 0.05, + "global_step": 8677, + "learning_rate": 0.00046462020033388984, + "loss": 1.4205, + "loss_base2": 2.0493, + "loss_pixel": 0.1713, + "loss_text": 1.2492, + "ppl": 4.1392, + "step": 8677 + }, + { + "epoch": 0.05, + "global_step": 8678, + "learning_rate": 0.0004646160267111853, + "loss": 1.4253, + "loss_base2": 2.0563, + "loss_pixel": 0.1682, + "loss_text": 1.2571, + "ppl": 4.1591, + "step": 8678 + }, + { + "epoch": 0.05, + "global_step": 8679, + "learning_rate": 0.0004646118530884808, + "loss": 1.4182, + "loss_base2": 2.046, + "loss_pixel": 0.1682, + "loss_text": 1.25, + "ppl": 4.1297, + "step": 8679 + }, + { + "epoch": 0.05, + "global_step": 8680, + "learning_rate": 0.0004646076794657763, + "loss": 1.5827, + "loss_base2": 2.2834, + "loss_pixel": 0.1675, + "loss_text": 1.4152, + "ppl": 4.8681, + "step": 8680 + }, + { + "epoch": 0.05, + "global_step": 8681, + "learning_rate": 0.0004646035058430718, + "loss": 1.6736, + "loss_base2": 2.4145, + "loss_pixel": 0.1699, + "loss_text": 1.5037, + "ppl": 5.3313, + "step": 8681 + }, + { + "epoch": 0.05, + "global_step": 8682, + "learning_rate": 0.00046459933222036727, + "loss": 1.6707, + "loss_base2": 2.4103, + "loss_pixel": 0.167, + "loss_text": 1.5036, + "ppl": 5.3159, + "step": 8682 + }, + { + "epoch": 0.05, + "global_step": 8683, + "learning_rate": 0.0004645951585976628, + "loss": 1.6585, + "loss_base2": 2.3927, + "loss_pixel": 0.1677, + "loss_text": 1.4908, + "ppl": 5.2514, + "step": 8683 + }, + { + "epoch": 0.05, + "global_step": 8684, + "learning_rate": 0.0004645909849749583, + "loss": 1.6486, + "loss_base2": 2.3784, + "loss_pixel": 0.1678, + "loss_text": 1.4808, + "ppl": 5.1997, + "step": 8684 + }, + { + "epoch": 0.05, + "global_step": 8685, + "learning_rate": 0.0004645868113522538, + "loss": 1.6665, + "loss_base2": 2.4043, + "loss_pixel": 0.1681, + "loss_text": 1.4984, + "ppl": 5.2936, + "step": 8685 + }, + { + "epoch": 0.05, + "global_step": 8686, + "learning_rate": 0.0004645826377295493, + "loss": 1.652, + "loss_base2": 2.3833, + "loss_pixel": 0.1694, + "loss_text": 1.4825, + "ppl": 5.2174, + "step": 8686 + }, + { + "epoch": 0.05, + "global_step": 8687, + "learning_rate": 0.00046457846410684475, + "loss": 1.6512, + "loss_base2": 2.3822, + "loss_pixel": 0.1693, + "loss_text": 1.4819, + "ppl": 5.2132, + "step": 8687 + }, + { + "epoch": 0.05, + "global_step": 8688, + "learning_rate": 0.00046457429048414026, + "loss": 1.6281, + "loss_base2": 2.3489, + "loss_pixel": 0.1701, + "loss_text": 1.4581, + "ppl": 5.0942, + "step": 8688 + }, + { + "epoch": 0.05, + "global_step": 8689, + "learning_rate": 0.00046457011686143576, + "loss": 1.656, + "loss_base2": 2.3891, + "loss_pixel": 0.1682, + "loss_text": 1.4878, + "ppl": 5.2383, + "step": 8689 + }, + { + "epoch": 0.05, + "global_step": 8690, + "learning_rate": 0.00046456594323873127, + "loss": 1.6472, + "loss_base2": 2.3764, + "loss_pixel": 0.1706, + "loss_text": 1.4766, + "ppl": 5.1924, + "step": 8690 + }, + { + "epoch": 0.05, + "global_step": 8691, + "learning_rate": 0.0004645617696160267, + "loss": 1.6512, + "loss_base2": 2.3822, + "loss_pixel": 0.1702, + "loss_text": 1.481, + "ppl": 5.2132, + "step": 8691 + }, + { + "epoch": 0.05, + "global_step": 8692, + "learning_rate": 0.0004645575959933222, + "loss": 1.6492, + "loss_base2": 2.3793, + "loss_pixel": 0.1694, + "loss_text": 1.4798, + "ppl": 5.2028, + "step": 8692 + }, + { + "epoch": 0.05, + "global_step": 8693, + "learning_rate": 0.0004645534223706177, + "loss": 1.6717, + "loss_base2": 2.4118, + "loss_pixel": 0.1684, + "loss_text": 1.5032, + "ppl": 5.3212, + "step": 8693 + }, + { + "epoch": 0.05, + "global_step": 8694, + "learning_rate": 0.0004645492487479132, + "loss": 1.6548, + "loss_base2": 2.3874, + "loss_pixel": 0.1693, + "loss_text": 1.4854, + "ppl": 5.232, + "step": 8694 + }, + { + "epoch": 0.05, + "global_step": 8695, + "learning_rate": 0.0004645450751252087, + "loss": 1.6522, + "loss_base2": 2.3836, + "loss_pixel": 0.1685, + "loss_text": 1.4837, + "ppl": 5.2184, + "step": 8695 + }, + { + "epoch": 0.05, + "global_step": 8696, + "learning_rate": 0.00046454090150250415, + "loss": 1.6557, + "loss_base2": 2.3887, + "loss_pixel": 0.1694, + "loss_text": 1.4864, + "ppl": 5.2367, + "step": 8696 + }, + { + "epoch": 0.05, + "global_step": 8697, + "learning_rate": 0.00046453672787979966, + "loss": 1.6446, + "loss_base2": 2.3727, + "loss_pixel": 0.1707, + "loss_text": 1.4739, + "ppl": 5.1789, + "step": 8697 + }, + { + "epoch": 0.05, + "global_step": 8698, + "learning_rate": 0.00046453255425709517, + "loss": 1.6507, + "loss_base2": 2.3815, + "loss_pixel": 0.1699, + "loss_text": 1.4808, + "ppl": 5.2106, + "step": 8698 + }, + { + "epoch": 0.05, + "global_step": 8699, + "learning_rate": 0.0004645283806343907, + "loss": 1.6559, + "loss_base2": 2.389, + "loss_pixel": 0.1692, + "loss_text": 1.4866, + "ppl": 5.2378, + "step": 8699 + }, + { + "epoch": 0.05, + "global_step": 8700, + "learning_rate": 0.0004645242070116861, + "loss": 1.6403, + "loss_base2": 2.3665, + "loss_pixel": 0.1695, + "loss_text": 1.4708, + "ppl": 5.1567, + "step": 8700 + }, + { + "epoch": 0.05, + "global_step": 8701, + "learning_rate": 0.00046452003338898163, + "loss": 1.6394, + "loss_base2": 2.3652, + "loss_pixel": 0.1685, + "loss_text": 1.4709, + "ppl": 5.1521, + "step": 8701 + }, + { + "epoch": 0.05, + "global_step": 8702, + "learning_rate": 0.00046451585976627714, + "loss": 1.6365, + "loss_base2": 2.361, + "loss_pixel": 0.1682, + "loss_text": 1.4682, + "ppl": 5.1372, + "step": 8702 + }, + { + "epoch": 0.05, + "global_step": 8703, + "learning_rate": 0.00046451168614357265, + "loss": 1.6623, + "loss_base2": 2.3982, + "loss_pixel": 0.1701, + "loss_text": 1.4922, + "ppl": 5.2714, + "step": 8703 + }, + { + "epoch": 0.05, + "global_step": 8704, + "learning_rate": 0.00046450751252086816, + "loss": 1.6463, + "loss_base2": 2.3751, + "loss_pixel": 0.1695, + "loss_text": 1.4768, + "ppl": 5.1877, + "step": 8704 + }, + { + "epoch": 0.05, + "global_step": 8705, + "learning_rate": 0.0004645033388981636, + "loss": 1.665, + "loss_base2": 2.4021, + "loss_pixel": 0.1689, + "loss_text": 1.4961, + "ppl": 5.2857, + "step": 8705 + }, + { + "epoch": 0.05, + "global_step": 8706, + "learning_rate": 0.0004644991652754591, + "loss": 1.6433, + "loss_base2": 2.3708, + "loss_pixel": 0.169, + "loss_text": 1.4743, + "ppl": 5.1722, + "step": 8706 + }, + { + "epoch": 0.05, + "global_step": 8707, + "learning_rate": 0.0004644949916527546, + "loss": 1.644, + "loss_base2": 2.3718, + "loss_pixel": 0.1688, + "loss_text": 1.4753, + "ppl": 5.1758, + "step": 8707 + }, + { + "epoch": 0.05, + "global_step": 8708, + "learning_rate": 0.00046449081803005013, + "loss": 1.641, + "loss_base2": 2.3675, + "loss_pixel": 0.1685, + "loss_text": 1.4724, + "ppl": 5.1603, + "step": 8708 + }, + { + "epoch": 0.05, + "global_step": 8709, + "learning_rate": 0.0004644866444073456, + "loss": 1.6444, + "loss_base2": 2.3724, + "loss_pixel": 0.1685, + "loss_text": 1.4759, + "ppl": 5.1779, + "step": 8709 + }, + { + "epoch": 0.05, + "global_step": 8710, + "learning_rate": 0.0004644824707846411, + "loss": 1.6488, + "loss_base2": 2.3787, + "loss_pixel": 0.1689, + "loss_text": 1.4799, + "ppl": 5.2007, + "step": 8710 + }, + { + "epoch": 0.05, + "global_step": 8711, + "learning_rate": 0.00046447829716193654, + "loss": 1.6296, + "loss_base2": 2.351, + "loss_pixel": 0.1682, + "loss_text": 1.4614, + "ppl": 5.1018, + "step": 8711 + }, + { + "epoch": 0.05, + "global_step": 8712, + "learning_rate": 0.00046447412353923205, + "loss": 1.6587, + "loss_base2": 2.393, + "loss_pixel": 0.1672, + "loss_text": 1.4915, + "ppl": 5.2525, + "step": 8712 + }, + { + "epoch": 0.05, + "global_step": 8713, + "learning_rate": 0.00046446994991652756, + "loss": 1.6307, + "loss_base2": 2.3526, + "loss_pixel": 0.1697, + "loss_text": 1.461, + "ppl": 5.1074, + "step": 8713 + }, + { + "epoch": 0.05, + "global_step": 8714, + "learning_rate": 0.000464465776293823, + "loss": 1.6334, + "loss_base2": 2.3565, + "loss_pixel": 0.1687, + "loss_text": 1.4648, + "ppl": 5.1213, + "step": 8714 + }, + { + "epoch": 0.05, + "global_step": 8715, + "learning_rate": 0.0004644616026711185, + "loss": 1.6381, + "loss_base2": 2.3633, + "loss_pixel": 0.1673, + "loss_text": 1.4707, + "ppl": 5.1454, + "step": 8715 + }, + { + "epoch": 0.05, + "global_step": 8716, + "learning_rate": 0.000464457429048414, + "loss": 1.6604, + "loss_base2": 2.3955, + "loss_pixel": 0.1682, + "loss_text": 1.4922, + "ppl": 5.2614, + "step": 8716 + }, + { + "epoch": 0.05, + "global_step": 8717, + "learning_rate": 0.00046445325542570953, + "loss": 1.6491, + "loss_base2": 2.3791, + "loss_pixel": 0.1689, + "loss_text": 1.4802, + "ppl": 5.2023, + "step": 8717 + }, + { + "epoch": 0.05, + "global_step": 8718, + "learning_rate": 0.000464449081803005, + "loss": 1.6522, + "loss_base2": 2.3836, + "loss_pixel": 0.1683, + "loss_text": 1.4839, + "ppl": 5.2184, + "step": 8718 + }, + { + "epoch": 0.05, + "global_step": 8719, + "learning_rate": 0.0004644449081803005, + "loss": 1.6451, + "loss_base2": 2.3734, + "loss_pixel": 0.1695, + "loss_text": 1.4756, + "ppl": 5.1815, + "step": 8719 + }, + { + "epoch": 0.05, + "global_step": 8720, + "learning_rate": 0.000464440734557596, + "loss": 1.643, + "loss_base2": 2.3703, + "loss_pixel": 0.1689, + "loss_text": 1.4741, + "ppl": 5.1707, + "step": 8720 + }, + { + "epoch": 0.05, + "global_step": 8721, + "learning_rate": 0.0004644365609348915, + "loss": 1.6456, + "loss_base2": 2.3741, + "loss_pixel": 0.1686, + "loss_text": 1.477, + "ppl": 5.1841, + "step": 8721 + }, + { + "epoch": 0.05, + "global_step": 8722, + "learning_rate": 0.000464432387312187, + "loss": 1.6264, + "loss_base2": 2.3464, + "loss_pixel": 0.1671, + "loss_text": 1.4593, + "ppl": 5.0855, + "step": 8722 + }, + { + "epoch": 0.05, + "global_step": 8723, + "learning_rate": 0.00046442821368948247, + "loss": 1.6404, + "loss_base2": 2.3666, + "loss_pixel": 0.1668, + "loss_text": 1.4736, + "ppl": 5.1572, + "step": 8723 + }, + { + "epoch": 0.05, + "global_step": 8724, + "learning_rate": 0.000464424040066778, + "loss": 1.6222, + "loss_base2": 2.3403, + "loss_pixel": 0.1676, + "loss_text": 1.4547, + "ppl": 5.0642, + "step": 8724 + }, + { + "epoch": 0.05, + "global_step": 8725, + "learning_rate": 0.0004644198664440735, + "loss": 1.5826, + "loss_base2": 2.2832, + "loss_pixel": 0.1685, + "loss_text": 1.414, + "ppl": 4.8676, + "step": 8725 + }, + { + "epoch": 0.05, + "global_step": 8726, + "learning_rate": 0.000464415692821369, + "loss": 1.6607, + "loss_base2": 2.3959, + "loss_pixel": 0.1674, + "loss_text": 1.4933, + "ppl": 5.263, + "step": 8726 + }, + { + "epoch": 0.05, + "global_step": 8727, + "learning_rate": 0.00046441151919866444, + "loss": 1.6424, + "loss_base2": 2.3695, + "loss_pixel": 0.1696, + "loss_text": 1.4728, + "ppl": 5.1676, + "step": 8727 + }, + { + "epoch": 0.05, + "global_step": 8728, + "learning_rate": 0.00046440734557595995, + "loss": 1.6412, + "loss_base2": 2.3678, + "loss_pixel": 0.1669, + "loss_text": 1.4743, + "ppl": 5.1614, + "step": 8728 + }, + { + "epoch": 0.05, + "global_step": 8729, + "learning_rate": 0.0004644031719532554, + "loss": 1.6591, + "loss_base2": 2.3936, + "loss_pixel": 0.168, + "loss_text": 1.4911, + "ppl": 5.2546, + "step": 8729 + }, + { + "epoch": 0.05, + "global_step": 8730, + "learning_rate": 0.0004643989983305509, + "loss": 1.6489, + "loss_base2": 2.3789, + "loss_pixel": 0.1682, + "loss_text": 1.4806, + "ppl": 5.2013, + "step": 8730 + }, + { + "epoch": 0.05, + "global_step": 8731, + "learning_rate": 0.0004643948247078464, + "loss": 1.6532, + "loss_base2": 2.3851, + "loss_pixel": 0.1681, + "loss_text": 1.485, + "ppl": 5.2237, + "step": 8731 + }, + { + "epoch": 0.05, + "global_step": 8732, + "learning_rate": 0.0004643906510851419, + "loss": 1.6414, + "loss_base2": 2.368, + "loss_pixel": 0.1698, + "loss_text": 1.4716, + "ppl": 5.1624, + "step": 8732 + }, + { + "epoch": 0.05, + "global_step": 8733, + "learning_rate": 0.0004643864774624374, + "loss": 1.65, + "loss_base2": 2.3804, + "loss_pixel": 0.1675, + "loss_text": 1.4825, + "ppl": 5.207, + "step": 8733 + }, + { + "epoch": 0.05, + "global_step": 8734, + "learning_rate": 0.0004643823038397329, + "loss": 1.6416, + "loss_base2": 2.3683, + "loss_pixel": 0.1676, + "loss_text": 1.474, + "ppl": 5.1634, + "step": 8734 + }, + { + "epoch": 0.05, + "global_step": 8735, + "learning_rate": 0.0004643781302170284, + "loss": 1.6479, + "loss_base2": 2.3774, + "loss_pixel": 0.1675, + "loss_text": 1.4803, + "ppl": 5.1961, + "step": 8735 + }, + { + "epoch": 0.05, + "global_step": 8736, + "learning_rate": 0.0004643739565943239, + "loss": 1.6159, + "loss_base2": 2.3313, + "loss_pixel": 0.1676, + "loss_text": 1.4483, + "ppl": 5.0324, + "step": 8736 + }, + { + "epoch": 0.05, + "global_step": 8737, + "learning_rate": 0.00046436978297161936, + "loss": 1.648, + "loss_base2": 2.3776, + "loss_pixel": 0.1674, + "loss_text": 1.4806, + "ppl": 5.1966, + "step": 8737 + }, + { + "epoch": 0.05, + "global_step": 8738, + "learning_rate": 0.00046436560934891486, + "loss": 1.6486, + "loss_base2": 2.3784, + "loss_pixel": 0.1673, + "loss_text": 1.4813, + "ppl": 5.1997, + "step": 8738 + }, + { + "epoch": 0.05, + "global_step": 8739, + "learning_rate": 0.00046436143572621037, + "loss": 1.6343, + "loss_base2": 2.3578, + "loss_pixel": 0.1674, + "loss_text": 1.4669, + "ppl": 5.1259, + "step": 8739 + }, + { + "epoch": 0.05, + "global_step": 8740, + "learning_rate": 0.0004643572621035059, + "loss": 1.6481, + "loss_base2": 2.3777, + "loss_pixel": 0.1681, + "loss_text": 1.48, + "ppl": 5.1971, + "step": 8740 + }, + { + "epoch": 0.05, + "global_step": 8741, + "learning_rate": 0.00046435308848080133, + "loss": 1.6443, + "loss_base2": 2.3722, + "loss_pixel": 0.168, + "loss_text": 1.4764, + "ppl": 5.1774, + "step": 8741 + }, + { + "epoch": 0.05, + "global_step": 8742, + "learning_rate": 0.00046434891485809684, + "loss": 1.6265, + "loss_base2": 2.3465, + "loss_pixel": 0.1684, + "loss_text": 1.4581, + "ppl": 5.086, + "step": 8742 + }, + { + "epoch": 0.05, + "global_step": 8743, + "learning_rate": 0.00046434474123539235, + "loss": 1.6491, + "loss_base2": 2.3791, + "loss_pixel": 0.1676, + "loss_text": 1.4814, + "ppl": 5.2023, + "step": 8743 + }, + { + "epoch": 0.05, + "global_step": 8744, + "learning_rate": 0.00046434056761268785, + "loss": 1.6329, + "loss_base2": 2.3558, + "loss_pixel": 0.1681, + "loss_text": 1.4648, + "ppl": 5.1187, + "step": 8744 + }, + { + "epoch": 0.05, + "global_step": 8745, + "learning_rate": 0.00046433639398998336, + "loss": 1.6544, + "loss_base2": 2.3868, + "loss_pixel": 0.1679, + "loss_text": 1.4864, + "ppl": 5.2299, + "step": 8745 + }, + { + "epoch": 0.05, + "global_step": 8746, + "learning_rate": 0.0004643322203672788, + "loss": 1.6543, + "loss_base2": 2.3867, + "loss_pixel": 0.1689, + "loss_text": 1.4854, + "ppl": 5.2294, + "step": 8746 + }, + { + "epoch": 0.05, + "global_step": 8747, + "learning_rate": 0.0004643280467445743, + "loss": 1.6328, + "loss_base2": 2.3556, + "loss_pixel": 0.1685, + "loss_text": 1.4643, + "ppl": 5.1182, + "step": 8747 + }, + { + "epoch": 0.05, + "global_step": 8748, + "learning_rate": 0.0004643238731218698, + "loss": 1.4283, + "loss_base2": 2.0606, + "loss_pixel": 0.1693, + "loss_text": 1.259, + "ppl": 4.1716, + "step": 8748 + }, + { + "epoch": 0.05, + "global_step": 8749, + "learning_rate": 0.0004643196994991653, + "loss": 1.4277, + "loss_base2": 2.0597, + "loss_pixel": 0.1689, + "loss_text": 1.2588, + "ppl": 4.1691, + "step": 8749 + }, + { + "epoch": 0.05, + "global_step": 8750, + "learning_rate": 0.00046431552587646073, + "loss": 1.4247, + "loss_base2": 2.0554, + "loss_pixel": 0.1672, + "loss_text": 1.2575, + "ppl": 4.1566, + "step": 8750 + }, + { + "epoch": 0.05, + "global_step": 8751, + "learning_rate": 0.00046431135225375624, + "loss": 1.4289, + "loss_base2": 2.0615, + "loss_pixel": 0.169, + "loss_text": 1.2599, + "ppl": 4.1741, + "step": 8751 + }, + { + "epoch": 0.05, + "global_step": 8752, + "learning_rate": 0.00046430717863105175, + "loss": 1.4468, + "loss_base2": 2.0873, + "loss_pixel": 0.1672, + "loss_text": 1.2795, + "ppl": 4.2495, + "step": 8752 + }, + { + "epoch": 0.05, + "global_step": 8753, + "learning_rate": 0.00046430300500834726, + "loss": 1.4326, + "loss_base2": 2.0668, + "loss_pixel": 0.1705, + "loss_text": 1.2621, + "ppl": 4.1896, + "step": 8753 + }, + { + "epoch": 0.05, + "global_step": 8754, + "learning_rate": 0.00046429883138564276, + "loss": 1.4309, + "loss_base2": 2.0644, + "loss_pixel": 0.1677, + "loss_text": 1.2632, + "ppl": 4.1825, + "step": 8754 + }, + { + "epoch": 0.05, + "global_step": 8755, + "learning_rate": 0.0004642946577629382, + "loss": 1.411, + "loss_base2": 2.0356, + "loss_pixel": 0.1668, + "loss_text": 1.2442, + "ppl": 4.1001, + "step": 8755 + }, + { + "epoch": 0.05, + "global_step": 8756, + "learning_rate": 0.0004642904841402337, + "loss": 1.5902, + "loss_base2": 2.2942, + "loss_pixel": 0.1678, + "loss_text": 1.4223, + "ppl": 4.9047, + "step": 8756 + }, + { + "epoch": 0.05, + "global_step": 8757, + "learning_rate": 0.00046428631051752923, + "loss": 1.6525, + "loss_base2": 2.3841, + "loss_pixel": 0.1674, + "loss_text": 1.4851, + "ppl": 5.22, + "step": 8757 + }, + { + "epoch": 0.05, + "global_step": 8758, + "learning_rate": 0.00046428213689482474, + "loss": 1.642, + "loss_base2": 2.3689, + "loss_pixel": 0.1675, + "loss_text": 1.4746, + "ppl": 5.1655, + "step": 8758 + }, + { + "epoch": 0.05, + "global_step": 8759, + "learning_rate": 0.0004642779632721202, + "loss": 1.6525, + "loss_base2": 2.3841, + "loss_pixel": 0.1668, + "loss_text": 1.4857, + "ppl": 5.22, + "step": 8759 + }, + { + "epoch": 0.05, + "global_step": 8760, + "learning_rate": 0.0004642737896494157, + "loss": 1.6474, + "loss_base2": 2.3767, + "loss_pixel": 0.1686, + "loss_text": 1.4789, + "ppl": 5.1935, + "step": 8760 + }, + { + "epoch": 0.05, + "global_step": 8761, + "learning_rate": 0.0004642696160267112, + "loss": 1.6602, + "loss_base2": 2.3952, + "loss_pixel": 0.1668, + "loss_text": 1.4934, + "ppl": 5.2604, + "step": 8761 + }, + { + "epoch": 0.05, + "global_step": 8762, + "learning_rate": 0.0004642654424040067, + "loss": 1.6325, + "loss_base2": 2.3552, + "loss_pixel": 0.1677, + "loss_text": 1.4648, + "ppl": 5.1167, + "step": 8762 + }, + { + "epoch": 0.05, + "global_step": 8763, + "learning_rate": 0.0004642612687813022, + "loss": 1.6288, + "loss_base2": 2.3499, + "loss_pixel": 0.1668, + "loss_text": 1.462, + "ppl": 5.0978, + "step": 8763 + }, + { + "epoch": 0.05, + "global_step": 8764, + "learning_rate": 0.0004642570951585977, + "loss": 1.6186, + "loss_base2": 2.3351, + "loss_pixel": 0.1673, + "loss_text": 1.4513, + "ppl": 5.046, + "step": 8764 + }, + { + "epoch": 0.05, + "global_step": 8765, + "learning_rate": 0.0004642529215358932, + "loss": 1.6492, + "loss_base2": 2.3793, + "loss_pixel": 0.1688, + "loss_text": 1.4804, + "ppl": 5.2028, + "step": 8765 + }, + { + "epoch": 0.05, + "global_step": 8766, + "learning_rate": 0.0004642487479131887, + "loss": 1.6533, + "loss_base2": 2.3852, + "loss_pixel": 0.1684, + "loss_text": 1.4849, + "ppl": 5.2242, + "step": 8766 + }, + { + "epoch": 0.05, + "global_step": 8767, + "learning_rate": 0.00046424457429048414, + "loss": 1.6595, + "loss_base2": 2.3942, + "loss_pixel": 0.1704, + "loss_text": 1.489, + "ppl": 5.2567, + "step": 8767 + }, + { + "epoch": 0.05, + "global_step": 8768, + "learning_rate": 0.0004642404006677796, + "loss": 1.6379, + "loss_base2": 2.363, + "loss_pixel": 0.1682, + "loss_text": 1.4697, + "ppl": 5.1444, + "step": 8768 + }, + { + "epoch": 0.05, + "global_step": 8769, + "learning_rate": 0.0004642362270450751, + "loss": 1.6551, + "loss_base2": 2.3878, + "loss_pixel": 0.1694, + "loss_text": 1.4856, + "ppl": 5.2336, + "step": 8769 + }, + { + "epoch": 0.05, + "global_step": 8770, + "learning_rate": 0.0004642320534223706, + "loss": 1.6488, + "loss_base2": 2.3787, + "loss_pixel": 0.1664, + "loss_text": 1.4823, + "ppl": 5.2007, + "step": 8770 + }, + { + "epoch": 0.05, + "global_step": 8771, + "learning_rate": 0.0004642278797996661, + "loss": 1.6469, + "loss_base2": 2.376, + "loss_pixel": 0.1679, + "loss_text": 1.479, + "ppl": 5.1909, + "step": 8771 + }, + { + "epoch": 0.05, + "global_step": 8772, + "learning_rate": 0.0004642237061769616, + "loss": 1.6393, + "loss_base2": 2.365, + "loss_pixel": 0.1674, + "loss_text": 1.472, + "ppl": 5.1516, + "step": 8772 + }, + { + "epoch": 0.05, + "global_step": 8773, + "learning_rate": 0.0004642195325542571, + "loss": 1.6578, + "loss_base2": 2.3917, + "loss_pixel": 0.1677, + "loss_text": 1.4901, + "ppl": 5.2478, + "step": 8773 + }, + { + "epoch": 0.05, + "global_step": 8774, + "learning_rate": 0.0004642153589315526, + "loss": 1.633, + "loss_base2": 2.3559, + "loss_pixel": 0.1672, + "loss_text": 1.4658, + "ppl": 5.1192, + "step": 8774 + }, + { + "epoch": 0.05, + "global_step": 8775, + "learning_rate": 0.0004642111853088481, + "loss": 1.6622, + "loss_base2": 2.398, + "loss_pixel": 0.1668, + "loss_text": 1.4954, + "ppl": 5.2709, + "step": 8775 + }, + { + "epoch": 0.05, + "global_step": 8776, + "learning_rate": 0.0004642070116861436, + "loss": 1.6451, + "loss_base2": 2.3734, + "loss_pixel": 0.1673, + "loss_text": 1.4778, + "ppl": 5.1815, + "step": 8776 + }, + { + "epoch": 0.05, + "global_step": 8777, + "learning_rate": 0.00046420283806343905, + "loss": 1.6483, + "loss_base2": 2.378, + "loss_pixel": 0.1677, + "loss_text": 1.4806, + "ppl": 5.1981, + "step": 8777 + }, + { + "epoch": 0.05, + "global_step": 8778, + "learning_rate": 0.00046419866444073456, + "loss": 1.639, + "loss_base2": 2.3646, + "loss_pixel": 0.1678, + "loss_text": 1.4712, + "ppl": 5.15, + "step": 8778 + }, + { + "epoch": 0.05, + "global_step": 8779, + "learning_rate": 0.00046419449081803007, + "loss": 1.6496, + "loss_base2": 2.3799, + "loss_pixel": 0.1674, + "loss_text": 1.4822, + "ppl": 5.2049, + "step": 8779 + }, + { + "epoch": 0.05, + "global_step": 8780, + "learning_rate": 0.0004641903171953256, + "loss": 1.601, + "loss_base2": 2.3098, + "loss_pixel": 0.1684, + "loss_text": 1.4327, + "ppl": 4.958, + "step": 8780 + }, + { + "epoch": 0.05, + "global_step": 8781, + "learning_rate": 0.0004641861435726211, + "loss": 1.6171, + "loss_base2": 2.333, + "loss_pixel": 0.1678, + "loss_text": 1.4494, + "ppl": 5.0385, + "step": 8781 + }, + { + "epoch": 0.05, + "global_step": 8782, + "learning_rate": 0.00046418196994991653, + "loss": 1.648, + "loss_base2": 2.3776, + "loss_pixel": 0.1665, + "loss_text": 1.4815, + "ppl": 5.1966, + "step": 8782 + }, + { + "epoch": 0.05, + "global_step": 8783, + "learning_rate": 0.00046417779632721204, + "loss": 1.6554, + "loss_base2": 2.3882, + "loss_pixel": 0.1679, + "loss_text": 1.4875, + "ppl": 5.2352, + "step": 8783 + }, + { + "epoch": 0.05, + "global_step": 8784, + "learning_rate": 0.00046417362270450755, + "loss": 1.6507, + "loss_base2": 2.3815, + "loss_pixel": 0.1671, + "loss_text": 1.4836, + "ppl": 5.2106, + "step": 8784 + }, + { + "epoch": 0.05, + "global_step": 8785, + "learning_rate": 0.00046416944908180306, + "loss": 1.6542, + "loss_base2": 2.3865, + "loss_pixel": 0.1671, + "loss_text": 1.4871, + "ppl": 5.2289, + "step": 8785 + }, + { + "epoch": 0.05, + "global_step": 8786, + "learning_rate": 0.00046416527545909846, + "loss": 1.6316, + "loss_base2": 2.3539, + "loss_pixel": 0.1667, + "loss_text": 1.4649, + "ppl": 5.112, + "step": 8786 + }, + { + "epoch": 0.05, + "global_step": 8787, + "learning_rate": 0.00046416110183639396, + "loss": 1.622, + "loss_base2": 2.3401, + "loss_pixel": 0.1689, + "loss_text": 1.4531, + "ppl": 5.0632, + "step": 8787 + }, + { + "epoch": 0.05, + "global_step": 8788, + "learning_rate": 0.00046415692821368947, + "loss": 1.6489, + "loss_base2": 2.3789, + "loss_pixel": 0.1669, + "loss_text": 1.482, + "ppl": 5.2013, + "step": 8788 + }, + { + "epoch": 0.05, + "global_step": 8789, + "learning_rate": 0.000464152754590985, + "loss": 1.6396, + "loss_base2": 2.3654, + "loss_pixel": 0.1663, + "loss_text": 1.4733, + "ppl": 5.1531, + "step": 8789 + }, + { + "epoch": 0.05, + "global_step": 8790, + "learning_rate": 0.0004641485809682805, + "loss": 1.6483, + "loss_base2": 2.378, + "loss_pixel": 0.1675, + "loss_text": 1.4808, + "ppl": 5.1981, + "step": 8790 + }, + { + "epoch": 0.05, + "global_step": 8791, + "learning_rate": 0.00046414440734557594, + "loss": 1.6341, + "loss_base2": 2.3575, + "loss_pixel": 0.1674, + "loss_text": 1.4667, + "ppl": 5.1248, + "step": 8791 + }, + { + "epoch": 0.05, + "global_step": 8792, + "learning_rate": 0.00046414023372287144, + "loss": 1.6525, + "loss_base2": 2.3841, + "loss_pixel": 0.1671, + "loss_text": 1.4854, + "ppl": 5.22, + "step": 8792 + }, + { + "epoch": 0.05, + "global_step": 8793, + "learning_rate": 0.00046413606010016695, + "loss": 1.6372, + "loss_base2": 2.362, + "loss_pixel": 0.1676, + "loss_text": 1.4695, + "ppl": 5.1408, + "step": 8793 + }, + { + "epoch": 0.05, + "global_step": 8794, + "learning_rate": 0.00046413188647746246, + "loss": 1.6453, + "loss_base2": 2.3737, + "loss_pixel": 0.1664, + "loss_text": 1.4789, + "ppl": 5.1826, + "step": 8794 + }, + { + "epoch": 0.05, + "global_step": 8795, + "learning_rate": 0.00046412771285475797, + "loss": 1.6666, + "loss_base2": 2.4044, + "loss_pixel": 0.1672, + "loss_text": 1.4993, + "ppl": 5.2941, + "step": 8795 + }, + { + "epoch": 0.05, + "global_step": 8796, + "learning_rate": 0.0004641235392320534, + "loss": 1.6524, + "loss_base2": 2.3839, + "loss_pixel": 0.1676, + "loss_text": 1.4847, + "ppl": 5.2195, + "step": 8796 + }, + { + "epoch": 0.05, + "global_step": 8797, + "learning_rate": 0.0004641193656093489, + "loss": 1.6304, + "loss_base2": 2.3522, + "loss_pixel": 0.1649, + "loss_text": 1.4655, + "ppl": 5.1059, + "step": 8797 + }, + { + "epoch": 0.05, + "global_step": 8798, + "learning_rate": 0.00046411519198664443, + "loss": 1.648, + "loss_base2": 2.3776, + "loss_pixel": 0.1673, + "loss_text": 1.4807, + "ppl": 5.1966, + "step": 8798 + }, + { + "epoch": 0.05, + "global_step": 8799, + "learning_rate": 0.00046411101836393994, + "loss": 1.6644, + "loss_base2": 2.4012, + "loss_pixel": 0.1679, + "loss_text": 1.4965, + "ppl": 5.2825, + "step": 8799 + }, + { + "epoch": 0.05, + "global_step": 8800, + "learning_rate": 0.0004641068447412354, + "loss": 1.6402, + "loss_base2": 2.3663, + "loss_pixel": 0.1667, + "loss_text": 1.4735, + "ppl": 5.1562, + "step": 8800 + }, + { + "epoch": 0.05, + "global_step": 8801, + "learning_rate": 0.0004641026711185309, + "loss": 1.6343, + "loss_base2": 2.3578, + "loss_pixel": 0.1667, + "loss_text": 1.4676, + "ppl": 5.1259, + "step": 8801 + }, + { + "epoch": 0.05, + "global_step": 8802, + "learning_rate": 0.0004640984974958264, + "loss": 1.6229, + "loss_base2": 2.3413, + "loss_pixel": 0.167, + "loss_text": 1.4559, + "ppl": 5.0678, + "step": 8802 + }, + { + "epoch": 0.05, + "global_step": 8803, + "learning_rate": 0.0004640943238731219, + "loss": 1.4349, + "loss_base2": 2.0701, + "loss_pixel": 0.1682, + "loss_text": 1.2667, + "ppl": 4.1992, + "step": 8803 + }, + { + "epoch": 0.05, + "global_step": 8804, + "learning_rate": 0.0004640901502504174, + "loss": 1.4622, + "loss_base2": 2.1095, + "loss_pixel": 0.1669, + "loss_text": 1.2953, + "ppl": 4.3154, + "step": 8804 + }, + { + "epoch": 0.05, + "global_step": 8805, + "learning_rate": 0.0004640859766277128, + "loss": 1.4251, + "loss_base2": 2.056, + "loss_pixel": 0.1671, + "loss_text": 1.258, + "ppl": 4.1583, + "step": 8805 + }, + { + "epoch": 0.05, + "global_step": 8806, + "learning_rate": 0.00046408180300500833, + "loss": 1.4442, + "loss_base2": 2.0835, + "loss_pixel": 0.167, + "loss_text": 1.2772, + "ppl": 4.2385, + "step": 8806 + }, + { + "epoch": 0.05, + "global_step": 8807, + "learning_rate": 0.00046407762938230384, + "loss": 1.4066, + "loss_base2": 2.0293, + "loss_pixel": 0.1664, + "loss_text": 1.2402, + "ppl": 4.0821, + "step": 8807 + }, + { + "epoch": 0.05, + "global_step": 8808, + "learning_rate": 0.00046407345575959934, + "loss": 1.4369, + "loss_base2": 2.073, + "loss_pixel": 0.1661, + "loss_text": 1.2708, + "ppl": 4.2076, + "step": 8808 + }, + { + "epoch": 0.05, + "global_step": 8809, + "learning_rate": 0.0004640692821368948, + "loss": 1.4284, + "loss_base2": 2.0607, + "loss_pixel": 0.1668, + "loss_text": 1.2616, + "ppl": 4.172, + "step": 8809 + }, + { + "epoch": 0.05, + "global_step": 8810, + "learning_rate": 0.0004640651085141903, + "loss": 1.4263, + "loss_base2": 2.0577, + "loss_pixel": 0.1679, + "loss_text": 1.2584, + "ppl": 4.1633, + "step": 8810 + }, + { + "epoch": 0.05, + "global_step": 8811, + "learning_rate": 0.0004640609348914858, + "loss": 1.5038, + "loss_base2": 2.1695, + "loss_pixel": 0.1667, + "loss_text": 1.3371, + "ppl": 4.4988, + "step": 8811 + }, + { + "epoch": 0.05, + "global_step": 8812, + "learning_rate": 0.0004640567612687813, + "loss": 1.665, + "loss_base2": 2.4021, + "loss_pixel": 0.1668, + "loss_text": 1.4982, + "ppl": 5.2857, + "step": 8812 + }, + { + "epoch": 0.05, + "global_step": 8813, + "learning_rate": 0.00046405258764607683, + "loss": 1.6662, + "loss_base2": 2.4038, + "loss_pixel": 0.1668, + "loss_text": 1.4994, + "ppl": 5.292, + "step": 8813 + }, + { + "epoch": 0.05, + "global_step": 8814, + "learning_rate": 0.0004640484140233723, + "loss": 1.6834, + "loss_base2": 2.4286, + "loss_pixel": 0.1682, + "loss_text": 1.5152, + "ppl": 5.3838, + "step": 8814 + }, + { + "epoch": 0.05, + "global_step": 8815, + "learning_rate": 0.0004640442404006678, + "loss": 1.6562, + "loss_base2": 2.3894, + "loss_pixel": 0.1685, + "loss_text": 1.4877, + "ppl": 5.2394, + "step": 8815 + }, + { + "epoch": 0.05, + "global_step": 8816, + "learning_rate": 0.0004640400667779633, + "loss": 1.6559, + "loss_base2": 2.389, + "loss_pixel": 0.1685, + "loss_text": 1.4874, + "ppl": 5.2378, + "step": 8816 + }, + { + "epoch": 0.05, + "global_step": 8817, + "learning_rate": 0.0004640358931552588, + "loss": 1.6639, + "loss_base2": 2.4005, + "loss_pixel": 0.1676, + "loss_text": 1.4963, + "ppl": 5.2799, + "step": 8817 + }, + { + "epoch": 0.05, + "global_step": 8818, + "learning_rate": 0.00046403171953255426, + "loss": 1.6474, + "loss_base2": 2.3767, + "loss_pixel": 0.1666, + "loss_text": 1.4807, + "ppl": 5.1935, + "step": 8818 + }, + { + "epoch": 0.05, + "global_step": 8819, + "learning_rate": 0.00046402754590984976, + "loss": 1.6474, + "loss_base2": 2.3767, + "loss_pixel": 0.1666, + "loss_text": 1.4808, + "ppl": 5.1935, + "step": 8819 + }, + { + "epoch": 0.05, + "global_step": 8820, + "learning_rate": 0.00046402337228714527, + "loss": 1.656, + "loss_base2": 2.3891, + "loss_pixel": 0.1675, + "loss_text": 1.4885, + "ppl": 5.2383, + "step": 8820 + }, + { + "epoch": 0.05, + "global_step": 8821, + "learning_rate": 0.0004640191986644408, + "loss": 1.6614, + "loss_base2": 2.3969, + "loss_pixel": 0.1669, + "loss_text": 1.4944, + "ppl": 5.2667, + "step": 8821 + }, + { + "epoch": 0.05, + "global_step": 8822, + "learning_rate": 0.0004640150250417363, + "loss": 1.639, + "loss_base2": 2.3646, + "loss_pixel": 0.1678, + "loss_text": 1.4712, + "ppl": 5.15, + "step": 8822 + }, + { + "epoch": 0.05, + "global_step": 8823, + "learning_rate": 0.0004640108514190317, + "loss": 1.6377, + "loss_base2": 2.3627, + "loss_pixel": 0.168, + "loss_text": 1.4697, + "ppl": 5.1433, + "step": 8823 + }, + { + "epoch": 0.05, + "global_step": 8824, + "learning_rate": 0.0004640066777963272, + "loss": 1.6616, + "loss_base2": 2.3972, + "loss_pixel": 0.1677, + "loss_text": 1.4939, + "ppl": 5.2677, + "step": 8824 + }, + { + "epoch": 0.05, + "global_step": 8825, + "learning_rate": 0.0004640025041736227, + "loss": 1.6567, + "loss_base2": 2.3901, + "loss_pixel": 0.1679, + "loss_text": 1.4887, + "ppl": 5.242, + "step": 8825 + }, + { + "epoch": 0.05, + "global_step": 8826, + "learning_rate": 0.0004639983305509182, + "loss": 1.6436, + "loss_base2": 2.3712, + "loss_pixel": 0.1663, + "loss_text": 1.4773, + "ppl": 5.1738, + "step": 8826 + }, + { + "epoch": 0.05, + "global_step": 8827, + "learning_rate": 0.00046399415692821366, + "loss": 1.6579, + "loss_base2": 2.3918, + "loss_pixel": 0.1654, + "loss_text": 1.4925, + "ppl": 5.2483, + "step": 8827 + }, + { + "epoch": 0.05, + "global_step": 8828, + "learning_rate": 0.00046398998330550917, + "loss": 1.6374, + "loss_base2": 2.3623, + "loss_pixel": 0.1679, + "loss_text": 1.4695, + "ppl": 5.1418, + "step": 8828 + }, + { + "epoch": 0.05, + "global_step": 8829, + "learning_rate": 0.0004639858096828047, + "loss": 1.6182, + "loss_base2": 2.3346, + "loss_pixel": 0.1658, + "loss_text": 1.4524, + "ppl": 5.044, + "step": 8829 + }, + { + "epoch": 0.05, + "global_step": 8830, + "learning_rate": 0.0004639816360601002, + "loss": 1.6427, + "loss_base2": 2.3699, + "loss_pixel": 0.1657, + "loss_text": 1.477, + "ppl": 5.1691, + "step": 8830 + }, + { + "epoch": 0.05, + "global_step": 8831, + "learning_rate": 0.0004639774624373957, + "loss": 1.6627, + "loss_base2": 2.3988, + "loss_pixel": 0.1671, + "loss_text": 1.4956, + "ppl": 5.2735, + "step": 8831 + }, + { + "epoch": 0.05, + "global_step": 8832, + "learning_rate": 0.00046397328881469114, + "loss": 1.6458, + "loss_base2": 2.3744, + "loss_pixel": 0.1673, + "loss_text": 1.4785, + "ppl": 5.1852, + "step": 8832 + }, + { + "epoch": 0.05, + "global_step": 8833, + "learning_rate": 0.00046396911519198665, + "loss": 1.5605, + "loss_base2": 2.2513, + "loss_pixel": 0.1683, + "loss_text": 1.3922, + "ppl": 4.7612, + "step": 8833 + }, + { + "epoch": 0.05, + "global_step": 8834, + "learning_rate": 0.00046396494156928216, + "loss": 1.4467, + "loss_base2": 2.0871, + "loss_pixel": 0.166, + "loss_text": 1.2808, + "ppl": 4.2491, + "step": 8834 + }, + { + "epoch": 0.05, + "global_step": 8835, + "learning_rate": 0.00046396076794657766, + "loss": 1.4383, + "loss_base2": 2.075, + "loss_pixel": 0.1672, + "loss_text": 1.2711, + "ppl": 4.2135, + "step": 8835 + }, + { + "epoch": 0.05, + "global_step": 8836, + "learning_rate": 0.0004639565943238731, + "loss": 1.4467, + "loss_base2": 2.0871, + "loss_pixel": 0.1668, + "loss_text": 1.2799, + "ppl": 4.2491, + "step": 8836 + }, + { + "epoch": 0.05, + "global_step": 8837, + "learning_rate": 0.0004639524207011686, + "loss": 1.4266, + "loss_base2": 2.0581, + "loss_pixel": 0.1654, + "loss_text": 1.2612, + "ppl": 4.1645, + "step": 8837 + }, + { + "epoch": 0.05, + "global_step": 8838, + "learning_rate": 0.00046394824707846413, + "loss": 1.4249, + "loss_base2": 2.0557, + "loss_pixel": 0.1664, + "loss_text": 1.2585, + "ppl": 4.1574, + "step": 8838 + }, + { + "epoch": 0.05, + "global_step": 8839, + "learning_rate": 0.00046394407345575964, + "loss": 1.4331, + "loss_base2": 2.0675, + "loss_pixel": 0.1673, + "loss_text": 1.2657, + "ppl": 4.1917, + "step": 8839 + }, + { + "epoch": 0.05, + "global_step": 8840, + "learning_rate": 0.00046393989983305515, + "loss": 1.4242, + "loss_base2": 2.0547, + "loss_pixel": 0.1666, + "loss_text": 1.2576, + "ppl": 4.1545, + "step": 8840 + }, + { + "epoch": 0.05, + "global_step": 8841, + "learning_rate": 0.0004639357262103506, + "loss": 1.5561, + "loss_base2": 2.245, + "loss_pixel": 0.1666, + "loss_text": 1.3895, + "ppl": 4.7403, + "step": 8841 + }, + { + "epoch": 0.05, + "global_step": 8842, + "learning_rate": 0.00046393155258764605, + "loss": 1.6781, + "loss_base2": 2.421, + "loss_pixel": 0.1682, + "loss_text": 1.5099, + "ppl": 5.3554, + "step": 8842 + }, + { + "epoch": 0.05, + "global_step": 8843, + "learning_rate": 0.00046392737896494156, + "loss": 1.6701, + "loss_base2": 2.4094, + "loss_pixel": 0.1657, + "loss_text": 1.5043, + "ppl": 5.3127, + "step": 8843 + }, + { + "epoch": 0.05, + "global_step": 8844, + "learning_rate": 0.00046392320534223707, + "loss": 1.6458, + "loss_base2": 2.3744, + "loss_pixel": 0.1673, + "loss_text": 1.4785, + "ppl": 5.1852, + "step": 8844 + }, + { + "epoch": 0.05, + "global_step": 8845, + "learning_rate": 0.0004639190317195326, + "loss": 1.6439, + "loss_base2": 2.3716, + "loss_pixel": 0.1666, + "loss_text": 1.4773, + "ppl": 5.1753, + "step": 8845 + }, + { + "epoch": 0.05, + "global_step": 8846, + "learning_rate": 0.000463914858096828, + "loss": 1.6626, + "loss_base2": 2.3986, + "loss_pixel": 0.1666, + "loss_text": 1.4961, + "ppl": 5.273, + "step": 8846 + }, + { + "epoch": 0.05, + "global_step": 8847, + "learning_rate": 0.00046391068447412353, + "loss": 1.657, + "loss_base2": 2.3905, + "loss_pixel": 0.1633, + "loss_text": 1.4937, + "ppl": 5.2436, + "step": 8847 + }, + { + "epoch": 0.05, + "global_step": 8848, + "learning_rate": 0.00046390651085141904, + "loss": 1.6545, + "loss_base2": 2.3869, + "loss_pixel": 0.164, + "loss_text": 1.4905, + "ppl": 5.2305, + "step": 8848 + }, + { + "epoch": 0.05, + "global_step": 8849, + "learning_rate": 0.00046390233722871455, + "loss": 1.6455, + "loss_base2": 2.374, + "loss_pixel": 0.1643, + "loss_text": 1.4812, + "ppl": 5.1836, + "step": 8849 + }, + { + "epoch": 0.05, + "global_step": 8850, + "learning_rate": 0.00046389816360601, + "loss": 1.6577, + "loss_base2": 2.3916, + "loss_pixel": 0.1635, + "loss_text": 1.4943, + "ppl": 5.2472, + "step": 8850 + }, + { + "epoch": 0.05, + "global_step": 8851, + "learning_rate": 0.0004638939899833055, + "loss": 1.6428, + "loss_base2": 2.3701, + "loss_pixel": 0.1634, + "loss_text": 1.4794, + "ppl": 5.1696, + "step": 8851 + }, + { + "epoch": 0.05, + "global_step": 8852, + "learning_rate": 0.000463889816360601, + "loss": 1.6483, + "loss_base2": 2.378, + "loss_pixel": 0.1605, + "loss_text": 1.4878, + "ppl": 5.1981, + "step": 8852 + }, + { + "epoch": 0.05, + "global_step": 8853, + "learning_rate": 0.0004638856427378965, + "loss": 1.6418, + "loss_base2": 2.3686, + "loss_pixel": 0.1611, + "loss_text": 1.4807, + "ppl": 5.1645, + "step": 8853 + }, + { + "epoch": 0.05, + "global_step": 8854, + "learning_rate": 0.00046388146911519203, + "loss": 1.6296, + "loss_base2": 2.351, + "loss_pixel": 0.1582, + "loss_text": 1.4715, + "ppl": 5.1018, + "step": 8854 + }, + { + "epoch": 0.05, + "global_step": 8855, + "learning_rate": 0.0004638772954924875, + "loss": 1.6293, + "loss_base2": 2.3506, + "loss_pixel": 0.1611, + "loss_text": 1.4682, + "ppl": 5.1003, + "step": 8855 + }, + { + "epoch": 0.05, + "global_step": 8856, + "learning_rate": 0.000463873121869783, + "loss": 1.6365, + "loss_base2": 2.361, + "loss_pixel": 0.1603, + "loss_text": 1.4762, + "ppl": 5.1372, + "step": 8856 + }, + { + "epoch": 0.05, + "global_step": 8857, + "learning_rate": 0.0004638689482470785, + "loss": 1.6348, + "loss_base2": 2.3585, + "loss_pixel": 0.1605, + "loss_text": 1.4743, + "ppl": 5.1284, + "step": 8857 + }, + { + "epoch": 0.05, + "global_step": 8858, + "learning_rate": 0.000463864774624374, + "loss": 1.6467, + "loss_base2": 2.3757, + "loss_pixel": 0.1598, + "loss_text": 1.4869, + "ppl": 5.1898, + "step": 8858 + }, + { + "epoch": 0.05, + "global_step": 8859, + "learning_rate": 0.00046386060100166946, + "loss": 1.6434, + "loss_base2": 2.3709, + "loss_pixel": 0.1608, + "loss_text": 1.4827, + "ppl": 5.1727, + "step": 8859 + }, + { + "epoch": 0.05, + "global_step": 8860, + "learning_rate": 0.00046385642737896497, + "loss": 1.6314, + "loss_base2": 2.3536, + "loss_pixel": 0.1608, + "loss_text": 1.4706, + "ppl": 5.111, + "step": 8860 + }, + { + "epoch": 0.05, + "global_step": 8861, + "learning_rate": 0.0004638522537562604, + "loss": 1.6179, + "loss_base2": 2.3341, + "loss_pixel": 0.163, + "loss_text": 1.4549, + "ppl": 5.0425, + "step": 8861 + }, + { + "epoch": 0.05, + "global_step": 8862, + "learning_rate": 0.0004638480801335559, + "loss": 1.6456, + "loss_base2": 2.3741, + "loss_pixel": 0.1591, + "loss_text": 1.4865, + "ppl": 5.1841, + "step": 8862 + }, + { + "epoch": 0.05, + "global_step": 8863, + "learning_rate": 0.00046384390651085143, + "loss": 1.6354, + "loss_base2": 2.3594, + "loss_pixel": 0.1593, + "loss_text": 1.4761, + "ppl": 5.1315, + "step": 8863 + }, + { + "epoch": 0.05, + "global_step": 8864, + "learning_rate": 0.0004638397328881469, + "loss": 1.6378, + "loss_base2": 2.3628, + "loss_pixel": 0.1582, + "loss_text": 1.4796, + "ppl": 5.1438, + "step": 8864 + }, + { + "epoch": 0.05, + "global_step": 8865, + "learning_rate": 0.0004638355592654424, + "loss": 1.6301, + "loss_base2": 2.3517, + "loss_pixel": 0.1582, + "loss_text": 1.4719, + "ppl": 5.1044, + "step": 8865 + }, + { + "epoch": 0.05, + "global_step": 8866, + "learning_rate": 0.0004638313856427379, + "loss": 1.6315, + "loss_base2": 2.3538, + "loss_pixel": 0.1586, + "loss_text": 1.4729, + "ppl": 5.1115, + "step": 8866 + }, + { + "epoch": 0.05, + "global_step": 8867, + "learning_rate": 0.0004638272120200334, + "loss": 1.6231, + "loss_base2": 2.3416, + "loss_pixel": 0.1572, + "loss_text": 1.4658, + "ppl": 5.0688, + "step": 8867 + }, + { + "epoch": 0.05, + "global_step": 8868, + "learning_rate": 0.00046382303839732886, + "loss": 1.622, + "loss_base2": 2.3401, + "loss_pixel": 0.1599, + "loss_text": 1.4622, + "ppl": 5.0632, + "step": 8868 + }, + { + "epoch": 0.05, + "global_step": 8869, + "learning_rate": 0.00046381886477462437, + "loss": 1.6289, + "loss_base2": 2.35, + "loss_pixel": 0.1598, + "loss_text": 1.4692, + "ppl": 5.0983, + "step": 8869 + }, + { + "epoch": 0.05, + "global_step": 8870, + "learning_rate": 0.0004638146911519199, + "loss": 1.6502, + "loss_base2": 2.3807, + "loss_pixel": 0.1586, + "loss_text": 1.4916, + "ppl": 5.208, + "step": 8870 + }, + { + "epoch": 0.05, + "global_step": 8871, + "learning_rate": 0.0004638105175292154, + "loss": 1.6261, + "loss_base2": 2.346, + "loss_pixel": 0.1573, + "loss_text": 1.4688, + "ppl": 5.084, + "step": 8871 + }, + { + "epoch": 0.05, + "global_step": 8872, + "learning_rate": 0.0004638063439065109, + "loss": 1.6276, + "loss_base2": 2.3481, + "loss_pixel": 0.1576, + "loss_text": 1.47, + "ppl": 5.0916, + "step": 8872 + }, + { + "epoch": 0.05, + "global_step": 8873, + "learning_rate": 0.00046380217028380634, + "loss": 1.6522, + "loss_base2": 2.3836, + "loss_pixel": 0.1575, + "loss_text": 1.4947, + "ppl": 5.2184, + "step": 8873 + }, + { + "epoch": 0.05, + "global_step": 8874, + "learning_rate": 0.00046379799666110185, + "loss": 1.6077, + "loss_base2": 2.3194, + "loss_pixel": 0.1581, + "loss_text": 1.4496, + "ppl": 4.9913, + "step": 8874 + }, + { + "epoch": 0.05, + "global_step": 8875, + "learning_rate": 0.00046379382303839736, + "loss": 1.6253, + "loss_base2": 2.3448, + "loss_pixel": 0.1595, + "loss_text": 1.4659, + "ppl": 5.0799, + "step": 8875 + }, + { + "epoch": 0.05, + "global_step": 8876, + "learning_rate": 0.00046378964941569287, + "loss": 1.6282, + "loss_base2": 2.349, + "loss_pixel": 0.16, + "loss_text": 1.4682, + "ppl": 5.0947, + "step": 8876 + }, + { + "epoch": 0.05, + "global_step": 8877, + "learning_rate": 0.0004637854757929883, + "loss": 1.6386, + "loss_base2": 2.364, + "loss_pixel": 0.1579, + "loss_text": 1.4807, + "ppl": 5.148, + "step": 8877 + }, + { + "epoch": 0.05, + "global_step": 8878, + "learning_rate": 0.00046378130217028383, + "loss": 1.6497, + "loss_base2": 2.38, + "loss_pixel": 0.1601, + "loss_text": 1.4896, + "ppl": 5.2054, + "step": 8878 + }, + { + "epoch": 0.05, + "global_step": 8879, + "learning_rate": 0.00046377712854757933, + "loss": 1.63, + "loss_base2": 2.3516, + "loss_pixel": 0.1575, + "loss_text": 1.4724, + "ppl": 5.1039, + "step": 8879 + }, + { + "epoch": 0.05, + "global_step": 8880, + "learning_rate": 0.0004637729549248748, + "loss": 1.611, + "loss_base2": 2.3242, + "loss_pixel": 0.1557, + "loss_text": 1.4553, + "ppl": 5.0078, + "step": 8880 + }, + { + "epoch": 0.05, + "global_step": 8881, + "learning_rate": 0.0004637687813021703, + "loss": 1.6342, + "loss_base2": 2.3577, + "loss_pixel": 0.1565, + "loss_text": 1.4776, + "ppl": 5.1254, + "step": 8881 + }, + { + "epoch": 0.05, + "global_step": 8882, + "learning_rate": 0.00046376460767946575, + "loss": 1.6266, + "loss_base2": 2.3467, + "loss_pixel": 0.1578, + "loss_text": 1.4689, + "ppl": 5.0866, + "step": 8882 + }, + { + "epoch": 0.05, + "global_step": 8883, + "learning_rate": 0.00046376043405676126, + "loss": 1.6314, + "loss_base2": 2.3536, + "loss_pixel": 0.1597, + "loss_text": 1.4717, + "ppl": 5.111, + "step": 8883 + }, + { + "epoch": 0.05, + "global_step": 8884, + "learning_rate": 0.00046375626043405676, + "loss": 1.6137, + "loss_base2": 2.3281, + "loss_pixel": 0.1551, + "loss_text": 1.4586, + "ppl": 5.0214, + "step": 8884 + }, + { + "epoch": 0.05, + "global_step": 8885, + "learning_rate": 0.00046375208681135227, + "loss": 1.6447, + "loss_base2": 2.3728, + "loss_pixel": 0.1583, + "loss_text": 1.4864, + "ppl": 5.1795, + "step": 8885 + }, + { + "epoch": 0.05, + "global_step": 8886, + "learning_rate": 0.0004637479131886477, + "loss": 1.627, + "loss_base2": 2.3473, + "loss_pixel": 0.1581, + "loss_text": 1.4688, + "ppl": 5.0886, + "step": 8886 + }, + { + "epoch": 0.05, + "global_step": 8887, + "learning_rate": 0.00046374373956594323, + "loss": 1.6229, + "loss_base2": 2.3413, + "loss_pixel": 0.1579, + "loss_text": 1.465, + "ppl": 5.0678, + "step": 8887 + }, + { + "epoch": 0.05, + "global_step": 8888, + "learning_rate": 0.00046373956594323874, + "loss": 1.625, + "loss_base2": 2.3444, + "loss_pixel": 0.1586, + "loss_text": 1.4664, + "ppl": 5.0784, + "step": 8888 + }, + { + "epoch": 0.05, + "global_step": 8889, + "learning_rate": 0.00046373539232053425, + "loss": 1.6358, + "loss_base2": 2.36, + "loss_pixel": 0.1556, + "loss_text": 1.4802, + "ppl": 5.1336, + "step": 8889 + }, + { + "epoch": 0.05, + "global_step": 8890, + "learning_rate": 0.00046373121869782975, + "loss": 1.6499, + "loss_base2": 2.3803, + "loss_pixel": 0.1562, + "loss_text": 1.4936, + "ppl": 5.2065, + "step": 8890 + }, + { + "epoch": 0.05, + "global_step": 8891, + "learning_rate": 0.0004637270450751252, + "loss": 1.6378, + "loss_base2": 2.3628, + "loss_pixel": 0.1564, + "loss_text": 1.4815, + "ppl": 5.1438, + "step": 8891 + }, + { + "epoch": 0.05, + "global_step": 8892, + "learning_rate": 0.0004637228714524207, + "loss": 1.6219, + "loss_base2": 2.3399, + "loss_pixel": 0.1548, + "loss_text": 1.467, + "ppl": 5.0627, + "step": 8892 + }, + { + "epoch": 0.05, + "global_step": 8893, + "learning_rate": 0.0004637186978297162, + "loss": 1.6167, + "loss_base2": 2.3324, + "loss_pixel": 0.1569, + "loss_text": 1.4598, + "ppl": 5.0364, + "step": 8893 + }, + { + "epoch": 0.05, + "global_step": 8894, + "learning_rate": 0.00046371452420701173, + "loss": 1.6425, + "loss_base2": 2.3696, + "loss_pixel": 0.1565, + "loss_text": 1.486, + "ppl": 5.1681, + "step": 8894 + }, + { + "epoch": 0.05, + "global_step": 8895, + "learning_rate": 0.0004637103505843072, + "loss": 1.6411, + "loss_base2": 2.3676, + "loss_pixel": 0.155, + "loss_text": 1.4862, + "ppl": 5.1608, + "step": 8895 + }, + { + "epoch": 0.05, + "global_step": 8896, + "learning_rate": 0.0004637061769616027, + "loss": 1.6256, + "loss_base2": 2.3452, + "loss_pixel": 0.1564, + "loss_text": 1.4692, + "ppl": 5.0815, + "step": 8896 + }, + { + "epoch": 0.05, + "global_step": 8897, + "learning_rate": 0.0004637020033388982, + "loss": 1.6449, + "loss_base2": 2.3731, + "loss_pixel": 0.169, + "loss_text": 1.4758, + "ppl": 5.1805, + "step": 8897 + }, + { + "epoch": 0.05, + "global_step": 8898, + "learning_rate": 0.00046369782971619365, + "loss": 1.6681, + "loss_base2": 2.4066, + "loss_pixel": 0.1756, + "loss_text": 1.4925, + "ppl": 5.3021, + "step": 8898 + }, + { + "epoch": 0.05, + "global_step": 8899, + "learning_rate": 0.00046369365609348916, + "loss": 1.6523, + "loss_base2": 2.3838, + "loss_pixel": 0.1737, + "loss_text": 1.4786, + "ppl": 5.219, + "step": 8899 + }, + { + "epoch": 0.05, + "global_step": 8900, + "learning_rate": 0.0004636894824707846, + "loss": 1.6211, + "loss_base2": 2.3388, + "loss_pixel": 0.1584, + "loss_text": 1.4627, + "ppl": 5.0587, + "step": 8900 + }, + { + "epoch": 0.05, + "global_step": 8901, + "learning_rate": 0.0004636853088480801, + "loss": 1.6397, + "loss_base2": 2.3656, + "loss_pixel": 0.1573, + "loss_text": 1.4825, + "ppl": 5.1536, + "step": 8901 + }, + { + "epoch": 0.05, + "global_step": 8902, + "learning_rate": 0.0004636811352253756, + "loss": 1.6432, + "loss_base2": 2.3706, + "loss_pixel": 0.1575, + "loss_text": 1.4857, + "ppl": 5.1717, + "step": 8902 + }, + { + "epoch": 0.05, + "global_step": 8903, + "learning_rate": 0.00046367696160267113, + "loss": 1.6265, + "loss_base2": 2.3465, + "loss_pixel": 0.1586, + "loss_text": 1.4679, + "ppl": 5.086, + "step": 8903 + }, + { + "epoch": 0.05, + "global_step": 8904, + "learning_rate": 0.00046367278797996664, + "loss": 1.6261, + "loss_base2": 2.346, + "loss_pixel": 0.1567, + "loss_text": 1.4694, + "ppl": 5.084, + "step": 8904 + }, + { + "epoch": 0.05, + "global_step": 8905, + "learning_rate": 0.0004636686143572621, + "loss": 1.6162, + "loss_base2": 2.3317, + "loss_pixel": 0.1552, + "loss_text": 1.461, + "ppl": 5.0339, + "step": 8905 + }, + { + "epoch": 0.05, + "global_step": 8906, + "learning_rate": 0.0004636644407345576, + "loss": 1.6111, + "loss_base2": 2.3243, + "loss_pixel": 0.1571, + "loss_text": 1.454, + "ppl": 5.0083, + "step": 8906 + }, + { + "epoch": 0.05, + "global_step": 8907, + "learning_rate": 0.0004636602671118531, + "loss": 1.6235, + "loss_base2": 2.3422, + "loss_pixel": 0.1563, + "loss_text": 1.4672, + "ppl": 5.0708, + "step": 8907 + }, + { + "epoch": 0.05, + "global_step": 8908, + "learning_rate": 0.0004636560934891486, + "loss": 1.6489, + "loss_base2": 2.3789, + "loss_pixel": 0.1558, + "loss_text": 1.493, + "ppl": 5.2013, + "step": 8908 + }, + { + "epoch": 0.05, + "global_step": 8909, + "learning_rate": 0.00046365191986644407, + "loss": 1.6446, + "loss_base2": 2.3727, + "loss_pixel": 0.157, + "loss_text": 1.4875, + "ppl": 5.1789, + "step": 8909 + }, + { + "epoch": 0.05, + "global_step": 8910, + "learning_rate": 0.0004636477462437396, + "loss": 1.6219, + "loss_base2": 2.3399, + "loss_pixel": 0.159, + "loss_text": 1.4629, + "ppl": 5.0627, + "step": 8910 + }, + { + "epoch": 0.05, + "global_step": 8911, + "learning_rate": 0.0004636435726210351, + "loss": 1.6474, + "loss_base2": 2.3767, + "loss_pixel": 0.1554, + "loss_text": 1.492, + "ppl": 5.1935, + "step": 8911 + }, + { + "epoch": 0.05, + "global_step": 8912, + "learning_rate": 0.0004636393989983306, + "loss": 1.6175, + "loss_base2": 2.3336, + "loss_pixel": 0.156, + "loss_text": 1.4614, + "ppl": 5.0405, + "step": 8912 + }, + { + "epoch": 0.05, + "global_step": 8913, + "learning_rate": 0.0004636352253756261, + "loss": 1.6262, + "loss_base2": 2.3461, + "loss_pixel": 0.1564, + "loss_text": 1.4699, + "ppl": 5.0845, + "step": 8913 + }, + { + "epoch": 0.05, + "global_step": 8914, + "learning_rate": 0.00046363105175292155, + "loss": 1.6454, + "loss_base2": 2.3738, + "loss_pixel": 0.1538, + "loss_text": 1.4916, + "ppl": 5.1831, + "step": 8914 + }, + { + "epoch": 0.05, + "global_step": 8915, + "learning_rate": 0.00046362687813021706, + "loss": 1.6168, + "loss_base2": 2.3325, + "loss_pixel": 0.1567, + "loss_text": 1.4601, + "ppl": 5.0369, + "step": 8915 + }, + { + "epoch": 0.05, + "global_step": 8916, + "learning_rate": 0.00046362270450751256, + "loss": 1.6322, + "loss_base2": 2.3548, + "loss_pixel": 0.1556, + "loss_text": 1.4766, + "ppl": 5.1151, + "step": 8916 + }, + { + "epoch": 0.05, + "global_step": 8917, + "learning_rate": 0.000463618530884808, + "loss": 1.6285, + "loss_base2": 2.3494, + "loss_pixel": 0.1634, + "loss_text": 1.4651, + "ppl": 5.0962, + "step": 8917 + }, + { + "epoch": 0.05, + "global_step": 8918, + "learning_rate": 0.00046361435726210347, + "loss": 1.6501, + "loss_base2": 2.3806, + "loss_pixel": 0.1743, + "loss_text": 1.4757, + "ppl": 5.2075, + "step": 8918 + }, + { + "epoch": 0.05, + "global_step": 8919, + "learning_rate": 0.000463610183639399, + "loss": 1.6237, + "loss_base2": 2.3425, + "loss_pixel": 0.1746, + "loss_text": 1.4491, + "ppl": 5.0718, + "step": 8919 + }, + { + "epoch": 0.05, + "global_step": 8920, + "learning_rate": 0.0004636060100166945, + "loss": 1.6357, + "loss_base2": 2.3598, + "loss_pixel": 0.1633, + "loss_text": 1.4724, + "ppl": 5.133, + "step": 8920 + }, + { + "epoch": 0.05, + "global_step": 8921, + "learning_rate": 0.00046360183639399, + "loss": 1.6382, + "loss_base2": 2.3634, + "loss_pixel": 0.1567, + "loss_text": 1.4815, + "ppl": 5.1459, + "step": 8921 + }, + { + "epoch": 0.05, + "global_step": 8922, + "learning_rate": 0.0004635976627712855, + "loss": 1.6405, + "loss_base2": 2.3667, + "loss_pixel": 0.1583, + "loss_text": 1.4822, + "ppl": 5.1577, + "step": 8922 + }, + { + "epoch": 0.05, + "global_step": 8923, + "learning_rate": 0.00046359348914858095, + "loss": 1.6539, + "loss_base2": 2.3861, + "loss_pixel": 0.1572, + "loss_text": 1.4967, + "ppl": 5.2273, + "step": 8923 + }, + { + "epoch": 0.05, + "global_step": 8924, + "learning_rate": 0.00046358931552587646, + "loss": 1.6369, + "loss_base2": 2.3615, + "loss_pixel": 0.1583, + "loss_text": 1.4786, + "ppl": 5.1392, + "step": 8924 + }, + { + "epoch": 0.05, + "global_step": 8925, + "learning_rate": 0.00046358514190317197, + "loss": 1.6292, + "loss_base2": 2.3504, + "loss_pixel": 0.1576, + "loss_text": 1.4715, + "ppl": 5.0998, + "step": 8925 + }, + { + "epoch": 0.05, + "global_step": 8926, + "learning_rate": 0.0004635809682804675, + "loss": 1.6205, + "loss_base2": 2.3379, + "loss_pixel": 0.1576, + "loss_text": 1.4629, + "ppl": 5.0556, + "step": 8926 + }, + { + "epoch": 0.05, + "global_step": 8927, + "learning_rate": 0.0004635767946577629, + "loss": 1.6303, + "loss_base2": 2.352, + "loss_pixel": 0.1582, + "loss_text": 1.4721, + "ppl": 5.1054, + "step": 8927 + }, + { + "epoch": 0.05, + "global_step": 8928, + "learning_rate": 0.00046357262103505843, + "loss": 1.6219, + "loss_base2": 2.3399, + "loss_pixel": 0.1552, + "loss_text": 1.4668, + "ppl": 5.0627, + "step": 8928 + }, + { + "epoch": 0.05, + "global_step": 8929, + "learning_rate": 0.00046356844741235394, + "loss": 1.6262, + "loss_base2": 2.3461, + "loss_pixel": 0.1585, + "loss_text": 1.4677, + "ppl": 5.0845, + "step": 8929 + }, + { + "epoch": 0.05, + "global_step": 8930, + "learning_rate": 0.00046356427378964945, + "loss": 1.6396, + "loss_base2": 2.3654, + "loss_pixel": 0.1581, + "loss_text": 1.4815, + "ppl": 5.1531, + "step": 8930 + }, + { + "epoch": 0.05, + "global_step": 8931, + "learning_rate": 0.00046356010016694496, + "loss": 1.6376, + "loss_base2": 2.3626, + "loss_pixel": 0.1541, + "loss_text": 1.4835, + "ppl": 5.1428, + "step": 8931 + }, + { + "epoch": 0.05, + "global_step": 8932, + "learning_rate": 0.0004635559265442404, + "loss": 1.6289, + "loss_base2": 2.35, + "loss_pixel": 0.1556, + "loss_text": 1.4733, + "ppl": 5.0983, + "step": 8932 + }, + { + "epoch": 0.05, + "global_step": 8933, + "learning_rate": 0.0004635517529215359, + "loss": 1.6233, + "loss_base2": 2.3419, + "loss_pixel": 0.1552, + "loss_text": 1.4681, + "ppl": 5.0698, + "step": 8933 + }, + { + "epoch": 0.05, + "global_step": 8934, + "learning_rate": 0.0004635475792988314, + "loss": 1.5947, + "loss_base2": 2.3007, + "loss_pixel": 0.1552, + "loss_text": 1.4395, + "ppl": 4.9269, + "step": 8934 + }, + { + "epoch": 0.05, + "global_step": 8935, + "learning_rate": 0.00046354340567612693, + "loss": 1.5653, + "loss_base2": 2.2583, + "loss_pixel": 0.1527, + "loss_text": 1.4126, + "ppl": 4.7841, + "step": 8935 + }, + { + "epoch": 0.05, + "global_step": 8936, + "learning_rate": 0.00046353923205342233, + "loss": 1.6302, + "loss_base2": 2.3519, + "loss_pixel": 0.1548, + "loss_text": 1.4754, + "ppl": 5.1049, + "step": 8936 + }, + { + "epoch": 0.05, + "global_step": 8937, + "learning_rate": 0.00046353505843071784, + "loss": 1.6385, + "loss_base2": 2.3639, + "loss_pixel": 0.163, + "loss_text": 1.4755, + "ppl": 5.1474, + "step": 8937 + }, + { + "epoch": 0.05, + "global_step": 8938, + "learning_rate": 0.00046353088480801334, + "loss": 1.6295, + "loss_base2": 2.3509, + "loss_pixel": 0.1682, + "loss_text": 1.4613, + "ppl": 5.1013, + "step": 8938 + }, + { + "epoch": 0.05, + "global_step": 8939, + "learning_rate": 0.00046352671118530885, + "loss": 1.6473, + "loss_base2": 2.3766, + "loss_pixel": 0.1696, + "loss_text": 1.4778, + "ppl": 5.1929, + "step": 8939 + }, + { + "epoch": 0.05, + "global_step": 8940, + "learning_rate": 0.00046352253756260436, + "loss": 1.6196, + "loss_base2": 2.3366, + "loss_pixel": 0.1673, + "loss_text": 1.4522, + "ppl": 5.0511, + "step": 8940 + }, + { + "epoch": 0.05, + "global_step": 8941, + "learning_rate": 0.0004635183639398998, + "loss": 1.6347, + "loss_base2": 2.3584, + "loss_pixel": 0.1688, + "loss_text": 1.4658, + "ppl": 5.1279, + "step": 8941 + }, + { + "epoch": 0.05, + "global_step": 8942, + "learning_rate": 0.0004635141903171953, + "loss": 1.6216, + "loss_base2": 2.3395, + "loss_pixel": 0.169, + "loss_text": 1.4526, + "ppl": 5.0612, + "step": 8942 + }, + { + "epoch": 0.05, + "global_step": 8943, + "learning_rate": 0.00046351001669449083, + "loss": 1.6494, + "loss_base2": 2.3796, + "loss_pixel": 0.1677, + "loss_text": 1.4817, + "ppl": 5.2039, + "step": 8943 + }, + { + "epoch": 0.05, + "global_step": 8944, + "learning_rate": 0.00046350584307178633, + "loss": 1.6463, + "loss_base2": 2.3751, + "loss_pixel": 0.1688, + "loss_text": 1.4775, + "ppl": 5.1877, + "step": 8944 + }, + { + "epoch": 0.05, + "global_step": 8945, + "learning_rate": 0.0004635016694490818, + "loss": 1.6542, + "loss_base2": 2.3865, + "loss_pixel": 0.1684, + "loss_text": 1.4859, + "ppl": 5.2289, + "step": 8945 + }, + { + "epoch": 0.05, + "global_step": 8946, + "learning_rate": 0.0004634974958263773, + "loss": 1.6272, + "loss_base2": 2.3476, + "loss_pixel": 0.168, + "loss_text": 1.4591, + "ppl": 5.0896, + "step": 8946 + }, + { + "epoch": 0.05, + "global_step": 8947, + "learning_rate": 0.0004634933222036728, + "loss": 1.6262, + "loss_base2": 2.3461, + "loss_pixel": 0.1682, + "loss_text": 1.458, + "ppl": 5.0845, + "step": 8947 + }, + { + "epoch": 0.05, + "global_step": 8948, + "learning_rate": 0.0004634891485809683, + "loss": 1.6466, + "loss_base2": 2.3755, + "loss_pixel": 0.1681, + "loss_text": 1.4785, + "ppl": 5.1893, + "step": 8948 + }, + { + "epoch": 0.05, + "global_step": 8949, + "learning_rate": 0.0004634849749582638, + "loss": 1.6439, + "loss_base2": 2.3716, + "loss_pixel": 0.1679, + "loss_text": 1.476, + "ppl": 5.1753, + "step": 8949 + }, + { + "epoch": 0.05, + "global_step": 8950, + "learning_rate": 0.00046348080133555927, + "loss": 1.6241, + "loss_base2": 2.3431, + "loss_pixel": 0.1657, + "loss_text": 1.4584, + "ppl": 5.0739, + "step": 8950 + }, + { + "epoch": 0.05, + "global_step": 8951, + "learning_rate": 0.0004634766277128548, + "loss": 1.6321, + "loss_base2": 2.3546, + "loss_pixel": 0.1677, + "loss_text": 1.4644, + "ppl": 5.1146, + "step": 8951 + }, + { + "epoch": 0.05, + "global_step": 8952, + "learning_rate": 0.0004634724540901503, + "loss": 1.6491, + "loss_base2": 2.3791, + "loss_pixel": 0.1683, + "loss_text": 1.4808, + "ppl": 5.2023, + "step": 8952 + }, + { + "epoch": 0.05, + "global_step": 8953, + "learning_rate": 0.0004634682804674458, + "loss": 1.6472, + "loss_base2": 2.3764, + "loss_pixel": 0.1665, + "loss_text": 1.4807, + "ppl": 5.1924, + "step": 8953 + }, + { + "epoch": 0.05, + "global_step": 8954, + "learning_rate": 0.0004634641068447412, + "loss": 1.6312, + "loss_base2": 2.3533, + "loss_pixel": 0.167, + "loss_text": 1.4642, + "ppl": 5.11, + "step": 8954 + }, + { + "epoch": 0.05, + "global_step": 8955, + "learning_rate": 0.0004634599332220367, + "loss": 1.6385, + "loss_base2": 2.3639, + "loss_pixel": 0.1671, + "loss_text": 1.4714, + "ppl": 5.1474, + "step": 8955 + }, + { + "epoch": 0.05, + "global_step": 8956, + "learning_rate": 0.0004634557595993322, + "loss": 1.5742, + "loss_base2": 2.2711, + "loss_pixel": 0.1686, + "loss_text": 1.4056, + "ppl": 4.8269, + "step": 8956 + }, + { + "epoch": 0.05, + "global_step": 8957, + "learning_rate": 0.0004634515859766277, + "loss": 1.4378, + "loss_base2": 2.0743, + "loss_pixel": 0.1683, + "loss_text": 1.2695, + "ppl": 4.2114, + "step": 8957 + }, + { + "epoch": 0.05, + "global_step": 8958, + "learning_rate": 0.0004634474123539232, + "loss": 1.4398, + "loss_base2": 2.0772, + "loss_pixel": 0.1676, + "loss_text": 1.2722, + "ppl": 4.2199, + "step": 8958 + }, + { + "epoch": 0.05, + "global_step": 8959, + "learning_rate": 0.0004634432387312187, + "loss": 1.4092, + "loss_base2": 2.033, + "loss_pixel": 0.167, + "loss_text": 1.2422, + "ppl": 4.0927, + "step": 8959 + }, + { + "epoch": 0.05, + "global_step": 8960, + "learning_rate": 0.0004634390651085142, + "loss": 1.4049, + "loss_base2": 2.0268, + "loss_pixel": 0.1656, + "loss_text": 1.2393, + "ppl": 4.0751, + "step": 8960 + }, + { + "epoch": 0.05, + "global_step": 8961, + "learning_rate": 0.0004634348914858097, + "loss": 1.3992, + "loss_base2": 2.0186, + "loss_pixel": 0.1676, + "loss_text": 1.2316, + "ppl": 4.052, + "step": 8961 + }, + { + "epoch": 0.05, + "global_step": 8962, + "learning_rate": 0.0004634307178631052, + "loss": 1.4404, + "loss_base2": 2.0781, + "loss_pixel": 0.1685, + "loss_text": 1.2719, + "ppl": 4.2224, + "step": 8962 + }, + { + "epoch": 0.05, + "global_step": 8963, + "learning_rate": 0.0004634265442404007, + "loss": 1.4392, + "loss_base2": 2.0763, + "loss_pixel": 0.167, + "loss_text": 1.2723, + "ppl": 4.2173, + "step": 8963 + }, + { + "epoch": 0.05, + "global_step": 8964, + "learning_rate": 0.00046342237061769616, + "loss": 1.4367, + "loss_base2": 2.0727, + "loss_pixel": 0.1671, + "loss_text": 1.2697, + "ppl": 4.2068, + "step": 8964 + }, + { + "epoch": 0.05, + "global_step": 8965, + "learning_rate": 0.00046341819699499166, + "loss": 1.4241, + "loss_base2": 2.0545, + "loss_pixel": 0.1678, + "loss_text": 1.2563, + "ppl": 4.1541, + "step": 8965 + }, + { + "epoch": 0.05, + "global_step": 8966, + "learning_rate": 0.00046341402337228717, + "loss": 1.4413, + "loss_base2": 2.0794, + "loss_pixel": 0.1695, + "loss_text": 1.2719, + "ppl": 4.2262, + "step": 8966 + }, + { + "epoch": 0.05, + "global_step": 8967, + "learning_rate": 0.0004634098497495827, + "loss": 1.4186, + "loss_base2": 2.0466, + "loss_pixel": 0.1657, + "loss_text": 1.2529, + "ppl": 4.1313, + "step": 8967 + }, + { + "epoch": 0.05, + "global_step": 8968, + "learning_rate": 0.00046340567612687813, + "loss": 1.4366, + "loss_base2": 2.0726, + "loss_pixel": 0.1666, + "loss_text": 1.27, + "ppl": 4.2064, + "step": 8968 + }, + { + "epoch": 0.05, + "global_step": 8969, + "learning_rate": 0.00046340150250417364, + "loss": 1.4191, + "loss_base2": 2.0473, + "loss_pixel": 0.1664, + "loss_text": 1.2527, + "ppl": 4.1334, + "step": 8969 + }, + { + "epoch": 0.05, + "global_step": 8970, + "learning_rate": 0.00046339732888146915, + "loss": 1.4295, + "loss_base2": 2.0623, + "loss_pixel": 0.1659, + "loss_text": 1.2636, + "ppl": 4.1766, + "step": 8970 + }, + { + "epoch": 0.05, + "global_step": 8971, + "learning_rate": 0.00046339315525876465, + "loss": 1.4142, + "loss_base2": 2.0403, + "loss_pixel": 0.1665, + "loss_text": 1.2477, + "ppl": 4.1132, + "step": 8971 + }, + { + "epoch": 0.05, + "global_step": 8972, + "learning_rate": 0.00046338898163606016, + "loss": 1.5503, + "loss_base2": 2.2366, + "loss_pixel": 0.1674, + "loss_text": 1.3829, + "ppl": 4.7129, + "step": 8972 + }, + { + "epoch": 0.05, + "global_step": 8973, + "learning_rate": 0.00046338480801335556, + "loss": 1.639, + "loss_base2": 2.3646, + "loss_pixel": 0.1667, + "loss_text": 1.4723, + "ppl": 5.15, + "step": 8973 + }, + { + "epoch": 0.05, + "global_step": 8974, + "learning_rate": 0.00046338063439065107, + "loss": 1.6347, + "loss_base2": 2.3584, + "loss_pixel": 0.1676, + "loss_text": 1.4671, + "ppl": 5.1279, + "step": 8974 + }, + { + "epoch": 0.05, + "global_step": 8975, + "learning_rate": 0.0004633764607679466, + "loss": 1.6718, + "loss_base2": 2.4119, + "loss_pixel": 0.1655, + "loss_text": 1.5063, + "ppl": 5.3217, + "step": 8975 + }, + { + "epoch": 0.05, + "global_step": 8976, + "learning_rate": 0.0004633722871452421, + "loss": 1.6581, + "loss_base2": 2.3921, + "loss_pixel": 0.1662, + "loss_text": 1.4919, + "ppl": 5.2493, + "step": 8976 + }, + { + "epoch": 0.05, + "global_step": 8977, + "learning_rate": 0.00046336811352253753, + "loss": 1.6327, + "loss_base2": 2.3555, + "loss_pixel": 0.1652, + "loss_text": 1.4675, + "ppl": 5.1177, + "step": 8977 + }, + { + "epoch": 0.05, + "global_step": 8978, + "learning_rate": 0.00046336393989983304, + "loss": 1.6575, + "loss_base2": 2.3913, + "loss_pixel": 0.1672, + "loss_text": 1.4903, + "ppl": 5.2462, + "step": 8978 + }, + { + "epoch": 0.05, + "global_step": 8979, + "learning_rate": 0.00046335976627712855, + "loss": 1.6515, + "loss_base2": 2.3826, + "loss_pixel": 0.166, + "loss_text": 1.4854, + "ppl": 5.2148, + "step": 8979 + }, + { + "epoch": 0.05, + "global_step": 8980, + "learning_rate": 0.00046335559265442406, + "loss": 1.646, + "loss_base2": 2.3747, + "loss_pixel": 0.1665, + "loss_text": 1.4795, + "ppl": 5.1862, + "step": 8980 + }, + { + "epoch": 0.05, + "global_step": 8981, + "learning_rate": 0.00046335141903171956, + "loss": 1.6302, + "loss_base2": 2.3519, + "loss_pixel": 0.1666, + "loss_text": 1.4636, + "ppl": 5.1049, + "step": 8981 + }, + { + "epoch": 0.05, + "global_step": 8982, + "learning_rate": 0.000463347245409015, + "loss": 1.6317, + "loss_base2": 2.354, + "loss_pixel": 0.1662, + "loss_text": 1.4655, + "ppl": 5.1126, + "step": 8982 + }, + { + "epoch": 0.05, + "global_step": 8983, + "learning_rate": 0.0004633430717863105, + "loss": 1.6555, + "loss_base2": 2.3884, + "loss_pixel": 0.1659, + "loss_text": 1.4896, + "ppl": 5.2357, + "step": 8983 + }, + { + "epoch": 0.05, + "global_step": 8984, + "learning_rate": 0.00046333889816360603, + "loss": 1.637, + "loss_base2": 2.3617, + "loss_pixel": 0.1645, + "loss_text": 1.4724, + "ppl": 5.1397, + "step": 8984 + }, + { + "epoch": 0.05, + "global_step": 8985, + "learning_rate": 0.00046333472454090154, + "loss": 1.6448, + "loss_base2": 2.3729, + "loss_pixel": 0.1663, + "loss_text": 1.4785, + "ppl": 5.18, + "step": 8985 + }, + { + "epoch": 0.05, + "global_step": 8986, + "learning_rate": 0.000463330550918197, + "loss": 1.6521, + "loss_base2": 2.3835, + "loss_pixel": 0.1658, + "loss_text": 1.4863, + "ppl": 5.2179, + "step": 8986 + }, + { + "epoch": 0.05, + "global_step": 8987, + "learning_rate": 0.0004633263772954925, + "loss": 1.6348, + "loss_base2": 2.3585, + "loss_pixel": 0.1667, + "loss_text": 1.4682, + "ppl": 5.1284, + "step": 8987 + }, + { + "epoch": 0.05, + "global_step": 8988, + "learning_rate": 0.000463322203672788, + "loss": 1.6279, + "loss_base2": 2.3486, + "loss_pixel": 0.1666, + "loss_text": 1.4613, + "ppl": 5.0932, + "step": 8988 + }, + { + "epoch": 0.05, + "global_step": 8989, + "learning_rate": 0.0004633180300500835, + "loss": 1.6368, + "loss_base2": 2.3614, + "loss_pixel": 0.1664, + "loss_text": 1.4704, + "ppl": 5.1387, + "step": 8989 + }, + { + "epoch": 0.05, + "global_step": 8990, + "learning_rate": 0.000463313856427379, + "loss": 1.6329, + "loss_base2": 2.3558, + "loss_pixel": 0.1682, + "loss_text": 1.4647, + "ppl": 5.1187, + "step": 8990 + }, + { + "epoch": 0.05, + "global_step": 8991, + "learning_rate": 0.0004633096828046745, + "loss": 1.6451, + "loss_base2": 2.3734, + "loss_pixel": 0.1654, + "loss_text": 1.4796, + "ppl": 5.1815, + "step": 8991 + }, + { + "epoch": 0.05, + "global_step": 8992, + "learning_rate": 0.0004633055091819699, + "loss": 1.6458, + "loss_base2": 2.3744, + "loss_pixel": 0.1658, + "loss_text": 1.48, + "ppl": 5.1852, + "step": 8992 + }, + { + "epoch": 0.05, + "global_step": 8993, + "learning_rate": 0.00046330133555926543, + "loss": 1.6527, + "loss_base2": 2.3843, + "loss_pixel": 0.166, + "loss_text": 1.4867, + "ppl": 5.2211, + "step": 8993 + }, + { + "epoch": 0.05, + "global_step": 8994, + "learning_rate": 0.00046329716193656094, + "loss": 1.5627, + "loss_base2": 2.2545, + "loss_pixel": 0.1656, + "loss_text": 1.3971, + "ppl": 4.7717, + "step": 8994 + }, + { + "epoch": 0.05, + "global_step": 8995, + "learning_rate": 0.0004632929883138564, + "loss": 1.429, + "loss_base2": 2.0616, + "loss_pixel": 0.1669, + "loss_text": 1.2621, + "ppl": 4.1745, + "step": 8995 + }, + { + "epoch": 0.05, + "global_step": 8996, + "learning_rate": 0.0004632888146911519, + "loss": 1.4505, + "loss_base2": 2.0926, + "loss_pixel": 0.1693, + "loss_text": 1.2812, + "ppl": 4.2652, + "step": 8996 + }, + { + "epoch": 0.05, + "global_step": 8997, + "learning_rate": 0.0004632846410684474, + "loss": 1.4346, + "loss_base2": 2.0697, + "loss_pixel": 0.1655, + "loss_text": 1.2691, + "ppl": 4.198, + "step": 8997 + }, + { + "epoch": 0.05, + "global_step": 8998, + "learning_rate": 0.0004632804674457429, + "loss": 1.4423, + "loss_base2": 2.0808, + "loss_pixel": 0.1677, + "loss_text": 1.2747, + "ppl": 4.2304, + "step": 8998 + }, + { + "epoch": 0.05, + "global_step": 8999, + "learning_rate": 0.0004632762938230384, + "loss": 1.4179, + "loss_base2": 2.0456, + "loss_pixel": 0.1668, + "loss_text": 1.2511, + "ppl": 4.1284, + "step": 8999 + }, + { + "epoch": 0.05, + "global_step": 9000, + "learning_rate": 0.0004632721202003339, + "loss": 1.4029, + "loss_base2": 2.024, + "loss_pixel": 0.1665, + "loss_text": 1.2364, + "ppl": 4.067, + "step": 9000 + }, + { + "epoch": 0.05, + "global_step": 9001, + "learning_rate": 0.0004632679465776294, + "loss": 1.4297, + "loss_base2": 2.0626, + "loss_pixel": 0.1663, + "loss_text": 1.2634, + "ppl": 4.1774, + "step": 9001 + }, + { + "epoch": 0.05, + "global_step": 9002, + "learning_rate": 0.0004632637729549249, + "loss": 1.4071, + "loss_base2": 2.03, + "loss_pixel": 0.1643, + "loss_text": 1.2428, + "ppl": 4.0841, + "step": 9002 + }, + { + "epoch": 0.05, + "global_step": 9003, + "learning_rate": 0.0004632595993322204, + "loss": 1.4425, + "loss_base2": 2.0811, + "loss_pixel": 0.1657, + "loss_text": 1.2768, + "ppl": 4.2313, + "step": 9003 + }, + { + "epoch": 0.05, + "global_step": 9004, + "learning_rate": 0.00046325542570951585, + "loss": 1.413, + "loss_base2": 2.0385, + "loss_pixel": 0.1656, + "loss_text": 1.2474, + "ppl": 4.1083, + "step": 9004 + }, + { + "epoch": 0.05, + "global_step": 9005, + "learning_rate": 0.00046325125208681136, + "loss": 1.4275, + "loss_base2": 2.0594, + "loss_pixel": 0.1665, + "loss_text": 1.261, + "ppl": 4.1683, + "step": 9005 + }, + { + "epoch": 0.05, + "global_step": 9006, + "learning_rate": 0.00046324707846410687, + "loss": 1.4094, + "loss_base2": 2.0333, + "loss_pixel": 0.1656, + "loss_text": 1.2438, + "ppl": 4.0935, + "step": 9006 + }, + { + "epoch": 0.05, + "global_step": 9007, + "learning_rate": 0.0004632429048414024, + "loss": 1.4175, + "loss_base2": 2.045, + "loss_pixel": 0.1648, + "loss_text": 1.2528, + "ppl": 4.1268, + "step": 9007 + }, + { + "epoch": 0.05, + "global_step": 9008, + "learning_rate": 0.0004632387312186979, + "loss": 1.4215, + "loss_base2": 2.0508, + "loss_pixel": 0.1653, + "loss_text": 1.2562, + "ppl": 4.1433, + "step": 9008 + }, + { + "epoch": 0.05, + "global_step": 9009, + "learning_rate": 0.00046323455759599333, + "loss": 1.4165, + "loss_base2": 2.0436, + "loss_pixel": 0.1648, + "loss_text": 1.2518, + "ppl": 4.1227, + "step": 9009 + }, + { + "epoch": 0.05, + "global_step": 9010, + "learning_rate": 0.00046323038397328884, + "loss": 1.4117, + "loss_base2": 2.0367, + "loss_pixel": 0.1652, + "loss_text": 1.2466, + "ppl": 4.1029, + "step": 9010 + }, + { + "epoch": 0.05, + "global_step": 9011, + "learning_rate": 0.0004632262103505843, + "loss": 1.4193, + "loss_base2": 2.0476, + "loss_pixel": 0.1662, + "loss_text": 1.2531, + "ppl": 4.1342, + "step": 9011 + }, + { + "epoch": 0.05, + "global_step": 9012, + "learning_rate": 0.0004632220367278798, + "loss": 1.6351, + "loss_base2": 2.359, + "loss_pixel": 0.1659, + "loss_text": 1.4692, + "ppl": 5.13, + "step": 9012 + }, + { + "epoch": 0.05, + "global_step": 9013, + "learning_rate": 0.00046321786310517526, + "loss": 1.6535, + "loss_base2": 2.3855, + "loss_pixel": 0.1655, + "loss_text": 1.488, + "ppl": 5.2252, + "step": 9013 + }, + { + "epoch": 0.05, + "global_step": 9014, + "learning_rate": 0.00046321368948247076, + "loss": 1.656, + "loss_base2": 2.3891, + "loss_pixel": 0.1647, + "loss_text": 1.4914, + "ppl": 5.2383, + "step": 9014 + }, + { + "epoch": 0.05, + "global_step": 9015, + "learning_rate": 0.00046320951585976627, + "loss": 1.6295, + "loss_base2": 2.3509, + "loss_pixel": 0.1646, + "loss_text": 1.4649, + "ppl": 5.1013, + "step": 9015 + }, + { + "epoch": 0.05, + "global_step": 9016, + "learning_rate": 0.0004632053422370618, + "loss": 1.6476, + "loss_base2": 2.377, + "loss_pixel": 0.166, + "loss_text": 1.4816, + "ppl": 5.1945, + "step": 9016 + }, + { + "epoch": 0.05, + "global_step": 9017, + "learning_rate": 0.0004632011686143573, + "loss": 1.6382, + "loss_base2": 2.3634, + "loss_pixel": 0.1666, + "loss_text": 1.4715, + "ppl": 5.1459, + "step": 9017 + }, + { + "epoch": 0.05, + "global_step": 9018, + "learning_rate": 0.00046319699499165274, + "loss": 1.6482, + "loss_base2": 2.3778, + "loss_pixel": 0.1657, + "loss_text": 1.4825, + "ppl": 5.1976, + "step": 9018 + }, + { + "epoch": 0.05, + "global_step": 9019, + "learning_rate": 0.00046319282136894825, + "loss": 1.643, + "loss_base2": 2.3703, + "loss_pixel": 0.1656, + "loss_text": 1.4774, + "ppl": 5.1707, + "step": 9019 + }, + { + "epoch": 0.05, + "global_step": 9020, + "learning_rate": 0.00046318864774624375, + "loss": 1.644, + "loss_base2": 2.3718, + "loss_pixel": 0.165, + "loss_text": 1.479, + "ppl": 5.1758, + "step": 9020 + }, + { + "epoch": 0.05, + "global_step": 9021, + "learning_rate": 0.00046318447412353926, + "loss": 1.6477, + "loss_base2": 2.3771, + "loss_pixel": 0.1647, + "loss_text": 1.483, + "ppl": 5.195, + "step": 9021 + }, + { + "epoch": 0.05, + "global_step": 9022, + "learning_rate": 0.00046318030050083477, + "loss": 1.6447, + "loss_base2": 2.3728, + "loss_pixel": 0.1657, + "loss_text": 1.4789, + "ppl": 5.1795, + "step": 9022 + }, + { + "epoch": 0.05, + "global_step": 9023, + "learning_rate": 0.0004631761268781302, + "loss": 1.6468, + "loss_base2": 2.3758, + "loss_pixel": 0.1652, + "loss_text": 1.4816, + "ppl": 5.1903, + "step": 9023 + }, + { + "epoch": 0.05, + "global_step": 9024, + "learning_rate": 0.00046317195325542573, + "loss": 1.6398, + "loss_base2": 2.3657, + "loss_pixel": 0.1655, + "loss_text": 1.4744, + "ppl": 5.1541, + "step": 9024 + }, + { + "epoch": 0.05, + "global_step": 9025, + "learning_rate": 0.00046316777963272123, + "loss": 1.6468, + "loss_base2": 2.3758, + "loss_pixel": 0.1657, + "loss_text": 1.4811, + "ppl": 5.1903, + "step": 9025 + }, + { + "epoch": 0.05, + "global_step": 9026, + "learning_rate": 0.00046316360601001674, + "loss": 1.6355, + "loss_base2": 2.3595, + "loss_pixel": 0.1661, + "loss_text": 1.4693, + "ppl": 5.132, + "step": 9026 + }, + { + "epoch": 0.05, + "global_step": 9027, + "learning_rate": 0.0004631594323873122, + "loss": 1.6412, + "loss_base2": 2.3678, + "loss_pixel": 0.1649, + "loss_text": 1.4764, + "ppl": 5.1614, + "step": 9027 + }, + { + "epoch": 0.05, + "global_step": 9028, + "learning_rate": 0.0004631552587646077, + "loss": 1.6316, + "loss_base2": 2.3539, + "loss_pixel": 0.1661, + "loss_text": 1.4655, + "ppl": 5.112, + "step": 9028 + }, + { + "epoch": 0.05, + "global_step": 9029, + "learning_rate": 0.0004631510851419032, + "loss": 1.6343, + "loss_base2": 2.3578, + "loss_pixel": 0.1654, + "loss_text": 1.4689, + "ppl": 5.1259, + "step": 9029 + }, + { + "epoch": 0.05, + "global_step": 9030, + "learning_rate": 0.00046314691151919866, + "loss": 1.6318, + "loss_base2": 2.3542, + "loss_pixel": 0.1656, + "loss_text": 1.4662, + "ppl": 5.1131, + "step": 9030 + }, + { + "epoch": 0.05, + "global_step": 9031, + "learning_rate": 0.00046314273789649417, + "loss": 1.6284, + "loss_base2": 2.3493, + "loss_pixel": 0.1655, + "loss_text": 1.4629, + "ppl": 5.0957, + "step": 9031 + }, + { + "epoch": 0.05, + "global_step": 9032, + "learning_rate": 0.0004631385642737896, + "loss": 1.6564, + "loss_base2": 2.3897, + "loss_pixel": 0.1663, + "loss_text": 1.4901, + "ppl": 5.2404, + "step": 9032 + }, + { + "epoch": 0.05, + "global_step": 9033, + "learning_rate": 0.00046313439065108513, + "loss": 1.6279, + "loss_base2": 2.3486, + "loss_pixel": 0.1644, + "loss_text": 1.4635, + "ppl": 5.0932, + "step": 9033 + }, + { + "epoch": 0.05, + "global_step": 9034, + "learning_rate": 0.00046313021702838064, + "loss": 1.6292, + "loss_base2": 2.3504, + "loss_pixel": 0.1656, + "loss_text": 1.4637, + "ppl": 5.0998, + "step": 9034 + }, + { + "epoch": 0.05, + "global_step": 9035, + "learning_rate": 0.00046312604340567615, + "loss": 1.6334, + "loss_base2": 2.3565, + "loss_pixel": 0.165, + "loss_text": 1.4684, + "ppl": 5.1213, + "step": 9035 + }, + { + "epoch": 0.05, + "global_step": 9036, + "learning_rate": 0.0004631218697829716, + "loss": 1.628, + "loss_base2": 2.3487, + "loss_pixel": 0.1644, + "loss_text": 1.4635, + "ppl": 5.0937, + "step": 9036 + }, + { + "epoch": 0.05, + "global_step": 9037, + "learning_rate": 0.0004631176961602671, + "loss": 1.6396, + "loss_base2": 2.3654, + "loss_pixel": 0.165, + "loss_text": 1.4746, + "ppl": 5.1531, + "step": 9037 + }, + { + "epoch": 0.05, + "global_step": 9038, + "learning_rate": 0.0004631135225375626, + "loss": 1.642, + "loss_base2": 2.3689, + "loss_pixel": 0.166, + "loss_text": 1.476, + "ppl": 5.1655, + "step": 9038 + }, + { + "epoch": 0.05, + "global_step": 9039, + "learning_rate": 0.0004631093489148581, + "loss": 1.6339, + "loss_base2": 2.3572, + "loss_pixel": 0.1654, + "loss_text": 1.4685, + "ppl": 5.1238, + "step": 9039 + }, + { + "epoch": 0.05, + "global_step": 9040, + "learning_rate": 0.00046310517529215363, + "loss": 1.6329, + "loss_base2": 2.3558, + "loss_pixel": 0.1658, + "loss_text": 1.4671, + "ppl": 5.1187, + "step": 9040 + }, + { + "epoch": 0.05, + "global_step": 9041, + "learning_rate": 0.0004631010016694491, + "loss": 1.6477, + "loss_base2": 2.3771, + "loss_pixel": 0.1671, + "loss_text": 1.4807, + "ppl": 5.195, + "step": 9041 + }, + { + "epoch": 0.05, + "global_step": 9042, + "learning_rate": 0.0004630968280467446, + "loss": 1.6651, + "loss_base2": 2.4022, + "loss_pixel": 0.1778, + "loss_text": 1.4873, + "ppl": 5.2862, + "step": 9042 + }, + { + "epoch": 0.05, + "global_step": 9043, + "learning_rate": 0.0004630926544240401, + "loss": 1.6566, + "loss_base2": 2.39, + "loss_pixel": 0.1856, + "loss_text": 1.471, + "ppl": 5.2415, + "step": 9043 + }, + { + "epoch": 0.05, + "global_step": 9044, + "learning_rate": 0.0004630884808013356, + "loss": 1.7014, + "loss_base2": 2.4546, + "loss_pixel": 0.2076, + "loss_text": 1.4938, + "ppl": 5.4816, + "step": 9044 + }, + { + "epoch": 0.05, + "global_step": 9045, + "learning_rate": 0.00046308430717863106, + "loss": 1.6522, + "loss_base2": 2.3836, + "loss_pixel": 0.2036, + "loss_text": 1.4485, + "ppl": 5.2184, + "step": 9045 + }, + { + "epoch": 0.05, + "global_step": 9046, + "learning_rate": 0.00046308013355592656, + "loss": 1.6956, + "loss_base2": 2.4462, + "loss_pixel": 0.1983, + "loss_text": 1.4973, + "ppl": 5.4499, + "step": 9046 + }, + { + "epoch": 0.05, + "global_step": 9047, + "learning_rate": 0.00046307595993322207, + "loss": 1.6755, + "loss_base2": 2.4172, + "loss_pixel": 0.1929, + "loss_text": 1.4826, + "ppl": 5.3415, + "step": 9047 + }, + { + "epoch": 0.05, + "global_step": 9048, + "learning_rate": 0.0004630717863105176, + "loss": 1.6525, + "loss_base2": 2.3841, + "loss_pixel": 0.1885, + "loss_text": 1.4639, + "ppl": 5.22, + "step": 9048 + }, + { + "epoch": 0.05, + "global_step": 9049, + "learning_rate": 0.00046306761268781303, + "loss": 1.6643, + "loss_base2": 2.4011, + "loss_pixel": 0.1903, + "loss_text": 1.474, + "ppl": 5.282, + "step": 9049 + }, + { + "epoch": 0.05, + "global_step": 9050, + "learning_rate": 0.0004630634390651085, + "loss": 1.6606, + "loss_base2": 2.3957, + "loss_pixel": 0.1874, + "loss_text": 1.4732, + "ppl": 5.2625, + "step": 9050 + }, + { + "epoch": 0.05, + "global_step": 9051, + "learning_rate": 0.000463059265442404, + "loss": 1.644, + "loss_base2": 2.3718, + "loss_pixel": 0.187, + "loss_text": 1.457, + "ppl": 5.1758, + "step": 9051 + }, + { + "epoch": 0.05, + "global_step": 9052, + "learning_rate": 0.0004630550918196995, + "loss": 1.6617, + "loss_base2": 2.3973, + "loss_pixel": 0.1869, + "loss_text": 1.4748, + "ppl": 5.2683, + "step": 9052 + }, + { + "epoch": 0.05, + "global_step": 9053, + "learning_rate": 0.000463050918196995, + "loss": 1.6692, + "loss_base2": 2.4081, + "loss_pixel": 0.1819, + "loss_text": 1.4873, + "ppl": 5.3079, + "step": 9053 + }, + { + "epoch": 0.05, + "global_step": 9054, + "learning_rate": 0.00046304674457429046, + "loss": 1.6556, + "loss_base2": 2.3885, + "loss_pixel": 0.1831, + "loss_text": 1.4725, + "ppl": 5.2362, + "step": 9054 + }, + { + "epoch": 0.05, + "global_step": 9055, + "learning_rate": 0.00046304257095158597, + "loss": 1.6467, + "loss_base2": 2.3757, + "loss_pixel": 0.1785, + "loss_text": 1.4682, + "ppl": 5.1898, + "step": 9055 + }, + { + "epoch": 0.05, + "global_step": 9056, + "learning_rate": 0.0004630383973288815, + "loss": 1.6477, + "loss_base2": 2.3771, + "loss_pixel": 0.1783, + "loss_text": 1.4695, + "ppl": 5.195, + "step": 9056 + }, + { + "epoch": 0.05, + "global_step": 9057, + "learning_rate": 0.000463034223706177, + "loss": 1.6516, + "loss_base2": 2.3828, + "loss_pixel": 0.1759, + "loss_text": 1.4756, + "ppl": 5.2153, + "step": 9057 + }, + { + "epoch": 0.05, + "global_step": 9058, + "learning_rate": 0.0004630300500834725, + "loss": 1.645, + "loss_base2": 2.3732, + "loss_pixel": 0.1761, + "loss_text": 1.4689, + "ppl": 5.181, + "step": 9058 + }, + { + "epoch": 0.05, + "global_step": 9059, + "learning_rate": 0.00046302587646076794, + "loss": 1.6416, + "loss_base2": 2.3683, + "loss_pixel": 0.1764, + "loss_text": 1.4652, + "ppl": 5.1634, + "step": 9059 + }, + { + "epoch": 0.05, + "global_step": 9060, + "learning_rate": 0.00046302170283806345, + "loss": 1.646, + "loss_base2": 2.3747, + "loss_pixel": 0.1746, + "loss_text": 1.4714, + "ppl": 5.1862, + "step": 9060 + }, + { + "epoch": 0.05, + "global_step": 9061, + "learning_rate": 0.00046301752921535896, + "loss": 1.6461, + "loss_base2": 2.3748, + "loss_pixel": 0.1737, + "loss_text": 1.4724, + "ppl": 5.1867, + "step": 9061 + }, + { + "epoch": 0.05, + "global_step": 9062, + "learning_rate": 0.00046301335559265446, + "loss": 1.6433, + "loss_base2": 2.3708, + "loss_pixel": 0.174, + "loss_text": 1.4693, + "ppl": 5.1722, + "step": 9062 + }, + { + "epoch": 0.05, + "global_step": 9063, + "learning_rate": 0.0004630091819699499, + "loss": 1.6327, + "loss_base2": 2.3555, + "loss_pixel": 0.173, + "loss_text": 1.4596, + "ppl": 5.1177, + "step": 9063 + }, + { + "epoch": 0.05, + "global_step": 9064, + "learning_rate": 0.0004630050083472454, + "loss": 1.6482, + "loss_base2": 2.3778, + "loss_pixel": 0.167, + "loss_text": 1.4812, + "ppl": 5.1976, + "step": 9064 + }, + { + "epoch": 0.05, + "global_step": 9065, + "learning_rate": 0.00046300083472454093, + "loss": 1.6358, + "loss_base2": 2.36, + "loss_pixel": 0.1651, + "loss_text": 1.4707, + "ppl": 5.1336, + "step": 9065 + }, + { + "epoch": 0.05, + "global_step": 9066, + "learning_rate": 0.00046299666110183644, + "loss": 1.6221, + "loss_base2": 2.3402, + "loss_pixel": 0.1649, + "loss_text": 1.4572, + "ppl": 5.0637, + "step": 9066 + }, + { + "epoch": 0.05, + "global_step": 9067, + "learning_rate": 0.0004629924874791319, + "loss": 1.6402, + "loss_base2": 2.3663, + "loss_pixel": 0.1652, + "loss_text": 1.4749, + "ppl": 5.1562, + "step": 9067 + }, + { + "epoch": 0.05, + "global_step": 9068, + "learning_rate": 0.00046298831385642734, + "loss": 1.629, + "loss_base2": 2.3502, + "loss_pixel": 0.1613, + "loss_text": 1.4677, + "ppl": 5.0988, + "step": 9068 + }, + { + "epoch": 0.05, + "global_step": 9069, + "learning_rate": 0.00046298414023372285, + "loss": 1.628, + "loss_base2": 2.3487, + "loss_pixel": 0.1606, + "loss_text": 1.4674, + "ppl": 5.0937, + "step": 9069 + }, + { + "epoch": 0.05, + "global_step": 9070, + "learning_rate": 0.00046297996661101836, + "loss": 1.6009, + "loss_base2": 2.3096, + "loss_pixel": 0.1616, + "loss_text": 1.4393, + "ppl": 4.9575, + "step": 9070 + }, + { + "epoch": 0.05, + "global_step": 9071, + "learning_rate": 0.00046297579298831387, + "loss": 1.6317, + "loss_base2": 2.354, + "loss_pixel": 0.1612, + "loss_text": 1.4705, + "ppl": 5.1126, + "step": 9071 + }, + { + "epoch": 0.05, + "global_step": 9072, + "learning_rate": 0.0004629716193656093, + "loss": 1.6259, + "loss_base2": 2.3457, + "loss_pixel": 0.1618, + "loss_text": 1.4641, + "ppl": 5.083, + "step": 9072 + }, + { + "epoch": 0.05, + "global_step": 9073, + "learning_rate": 0.0004629674457429048, + "loss": 1.6225, + "loss_base2": 2.3408, + "loss_pixel": 0.16, + "loss_text": 1.4626, + "ppl": 5.0657, + "step": 9073 + }, + { + "epoch": 0.05, + "global_step": 9074, + "learning_rate": 0.00046296327212020033, + "loss": 1.6344, + "loss_base2": 2.3579, + "loss_pixel": 0.1628, + "loss_text": 1.4716, + "ppl": 5.1264, + "step": 9074 + }, + { + "epoch": 0.05, + "global_step": 9075, + "learning_rate": 0.00046295909849749584, + "loss": 1.647, + "loss_base2": 2.3761, + "loss_pixel": 0.1594, + "loss_text": 1.4876, + "ppl": 5.1914, + "step": 9075 + }, + { + "epoch": 0.05, + "global_step": 9076, + "learning_rate": 0.00046295492487479135, + "loss": 1.6277, + "loss_base2": 2.3483, + "loss_pixel": 0.1587, + "loss_text": 1.469, + "ppl": 5.0921, + "step": 9076 + }, + { + "epoch": 0.05, + "global_step": 9077, + "learning_rate": 0.0004629507512520868, + "loss": 1.61, + "loss_base2": 2.3227, + "loss_pixel": 0.1567, + "loss_text": 1.4533, + "ppl": 5.0028, + "step": 9077 + }, + { + "epoch": 0.05, + "global_step": 9078, + "learning_rate": 0.0004629465776293823, + "loss": 1.6294, + "loss_base2": 2.3507, + "loss_pixel": 0.1606, + "loss_text": 1.4688, + "ppl": 5.1008, + "step": 9078 + }, + { + "epoch": 0.05, + "global_step": 9079, + "learning_rate": 0.0004629424040066778, + "loss": 1.6438, + "loss_base2": 2.3715, + "loss_pixel": 0.1685, + "loss_text": 1.4754, + "ppl": 5.1748, + "step": 9079 + }, + { + "epoch": 0.05, + "global_step": 9080, + "learning_rate": 0.0004629382303839733, + "loss": 1.6516, + "loss_base2": 2.3828, + "loss_pixel": 0.171, + "loss_text": 1.4805, + "ppl": 5.2153, + "step": 9080 + }, + { + "epoch": 0.05, + "global_step": 9081, + "learning_rate": 0.00046293405676126883, + "loss": 1.6435, + "loss_base2": 2.3711, + "loss_pixel": 0.1699, + "loss_text": 1.4736, + "ppl": 5.1732, + "step": 9081 + }, + { + "epoch": 0.05, + "global_step": 9082, + "learning_rate": 0.0004629298831385643, + "loss": 1.6616, + "loss_base2": 2.3972, + "loss_pixel": 0.1705, + "loss_text": 1.4911, + "ppl": 5.2677, + "step": 9082 + }, + { + "epoch": 0.05, + "global_step": 9083, + "learning_rate": 0.0004629257095158598, + "loss": 1.6413, + "loss_base2": 2.3679, + "loss_pixel": 0.1698, + "loss_text": 1.4716, + "ppl": 5.1619, + "step": 9083 + }, + { + "epoch": 0.05, + "global_step": 9084, + "learning_rate": 0.0004629215358931553, + "loss": 1.6523, + "loss_base2": 2.3838, + "loss_pixel": 0.1684, + "loss_text": 1.4838, + "ppl": 5.219, + "step": 9084 + }, + { + "epoch": 0.05, + "global_step": 9085, + "learning_rate": 0.0004629173622704508, + "loss": 1.6439, + "loss_base2": 2.3716, + "loss_pixel": 0.1668, + "loss_text": 1.4771, + "ppl": 5.1753, + "step": 9085 + }, + { + "epoch": 0.05, + "global_step": 9086, + "learning_rate": 0.0004629131886477462, + "loss": 1.6503, + "loss_base2": 2.3809, + "loss_pixel": 0.1679, + "loss_text": 1.4824, + "ppl": 5.2085, + "step": 9086 + }, + { + "epoch": 0.05, + "global_step": 9087, + "learning_rate": 0.0004629090150250417, + "loss": 1.6401, + "loss_base2": 2.3662, + "loss_pixel": 0.1689, + "loss_text": 1.4711, + "ppl": 5.1557, + "step": 9087 + }, + { + "epoch": 0.05, + "global_step": 9088, + "learning_rate": 0.0004629048414023372, + "loss": 1.6412, + "loss_base2": 2.3678, + "loss_pixel": 0.1689, + "loss_text": 1.4722, + "ppl": 5.1614, + "step": 9088 + }, + { + "epoch": 0.05, + "global_step": 9089, + "learning_rate": 0.00046290066777963273, + "loss": 1.6332, + "loss_base2": 2.3562, + "loss_pixel": 0.167, + "loss_text": 1.4662, + "ppl": 5.1202, + "step": 9089 + }, + { + "epoch": 0.05, + "global_step": 9090, + "learning_rate": 0.00046289649415692823, + "loss": 1.6322, + "loss_base2": 2.3548, + "loss_pixel": 0.1686, + "loss_text": 1.4636, + "ppl": 5.1151, + "step": 9090 + }, + { + "epoch": 0.05, + "global_step": 9091, + "learning_rate": 0.0004628923205342237, + "loss": 1.6307, + "loss_base2": 2.3526, + "loss_pixel": 0.1687, + "loss_text": 1.462, + "ppl": 5.1074, + "step": 9091 + }, + { + "epoch": 0.05, + "global_step": 9092, + "learning_rate": 0.0004628881469115192, + "loss": 1.6363, + "loss_base2": 2.3607, + "loss_pixel": 0.1664, + "loss_text": 1.47, + "ppl": 5.1361, + "step": 9092 + }, + { + "epoch": 0.05, + "global_step": 9093, + "learning_rate": 0.0004628839732888147, + "loss": 1.6458, + "loss_base2": 2.3744, + "loss_pixel": 0.1664, + "loss_text": 1.4795, + "ppl": 5.1852, + "step": 9093 + }, + { + "epoch": 0.05, + "global_step": 9094, + "learning_rate": 0.0004628797996661102, + "loss": 1.617, + "loss_base2": 2.3328, + "loss_pixel": 0.167, + "loss_text": 1.45, + "ppl": 5.038, + "step": 9094 + }, + { + "epoch": 0.05, + "global_step": 9095, + "learning_rate": 0.00046287562604340566, + "loss": 1.6364, + "loss_base2": 2.3608, + "loss_pixel": 0.1677, + "loss_text": 1.4687, + "ppl": 5.1366, + "step": 9095 + }, + { + "epoch": 0.05, + "global_step": 9096, + "learning_rate": 0.00046287145242070117, + "loss": 1.6277, + "loss_base2": 2.3483, + "loss_pixel": 0.1678, + "loss_text": 1.4599, + "ppl": 5.0921, + "step": 9096 + }, + { + "epoch": 0.05, + "global_step": 9097, + "learning_rate": 0.0004628672787979967, + "loss": 1.619, + "loss_base2": 2.3357, + "loss_pixel": 0.1674, + "loss_text": 1.4516, + "ppl": 5.048, + "step": 9097 + }, + { + "epoch": 0.05, + "global_step": 9098, + "learning_rate": 0.0004628631051752922, + "loss": 1.6367, + "loss_base2": 2.3613, + "loss_pixel": 0.1686, + "loss_text": 1.4681, + "ppl": 5.1382, + "step": 9098 + }, + { + "epoch": 0.05, + "global_step": 9099, + "learning_rate": 0.0004628589315525877, + "loss": 1.6363, + "loss_base2": 2.3607, + "loss_pixel": 0.167, + "loss_text": 1.4693, + "ppl": 5.1361, + "step": 9099 + }, + { + "epoch": 0.05, + "global_step": 9100, + "learning_rate": 0.00046285475792988315, + "loss": 1.5851, + "loss_base2": 2.2868, + "loss_pixel": 0.1665, + "loss_text": 1.4187, + "ppl": 4.8798, + "step": 9100 + }, + { + "epoch": 0.05, + "global_step": 9101, + "learning_rate": 0.00046285058430717865, + "loss": 1.4331, + "loss_base2": 2.0675, + "loss_pixel": 0.1658, + "loss_text": 1.2674, + "ppl": 4.1917, + "step": 9101 + }, + { + "epoch": 0.05, + "global_step": 9102, + "learning_rate": 0.00046284641068447416, + "loss": 1.4216, + "loss_base2": 2.0509, + "loss_pixel": 0.1679, + "loss_text": 1.2537, + "ppl": 4.1437, + "step": 9102 + }, + { + "epoch": 0.05, + "global_step": 9103, + "learning_rate": 0.00046284223706176967, + "loss": 1.4348, + "loss_base2": 2.07, + "loss_pixel": 0.1663, + "loss_text": 1.2685, + "ppl": 4.1988, + "step": 9103 + }, + { + "epoch": 0.05, + "global_step": 9104, + "learning_rate": 0.0004628380634390651, + "loss": 1.4173, + "loss_base2": 2.0447, + "loss_pixel": 0.1651, + "loss_text": 1.2522, + "ppl": 4.126, + "step": 9104 + }, + { + "epoch": 0.05, + "global_step": 9105, + "learning_rate": 0.0004628338898163606, + "loss": 1.4138, + "loss_base2": 2.0397, + "loss_pixel": 0.1664, + "loss_text": 1.2474, + "ppl": 4.1115, + "step": 9105 + }, + { + "epoch": 0.05, + "global_step": 9106, + "learning_rate": 0.0004628297161936561, + "loss": 1.4109, + "loss_base2": 2.0355, + "loss_pixel": 0.1679, + "loss_text": 1.2431, + "ppl": 4.0996, + "step": 9106 + }, + { + "epoch": 0.05, + "global_step": 9107, + "learning_rate": 0.0004628255425709516, + "loss": 1.4105, + "loss_base2": 2.0349, + "loss_pixel": 0.1663, + "loss_text": 1.2442, + "ppl": 4.098, + "step": 9107 + }, + { + "epoch": 0.05, + "global_step": 9108, + "learning_rate": 0.0004628213689482471, + "loss": 1.4203, + "loss_base2": 2.0491, + "loss_pixel": 0.1654, + "loss_text": 1.2549, + "ppl": 4.1384, + "step": 9108 + }, + { + "epoch": 0.05, + "global_step": 9109, + "learning_rate": 0.00046281719532554255, + "loss": 1.508, + "loss_base2": 2.1756, + "loss_pixel": 0.1674, + "loss_text": 1.3406, + "ppl": 4.5177, + "step": 9109 + }, + { + "epoch": 0.05, + "global_step": 9110, + "learning_rate": 0.00046281302170283806, + "loss": 1.4758, + "loss_base2": 2.1291, + "loss_pixel": 0.1671, + "loss_text": 1.3087, + "ppl": 4.3745, + "step": 9110 + }, + { + "epoch": 0.05, + "global_step": 9111, + "learning_rate": 0.00046280884808013356, + "loss": 1.4095, + "loss_base2": 2.0335, + "loss_pixel": 0.1666, + "loss_text": 1.2429, + "ppl": 4.0939, + "step": 9111 + }, + { + "epoch": 0.05, + "global_step": 9112, + "learning_rate": 0.00046280467445742907, + "loss": 1.4629, + "loss_base2": 2.1105, + "loss_pixel": 0.1662, + "loss_text": 1.2967, + "ppl": 4.3185, + "step": 9112 + }, + { + "epoch": 0.05, + "global_step": 9113, + "learning_rate": 0.0004628005008347245, + "loss": 1.4159, + "loss_base2": 2.0427, + "loss_pixel": 0.1655, + "loss_text": 1.2504, + "ppl": 4.1202, + "step": 9113 + }, + { + "epoch": 0.05, + "global_step": 9114, + "learning_rate": 0.00046279632721202003, + "loss": 1.4126, + "loss_base2": 2.038, + "loss_pixel": 0.1652, + "loss_text": 1.2474, + "ppl": 4.1066, + "step": 9114 + }, + { + "epoch": 0.05, + "global_step": 9115, + "learning_rate": 0.00046279215358931554, + "loss": 1.4233, + "loss_base2": 2.0534, + "loss_pixel": 0.1656, + "loss_text": 1.2577, + "ppl": 4.1508, + "step": 9115 + }, + { + "epoch": 0.05, + "global_step": 9116, + "learning_rate": 0.00046278797996661105, + "loss": 1.4166, + "loss_base2": 2.0437, + "loss_pixel": 0.164, + "loss_text": 1.2526, + "ppl": 4.1231, + "step": 9116 + }, + { + "epoch": 0.05, + "global_step": 9117, + "learning_rate": 0.00046278380634390655, + "loss": 1.4018, + "loss_base2": 2.0224, + "loss_pixel": 0.1666, + "loss_text": 1.2353, + "ppl": 4.0625, + "step": 9117 + }, + { + "epoch": 0.05, + "global_step": 9118, + "learning_rate": 0.000462779632721202, + "loss": 1.4743, + "loss_base2": 2.127, + "loss_pixel": 0.1655, + "loss_text": 1.3088, + "ppl": 4.368, + "step": 9118 + }, + { + "epoch": 0.05, + "global_step": 9119, + "learning_rate": 0.0004627754590984975, + "loss": 1.6047, + "loss_base2": 2.3151, + "loss_pixel": 0.1645, + "loss_text": 1.4403, + "ppl": 4.9764, + "step": 9119 + }, + { + "epoch": 0.05, + "global_step": 9120, + "learning_rate": 0.000462771285475793, + "loss": 1.6506, + "loss_base2": 2.3813, + "loss_pixel": 0.1655, + "loss_text": 1.485, + "ppl": 5.2101, + "step": 9120 + }, + { + "epoch": 0.05, + "global_step": 9121, + "learning_rate": 0.00046276711185308853, + "loss": 1.6395, + "loss_base2": 2.3653, + "loss_pixel": 0.1654, + "loss_text": 1.4742, + "ppl": 5.1526, + "step": 9121 + }, + { + "epoch": 0.05, + "global_step": 9122, + "learning_rate": 0.000462762938230384, + "loss": 1.6442, + "loss_base2": 2.3721, + "loss_pixel": 0.1642, + "loss_text": 1.48, + "ppl": 5.1769, + "step": 9122 + }, + { + "epoch": 0.05, + "global_step": 9123, + "learning_rate": 0.00046275876460767943, + "loss": 1.6394, + "loss_base2": 2.3652, + "loss_pixel": 0.1647, + "loss_text": 1.4747, + "ppl": 5.1521, + "step": 9123 + }, + { + "epoch": 0.05, + "global_step": 9124, + "learning_rate": 0.00046275459098497494, + "loss": 1.6394, + "loss_base2": 2.3652, + "loss_pixel": 0.1656, + "loss_text": 1.4738, + "ppl": 5.1521, + "step": 9124 + }, + { + "epoch": 0.05, + "global_step": 9125, + "learning_rate": 0.00046275041736227045, + "loss": 1.6646, + "loss_base2": 2.4015, + "loss_pixel": 0.1662, + "loss_text": 1.4984, + "ppl": 5.2836, + "step": 9125 + }, + { + "epoch": 0.05, + "global_step": 9126, + "learning_rate": 0.00046274624373956596, + "loss": 1.6194, + "loss_base2": 2.3363, + "loss_pixel": 0.166, + "loss_text": 1.4534, + "ppl": 5.0501, + "step": 9126 + }, + { + "epoch": 0.05, + "global_step": 9127, + "learning_rate": 0.0004627420701168614, + "loss": 1.659, + "loss_base2": 2.3934, + "loss_pixel": 0.1676, + "loss_text": 1.4914, + "ppl": 5.2541, + "step": 9127 + }, + { + "epoch": 0.05, + "global_step": 9128, + "learning_rate": 0.0004627378964941569, + "loss": 1.636, + "loss_base2": 2.3602, + "loss_pixel": 0.1655, + "loss_text": 1.4705, + "ppl": 5.1346, + "step": 9128 + }, + { + "epoch": 0.05, + "global_step": 9129, + "learning_rate": 0.0004627337228714524, + "loss": 1.647, + "loss_base2": 2.3761, + "loss_pixel": 0.1651, + "loss_text": 1.4819, + "ppl": 5.1914, + "step": 9129 + }, + { + "epoch": 0.05, + "global_step": 9130, + "learning_rate": 0.00046272954924874793, + "loss": 1.6286, + "loss_base2": 2.3496, + "loss_pixel": 0.1656, + "loss_text": 1.4631, + "ppl": 5.0967, + "step": 9130 + }, + { + "epoch": 0.05, + "global_step": 9131, + "learning_rate": 0.0004627253756260434, + "loss": 1.6411, + "loss_base2": 2.3676, + "loss_pixel": 0.1658, + "loss_text": 1.4752, + "ppl": 5.1608, + "step": 9131 + }, + { + "epoch": 0.05, + "global_step": 9132, + "learning_rate": 0.0004627212020033389, + "loss": 1.6376, + "loss_base2": 2.3626, + "loss_pixel": 0.1665, + "loss_text": 1.4711, + "ppl": 5.1428, + "step": 9132 + }, + { + "epoch": 0.05, + "global_step": 9133, + "learning_rate": 0.0004627170283806344, + "loss": 1.6448, + "loss_base2": 2.3729, + "loss_pixel": 0.1676, + "loss_text": 1.4772, + "ppl": 5.18, + "step": 9133 + }, + { + "epoch": 0.05, + "global_step": 9134, + "learning_rate": 0.0004627128547579299, + "loss": 1.6387, + "loss_base2": 2.3641, + "loss_pixel": 0.1667, + "loss_text": 1.472, + "ppl": 5.1485, + "step": 9134 + }, + { + "epoch": 0.05, + "global_step": 9135, + "learning_rate": 0.0004627086811352254, + "loss": 1.6057, + "loss_base2": 2.3165, + "loss_pixel": 0.168, + "loss_text": 1.4376, + "ppl": 4.9813, + "step": 9135 + }, + { + "epoch": 0.05, + "global_step": 9136, + "learning_rate": 0.00046270450751252087, + "loss": 1.6302, + "loss_base2": 2.3519, + "loss_pixel": 0.1704, + "loss_text": 1.4599, + "ppl": 5.1049, + "step": 9136 + }, + { + "epoch": 0.05, + "global_step": 9137, + "learning_rate": 0.0004627003338898164, + "loss": 1.6441, + "loss_base2": 2.3719, + "loss_pixel": 0.1696, + "loss_text": 1.4745, + "ppl": 5.1763, + "step": 9137 + }, + { + "epoch": 0.05, + "global_step": 9138, + "learning_rate": 0.0004626961602671119, + "loss": 1.6357, + "loss_base2": 2.3598, + "loss_pixel": 0.1683, + "loss_text": 1.4674, + "ppl": 5.133, + "step": 9138 + }, + { + "epoch": 0.05, + "global_step": 9139, + "learning_rate": 0.0004626919866444074, + "loss": 1.6447, + "loss_base2": 2.3728, + "loss_pixel": 0.1676, + "loss_text": 1.4771, + "ppl": 5.1795, + "step": 9139 + }, + { + "epoch": 0.05, + "global_step": 9140, + "learning_rate": 0.0004626878130217029, + "loss": 1.6102, + "loss_base2": 2.323, + "loss_pixel": 0.1682, + "loss_text": 1.442, + "ppl": 5.0038, + "step": 9140 + }, + { + "epoch": 0.05, + "global_step": 9141, + "learning_rate": 0.00046268363939899835, + "loss": 1.5804, + "loss_base2": 2.28, + "loss_pixel": 0.1675, + "loss_text": 1.4129, + "ppl": 4.8569, + "step": 9141 + }, + { + "epoch": 0.05, + "global_step": 9142, + "learning_rate": 0.0004626794657762938, + "loss": 1.6557, + "loss_base2": 2.3887, + "loss_pixel": 0.167, + "loss_text": 1.4887, + "ppl": 5.2367, + "step": 9142 + }, + { + "epoch": 0.05, + "global_step": 9143, + "learning_rate": 0.0004626752921535893, + "loss": 1.6408, + "loss_base2": 2.3672, + "loss_pixel": 0.1672, + "loss_text": 1.4736, + "ppl": 5.1593, + "step": 9143 + }, + { + "epoch": 0.05, + "global_step": 9144, + "learning_rate": 0.0004626711185308848, + "loss": 1.6425, + "loss_base2": 2.3696, + "loss_pixel": 0.168, + "loss_text": 1.4744, + "ppl": 5.1681, + "step": 9144 + }, + { + "epoch": 0.05, + "global_step": 9145, + "learning_rate": 0.00046266694490818027, + "loss": 1.6413, + "loss_base2": 2.3679, + "loss_pixel": 0.1677, + "loss_text": 1.4736, + "ppl": 5.1619, + "step": 9145 + }, + { + "epoch": 0.05, + "global_step": 9146, + "learning_rate": 0.0004626627712854758, + "loss": 1.6466, + "loss_base2": 2.3755, + "loss_pixel": 0.1663, + "loss_text": 1.4804, + "ppl": 5.1893, + "step": 9146 + }, + { + "epoch": 0.05, + "global_step": 9147, + "learning_rate": 0.0004626585976627713, + "loss": 1.6431, + "loss_base2": 2.3705, + "loss_pixel": 0.1651, + "loss_text": 1.478, + "ppl": 5.1712, + "step": 9147 + }, + { + "epoch": 0.05, + "global_step": 9148, + "learning_rate": 0.0004626544240400668, + "loss": 1.6309, + "loss_base2": 2.3529, + "loss_pixel": 0.1608, + "loss_text": 1.4701, + "ppl": 5.1085, + "step": 9148 + }, + { + "epoch": 0.05, + "global_step": 9149, + "learning_rate": 0.0004626502504173623, + "loss": 1.641, + "loss_base2": 2.3675, + "loss_pixel": 0.1589, + "loss_text": 1.4821, + "ppl": 5.1603, + "step": 9149 + }, + { + "epoch": 0.05, + "global_step": 9150, + "learning_rate": 0.00046264607679465775, + "loss": 1.6234, + "loss_base2": 2.3421, + "loss_pixel": 0.1584, + "loss_text": 1.465, + "ppl": 5.0703, + "step": 9150 + }, + { + "epoch": 0.05, + "global_step": 9151, + "learning_rate": 0.00046264190317195326, + "loss": 1.6224, + "loss_base2": 2.3406, + "loss_pixel": 0.1604, + "loss_text": 1.462, + "ppl": 5.0652, + "step": 9151 + }, + { + "epoch": 0.05, + "global_step": 9152, + "learning_rate": 0.00046263772954924877, + "loss": 1.6464, + "loss_base2": 2.3753, + "loss_pixel": 0.1594, + "loss_text": 1.487, + "ppl": 5.1883, + "step": 9152 + }, + { + "epoch": 0.05, + "global_step": 9153, + "learning_rate": 0.0004626335559265443, + "loss": 1.6176, + "loss_base2": 2.3337, + "loss_pixel": 0.157, + "loss_text": 1.4605, + "ppl": 5.041, + "step": 9153 + }, + { + "epoch": 0.05, + "global_step": 9154, + "learning_rate": 0.00046262938230383973, + "loss": 1.6221, + "loss_base2": 2.3402, + "loss_pixel": 0.1574, + "loss_text": 1.4646, + "ppl": 5.0637, + "step": 9154 + }, + { + "epoch": 0.05, + "global_step": 9155, + "learning_rate": 0.00046262520868113523, + "loss": 1.6236, + "loss_base2": 2.3424, + "loss_pixel": 0.1592, + "loss_text": 1.4645, + "ppl": 5.0713, + "step": 9155 + }, + { + "epoch": 0.05, + "global_step": 9156, + "learning_rate": 0.00046262103505843074, + "loss": 1.6224, + "loss_base2": 2.3406, + "loss_pixel": 0.1591, + "loss_text": 1.4633, + "ppl": 5.0652, + "step": 9156 + }, + { + "epoch": 0.05, + "global_step": 9157, + "learning_rate": 0.00046261686143572625, + "loss": 1.6182, + "loss_base2": 2.3346, + "loss_pixel": 0.157, + "loss_text": 1.4611, + "ppl": 5.044, + "step": 9157 + }, + { + "epoch": 0.05, + "global_step": 9158, + "learning_rate": 0.00046261268781302176, + "loss": 1.6344, + "loss_base2": 2.3579, + "loss_pixel": 0.1555, + "loss_text": 1.4789, + "ppl": 5.1264, + "step": 9158 + }, + { + "epoch": 0.05, + "global_step": 9159, + "learning_rate": 0.0004626085141903172, + "loss": 1.617, + "loss_base2": 2.3328, + "loss_pixel": 0.1578, + "loss_text": 1.4592, + "ppl": 5.038, + "step": 9159 + }, + { + "epoch": 0.05, + "global_step": 9160, + "learning_rate": 0.0004626043405676127, + "loss": 1.6192, + "loss_base2": 2.336, + "loss_pixel": 0.1569, + "loss_text": 1.4623, + "ppl": 5.049, + "step": 9160 + }, + { + "epoch": 0.05, + "global_step": 9161, + "learning_rate": 0.00046260016694490817, + "loss": 1.6327, + "loss_base2": 2.3555, + "loss_pixel": 0.1585, + "loss_text": 1.4741, + "ppl": 5.1177, + "step": 9161 + }, + { + "epoch": 0.05, + "global_step": 9162, + "learning_rate": 0.0004625959933222037, + "loss": 1.6333, + "loss_base2": 2.3564, + "loss_pixel": 0.1561, + "loss_text": 1.4772, + "ppl": 5.1207, + "step": 9162 + }, + { + "epoch": 0.05, + "global_step": 9163, + "learning_rate": 0.00046259181969949913, + "loss": 1.6541, + "loss_base2": 2.3864, + "loss_pixel": 0.1694, + "loss_text": 1.4847, + "ppl": 5.2284, + "step": 9163 + }, + { + "epoch": 0.05, + "global_step": 9164, + "learning_rate": 0.00046258764607679464, + "loss": 1.6519, + "loss_base2": 2.3832, + "loss_pixel": 0.1669, + "loss_text": 1.485, + "ppl": 5.2169, + "step": 9164 + }, + { + "epoch": 0.05, + "global_step": 9165, + "learning_rate": 0.00046258347245409015, + "loss": 1.6307, + "loss_base2": 2.3526, + "loss_pixel": 0.1667, + "loss_text": 1.464, + "ppl": 5.1074, + "step": 9165 + }, + { + "epoch": 0.05, + "global_step": 9166, + "learning_rate": 0.00046257929883138565, + "loss": 1.6067, + "loss_base2": 2.318, + "loss_pixel": 0.1686, + "loss_text": 1.4381, + "ppl": 4.9863, + "step": 9166 + }, + { + "epoch": 0.05, + "global_step": 9167, + "learning_rate": 0.00046257512520868116, + "loss": 1.6385, + "loss_base2": 2.3639, + "loss_pixel": 0.1676, + "loss_text": 1.4709, + "ppl": 5.1474, + "step": 9167 + }, + { + "epoch": 0.05, + "global_step": 9168, + "learning_rate": 0.0004625709515859766, + "loss": 1.6324, + "loss_base2": 2.3551, + "loss_pixel": 0.1657, + "loss_text": 1.4667, + "ppl": 5.1161, + "step": 9168 + }, + { + "epoch": 0.05, + "global_step": 9169, + "learning_rate": 0.0004625667779632721, + "loss": 1.63, + "loss_base2": 2.3516, + "loss_pixel": 0.1655, + "loss_text": 1.4645, + "ppl": 5.1039, + "step": 9169 + }, + { + "epoch": 0.05, + "global_step": 9170, + "learning_rate": 0.00046256260434056763, + "loss": 1.6264, + "loss_base2": 2.3464, + "loss_pixel": 0.1653, + "loss_text": 1.4611, + "ppl": 5.0855, + "step": 9170 + }, + { + "epoch": 0.05, + "global_step": 9171, + "learning_rate": 0.00046255843071786313, + "loss": 1.638, + "loss_base2": 2.3631, + "loss_pixel": 0.1666, + "loss_text": 1.4714, + "ppl": 5.1449, + "step": 9171 + }, + { + "epoch": 0.05, + "global_step": 9172, + "learning_rate": 0.0004625542570951586, + "loss": 1.632, + "loss_base2": 2.3545, + "loss_pixel": 0.1654, + "loss_text": 1.4665, + "ppl": 5.1141, + "step": 9172 + }, + { + "epoch": 0.05, + "global_step": 9173, + "learning_rate": 0.0004625500834724541, + "loss": 1.6432, + "loss_base2": 2.3706, + "loss_pixel": 0.1669, + "loss_text": 1.4763, + "ppl": 5.1717, + "step": 9173 + }, + { + "epoch": 0.05, + "global_step": 9174, + "learning_rate": 0.0004625459098497496, + "loss": 1.6294, + "loss_base2": 2.3507, + "loss_pixel": 0.1656, + "loss_text": 1.4639, + "ppl": 5.1008, + "step": 9174 + }, + { + "epoch": 0.05, + "global_step": 9175, + "learning_rate": 0.0004625417362270451, + "loss": 1.626, + "loss_base2": 2.3458, + "loss_pixel": 0.1661, + "loss_text": 1.4599, + "ppl": 5.0835, + "step": 9175 + }, + { + "epoch": 0.05, + "global_step": 9176, + "learning_rate": 0.0004625375626043406, + "loss": 1.6283, + "loss_base2": 2.3491, + "loss_pixel": 0.1667, + "loss_text": 1.4616, + "ppl": 5.0952, + "step": 9176 + }, + { + "epoch": 0.05, + "global_step": 9177, + "learning_rate": 0.00046253338898163607, + "loss": 1.6346, + "loss_base2": 2.3582, + "loss_pixel": 0.1666, + "loss_text": 1.4679, + "ppl": 5.1274, + "step": 9177 + }, + { + "epoch": 0.05, + "global_step": 9178, + "learning_rate": 0.0004625292153589316, + "loss": 1.6472, + "loss_base2": 2.3764, + "loss_pixel": 0.1671, + "loss_text": 1.4801, + "ppl": 5.1924, + "step": 9178 + }, + { + "epoch": 0.05, + "global_step": 9179, + "learning_rate": 0.0004625250417362271, + "loss": 1.6514, + "loss_base2": 2.3825, + "loss_pixel": 0.1675, + "loss_text": 1.484, + "ppl": 5.2143, + "step": 9179 + }, + { + "epoch": 0.05, + "global_step": 9180, + "learning_rate": 0.00046252086811352254, + "loss": 1.6448, + "loss_base2": 2.3729, + "loss_pixel": 0.1676, + "loss_text": 1.4772, + "ppl": 5.18, + "step": 9180 + }, + { + "epoch": 0.05, + "global_step": 9181, + "learning_rate": 0.000462516694490818, + "loss": 1.6291, + "loss_base2": 2.3503, + "loss_pixel": 0.1672, + "loss_text": 1.4619, + "ppl": 5.0993, + "step": 9181 + }, + { + "epoch": 0.05, + "global_step": 9182, + "learning_rate": 0.0004625125208681135, + "loss": 1.6519, + "loss_base2": 2.3832, + "loss_pixel": 0.1675, + "loss_text": 1.4844, + "ppl": 5.2169, + "step": 9182 + }, + { + "epoch": 0.05, + "global_step": 9183, + "learning_rate": 0.000462508347245409, + "loss": 1.6255, + "loss_base2": 2.3451, + "loss_pixel": 0.1665, + "loss_text": 1.459, + "ppl": 5.081, + "step": 9183 + }, + { + "epoch": 0.05, + "global_step": 9184, + "learning_rate": 0.0004625041736227045, + "loss": 1.64, + "loss_base2": 2.366, + "loss_pixel": 0.1663, + "loss_text": 1.4737, + "ppl": 5.1552, + "step": 9184 + }, + { + "epoch": 0.05, + "global_step": 9185, + "learning_rate": 0.0004625, + "loss": 1.6412, + "loss_base2": 2.3678, + "loss_pixel": 0.1675, + "loss_text": 1.4737, + "ppl": 5.1614, + "step": 9185 + }, + { + "epoch": 0.05, + "global_step": 9186, + "learning_rate": 0.0004624958263772955, + "loss": 1.6418, + "loss_base2": 2.3686, + "loss_pixel": 0.166, + "loss_text": 1.4758, + "ppl": 5.1645, + "step": 9186 + }, + { + "epoch": 0.05, + "global_step": 9187, + "learning_rate": 0.000462491652754591, + "loss": 1.4616, + "loss_base2": 2.1086, + "loss_pixel": 0.1669, + "loss_text": 1.2948, + "ppl": 4.3129, + "step": 9187 + }, + { + "epoch": 0.05, + "global_step": 9188, + "learning_rate": 0.0004624874791318865, + "loss": 1.4258, + "loss_base2": 2.057, + "loss_pixel": 0.165, + "loss_text": 1.2608, + "ppl": 4.1612, + "step": 9188 + }, + { + "epoch": 0.05, + "global_step": 9189, + "learning_rate": 0.000462483305509182, + "loss": 1.4452, + "loss_base2": 2.085, + "loss_pixel": 0.1662, + "loss_text": 1.279, + "ppl": 4.2427, + "step": 9189 + }, + { + "epoch": 0.05, + "global_step": 9190, + "learning_rate": 0.00046247913188647745, + "loss": 1.432, + "loss_base2": 2.0659, + "loss_pixel": 0.1662, + "loss_text": 1.2658, + "ppl": 4.1871, + "step": 9190 + }, + { + "epoch": 0.05, + "global_step": 9191, + "learning_rate": 0.00046247495826377296, + "loss": 1.4114, + "loss_base2": 2.0362, + "loss_pixel": 0.1642, + "loss_text": 1.2472, + "ppl": 4.1017, + "step": 9191 + }, + { + "epoch": 0.05, + "global_step": 9192, + "learning_rate": 0.00046247078464106846, + "loss": 1.4246, + "loss_base2": 2.0553, + "loss_pixel": 0.1655, + "loss_text": 1.2591, + "ppl": 4.1562, + "step": 9192 + }, + { + "epoch": 0.05, + "global_step": 9193, + "learning_rate": 0.00046246661101836397, + "loss": 1.428, + "loss_base2": 2.0602, + "loss_pixel": 0.1677, + "loss_text": 1.2603, + "ppl": 4.1704, + "step": 9193 + }, + { + "epoch": 0.05, + "global_step": 9194, + "learning_rate": 0.0004624624373956595, + "loss": 1.6444, + "loss_base2": 2.3724, + "loss_pixel": 0.1645, + "loss_text": 1.4799, + "ppl": 5.1779, + "step": 9194 + }, + { + "epoch": 0.05, + "global_step": 9195, + "learning_rate": 0.00046245826377295493, + "loss": 1.6313, + "loss_base2": 2.3535, + "loss_pixel": 0.1652, + "loss_text": 1.4661, + "ppl": 5.1105, + "step": 9195 + }, + { + "epoch": 0.05, + "global_step": 9196, + "learning_rate": 0.00046245409015025044, + "loss": 1.6433, + "loss_base2": 2.3708, + "loss_pixel": 0.1655, + "loss_text": 1.4778, + "ppl": 5.1722, + "step": 9196 + }, + { + "epoch": 0.05, + "global_step": 9197, + "learning_rate": 0.00046244991652754595, + "loss": 1.6505, + "loss_base2": 2.3812, + "loss_pixel": 0.1651, + "loss_text": 1.4854, + "ppl": 5.2096, + "step": 9197 + }, + { + "epoch": 0.05, + "global_step": 9198, + "learning_rate": 0.00046244574290484145, + "loss": 1.6677, + "loss_base2": 2.406, + "loss_pixel": 0.1653, + "loss_text": 1.5025, + "ppl": 5.3, + "step": 9198 + }, + { + "epoch": 0.05, + "global_step": 9199, + "learning_rate": 0.0004624415692821369, + "loss": 1.6389, + "loss_base2": 2.3644, + "loss_pixel": 0.1648, + "loss_text": 1.4741, + "ppl": 5.1495, + "step": 9199 + }, + { + "epoch": 0.05, + "global_step": 9200, + "learning_rate": 0.00046243739565943236, + "loss": 1.6588, + "loss_base2": 2.3931, + "loss_pixel": 0.1645, + "loss_text": 1.4943, + "ppl": 5.253, + "step": 9200 + }, + { + "epoch": 0.05, + "global_step": 9201, + "learning_rate": 0.00046243322203672787, + "loss": 1.6468, + "loss_base2": 2.3758, + "loss_pixel": 0.1653, + "loss_text": 1.4815, + "ppl": 5.1903, + "step": 9201 + }, + { + "epoch": 0.05, + "global_step": 9202, + "learning_rate": 0.0004624290484140234, + "loss": 1.6345, + "loss_base2": 2.3581, + "loss_pixel": 0.1655, + "loss_text": 1.469, + "ppl": 5.1269, + "step": 9202 + }, + { + "epoch": 0.05, + "global_step": 9203, + "learning_rate": 0.0004624248747913189, + "loss": 1.6589, + "loss_base2": 2.3933, + "loss_pixel": 0.1649, + "loss_text": 1.494, + "ppl": 5.2535, + "step": 9203 + }, + { + "epoch": 0.05, + "global_step": 9204, + "learning_rate": 0.00046242070116861433, + "loss": 1.6429, + "loss_base2": 2.3702, + "loss_pixel": 0.165, + "loss_text": 1.4779, + "ppl": 5.1701, + "step": 9204 + }, + { + "epoch": 0.05, + "global_step": 9205, + "learning_rate": 0.00046241652754590984, + "loss": 1.6171, + "loss_base2": 2.333, + "loss_pixel": 0.1628, + "loss_text": 1.4543, + "ppl": 5.0385, + "step": 9205 + }, + { + "epoch": 0.05, + "global_step": 9206, + "learning_rate": 0.00046241235392320535, + "loss": 1.6316, + "loss_base2": 2.3539, + "loss_pixel": 0.1634, + "loss_text": 1.4682, + "ppl": 5.112, + "step": 9206 + }, + { + "epoch": 0.05, + "global_step": 9207, + "learning_rate": 0.00046240818030050086, + "loss": 1.6218, + "loss_base2": 2.3398, + "loss_pixel": 0.1636, + "loss_text": 1.4583, + "ppl": 5.0622, + "step": 9207 + }, + { + "epoch": 0.05, + "global_step": 9208, + "learning_rate": 0.00046240400667779636, + "loss": 1.6455, + "loss_base2": 2.374, + "loss_pixel": 0.1655, + "loss_text": 1.4801, + "ppl": 5.1836, + "step": 9208 + }, + { + "epoch": 0.05, + "global_step": 9209, + "learning_rate": 0.0004623998330550918, + "loss": 1.6511, + "loss_base2": 2.382, + "loss_pixel": 0.1649, + "loss_text": 1.4862, + "ppl": 5.2127, + "step": 9209 + }, + { + "epoch": 0.05, + "global_step": 9210, + "learning_rate": 0.0004623956594323873, + "loss": 1.6374, + "loss_base2": 2.3623, + "loss_pixel": 0.1632, + "loss_text": 1.4743, + "ppl": 5.1418, + "step": 9210 + }, + { + "epoch": 0.05, + "global_step": 9211, + "learning_rate": 0.00046239148580968283, + "loss": 1.6469, + "loss_base2": 2.376, + "loss_pixel": 0.1645, + "loss_text": 1.4824, + "ppl": 5.1909, + "step": 9211 + }, + { + "epoch": 0.05, + "global_step": 9212, + "learning_rate": 0.00046238731218697834, + "loss": 1.6339, + "loss_base2": 2.3572, + "loss_pixel": 0.1645, + "loss_text": 1.4694, + "ppl": 5.1238, + "step": 9212 + }, + { + "epoch": 0.05, + "global_step": 9213, + "learning_rate": 0.0004623831385642738, + "loss": 1.6405, + "loss_base2": 2.3667, + "loss_pixel": 0.1651, + "loss_text": 1.4754, + "ppl": 5.1577, + "step": 9213 + }, + { + "epoch": 0.05, + "global_step": 9214, + "learning_rate": 0.0004623789649415693, + "loss": 1.6296, + "loss_base2": 2.351, + "loss_pixel": 0.1651, + "loss_text": 1.4645, + "ppl": 5.1018, + "step": 9214 + }, + { + "epoch": 0.05, + "global_step": 9215, + "learning_rate": 0.0004623747913188648, + "loss": 1.6505, + "loss_base2": 2.3812, + "loss_pixel": 0.1658, + "loss_text": 1.4847, + "ppl": 5.2096, + "step": 9215 + }, + { + "epoch": 0.05, + "global_step": 9216, + "learning_rate": 0.0004623706176961603, + "loss": 1.6415, + "loss_base2": 2.3682, + "loss_pixel": 0.1652, + "loss_text": 1.4763, + "ppl": 5.1629, + "step": 9216 + }, + { + "epoch": 0.05, + "global_step": 9217, + "learning_rate": 0.0004623664440734558, + "loss": 1.4509, + "loss_base2": 2.0932, + "loss_pixel": 0.1638, + "loss_text": 1.2871, + "ppl": 4.267, + "step": 9217 + }, + { + "epoch": 0.05, + "global_step": 9218, + "learning_rate": 0.0004623622704507512, + "loss": 1.4225, + "loss_base2": 2.0522, + "loss_pixel": 0.1649, + "loss_text": 1.2577, + "ppl": 4.1475, + "step": 9218 + }, + { + "epoch": 0.05, + "global_step": 9219, + "learning_rate": 0.00046235809682804673, + "loss": 1.4258, + "loss_base2": 2.057, + "loss_pixel": 0.1647, + "loss_text": 1.2612, + "ppl": 4.1612, + "step": 9219 + }, + { + "epoch": 0.05, + "global_step": 9220, + "learning_rate": 0.00046235392320534223, + "loss": 1.4574, + "loss_base2": 2.1026, + "loss_pixel": 0.1663, + "loss_text": 1.291, + "ppl": 4.2948, + "step": 9220 + }, + { + "epoch": 0.05, + "global_step": 9221, + "learning_rate": 0.00046234974958263774, + "loss": 1.4233, + "loss_base2": 2.0534, + "loss_pixel": 0.1642, + "loss_text": 1.2591, + "ppl": 4.1508, + "step": 9221 + }, + { + "epoch": 0.05, + "global_step": 9222, + "learning_rate": 0.0004623455759599332, + "loss": 1.436, + "loss_base2": 2.0717, + "loss_pixel": 0.1638, + "loss_text": 1.2723, + "ppl": 4.2038, + "step": 9222 + }, + { + "epoch": 0.05, + "global_step": 9223, + "learning_rate": 0.0004623414023372287, + "loss": 1.4013, + "loss_base2": 2.0216, + "loss_pixel": 0.1595, + "loss_text": 1.2418, + "ppl": 4.0605, + "step": 9223 + }, + { + "epoch": 0.05, + "global_step": 9224, + "learning_rate": 0.0004623372287145242, + "loss": 1.4141, + "loss_base2": 2.0401, + "loss_pixel": 0.1573, + "loss_text": 1.2568, + "ppl": 4.1128, + "step": 9224 + }, + { + "epoch": 0.05, + "global_step": 9225, + "learning_rate": 0.0004623330550918197, + "loss": 1.422, + "loss_base2": 2.0515, + "loss_pixel": 0.1586, + "loss_text": 1.2634, + "ppl": 4.1454, + "step": 9225 + }, + { + "epoch": 0.05, + "global_step": 9226, + "learning_rate": 0.0004623288814691152, + "loss": 1.4035, + "loss_base2": 2.0248, + "loss_pixel": 0.1595, + "loss_text": 1.2439, + "ppl": 4.0694, + "step": 9226 + }, + { + "epoch": 0.05, + "global_step": 9227, + "learning_rate": 0.0004623247078464107, + "loss": 1.3948, + "loss_base2": 2.0123, + "loss_pixel": 0.1544, + "loss_text": 1.2404, + "ppl": 4.0342, + "step": 9227 + }, + { + "epoch": 0.05, + "global_step": 9228, + "learning_rate": 0.0004623205342237062, + "loss": 1.4149, + "loss_base2": 2.0413, + "loss_pixel": 0.1574, + "loss_text": 1.2575, + "ppl": 4.1161, + "step": 9228 + }, + { + "epoch": 0.05, + "global_step": 9229, + "learning_rate": 0.0004623163606010017, + "loss": 1.415, + "loss_base2": 2.0414, + "loss_pixel": 0.1565, + "loss_text": 1.2585, + "ppl": 4.1165, + "step": 9229 + }, + { + "epoch": 0.05, + "global_step": 9230, + "learning_rate": 0.0004623121869782972, + "loss": 1.405, + "loss_base2": 2.027, + "loss_pixel": 0.1545, + "loss_text": 1.2505, + "ppl": 4.0755, + "step": 9230 + }, + { + "epoch": 0.05, + "global_step": 9231, + "learning_rate": 0.00046230801335559265, + "loss": 1.4309, + "loss_base2": 2.0644, + "loss_pixel": 0.156, + "loss_text": 1.2749, + "ppl": 4.1825, + "step": 9231 + }, + { + "epoch": 0.05, + "global_step": 9232, + "learning_rate": 0.00046230383973288816, + "loss": 1.4208, + "loss_base2": 2.0498, + "loss_pixel": 0.1553, + "loss_text": 1.2655, + "ppl": 4.1404, + "step": 9232 + }, + { + "epoch": 0.05, + "global_step": 9233, + "learning_rate": 0.00046229966611018367, + "loss": 1.3943, + "loss_base2": 2.0115, + "loss_pixel": 0.156, + "loss_text": 1.2382, + "ppl": 4.0322, + "step": 9233 + }, + { + "epoch": 0.05, + "global_step": 9234, + "learning_rate": 0.0004622954924874792, + "loss": 1.4212, + "loss_base2": 2.0504, + "loss_pixel": 0.156, + "loss_text": 1.2652, + "ppl": 4.1421, + "step": 9234 + }, + { + "epoch": 0.05, + "global_step": 9235, + "learning_rate": 0.0004622913188647747, + "loss": 1.4014, + "loss_base2": 2.0218, + "loss_pixel": 0.1541, + "loss_text": 1.2473, + "ppl": 4.0609, + "step": 9235 + }, + { + "epoch": 0.05, + "global_step": 9236, + "learning_rate": 0.0004622871452420701, + "loss": 1.4167, + "loss_base2": 2.0439, + "loss_pixel": 0.1568, + "loss_text": 1.2599, + "ppl": 4.1235, + "step": 9236 + }, + { + "epoch": 0.05, + "global_step": 9237, + "learning_rate": 0.0004622829716193656, + "loss": 1.4092, + "loss_base2": 2.033, + "loss_pixel": 0.1569, + "loss_text": 1.2523, + "ppl": 4.0927, + "step": 9237 + }, + { + "epoch": 0.05, + "global_step": 9238, + "learning_rate": 0.0004622787979966611, + "loss": 1.4157, + "loss_base2": 2.0424, + "loss_pixel": 0.1539, + "loss_text": 1.2618, + "ppl": 4.1194, + "step": 9238 + }, + { + "epoch": 0.05, + "global_step": 9239, + "learning_rate": 0.0004622746243739566, + "loss": 1.432, + "loss_base2": 2.0659, + "loss_pixel": 0.1641, + "loss_text": 1.2679, + "ppl": 4.1871, + "step": 9239 + }, + { + "epoch": 0.05, + "global_step": 9240, + "learning_rate": 0.00046227045075125206, + "loss": 1.4258, + "loss_base2": 2.057, + "loss_pixel": 0.166, + "loss_text": 1.2598, + "ppl": 4.1612, + "step": 9240 + }, + { + "epoch": 0.05, + "global_step": 9241, + "learning_rate": 0.00046226627712854756, + "loss": 1.4168, + "loss_base2": 2.044, + "loss_pixel": 0.1679, + "loss_text": 1.2489, + "ppl": 4.1239, + "step": 9241 + }, + { + "epoch": 0.05, + "global_step": 9242, + "learning_rate": 0.00046226210350584307, + "loss": 1.4222, + "loss_base2": 2.0518, + "loss_pixel": 0.1657, + "loss_text": 1.2564, + "ppl": 4.1462, + "step": 9242 + }, + { + "epoch": 0.05, + "global_step": 9243, + "learning_rate": 0.0004622579298831386, + "loss": 1.4092, + "loss_base2": 2.033, + "loss_pixel": 0.1657, + "loss_text": 1.2436, + "ppl": 4.0927, + "step": 9243 + }, + { + "epoch": 0.05, + "global_step": 9244, + "learning_rate": 0.0004622537562604341, + "loss": 1.4138, + "loss_base2": 2.0397, + "loss_pixel": 0.1665, + "loss_text": 1.2473, + "ppl": 4.1115, + "step": 9244 + }, + { + "epoch": 0.05, + "global_step": 9245, + "learning_rate": 0.00046224958263772954, + "loss": 1.4204, + "loss_base2": 2.0492, + "loss_pixel": 0.1649, + "loss_text": 1.2555, + "ppl": 4.1388, + "step": 9245 + }, + { + "epoch": 0.05, + "global_step": 9246, + "learning_rate": 0.00046224540901502505, + "loss": 1.4196, + "loss_base2": 2.048, + "loss_pixel": 0.1658, + "loss_text": 1.2538, + "ppl": 4.1355, + "step": 9246 + }, + { + "epoch": 0.05, + "global_step": 9247, + "learning_rate": 0.00046224123539232055, + "loss": 1.4101, + "loss_base2": 2.0343, + "loss_pixel": 0.1646, + "loss_text": 1.2455, + "ppl": 4.0964, + "step": 9247 + }, + { + "epoch": 0.05, + "global_step": 9248, + "learning_rate": 0.00046223706176961606, + "loss": 1.4088, + "loss_base2": 2.0325, + "loss_pixel": 0.1646, + "loss_text": 1.2441, + "ppl": 4.091, + "step": 9248 + }, + { + "epoch": 0.05, + "global_step": 9249, + "learning_rate": 0.00046223288814691157, + "loss": 1.5921, + "loss_base2": 2.2969, + "loss_pixel": 0.165, + "loss_text": 1.427, + "ppl": 4.9141, + "step": 9249 + }, + { + "epoch": 0.05, + "global_step": 9250, + "learning_rate": 0.000462228714524207, + "loss": 1.6706, + "loss_base2": 2.4102, + "loss_pixel": 0.1684, + "loss_text": 1.5022, + "ppl": 5.3154, + "step": 9250 + }, + { + "epoch": 0.05, + "global_step": 9251, + "learning_rate": 0.00046222454090150253, + "loss": 1.6619, + "loss_base2": 2.3976, + "loss_pixel": 0.1665, + "loss_text": 1.4954, + "ppl": 5.2693, + "step": 9251 + }, + { + "epoch": 0.05, + "global_step": 9252, + "learning_rate": 0.00046222036727879804, + "loss": 1.6491, + "loss_base2": 2.3791, + "loss_pixel": 0.166, + "loss_text": 1.4832, + "ppl": 5.2023, + "step": 9252 + }, + { + "epoch": 0.05, + "global_step": 9253, + "learning_rate": 0.00046221619365609354, + "loss": 1.6646, + "loss_base2": 2.4015, + "loss_pixel": 0.1649, + "loss_text": 1.4997, + "ppl": 5.2836, + "step": 9253 + }, + { + "epoch": 0.05, + "global_step": 9254, + "learning_rate": 0.000462212020033389, + "loss": 1.6537, + "loss_base2": 2.3858, + "loss_pixel": 0.1673, + "loss_text": 1.4864, + "ppl": 5.2263, + "step": 9254 + }, + { + "epoch": 0.05, + "global_step": 9255, + "learning_rate": 0.00046220784641068445, + "loss": 1.6527, + "loss_base2": 2.3843, + "loss_pixel": 0.1658, + "loss_text": 1.4869, + "ppl": 5.2211, + "step": 9255 + }, + { + "epoch": 0.05, + "global_step": 9256, + "learning_rate": 0.00046220367278797996, + "loss": 1.6383, + "loss_base2": 2.3636, + "loss_pixel": 0.1652, + "loss_text": 1.4731, + "ppl": 5.1464, + "step": 9256 + }, + { + "epoch": 0.05, + "global_step": 9257, + "learning_rate": 0.00046219949916527546, + "loss": 1.636, + "loss_base2": 2.3602, + "loss_pixel": 0.1658, + "loss_text": 1.4702, + "ppl": 5.1346, + "step": 9257 + }, + { + "epoch": 0.05, + "global_step": 9258, + "learning_rate": 0.00046219532554257097, + "loss": 1.6279, + "loss_base2": 2.3486, + "loss_pixel": 0.1659, + "loss_text": 1.4621, + "ppl": 5.0932, + "step": 9258 + }, + { + "epoch": 0.05, + "global_step": 9259, + "learning_rate": 0.0004621911519198664, + "loss": 1.6302, + "loss_base2": 2.3519, + "loss_pixel": 0.1671, + "loss_text": 1.4631, + "ppl": 5.1049, + "step": 9259 + }, + { + "epoch": 0.05, + "global_step": 9260, + "learning_rate": 0.00046218697829716193, + "loss": 1.6404, + "loss_base2": 2.3666, + "loss_pixel": 0.166, + "loss_text": 1.4744, + "ppl": 5.1572, + "step": 9260 + }, + { + "epoch": 0.05, + "global_step": 9261, + "learning_rate": 0.00046218280467445744, + "loss": 1.6376, + "loss_base2": 2.3626, + "loss_pixel": 0.1649, + "loss_text": 1.4727, + "ppl": 5.1428, + "step": 9261 + }, + { + "epoch": 0.05, + "global_step": 9262, + "learning_rate": 0.00046217863105175295, + "loss": 1.6417, + "loss_base2": 2.3685, + "loss_pixel": 0.1663, + "loss_text": 1.4754, + "ppl": 5.1639, + "step": 9262 + }, + { + "epoch": 0.05, + "global_step": 9263, + "learning_rate": 0.0004621744574290484, + "loss": 1.6496, + "loss_base2": 2.3799, + "loss_pixel": 0.1645, + "loss_text": 1.4852, + "ppl": 5.2049, + "step": 9263 + }, + { + "epoch": 0.05, + "global_step": 9264, + "learning_rate": 0.0004621702838063439, + "loss": 1.6282, + "loss_base2": 2.349, + "loss_pixel": 0.1652, + "loss_text": 1.463, + "ppl": 5.0947, + "step": 9264 + }, + { + "epoch": 0.05, + "global_step": 9265, + "learning_rate": 0.0004621661101836394, + "loss": 1.6155, + "loss_base2": 2.3307, + "loss_pixel": 0.1649, + "loss_text": 1.4505, + "ppl": 5.0304, + "step": 9265 + }, + { + "epoch": 0.05, + "global_step": 9266, + "learning_rate": 0.0004621619365609349, + "loss": 1.638, + "loss_base2": 2.3631, + "loss_pixel": 0.1661, + "loss_text": 1.4719, + "ppl": 5.1449, + "step": 9266 + }, + { + "epoch": 0.05, + "global_step": 9267, + "learning_rate": 0.00046215776293823043, + "loss": 1.6473, + "loss_base2": 2.3766, + "loss_pixel": 0.1637, + "loss_text": 1.4836, + "ppl": 5.1929, + "step": 9267 + }, + { + "epoch": 0.05, + "global_step": 9268, + "learning_rate": 0.0004621535893155259, + "loss": 1.6361, + "loss_base2": 2.3604, + "loss_pixel": 0.165, + "loss_text": 1.4711, + "ppl": 5.1351, + "step": 9268 + }, + { + "epoch": 0.05, + "global_step": 9269, + "learning_rate": 0.0004621494156928214, + "loss": 1.6078, + "loss_base2": 2.3196, + "loss_pixel": 0.1642, + "loss_text": 1.4436, + "ppl": 4.9918, + "step": 9269 + }, + { + "epoch": 0.05, + "global_step": 9270, + "learning_rate": 0.0004621452420701169, + "loss": 1.6357, + "loss_base2": 2.3598, + "loss_pixel": 0.1657, + "loss_text": 1.47, + "ppl": 5.133, + "step": 9270 + }, + { + "epoch": 0.05, + "global_step": 9271, + "learning_rate": 0.0004621410684474124, + "loss": 1.6232, + "loss_base2": 2.3418, + "loss_pixel": 0.1639, + "loss_text": 1.4593, + "ppl": 5.0693, + "step": 9271 + }, + { + "epoch": 0.05, + "global_step": 9272, + "learning_rate": 0.00046213689482470786, + "loss": 1.6494, + "loss_base2": 2.3796, + "loss_pixel": 0.164, + "loss_text": 1.4853, + "ppl": 5.2039, + "step": 9272 + }, + { + "epoch": 0.05, + "global_step": 9273, + "learning_rate": 0.00046213272120200336, + "loss": 1.6431, + "loss_base2": 2.3705, + "loss_pixel": 0.1633, + "loss_text": 1.4798, + "ppl": 5.1712, + "step": 9273 + }, + { + "epoch": 0.05, + "global_step": 9274, + "learning_rate": 0.0004621285475792988, + "loss": 1.653, + "loss_base2": 2.3848, + "loss_pixel": 0.1643, + "loss_text": 1.4888, + "ppl": 5.2226, + "step": 9274 + }, + { + "epoch": 0.05, + "global_step": 9275, + "learning_rate": 0.0004621243739565943, + "loss": 1.6421, + "loss_base2": 2.369, + "loss_pixel": 0.165, + "loss_text": 1.4771, + "ppl": 5.166, + "step": 9275 + }, + { + "epoch": 0.05, + "global_step": 9276, + "learning_rate": 0.00046212020033388983, + "loss": 1.6359, + "loss_base2": 2.3601, + "loss_pixel": 0.1631, + "loss_text": 1.4727, + "ppl": 5.1341, + "step": 9276 + }, + { + "epoch": 0.05, + "global_step": 9277, + "learning_rate": 0.0004621160267111853, + "loss": 1.6364, + "loss_base2": 2.3608, + "loss_pixel": 0.1644, + "loss_text": 1.4719, + "ppl": 5.1366, + "step": 9277 + }, + { + "epoch": 0.05, + "global_step": 9278, + "learning_rate": 0.0004621118530884808, + "loss": 1.6206, + "loss_base2": 2.338, + "loss_pixel": 0.1644, + "loss_text": 1.4562, + "ppl": 5.0561, + "step": 9278 + }, + { + "epoch": 0.05, + "global_step": 9279, + "learning_rate": 0.0004621076794657763, + "loss": 1.6367, + "loss_base2": 2.3613, + "loss_pixel": 0.1653, + "loss_text": 1.4715, + "ppl": 5.1382, + "step": 9279 + }, + { + "epoch": 0.05, + "global_step": 9280, + "learning_rate": 0.0004621035058430718, + "loss": 1.6483, + "loss_base2": 2.378, + "loss_pixel": 0.1662, + "loss_text": 1.482, + "ppl": 5.1981, + "step": 9280 + }, + { + "epoch": 0.05, + "global_step": 9281, + "learning_rate": 0.00046209933222036726, + "loss": 1.636, + "loss_base2": 2.3602, + "loss_pixel": 0.1652, + "loss_text": 1.4708, + "ppl": 5.1346, + "step": 9281 + }, + { + "epoch": 0.05, + "global_step": 9282, + "learning_rate": 0.00046209515859766277, + "loss": 1.6302, + "loss_base2": 2.3519, + "loss_pixel": 0.1642, + "loss_text": 1.466, + "ppl": 5.1049, + "step": 9282 + }, + { + "epoch": 0.05, + "global_step": 9283, + "learning_rate": 0.0004620909849749583, + "loss": 1.6419, + "loss_base2": 2.3688, + "loss_pixel": 0.1638, + "loss_text": 1.478, + "ppl": 5.165, + "step": 9283 + }, + { + "epoch": 0.05, + "global_step": 9284, + "learning_rate": 0.0004620868113522538, + "loss": 1.6311, + "loss_base2": 2.3532, + "loss_pixel": 0.1651, + "loss_text": 1.466, + "ppl": 5.1095, + "step": 9284 + }, + { + "epoch": 0.05, + "global_step": 9285, + "learning_rate": 0.0004620826377295493, + "loss": 1.6412, + "loss_base2": 2.3678, + "loss_pixel": 0.1648, + "loss_text": 1.4765, + "ppl": 5.1614, + "step": 9285 + }, + { + "epoch": 0.05, + "global_step": 9286, + "learning_rate": 0.00046207846410684474, + "loss": 1.6379, + "loss_base2": 2.363, + "loss_pixel": 0.1637, + "loss_text": 1.4742, + "ppl": 5.1444, + "step": 9286 + }, + { + "epoch": 0.05, + "global_step": 9287, + "learning_rate": 0.00046207429048414025, + "loss": 1.6376, + "loss_base2": 2.3626, + "loss_pixel": 0.1638, + "loss_text": 1.4738, + "ppl": 5.1428, + "step": 9287 + }, + { + "epoch": 0.05, + "global_step": 9288, + "learning_rate": 0.00046207011686143576, + "loss": 1.6221, + "loss_base2": 2.3402, + "loss_pixel": 0.1647, + "loss_text": 1.4574, + "ppl": 5.0637, + "step": 9288 + }, + { + "epoch": 0.05, + "global_step": 9289, + "learning_rate": 0.00046206594323873126, + "loss": 1.6341, + "loss_base2": 2.3575, + "loss_pixel": 0.1642, + "loss_text": 1.4699, + "ppl": 5.1248, + "step": 9289 + }, + { + "epoch": 0.05, + "global_step": 9290, + "learning_rate": 0.0004620617696160267, + "loss": 1.6302, + "loss_base2": 2.3519, + "loss_pixel": 0.1643, + "loss_text": 1.4659, + "ppl": 5.1049, + "step": 9290 + }, + { + "epoch": 0.05, + "global_step": 9291, + "learning_rate": 0.0004620575959933222, + "loss": 1.6443, + "loss_base2": 2.3722, + "loss_pixel": 0.1639, + "loss_text": 1.4804, + "ppl": 5.1774, + "step": 9291 + }, + { + "epoch": 0.05, + "global_step": 9292, + "learning_rate": 0.0004620534223706177, + "loss": 1.6306, + "loss_base2": 2.3525, + "loss_pixel": 0.1632, + "loss_text": 1.4674, + "ppl": 5.1069, + "step": 9292 + }, + { + "epoch": 0.05, + "global_step": 9293, + "learning_rate": 0.0004620492487479132, + "loss": 1.6219, + "loss_base2": 2.3399, + "loss_pixel": 0.1658, + "loss_text": 1.456, + "ppl": 5.0627, + "step": 9293 + }, + { + "epoch": 0.05, + "global_step": 9294, + "learning_rate": 0.0004620450751252087, + "loss": 1.636, + "loss_base2": 2.3602, + "loss_pixel": 0.1644, + "loss_text": 1.4716, + "ppl": 5.1346, + "step": 9294 + }, + { + "epoch": 0.05, + "global_step": 9295, + "learning_rate": 0.00046204090150250415, + "loss": 1.6362, + "loss_base2": 2.3605, + "loss_pixel": 0.1641, + "loss_text": 1.4722, + "ppl": 5.1356, + "step": 9295 + }, + { + "epoch": 0.05, + "global_step": 9296, + "learning_rate": 0.00046203672787979965, + "loss": 1.6409, + "loss_base2": 2.3673, + "loss_pixel": 0.1645, + "loss_text": 1.4764, + "ppl": 5.1598, + "step": 9296 + }, + { + "epoch": 0.05, + "global_step": 9297, + "learning_rate": 0.00046203255425709516, + "loss": 1.6276, + "loss_base2": 2.3481, + "loss_pixel": 0.1634, + "loss_text": 1.4642, + "ppl": 5.0916, + "step": 9297 + }, + { + "epoch": 0.05, + "global_step": 9298, + "learning_rate": 0.00046202838063439067, + "loss": 1.6249, + "loss_base2": 2.3442, + "loss_pixel": 0.1653, + "loss_text": 1.4597, + "ppl": 5.0779, + "step": 9298 + }, + { + "epoch": 0.05, + "global_step": 9299, + "learning_rate": 0.0004620242070116861, + "loss": 1.6341, + "loss_base2": 2.3575, + "loss_pixel": 0.1641, + "loss_text": 1.47, + "ppl": 5.1248, + "step": 9299 + }, + { + "epoch": 0.05, + "global_step": 9300, + "learning_rate": 0.00046202003338898163, + "loss": 1.4212, + "loss_base2": 2.0504, + "loss_pixel": 0.1642, + "loss_text": 1.257, + "ppl": 4.1421, + "step": 9300 + }, + { + "epoch": 0.05, + "global_step": 9301, + "learning_rate": 0.00046201585976627713, + "loss": 1.4087, + "loss_base2": 2.0323, + "loss_pixel": 0.1633, + "loss_text": 1.2454, + "ppl": 4.0906, + "step": 9301 + }, + { + "epoch": 0.05, + "global_step": 9302, + "learning_rate": 0.00046201168614357264, + "loss": 1.4116, + "loss_base2": 2.0365, + "loss_pixel": 0.1641, + "loss_text": 1.2475, + "ppl": 4.1025, + "step": 9302 + }, + { + "epoch": 0.05, + "global_step": 9303, + "learning_rate": 0.00046200751252086815, + "loss": 1.438, + "loss_base2": 2.0746, + "loss_pixel": 0.1634, + "loss_text": 1.2746, + "ppl": 4.2123, + "step": 9303 + }, + { + "epoch": 0.05, + "global_step": 9304, + "learning_rate": 0.0004620033388981636, + "loss": 1.4125, + "loss_base2": 2.0378, + "loss_pixel": 0.1599, + "loss_text": 1.2526, + "ppl": 4.1062, + "step": 9304 + }, + { + "epoch": 0.05, + "global_step": 9305, + "learning_rate": 0.0004619991652754591, + "loss": 1.4074, + "loss_base2": 2.0304, + "loss_pixel": 0.1563, + "loss_text": 1.2511, + "ppl": 4.0853, + "step": 9305 + }, + { + "epoch": 0.05, + "global_step": 9306, + "learning_rate": 0.0004619949916527546, + "loss": 1.393, + "loss_base2": 2.0097, + "loss_pixel": 0.1544, + "loss_text": 1.2386, + "ppl": 4.0269, + "step": 9306 + }, + { + "epoch": 0.05, + "global_step": 9307, + "learning_rate": 0.0004619908180300501, + "loss": 1.4064, + "loss_base2": 2.029, + "loss_pixel": 0.1563, + "loss_text": 1.2501, + "ppl": 4.0812, + "step": 9307 + }, + { + "epoch": 0.05, + "global_step": 9308, + "learning_rate": 0.00046198664440734563, + "loss": 1.4138, + "loss_base2": 2.0397, + "loss_pixel": 0.1587, + "loss_text": 1.2551, + "ppl": 4.1115, + "step": 9308 + }, + { + "epoch": 0.05, + "global_step": 9309, + "learning_rate": 0.0004619824707846411, + "loss": 1.4086, + "loss_base2": 2.0322, + "loss_pixel": 0.1564, + "loss_text": 1.2522, + "ppl": 4.0902, + "step": 9309 + }, + { + "epoch": 0.05, + "global_step": 9310, + "learning_rate": 0.0004619782971619366, + "loss": 1.3931, + "loss_base2": 2.0098, + "loss_pixel": 0.1549, + "loss_text": 1.2382, + "ppl": 4.0273, + "step": 9310 + }, + { + "epoch": 0.05, + "global_step": 9311, + "learning_rate": 0.00046197412353923205, + "loss": 1.3872, + "loss_base2": 2.0013, + "loss_pixel": 0.156, + "loss_text": 1.2312, + "ppl": 4.0036, + "step": 9311 + }, + { + "epoch": 0.05, + "global_step": 9312, + "learning_rate": 0.00046196994991652755, + "loss": 1.4069, + "loss_base2": 2.0297, + "loss_pixel": 0.1552, + "loss_text": 1.2517, + "ppl": 4.0833, + "step": 9312 + }, + { + "epoch": 0.05, + "global_step": 9313, + "learning_rate": 0.000461965776293823, + "loss": 1.3917, + "loss_base2": 2.0078, + "loss_pixel": 0.155, + "loss_text": 1.2367, + "ppl": 4.0217, + "step": 9313 + }, + { + "epoch": 0.05, + "global_step": 9314, + "learning_rate": 0.0004619616026711185, + "loss": 1.3933, + "loss_base2": 2.0101, + "loss_pixel": 0.1538, + "loss_text": 1.2394, + "ppl": 4.0281, + "step": 9314 + }, + { + "epoch": 0.05, + "global_step": 9315, + "learning_rate": 0.000461957429048414, + "loss": 1.4089, + "loss_base2": 2.0326, + "loss_pixel": 0.1564, + "loss_text": 1.2526, + "ppl": 4.0915, + "step": 9315 + }, + { + "epoch": 0.05, + "global_step": 9316, + "learning_rate": 0.00046195325542570953, + "loss": 1.5637, + "loss_base2": 2.2559, + "loss_pixel": 0.1552, + "loss_text": 1.4085, + "ppl": 4.7765, + "step": 9316 + }, + { + "epoch": 0.05, + "global_step": 9317, + "learning_rate": 0.00046194908180300503, + "loss": 1.6446, + "loss_base2": 2.3727, + "loss_pixel": 0.1538, + "loss_text": 1.4908, + "ppl": 5.1789, + "step": 9317 + }, + { + "epoch": 0.05, + "global_step": 9318, + "learning_rate": 0.0004619449081803005, + "loss": 1.6284, + "loss_base2": 2.3493, + "loss_pixel": 0.1528, + "loss_text": 1.4756, + "ppl": 5.0957, + "step": 9318 + }, + { + "epoch": 0.05, + "global_step": 9319, + "learning_rate": 0.000461940734557596, + "loss": 1.6532, + "loss_base2": 2.3851, + "loss_pixel": 0.1575, + "loss_text": 1.4957, + "ppl": 5.2237, + "step": 9319 + }, + { + "epoch": 0.05, + "global_step": 9320, + "learning_rate": 0.0004619365609348915, + "loss": 1.6294, + "loss_base2": 2.3507, + "loss_pixel": 0.1561, + "loss_text": 1.4733, + "ppl": 5.1008, + "step": 9320 + }, + { + "epoch": 0.05, + "global_step": 9321, + "learning_rate": 0.000461932387312187, + "loss": 1.6456, + "loss_base2": 2.3741, + "loss_pixel": 0.172, + "loss_text": 1.4736, + "ppl": 5.1841, + "step": 9321 + }, + { + "epoch": 0.05, + "global_step": 9322, + "learning_rate": 0.00046192821368948246, + "loss": 1.6313, + "loss_base2": 2.3535, + "loss_pixel": 0.1706, + "loss_text": 1.4607, + "ppl": 5.1105, + "step": 9322 + }, + { + "epoch": 0.05, + "global_step": 9323, + "learning_rate": 0.00046192404006677797, + "loss": 1.6448, + "loss_base2": 2.3729, + "loss_pixel": 0.1688, + "loss_text": 1.476, + "ppl": 5.18, + "step": 9323 + }, + { + "epoch": 0.05, + "global_step": 9324, + "learning_rate": 0.0004619198664440735, + "loss": 1.6543, + "loss_base2": 2.3867, + "loss_pixel": 0.1669, + "loss_text": 1.4874, + "ppl": 5.2294, + "step": 9324 + }, + { + "epoch": 0.05, + "global_step": 9325, + "learning_rate": 0.000461915692821369, + "loss": 1.635, + "loss_base2": 2.3588, + "loss_pixel": 0.1649, + "loss_text": 1.4701, + "ppl": 5.1295, + "step": 9325 + }, + { + "epoch": 0.05, + "global_step": 9326, + "learning_rate": 0.0004619115191986645, + "loss": 1.6336, + "loss_base2": 2.3568, + "loss_pixel": 0.1648, + "loss_text": 1.4688, + "ppl": 5.1223, + "step": 9326 + }, + { + "epoch": 0.05, + "global_step": 9327, + "learning_rate": 0.00046190734557595995, + "loss": 1.6382, + "loss_base2": 2.3634, + "loss_pixel": 0.1647, + "loss_text": 1.4735, + "ppl": 5.1459, + "step": 9327 + }, + { + "epoch": 0.05, + "global_step": 9328, + "learning_rate": 0.00046190317195325545, + "loss": 1.6554, + "loss_base2": 2.3882, + "loss_pixel": 0.165, + "loss_text": 1.4904, + "ppl": 5.2352, + "step": 9328 + }, + { + "epoch": 0.05, + "global_step": 9329, + "learning_rate": 0.00046189899833055096, + "loss": 1.6408, + "loss_base2": 2.3672, + "loss_pixel": 0.1643, + "loss_text": 1.4765, + "ppl": 5.1593, + "step": 9329 + }, + { + "epoch": 0.05, + "global_step": 9330, + "learning_rate": 0.0004618948247078464, + "loss": 1.6446, + "loss_base2": 2.3727, + "loss_pixel": 0.1642, + "loss_text": 1.4804, + "ppl": 5.1789, + "step": 9330 + }, + { + "epoch": 0.05, + "global_step": 9331, + "learning_rate": 0.00046189065108514187, + "loss": 1.6359, + "loss_base2": 2.3601, + "loss_pixel": 0.1644, + "loss_text": 1.4715, + "ppl": 5.1341, + "step": 9331 + }, + { + "epoch": 0.05, + "global_step": 9332, + "learning_rate": 0.0004618864774624374, + "loss": 1.6441, + "loss_base2": 2.3719, + "loss_pixel": 0.1632, + "loss_text": 1.4809, + "ppl": 5.1763, + "step": 9332 + }, + { + "epoch": 0.05, + "global_step": 9333, + "learning_rate": 0.0004618823038397329, + "loss": 1.6381, + "loss_base2": 2.3633, + "loss_pixel": 0.1653, + "loss_text": 1.4727, + "ppl": 5.1454, + "step": 9333 + }, + { + "epoch": 0.05, + "global_step": 9334, + "learning_rate": 0.0004618781302170284, + "loss": 1.6498, + "loss_base2": 2.3802, + "loss_pixel": 0.165, + "loss_text": 1.4848, + "ppl": 5.2059, + "step": 9334 + }, + { + "epoch": 0.05, + "global_step": 9335, + "learning_rate": 0.0004618739565943239, + "loss": 1.6356, + "loss_base2": 2.3597, + "loss_pixel": 0.1639, + "loss_text": 1.4717, + "ppl": 5.1325, + "step": 9335 + }, + { + "epoch": 0.05, + "global_step": 9336, + "learning_rate": 0.00046186978297161935, + "loss": 1.6383, + "loss_base2": 2.3636, + "loss_pixel": 0.1653, + "loss_text": 1.473, + "ppl": 5.1464, + "step": 9336 + }, + { + "epoch": 0.05, + "global_step": 9337, + "learning_rate": 0.00046186560934891486, + "loss": 1.6302, + "loss_base2": 2.3519, + "loss_pixel": 0.1646, + "loss_text": 1.4656, + "ppl": 5.1049, + "step": 9337 + }, + { + "epoch": 0.05, + "global_step": 9338, + "learning_rate": 0.00046186143572621036, + "loss": 1.6237, + "loss_base2": 2.3425, + "loss_pixel": 0.1636, + "loss_text": 1.4601, + "ppl": 5.0718, + "step": 9338 + }, + { + "epoch": 0.05, + "global_step": 9339, + "learning_rate": 0.00046185726210350587, + "loss": 1.6202, + "loss_base2": 2.3375, + "loss_pixel": 0.1641, + "loss_text": 1.4561, + "ppl": 5.0541, + "step": 9339 + }, + { + "epoch": 0.05, + "global_step": 9340, + "learning_rate": 0.0004618530884808013, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.1641, + "loss_text": 1.4509, + "ppl": 5.0284, + "step": 9340 + }, + { + "epoch": 0.05, + "global_step": 9341, + "learning_rate": 0.00046184891485809683, + "loss": 1.6422, + "loss_base2": 2.3692, + "loss_pixel": 0.1638, + "loss_text": 1.4784, + "ppl": 5.1665, + "step": 9341 + }, + { + "epoch": 0.05, + "global_step": 9342, + "learning_rate": 0.00046184474123539234, + "loss": 1.636, + "loss_base2": 2.3602, + "loss_pixel": 0.1634, + "loss_text": 1.4726, + "ppl": 5.1346, + "step": 9342 + }, + { + "epoch": 0.05, + "global_step": 9343, + "learning_rate": 0.00046184056761268785, + "loss": 1.6375, + "loss_base2": 2.3624, + "loss_pixel": 0.1631, + "loss_text": 1.4744, + "ppl": 5.1423, + "step": 9343 + }, + { + "epoch": 0.05, + "global_step": 9344, + "learning_rate": 0.00046183639398998335, + "loss": 1.6551, + "loss_base2": 2.3878, + "loss_pixel": 0.1649, + "loss_text": 1.4902, + "ppl": 5.2336, + "step": 9344 + }, + { + "epoch": 0.05, + "global_step": 9345, + "learning_rate": 0.0004618322203672788, + "loss": 1.6294, + "loss_base2": 2.3507, + "loss_pixel": 0.1628, + "loss_text": 1.4666, + "ppl": 5.1008, + "step": 9345 + }, + { + "epoch": 0.05, + "global_step": 9346, + "learning_rate": 0.0004618280467445743, + "loss": 1.6332, + "loss_base2": 2.3562, + "loss_pixel": 0.1648, + "loss_text": 1.4685, + "ppl": 5.1202, + "step": 9346 + }, + { + "epoch": 0.05, + "global_step": 9347, + "learning_rate": 0.0004618238731218698, + "loss": 1.6457, + "loss_base2": 2.3742, + "loss_pixel": 0.1642, + "loss_text": 1.4814, + "ppl": 5.1846, + "step": 9347 + }, + { + "epoch": 0.05, + "global_step": 9348, + "learning_rate": 0.00046181969949916533, + "loss": 1.6316, + "loss_base2": 2.3539, + "loss_pixel": 0.1649, + "loss_text": 1.4667, + "ppl": 5.112, + "step": 9348 + }, + { + "epoch": 0.05, + "global_step": 9349, + "learning_rate": 0.0004618155258764607, + "loss": 1.5981, + "loss_base2": 2.3056, + "loss_pixel": 0.1633, + "loss_text": 1.4349, + "ppl": 4.9436, + "step": 9349 + }, + { + "epoch": 0.05, + "global_step": 9350, + "learning_rate": 0.00046181135225375623, + "loss": 1.6362, + "loss_base2": 2.3605, + "loss_pixel": 0.1638, + "loss_text": 1.4724, + "ppl": 5.1356, + "step": 9350 + }, + { + "epoch": 0.05, + "global_step": 9351, + "learning_rate": 0.00046180717863105174, + "loss": 1.6443, + "loss_base2": 2.3722, + "loss_pixel": 0.1644, + "loss_text": 1.4798, + "ppl": 5.1774, + "step": 9351 + }, + { + "epoch": 0.05, + "global_step": 9352, + "learning_rate": 0.00046180300500834725, + "loss": 1.6565, + "loss_base2": 2.3898, + "loss_pixel": 0.165, + "loss_text": 1.4915, + "ppl": 5.2409, + "step": 9352 + }, + { + "epoch": 0.05, + "global_step": 9353, + "learning_rate": 0.00046179883138564276, + "loss": 1.6242, + "loss_base2": 2.3432, + "loss_pixel": 0.1649, + "loss_text": 1.4593, + "ppl": 5.0744, + "step": 9353 + }, + { + "epoch": 0.05, + "global_step": 9354, + "learning_rate": 0.0004617946577629382, + "loss": 1.6434, + "loss_base2": 2.3709, + "loss_pixel": 0.1663, + "loss_text": 1.4772, + "ppl": 5.1727, + "step": 9354 + }, + { + "epoch": 0.05, + "global_step": 9355, + "learning_rate": 0.0004617904841402337, + "loss": 1.6382, + "loss_base2": 2.3634, + "loss_pixel": 0.1642, + "loss_text": 1.4739, + "ppl": 5.1459, + "step": 9355 + }, + { + "epoch": 0.05, + "global_step": 9356, + "learning_rate": 0.0004617863105175292, + "loss": 1.63, + "loss_base2": 2.3516, + "loss_pixel": 0.1656, + "loss_text": 1.4644, + "ppl": 5.1039, + "step": 9356 + }, + { + "epoch": 0.05, + "global_step": 9357, + "learning_rate": 0.00046178213689482473, + "loss": 1.6345, + "loss_base2": 2.3581, + "loss_pixel": 0.1625, + "loss_text": 1.472, + "ppl": 5.1269, + "step": 9357 + }, + { + "epoch": 0.05, + "global_step": 9358, + "learning_rate": 0.0004617779632721202, + "loss": 1.6215, + "loss_base2": 2.3393, + "loss_pixel": 0.163, + "loss_text": 1.4584, + "ppl": 5.0607, + "step": 9358 + }, + { + "epoch": 0.05, + "global_step": 9359, + "learning_rate": 0.0004617737896494157, + "loss": 1.6253, + "loss_base2": 2.3448, + "loss_pixel": 0.1638, + "loss_text": 1.4615, + "ppl": 5.0799, + "step": 9359 + }, + { + "epoch": 0.05, + "global_step": 9360, + "learning_rate": 0.0004617696160267112, + "loss": 1.6552, + "loss_base2": 2.3879, + "loss_pixel": 0.1654, + "loss_text": 1.4899, + "ppl": 5.2341, + "step": 9360 + }, + { + "epoch": 0.05, + "global_step": 9361, + "learning_rate": 0.0004617654424040067, + "loss": 1.6315, + "loss_base2": 2.3538, + "loss_pixel": 0.1658, + "loss_text": 1.4657, + "ppl": 5.1115, + "step": 9361 + }, + { + "epoch": 0.05, + "global_step": 9362, + "learning_rate": 0.0004617612687813022, + "loss": 1.6337, + "loss_base2": 2.3569, + "loss_pixel": 0.1638, + "loss_text": 1.4699, + "ppl": 5.1228, + "step": 9362 + }, + { + "epoch": 0.05, + "global_step": 9363, + "learning_rate": 0.00046175709515859767, + "loss": 1.6352, + "loss_base2": 2.3591, + "loss_pixel": 0.1646, + "loss_text": 1.4706, + "ppl": 5.1305, + "step": 9363 + }, + { + "epoch": 0.05, + "global_step": 9364, + "learning_rate": 0.0004617529215358932, + "loss": 1.6275, + "loss_base2": 2.348, + "loss_pixel": 0.164, + "loss_text": 1.4634, + "ppl": 5.0911, + "step": 9364 + }, + { + "epoch": 0.05, + "global_step": 9365, + "learning_rate": 0.0004617487479131887, + "loss": 1.6502, + "loss_base2": 2.3807, + "loss_pixel": 0.163, + "loss_text": 1.4872, + "ppl": 5.208, + "step": 9365 + }, + { + "epoch": 0.05, + "global_step": 9366, + "learning_rate": 0.0004617445742904842, + "loss": 1.6315, + "loss_base2": 2.3538, + "loss_pixel": 0.1643, + "loss_text": 1.4672, + "ppl": 5.1115, + "step": 9366 + }, + { + "epoch": 0.05, + "global_step": 9367, + "learning_rate": 0.0004617404006677797, + "loss": 1.6167, + "loss_base2": 2.3324, + "loss_pixel": 0.1635, + "loss_text": 1.4532, + "ppl": 5.0364, + "step": 9367 + }, + { + "epoch": 0.05, + "global_step": 9368, + "learning_rate": 0.0004617362270450751, + "loss": 1.6248, + "loss_base2": 2.3441, + "loss_pixel": 0.1631, + "loss_text": 1.4617, + "ppl": 5.0774, + "step": 9368 + }, + { + "epoch": 0.05, + "global_step": 9369, + "learning_rate": 0.0004617320534223706, + "loss": 1.6287, + "loss_base2": 2.3497, + "loss_pixel": 0.1644, + "loss_text": 1.4643, + "ppl": 5.0972, + "step": 9369 + }, + { + "epoch": 0.05, + "global_step": 9370, + "learning_rate": 0.0004617278797996661, + "loss": 1.6224, + "loss_base2": 2.3406, + "loss_pixel": 0.164, + "loss_text": 1.4584, + "ppl": 5.0652, + "step": 9370 + }, + { + "epoch": 0.05, + "global_step": 9371, + "learning_rate": 0.0004617237061769616, + "loss": 1.6286, + "loss_base2": 2.3496, + "loss_pixel": 0.1607, + "loss_text": 1.4679, + "ppl": 5.0967, + "step": 9371 + }, + { + "epoch": 0.05, + "global_step": 9372, + "learning_rate": 0.00046171953255425707, + "loss": 1.6414, + "loss_base2": 2.368, + "loss_pixel": 0.1646, + "loss_text": 1.4768, + "ppl": 5.1624, + "step": 9372 + }, + { + "epoch": 0.05, + "global_step": 9373, + "learning_rate": 0.0004617153589315526, + "loss": 1.6298, + "loss_base2": 2.3513, + "loss_pixel": 0.1636, + "loss_text": 1.4661, + "ppl": 5.1029, + "step": 9373 + }, + { + "epoch": 0.05, + "global_step": 9374, + "learning_rate": 0.0004617111853088481, + "loss": 1.6287, + "loss_base2": 2.3497, + "loss_pixel": 0.1634, + "loss_text": 1.4654, + "ppl": 5.0972, + "step": 9374 + }, + { + "epoch": 0.05, + "global_step": 9375, + "learning_rate": 0.0004617070116861436, + "loss": 1.6276, + "loss_base2": 2.3481, + "loss_pixel": 0.1637, + "loss_text": 1.4638, + "ppl": 5.0916, + "step": 9375 + }, + { + "epoch": 0.05, + "global_step": 9376, + "learning_rate": 0.0004617028380634391, + "loss": 1.6448, + "loss_base2": 2.3729, + "loss_pixel": 0.1631, + "loss_text": 1.4817, + "ppl": 5.18, + "step": 9376 + }, + { + "epoch": 0.05, + "global_step": 9377, + "learning_rate": 0.00046169866444073455, + "loss": 1.6305, + "loss_base2": 2.3523, + "loss_pixel": 0.1634, + "loss_text": 1.4671, + "ppl": 5.1064, + "step": 9377 + }, + { + "epoch": 0.05, + "global_step": 9378, + "learning_rate": 0.00046169449081803006, + "loss": 1.6262, + "loss_base2": 2.3461, + "loss_pixel": 0.1624, + "loss_text": 1.4638, + "ppl": 5.0845, + "step": 9378 + }, + { + "epoch": 0.05, + "global_step": 9379, + "learning_rate": 0.00046169031719532557, + "loss": 1.624, + "loss_base2": 2.3429, + "loss_pixel": 0.1638, + "loss_text": 1.4602, + "ppl": 5.0733, + "step": 9379 + }, + { + "epoch": 0.05, + "global_step": 9380, + "learning_rate": 0.0004616861435726211, + "loss": 1.6238, + "loss_base2": 2.3426, + "loss_pixel": 0.1643, + "loss_text": 1.4595, + "ppl": 5.0723, + "step": 9380 + }, + { + "epoch": 0.05, + "global_step": 9381, + "learning_rate": 0.00046168196994991653, + "loss": 1.6275, + "loss_base2": 2.348, + "loss_pixel": 0.1628, + "loss_text": 1.4647, + "ppl": 5.0911, + "step": 9381 + }, + { + "epoch": 0.05, + "global_step": 9382, + "learning_rate": 0.00046167779632721203, + "loss": 1.6258, + "loss_base2": 2.3455, + "loss_pixel": 0.1632, + "loss_text": 1.4627, + "ppl": 5.0825, + "step": 9382 + }, + { + "epoch": 0.05, + "global_step": 9383, + "learning_rate": 0.00046167362270450754, + "loss": 1.6326, + "loss_base2": 2.3553, + "loss_pixel": 0.1635, + "loss_text": 1.4691, + "ppl": 5.1172, + "step": 9383 + }, + { + "epoch": 0.05, + "global_step": 9384, + "learning_rate": 0.00046166944908180305, + "loss": 1.6242, + "loss_base2": 2.3432, + "loss_pixel": 0.1629, + "loss_text": 1.4613, + "ppl": 5.0744, + "step": 9384 + }, + { + "epoch": 0.05, + "global_step": 9385, + "learning_rate": 0.00046166527545909856, + "loss": 1.6316, + "loss_base2": 2.3539, + "loss_pixel": 0.1637, + "loss_text": 1.4678, + "ppl": 5.112, + "step": 9385 + }, + { + "epoch": 0.05, + "global_step": 9386, + "learning_rate": 0.00046166110183639396, + "loss": 1.634, + "loss_base2": 2.3574, + "loss_pixel": 0.1638, + "loss_text": 1.4702, + "ppl": 5.1243, + "step": 9386 + }, + { + "epoch": 0.05, + "global_step": 9387, + "learning_rate": 0.00046165692821368946, + "loss": 1.6201, + "loss_base2": 2.3373, + "loss_pixel": 0.1632, + "loss_text": 1.4569, + "ppl": 5.0536, + "step": 9387 + }, + { + "epoch": 0.05, + "global_step": 9388, + "learning_rate": 0.00046165275459098497, + "loss": 1.6411, + "loss_base2": 2.3676, + "loss_pixel": 0.1629, + "loss_text": 1.4781, + "ppl": 5.1608, + "step": 9388 + }, + { + "epoch": 0.05, + "global_step": 9389, + "learning_rate": 0.0004616485809682805, + "loss": 1.6221, + "loss_base2": 2.3402, + "loss_pixel": 0.1633, + "loss_text": 1.4587, + "ppl": 5.0637, + "step": 9389 + }, + { + "epoch": 0.05, + "global_step": 9390, + "learning_rate": 0.00046164440734557593, + "loss": 1.6331, + "loss_base2": 2.3561, + "loss_pixel": 0.1623, + "loss_text": 1.4708, + "ppl": 5.1197, + "step": 9390 + }, + { + "epoch": 0.05, + "global_step": 9391, + "learning_rate": 0.00046164023372287144, + "loss": 1.6283, + "loss_base2": 2.3491, + "loss_pixel": 0.1635, + "loss_text": 1.4648, + "ppl": 5.0952, + "step": 9391 + }, + { + "epoch": 0.05, + "global_step": 9392, + "learning_rate": 0.00046163606010016695, + "loss": 1.6326, + "loss_base2": 2.3553, + "loss_pixel": 0.1647, + "loss_text": 1.4679, + "ppl": 5.1172, + "step": 9392 + }, + { + "epoch": 0.05, + "global_step": 9393, + "learning_rate": 0.00046163188647746245, + "loss": 1.6257, + "loss_base2": 2.3454, + "loss_pixel": 0.1623, + "loss_text": 1.4634, + "ppl": 5.082, + "step": 9393 + }, + { + "epoch": 0.05, + "global_step": 9394, + "learning_rate": 0.00046162771285475796, + "loss": 1.6305, + "loss_base2": 2.3523, + "loss_pixel": 0.1634, + "loss_text": 1.4671, + "ppl": 5.1064, + "step": 9394 + }, + { + "epoch": 0.05, + "global_step": 9395, + "learning_rate": 0.0004616235392320534, + "loss": 1.6129, + "loss_base2": 2.3269, + "loss_pixel": 0.1634, + "loss_text": 1.4495, + "ppl": 5.0173, + "step": 9395 + }, + { + "epoch": 0.05, + "global_step": 9396, + "learning_rate": 0.0004616193656093489, + "loss": 1.6211, + "loss_base2": 2.3388, + "loss_pixel": 0.1628, + "loss_text": 1.4583, + "ppl": 5.0587, + "step": 9396 + }, + { + "epoch": 0.05, + "global_step": 9397, + "learning_rate": 0.00046161519198664443, + "loss": 1.6455, + "loss_base2": 2.374, + "loss_pixel": 0.1634, + "loss_text": 1.4821, + "ppl": 5.1836, + "step": 9397 + }, + { + "epoch": 0.05, + "global_step": 9398, + "learning_rate": 0.00046161101836393994, + "loss": 1.6115, + "loss_base2": 2.3249, + "loss_pixel": 0.1618, + "loss_text": 1.4497, + "ppl": 5.0103, + "step": 9398 + }, + { + "epoch": 0.05, + "global_step": 9399, + "learning_rate": 0.0004616068447412354, + "loss": 1.6399, + "loss_base2": 2.3659, + "loss_pixel": 0.164, + "loss_text": 1.4759, + "ppl": 5.1547, + "step": 9399 + }, + { + "epoch": 0.05, + "global_step": 9400, + "learning_rate": 0.0004616026711185309, + "loss": 1.6258, + "loss_base2": 2.3455, + "loss_pixel": 0.1631, + "loss_text": 1.4627, + "ppl": 5.0825, + "step": 9400 + }, + { + "epoch": 0.05, + "global_step": 9401, + "learning_rate": 0.0004615984974958264, + "loss": 1.6113, + "loss_base2": 2.3246, + "loss_pixel": 0.1623, + "loss_text": 1.449, + "ppl": 5.0093, + "step": 9401 + }, + { + "epoch": 0.05, + "global_step": 9402, + "learning_rate": 0.0004615943238731219, + "loss": 1.6348, + "loss_base2": 2.3585, + "loss_pixel": 0.1632, + "loss_text": 1.4716, + "ppl": 5.1284, + "step": 9402 + }, + { + "epoch": 0.05, + "global_step": 9403, + "learning_rate": 0.0004615901502504174, + "loss": 1.5987, + "loss_base2": 2.3064, + "loss_pixel": 0.1642, + "loss_text": 1.4346, + "ppl": 4.9466, + "step": 9403 + }, + { + "epoch": 0.05, + "global_step": 9404, + "learning_rate": 0.00046158597662771287, + "loss": 1.6351, + "loss_base2": 2.359, + "loss_pixel": 0.1655, + "loss_text": 1.4696, + "ppl": 5.13, + "step": 9404 + }, + { + "epoch": 0.05, + "global_step": 9405, + "learning_rate": 0.0004615818030050083, + "loss": 1.6427, + "loss_base2": 2.3699, + "loss_pixel": 0.1642, + "loss_text": 1.4785, + "ppl": 5.1691, + "step": 9405 + }, + { + "epoch": 0.05, + "global_step": 9406, + "learning_rate": 0.00046157762938230383, + "loss": 1.5957, + "loss_base2": 2.3021, + "loss_pixel": 0.1638, + "loss_text": 1.4318, + "ppl": 4.9318, + "step": 9406 + }, + { + "epoch": 0.05, + "global_step": 9407, + "learning_rate": 0.00046157345575959934, + "loss": 1.4598, + "loss_base2": 2.106, + "loss_pixel": 0.1634, + "loss_text": 1.2965, + "ppl": 4.3051, + "step": 9407 + }, + { + "epoch": 0.05, + "global_step": 9408, + "learning_rate": 0.0004615692821368948, + "loss": 1.4179, + "loss_base2": 2.0456, + "loss_pixel": 0.1626, + "loss_text": 1.2553, + "ppl": 4.1284, + "step": 9408 + }, + { + "epoch": 0.05, + "global_step": 9409, + "learning_rate": 0.0004615651085141903, + "loss": 1.4101, + "loss_base2": 2.0343, + "loss_pixel": 0.1633, + "loss_text": 1.2468, + "ppl": 4.0964, + "step": 9409 + }, + { + "epoch": 0.05, + "global_step": 9410, + "learning_rate": 0.0004615609348914858, + "loss": 1.4165, + "loss_base2": 2.0436, + "loss_pixel": 0.1636, + "loss_text": 1.2529, + "ppl": 4.1227, + "step": 9410 + }, + { + "epoch": 0.05, + "global_step": 9411, + "learning_rate": 0.0004615567612687813, + "loss": 1.4137, + "loss_base2": 2.0395, + "loss_pixel": 0.1637, + "loss_text": 1.25, + "ppl": 4.1111, + "step": 9411 + }, + { + "epoch": 0.05, + "global_step": 9412, + "learning_rate": 0.0004615525876460768, + "loss": 1.434, + "loss_base2": 2.0688, + "loss_pixel": 0.1643, + "loss_text": 1.2697, + "ppl": 4.1954, + "step": 9412 + }, + { + "epoch": 0.05, + "global_step": 9413, + "learning_rate": 0.0004615484140233723, + "loss": 1.4177, + "loss_base2": 2.0453, + "loss_pixel": 0.1644, + "loss_text": 1.2532, + "ppl": 4.1276, + "step": 9413 + }, + { + "epoch": 0.05, + "global_step": 9414, + "learning_rate": 0.0004615442404006678, + "loss": 1.5458, + "loss_base2": 2.2301, + "loss_pixel": 0.1652, + "loss_text": 1.3806, + "ppl": 4.6917, + "step": 9414 + }, + { + "epoch": 0.05, + "global_step": 9415, + "learning_rate": 0.0004615400667779633, + "loss": 1.6566, + "loss_base2": 2.39, + "loss_pixel": 0.1631, + "loss_text": 1.4935, + "ppl": 5.2415, + "step": 9415 + }, + { + "epoch": 0.05, + "global_step": 9416, + "learning_rate": 0.0004615358931552588, + "loss": 1.646, + "loss_base2": 2.3747, + "loss_pixel": 0.1621, + "loss_text": 1.4839, + "ppl": 5.1862, + "step": 9416 + }, + { + "epoch": 0.05, + "global_step": 9417, + "learning_rate": 0.00046153171953255425, + "loss": 1.6415, + "loss_base2": 2.3682, + "loss_pixel": 0.1639, + "loss_text": 1.4776, + "ppl": 5.1629, + "step": 9417 + }, + { + "epoch": 0.05, + "global_step": 9418, + "learning_rate": 0.00046152754590984976, + "loss": 1.6173, + "loss_base2": 2.3333, + "loss_pixel": 0.1632, + "loss_text": 1.4541, + "ppl": 5.0395, + "step": 9418 + }, + { + "epoch": 0.05, + "global_step": 9419, + "learning_rate": 0.00046152337228714526, + "loss": 1.6468, + "loss_base2": 2.3758, + "loss_pixel": 0.1635, + "loss_text": 1.4833, + "ppl": 5.1903, + "step": 9419 + }, + { + "epoch": 0.05, + "global_step": 9420, + "learning_rate": 0.00046151919866444077, + "loss": 1.6423, + "loss_base2": 2.3693, + "loss_pixel": 0.1621, + "loss_text": 1.4803, + "ppl": 5.167, + "step": 9420 + }, + { + "epoch": 0.05, + "global_step": 9421, + "learning_rate": 0.0004615150250417363, + "loss": 1.6292, + "loss_base2": 2.3504, + "loss_pixel": 0.1636, + "loss_text": 1.4656, + "ppl": 5.0998, + "step": 9421 + }, + { + "epoch": 0.05, + "global_step": 9422, + "learning_rate": 0.00046151085141903173, + "loss": 1.6437, + "loss_base2": 2.3714, + "loss_pixel": 0.1641, + "loss_text": 1.4796, + "ppl": 5.1743, + "step": 9422 + }, + { + "epoch": 0.05, + "global_step": 9423, + "learning_rate": 0.00046150667779632724, + "loss": 1.6352, + "loss_base2": 2.3591, + "loss_pixel": 0.162, + "loss_text": 1.4732, + "ppl": 5.1305, + "step": 9423 + }, + { + "epoch": 0.05, + "global_step": 9424, + "learning_rate": 0.0004615025041736227, + "loss": 1.6157, + "loss_base2": 2.331, + "loss_pixel": 0.1639, + "loss_text": 1.4518, + "ppl": 5.0314, + "step": 9424 + }, + { + "epoch": 0.05, + "global_step": 9425, + "learning_rate": 0.0004614983305509182, + "loss": 1.6403, + "loss_base2": 2.3665, + "loss_pixel": 0.1633, + "loss_text": 1.477, + "ppl": 5.1567, + "step": 9425 + }, + { + "epoch": 0.05, + "global_step": 9426, + "learning_rate": 0.0004614941569282137, + "loss": 1.6364, + "loss_base2": 2.3608, + "loss_pixel": 0.1626, + "loss_text": 1.4738, + "ppl": 5.1366, + "step": 9426 + }, + { + "epoch": 0.05, + "global_step": 9427, + "learning_rate": 0.00046148998330550916, + "loss": 1.6445, + "loss_base2": 2.3725, + "loss_pixel": 0.1646, + "loss_text": 1.4798, + "ppl": 5.1784, + "step": 9427 + }, + { + "epoch": 0.05, + "global_step": 9428, + "learning_rate": 0.00046148580968280467, + "loss": 1.6324, + "loss_base2": 2.3551, + "loss_pixel": 0.1643, + "loss_text": 1.4681, + "ppl": 5.1161, + "step": 9428 + }, + { + "epoch": 0.05, + "global_step": 9429, + "learning_rate": 0.0004614816360601002, + "loss": 1.6205, + "loss_base2": 2.3379, + "loss_pixel": 0.1616, + "loss_text": 1.4589, + "ppl": 5.0556, + "step": 9429 + }, + { + "epoch": 0.05, + "global_step": 9430, + "learning_rate": 0.0004614774624373957, + "loss": 1.6197, + "loss_base2": 2.3367, + "loss_pixel": 0.1621, + "loss_text": 1.4576, + "ppl": 5.0516, + "step": 9430 + }, + { + "epoch": 0.05, + "global_step": 9431, + "learning_rate": 0.00046147328881469113, + "loss": 1.6308, + "loss_base2": 2.3527, + "loss_pixel": 0.1621, + "loss_text": 1.4687, + "ppl": 5.108, + "step": 9431 + }, + { + "epoch": 0.05, + "global_step": 9432, + "learning_rate": 0.00046146911519198664, + "loss": 1.643, + "loss_base2": 2.3703, + "loss_pixel": 0.1632, + "loss_text": 1.4798, + "ppl": 5.1707, + "step": 9432 + }, + { + "epoch": 0.05, + "global_step": 9433, + "learning_rate": 0.00046146494156928215, + "loss": 1.6282, + "loss_base2": 2.349, + "loss_pixel": 0.1611, + "loss_text": 1.4671, + "ppl": 5.0947, + "step": 9433 + }, + { + "epoch": 0.05, + "global_step": 9434, + "learning_rate": 0.00046146076794657766, + "loss": 1.6315, + "loss_base2": 2.3538, + "loss_pixel": 0.1635, + "loss_text": 1.468, + "ppl": 5.1115, + "step": 9434 + }, + { + "epoch": 0.05, + "global_step": 9435, + "learning_rate": 0.00046145659432387316, + "loss": 1.6215, + "loss_base2": 2.3393, + "loss_pixel": 0.1629, + "loss_text": 1.4585, + "ppl": 5.0607, + "step": 9435 + }, + { + "epoch": 0.05, + "global_step": 9436, + "learning_rate": 0.0004614524207011686, + "loss": 1.5592, + "loss_base2": 2.2495, + "loss_pixel": 0.1621, + "loss_text": 1.3971, + "ppl": 4.755, + "step": 9436 + }, + { + "epoch": 0.05, + "global_step": 9437, + "learning_rate": 0.0004614482470784641, + "loss": 1.4481, + "loss_base2": 2.0892, + "loss_pixel": 0.1626, + "loss_text": 1.2855, + "ppl": 4.255, + "step": 9437 + }, + { + "epoch": 0.05, + "global_step": 9438, + "learning_rate": 0.00046144407345575963, + "loss": 1.4366, + "loss_base2": 2.0726, + "loss_pixel": 0.163, + "loss_text": 1.2736, + "ppl": 4.2064, + "step": 9438 + }, + { + "epoch": 0.05, + "global_step": 9439, + "learning_rate": 0.00046143989983305514, + "loss": 1.4113, + "loss_base2": 2.0361, + "loss_pixel": 0.1622, + "loss_text": 1.2491, + "ppl": 4.1013, + "step": 9439 + }, + { + "epoch": 0.05, + "global_step": 9440, + "learning_rate": 0.0004614357262103506, + "loss": 1.4206, + "loss_base2": 2.0495, + "loss_pixel": 0.1627, + "loss_text": 1.2579, + "ppl": 4.1396, + "step": 9440 + }, + { + "epoch": 0.05, + "global_step": 9441, + "learning_rate": 0.0004614315525876461, + "loss": 1.4399, + "loss_base2": 2.0773, + "loss_pixel": 0.1631, + "loss_text": 1.2768, + "ppl": 4.2203, + "step": 9441 + }, + { + "epoch": 0.05, + "global_step": 9442, + "learning_rate": 0.0004614273789649416, + "loss": 1.3983, + "loss_base2": 2.0173, + "loss_pixel": 0.1628, + "loss_text": 1.2355, + "ppl": 4.0483, + "step": 9442 + }, + { + "epoch": 0.05, + "global_step": 9443, + "learning_rate": 0.00046142320534223706, + "loss": 1.4151, + "loss_base2": 2.0416, + "loss_pixel": 0.1623, + "loss_text": 1.2528, + "ppl": 4.1169, + "step": 9443 + }, + { + "epoch": 0.05, + "global_step": 9444, + "learning_rate": 0.00046141903171953257, + "loss": 1.4069, + "loss_base2": 2.0297, + "loss_pixel": 0.1628, + "loss_text": 1.2441, + "ppl": 4.0833, + "step": 9444 + }, + { + "epoch": 0.05, + "global_step": 9445, + "learning_rate": 0.000461414858096828, + "loss": 1.4039, + "loss_base2": 2.0254, + "loss_pixel": 0.1629, + "loss_text": 1.241, + "ppl": 4.071, + "step": 9445 + }, + { + "epoch": 0.05, + "global_step": 9446, + "learning_rate": 0.00046141068447412353, + "loss": 1.4093, + "loss_base2": 2.0332, + "loss_pixel": 0.1632, + "loss_text": 1.2461, + "ppl": 4.0931, + "step": 9446 + }, + { + "epoch": 0.05, + "global_step": 9447, + "learning_rate": 0.00046140651085141903, + "loss": 1.419, + "loss_base2": 2.0472, + "loss_pixel": 0.1632, + "loss_text": 1.2559, + "ppl": 4.133, + "step": 9447 + }, + { + "epoch": 0.05, + "global_step": 9448, + "learning_rate": 0.00046140233722871454, + "loss": 1.4053, + "loss_base2": 2.0274, + "loss_pixel": 0.1648, + "loss_text": 1.2406, + "ppl": 4.0767, + "step": 9448 + }, + { + "epoch": 0.05, + "global_step": 9449, + "learning_rate": 0.00046139816360601, + "loss": 1.4224, + "loss_base2": 2.0521, + "loss_pixel": 0.1631, + "loss_text": 1.2594, + "ppl": 4.1471, + "step": 9449 + }, + { + "epoch": 0.05, + "global_step": 9450, + "learning_rate": 0.0004613939899833055, + "loss": 1.3986, + "loss_base2": 2.0178, + "loss_pixel": 0.1627, + "loss_text": 1.2359, + "ppl": 4.0495, + "step": 9450 + }, + { + "epoch": 0.05, + "global_step": 9451, + "learning_rate": 0.000461389816360601, + "loss": 1.431, + "loss_base2": 2.0645, + "loss_pixel": 0.1636, + "loss_text": 1.2674, + "ppl": 4.1829, + "step": 9451 + }, + { + "epoch": 0.05, + "global_step": 9452, + "learning_rate": 0.0004613856427378965, + "loss": 1.4224, + "loss_base2": 2.0521, + "loss_pixel": 0.163, + "loss_text": 1.2594, + "ppl": 4.1471, + "step": 9452 + }, + { + "epoch": 0.05, + "global_step": 9453, + "learning_rate": 0.000461381469115192, + "loss": 1.4185, + "loss_base2": 2.0465, + "loss_pixel": 0.164, + "loss_text": 1.2545, + "ppl": 4.1309, + "step": 9453 + }, + { + "epoch": 0.05, + "global_step": 9454, + "learning_rate": 0.0004613772954924875, + "loss": 1.4058, + "loss_base2": 2.0281, + "loss_pixel": 0.1632, + "loss_text": 1.2426, + "ppl": 4.0788, + "step": 9454 + }, + { + "epoch": 0.05, + "global_step": 9455, + "learning_rate": 0.000461373121869783, + "loss": 1.4143, + "loss_base2": 2.0404, + "loss_pixel": 0.1633, + "loss_text": 1.251, + "ppl": 4.1136, + "step": 9455 + }, + { + "epoch": 0.05, + "global_step": 9456, + "learning_rate": 0.0004613689482470785, + "loss": 1.4053, + "loss_base2": 2.0274, + "loss_pixel": 0.162, + "loss_text": 1.2433, + "ppl": 4.0767, + "step": 9456 + }, + { + "epoch": 0.05, + "global_step": 9457, + "learning_rate": 0.000461364774624374, + "loss": 1.4116, + "loss_base2": 2.0365, + "loss_pixel": 0.1582, + "loss_text": 1.2534, + "ppl": 4.1025, + "step": 9457 + }, + { + "epoch": 0.05, + "global_step": 9458, + "learning_rate": 0.00046136060100166945, + "loss": 1.407, + "loss_base2": 2.0299, + "loss_pixel": 0.1593, + "loss_text": 1.2477, + "ppl": 4.0837, + "step": 9458 + }, + { + "epoch": 0.05, + "global_step": 9459, + "learning_rate": 0.00046135642737896496, + "loss": 1.4228, + "loss_base2": 2.0527, + "loss_pixel": 0.1623, + "loss_text": 1.2606, + "ppl": 4.1487, + "step": 9459 + }, + { + "epoch": 0.05, + "global_step": 9460, + "learning_rate": 0.00046135225375626047, + "loss": 1.4712, + "loss_base2": 2.1225, + "loss_pixel": 0.1612, + "loss_text": 1.31, + "ppl": 4.3545, + "step": 9460 + }, + { + "epoch": 0.05, + "global_step": 9461, + "learning_rate": 0.0004613480801335559, + "loss": 1.542, + "loss_base2": 2.2246, + "loss_pixel": 0.1667, + "loss_text": 1.3753, + "ppl": 4.6739, + "step": 9461 + }, + { + "epoch": 0.05, + "global_step": 9462, + "learning_rate": 0.00046134390651085143, + "loss": 1.4047, + "loss_base2": 2.0266, + "loss_pixel": 0.1648, + "loss_text": 1.24, + "ppl": 4.0743, + "step": 9462 + }, + { + "epoch": 0.05, + "global_step": 9463, + "learning_rate": 0.0004613397328881469, + "loss": 1.429, + "loss_base2": 2.0616, + "loss_pixel": 0.1645, + "loss_text": 1.2645, + "ppl": 4.1745, + "step": 9463 + }, + { + "epoch": 0.05, + "global_step": 9464, + "learning_rate": 0.0004613355592654424, + "loss": 1.4247, + "loss_base2": 2.0554, + "loss_pixel": 0.1712, + "loss_text": 1.2535, + "ppl": 4.1566, + "step": 9464 + }, + { + "epoch": 0.05, + "global_step": 9465, + "learning_rate": 0.0004613313856427379, + "loss": 1.4284, + "loss_base2": 2.0607, + "loss_pixel": 0.167, + "loss_text": 1.2615, + "ppl": 4.172, + "step": 9465 + }, + { + "epoch": 0.05, + "global_step": 9466, + "learning_rate": 0.0004613272120200334, + "loss": 1.4068, + "loss_base2": 2.0296, + "loss_pixel": 0.1676, + "loss_text": 1.2393, + "ppl": 4.0829, + "step": 9466 + }, + { + "epoch": 0.05, + "global_step": 9467, + "learning_rate": 0.00046132303839732886, + "loss": 1.4189, + "loss_base2": 2.047, + "loss_pixel": 0.1644, + "loss_text": 1.2544, + "ppl": 4.1326, + "step": 9467 + }, + { + "epoch": 0.05, + "global_step": 9468, + "learning_rate": 0.00046131886477462436, + "loss": 1.396, + "loss_base2": 2.014, + "loss_pixel": 0.1622, + "loss_text": 1.2339, + "ppl": 4.039, + "step": 9468 + }, + { + "epoch": 0.05, + "global_step": 9469, + "learning_rate": 0.00046131469115191987, + "loss": 1.6191, + "loss_base2": 2.3359, + "loss_pixel": 0.1621, + "loss_text": 1.457, + "ppl": 5.0485, + "step": 9469 + }, + { + "epoch": 0.05, + "global_step": 9470, + "learning_rate": 0.0004613105175292154, + "loss": 1.6644, + "loss_base2": 2.4012, + "loss_pixel": 0.1636, + "loss_text": 1.5008, + "ppl": 5.2825, + "step": 9470 + }, + { + "epoch": 0.05, + "global_step": 9471, + "learning_rate": 0.0004613063439065109, + "loss": 1.6614, + "loss_base2": 2.3969, + "loss_pixel": 0.1724, + "loss_text": 1.4889, + "ppl": 5.2667, + "step": 9471 + }, + { + "epoch": 0.05, + "global_step": 9472, + "learning_rate": 0.00046130217028380634, + "loss": 1.6591, + "loss_base2": 2.3936, + "loss_pixel": 0.1763, + "loss_text": 1.4829, + "ppl": 5.2546, + "step": 9472 + }, + { + "epoch": 0.05, + "global_step": 9473, + "learning_rate": 0.00046129799666110185, + "loss": 1.6491, + "loss_base2": 2.3791, + "loss_pixel": 0.1715, + "loss_text": 1.4776, + "ppl": 5.2023, + "step": 9473 + }, + { + "epoch": 0.05, + "global_step": 9474, + "learning_rate": 0.00046129382303839735, + "loss": 1.6479, + "loss_base2": 2.3774, + "loss_pixel": 0.1624, + "loss_text": 1.4855, + "ppl": 5.1961, + "step": 9474 + }, + { + "epoch": 0.05, + "global_step": 9475, + "learning_rate": 0.00046128964941569286, + "loss": 1.656, + "loss_base2": 2.3891, + "loss_pixel": 0.1605, + "loss_text": 1.4955, + "ppl": 5.2383, + "step": 9475 + }, + { + "epoch": 0.05, + "global_step": 9476, + "learning_rate": 0.0004612854757929883, + "loss": 1.6444, + "loss_base2": 2.3724, + "loss_pixel": 0.16, + "loss_text": 1.4845, + "ppl": 5.1779, + "step": 9476 + }, + { + "epoch": 0.05, + "global_step": 9477, + "learning_rate": 0.0004612813021702838, + "loss": 1.6005, + "loss_base2": 2.309, + "loss_pixel": 0.1597, + "loss_text": 1.4409, + "ppl": 4.9555, + "step": 9477 + }, + { + "epoch": 0.05, + "global_step": 9478, + "learning_rate": 0.00046127712854757933, + "loss": 1.629, + "loss_base2": 2.3502, + "loss_pixel": 0.1575, + "loss_text": 1.4715, + "ppl": 5.0988, + "step": 9478 + }, + { + "epoch": 0.05, + "global_step": 9479, + "learning_rate": 0.00046127295492487484, + "loss": 1.6307, + "loss_base2": 2.3526, + "loss_pixel": 0.1582, + "loss_text": 1.4726, + "ppl": 5.1074, + "step": 9479 + }, + { + "epoch": 0.05, + "global_step": 9480, + "learning_rate": 0.0004612687813021703, + "loss": 1.6307, + "loss_base2": 2.3526, + "loss_pixel": 0.1578, + "loss_text": 1.4729, + "ppl": 5.1074, + "step": 9480 + }, + { + "epoch": 0.05, + "global_step": 9481, + "learning_rate": 0.00046126460767946574, + "loss": 1.6436, + "loss_base2": 2.3712, + "loss_pixel": 0.1595, + "loss_text": 1.4841, + "ppl": 5.1738, + "step": 9481 + }, + { + "epoch": 0.05, + "global_step": 9482, + "learning_rate": 0.00046126043405676125, + "loss": 1.6358, + "loss_base2": 2.36, + "loss_pixel": 0.1555, + "loss_text": 1.4803, + "ppl": 5.1336, + "step": 9482 + }, + { + "epoch": 0.05, + "global_step": 9483, + "learning_rate": 0.00046125626043405676, + "loss": 1.6466, + "loss_base2": 2.3755, + "loss_pixel": 0.1557, + "loss_text": 1.4908, + "ppl": 5.1893, + "step": 9483 + }, + { + "epoch": 0.05, + "global_step": 9484, + "learning_rate": 0.00046125208681135226, + "loss": 1.6056, + "loss_base2": 2.3164, + "loss_pixel": 0.1567, + "loss_text": 1.4489, + "ppl": 4.9808, + "step": 9484 + }, + { + "epoch": 0.05, + "global_step": 9485, + "learning_rate": 0.00046124791318864777, + "loss": 1.6374, + "loss_base2": 2.3623, + "loss_pixel": 0.1558, + "loss_text": 1.4816, + "ppl": 5.1418, + "step": 9485 + }, + { + "epoch": 0.05, + "global_step": 9486, + "learning_rate": 0.0004612437395659432, + "loss": 1.6392, + "loss_base2": 2.3649, + "loss_pixel": 0.1569, + "loss_text": 1.4823, + "ppl": 5.151, + "step": 9486 + }, + { + "epoch": 0.05, + "global_step": 9487, + "learning_rate": 0.00046123956594323873, + "loss": 1.6174, + "loss_base2": 2.3334, + "loss_pixel": 0.1559, + "loss_text": 1.4615, + "ppl": 5.04, + "step": 9487 + }, + { + "epoch": 0.05, + "global_step": 9488, + "learning_rate": 0.00046123539232053424, + "loss": 1.6102, + "loss_base2": 2.323, + "loss_pixel": 0.1542, + "loss_text": 1.4559, + "ppl": 5.0038, + "step": 9488 + }, + { + "epoch": 0.05, + "global_step": 9489, + "learning_rate": 0.00046123121869782975, + "loss": 1.6073, + "loss_base2": 2.3188, + "loss_pixel": 0.1567, + "loss_text": 1.4506, + "ppl": 4.9893, + "step": 9489 + }, + { + "epoch": 0.05, + "global_step": 9490, + "learning_rate": 0.0004612270450751252, + "loss": 1.639, + "loss_base2": 2.3646, + "loss_pixel": 0.1653, + "loss_text": 1.4737, + "ppl": 5.15, + "step": 9490 + }, + { + "epoch": 0.05, + "global_step": 9491, + "learning_rate": 0.0004612228714524207, + "loss": 1.4942, + "loss_base2": 2.1557, + "loss_pixel": 0.1675, + "loss_text": 1.3267, + "ppl": 4.4558, + "step": 9491 + }, + { + "epoch": 0.05, + "global_step": 9492, + "learning_rate": 0.0004612186978297162, + "loss": 1.4496, + "loss_base2": 2.0913, + "loss_pixel": 0.168, + "loss_text": 1.2816, + "ppl": 4.2614, + "step": 9492 + }, + { + "epoch": 0.05, + "global_step": 9493, + "learning_rate": 0.0004612145242070117, + "loss": 1.4396, + "loss_base2": 2.0769, + "loss_pixel": 0.1739, + "loss_text": 1.2657, + "ppl": 4.219, + "step": 9493 + }, + { + "epoch": 0.05, + "global_step": 9494, + "learning_rate": 0.00046121035058430723, + "loss": 1.4263, + "loss_base2": 2.0577, + "loss_pixel": 0.1721, + "loss_text": 1.2543, + "ppl": 4.1633, + "step": 9494 + }, + { + "epoch": 0.05, + "global_step": 9495, + "learning_rate": 0.0004612061769616027, + "loss": 1.4096, + "loss_base2": 2.0336, + "loss_pixel": 0.1703, + "loss_text": 1.2392, + "ppl": 4.0943, + "step": 9495 + }, + { + "epoch": 0.05, + "global_step": 9496, + "learning_rate": 0.0004612020033388982, + "loss": 1.4267, + "loss_base2": 2.0583, + "loss_pixel": 0.1697, + "loss_text": 1.257, + "ppl": 4.1649, + "step": 9496 + }, + { + "epoch": 0.05, + "global_step": 9497, + "learning_rate": 0.0004611978297161937, + "loss": 1.4006, + "loss_base2": 2.0206, + "loss_pixel": 0.1692, + "loss_text": 1.2314, + "ppl": 4.0576, + "step": 9497 + }, + { + "epoch": 0.05, + "global_step": 9498, + "learning_rate": 0.0004611936560934892, + "loss": 1.4174, + "loss_base2": 2.0449, + "loss_pixel": 0.169, + "loss_text": 1.2484, + "ppl": 4.1264, + "step": 9498 + }, + { + "epoch": 0.05, + "global_step": 9499, + "learning_rate": 0.0004611894824707846, + "loss": 1.3964, + "loss_base2": 2.0146, + "loss_pixel": 0.1672, + "loss_text": 1.2292, + "ppl": 4.0406, + "step": 9499 + }, + { + "epoch": 0.05, + "global_step": 9500, + "learning_rate": 0.0004611853088480801, + "loss": 1.4159, + "loss_base2": 2.0427, + "loss_pixel": 0.1665, + "loss_text": 1.2494, + "ppl": 4.1202, + "step": 9500 + }, + { + "epoch": 0.05, + "global_step": 9501, + "learning_rate": 0.0004611811352253756, + "loss": 1.4254, + "loss_base2": 2.0564, + "loss_pixel": 0.1674, + "loss_text": 1.258, + "ppl": 4.1595, + "step": 9501 + }, + { + "epoch": 0.05, + "global_step": 9502, + "learning_rate": 0.0004611769616026711, + "loss": 1.4177, + "loss_base2": 2.0453, + "loss_pixel": 0.1666, + "loss_text": 1.2511, + "ppl": 4.1276, + "step": 9502 + }, + { + "epoch": 0.05, + "global_step": 9503, + "learning_rate": 0.00046117278797996663, + "loss": 1.4292, + "loss_base2": 2.0619, + "loss_pixel": 0.1685, + "loss_text": 1.2608, + "ppl": 4.1754, + "step": 9503 + }, + { + "epoch": 0.05, + "global_step": 9504, + "learning_rate": 0.0004611686143572621, + "loss": 1.4099, + "loss_base2": 2.0341, + "loss_pixel": 0.1667, + "loss_text": 1.2432, + "ppl": 4.0955, + "step": 9504 + }, + { + "epoch": 0.05, + "global_step": 9505, + "learning_rate": 0.0004611644407345576, + "loss": 1.4258, + "loss_base2": 2.057, + "loss_pixel": 0.1668, + "loss_text": 1.2591, + "ppl": 4.1612, + "step": 9505 + }, + { + "epoch": 0.05, + "global_step": 9506, + "learning_rate": 0.0004611602671118531, + "loss": 1.4163, + "loss_base2": 2.0433, + "loss_pixel": 0.166, + "loss_text": 1.2502, + "ppl": 4.1218, + "step": 9506 + }, + { + "epoch": 0.05, + "global_step": 9507, + "learning_rate": 0.0004611560934891486, + "loss": 1.3986, + "loss_base2": 2.0178, + "loss_pixel": 0.1655, + "loss_text": 1.2331, + "ppl": 4.0495, + "step": 9507 + }, + { + "epoch": 0.05, + "global_step": 9508, + "learning_rate": 0.00046115191986644406, + "loss": 1.4075, + "loss_base2": 2.0306, + "loss_pixel": 0.1643, + "loss_text": 1.2432, + "ppl": 4.0857, + "step": 9508 + }, + { + "epoch": 0.05, + "global_step": 9509, + "learning_rate": 0.00046114774624373957, + "loss": 1.4252, + "loss_base2": 2.0561, + "loss_pixel": 0.1649, + "loss_text": 1.2603, + "ppl": 4.1587, + "step": 9509 + }, + { + "epoch": 0.05, + "global_step": 9510, + "learning_rate": 0.0004611435726210351, + "loss": 1.41, + "loss_base2": 2.0342, + "loss_pixel": 0.1667, + "loss_text": 1.2433, + "ppl": 4.096, + "step": 9510 + }, + { + "epoch": 0.05, + "global_step": 9511, + "learning_rate": 0.0004611393989983306, + "loss": 1.3865, + "loss_base2": 2.0003, + "loss_pixel": 0.1643, + "loss_text": 1.2222, + "ppl": 4.0008, + "step": 9511 + }, + { + "epoch": 0.05, + "global_step": 9512, + "learning_rate": 0.0004611352253756261, + "loss": 1.4015, + "loss_base2": 2.0219, + "loss_pixel": 0.1647, + "loss_text": 1.2368, + "ppl": 4.0613, + "step": 9512 + }, + { + "epoch": 0.05, + "global_step": 9513, + "learning_rate": 0.00046113105175292154, + "loss": 1.4074, + "loss_base2": 2.0304, + "loss_pixel": 0.1641, + "loss_text": 1.2433, + "ppl": 4.0853, + "step": 9513 + }, + { + "epoch": 0.05, + "global_step": 9514, + "learning_rate": 0.00046112687813021705, + "loss": 1.5845, + "loss_base2": 2.286, + "loss_pixel": 0.1642, + "loss_text": 1.4203, + "ppl": 4.8769, + "step": 9514 + }, + { + "epoch": 0.05, + "global_step": 9515, + "learning_rate": 0.00046112270450751256, + "loss": 1.6461, + "loss_base2": 2.3748, + "loss_pixel": 0.1644, + "loss_text": 1.4816, + "ppl": 5.1867, + "step": 9515 + }, + { + "epoch": 0.05, + "global_step": 9516, + "learning_rate": 0.00046111853088480806, + "loss": 1.6547, + "loss_base2": 2.3872, + "loss_pixel": 0.1642, + "loss_text": 1.4905, + "ppl": 5.2315, + "step": 9516 + }, + { + "epoch": 0.05, + "global_step": 9517, + "learning_rate": 0.00046111435726210346, + "loss": 1.6512, + "loss_base2": 2.3822, + "loss_pixel": 0.1659, + "loss_text": 1.4853, + "ppl": 5.2132, + "step": 9517 + }, + { + "epoch": 0.05, + "global_step": 9518, + "learning_rate": 0.00046111018363939897, + "loss": 1.6222, + "loss_base2": 2.3403, + "loss_pixel": 0.1647, + "loss_text": 1.4575, + "ppl": 5.0642, + "step": 9518 + }, + { + "epoch": 0.05, + "global_step": 9519, + "learning_rate": 0.0004611060100166945, + "loss": 1.6609, + "loss_base2": 2.3962, + "loss_pixel": 0.1637, + "loss_text": 1.4972, + "ppl": 5.264, + "step": 9519 + }, + { + "epoch": 0.05, + "global_step": 9520, + "learning_rate": 0.00046110183639399, + "loss": 1.6279, + "loss_base2": 2.3486, + "loss_pixel": 0.1644, + "loss_text": 1.4635, + "ppl": 5.0932, + "step": 9520 + }, + { + "epoch": 0.05, + "global_step": 9521, + "learning_rate": 0.0004610976627712855, + "loss": 1.6245, + "loss_base2": 2.3437, + "loss_pixel": 0.1627, + "loss_text": 1.4617, + "ppl": 5.0759, + "step": 9521 + }, + { + "epoch": 0.05, + "global_step": 9522, + "learning_rate": 0.00046109348914858095, + "loss": 1.6455, + "loss_base2": 2.374, + "loss_pixel": 0.1633, + "loss_text": 1.4822, + "ppl": 5.1836, + "step": 9522 + }, + { + "epoch": 0.05, + "global_step": 9523, + "learning_rate": 0.00046108931552587645, + "loss": 1.628, + "loss_base2": 2.3487, + "loss_pixel": 0.1642, + "loss_text": 1.4638, + "ppl": 5.0937, + "step": 9523 + }, + { + "epoch": 0.05, + "global_step": 9524, + "learning_rate": 0.00046108514190317196, + "loss": 1.634, + "loss_base2": 2.3574, + "loss_pixel": 0.1629, + "loss_text": 1.4712, + "ppl": 5.1243, + "step": 9524 + }, + { + "epoch": 0.05, + "global_step": 9525, + "learning_rate": 0.00046108096828046747, + "loss": 1.6316, + "loss_base2": 2.3539, + "loss_pixel": 0.1639, + "loss_text": 1.4677, + "ppl": 5.112, + "step": 9525 + }, + { + "epoch": 0.05, + "global_step": 9526, + "learning_rate": 0.0004610767946577629, + "loss": 1.6345, + "loss_base2": 2.3581, + "loss_pixel": 0.1624, + "loss_text": 1.4722, + "ppl": 5.1269, + "step": 9526 + }, + { + "epoch": 0.05, + "global_step": 9527, + "learning_rate": 0.00046107262103505843, + "loss": 1.6557, + "loss_base2": 2.3887, + "loss_pixel": 0.1631, + "loss_text": 1.4927, + "ppl": 5.2367, + "step": 9527 + }, + { + "epoch": 0.05, + "global_step": 9528, + "learning_rate": 0.00046106844741235394, + "loss": 1.644, + "loss_base2": 2.3718, + "loss_pixel": 0.1633, + "loss_text": 1.4807, + "ppl": 5.1758, + "step": 9528 + }, + { + "epoch": 0.05, + "global_step": 9529, + "learning_rate": 0.00046106427378964944, + "loss": 1.6258, + "loss_base2": 2.3455, + "loss_pixel": 0.1625, + "loss_text": 1.4633, + "ppl": 5.0825, + "step": 9529 + }, + { + "epoch": 0.05, + "global_step": 9530, + "learning_rate": 0.00046106010016694495, + "loss": 1.6274, + "loss_base2": 2.3478, + "loss_pixel": 0.1624, + "loss_text": 1.465, + "ppl": 5.0906, + "step": 9530 + }, + { + "epoch": 0.05, + "global_step": 9531, + "learning_rate": 0.0004610559265442404, + "loss": 1.6384, + "loss_base2": 2.3637, + "loss_pixel": 0.1638, + "loss_text": 1.4746, + "ppl": 5.1469, + "step": 9531 + }, + { + "epoch": 0.05, + "global_step": 9532, + "learning_rate": 0.0004610517529215359, + "loss": 1.6296, + "loss_base2": 2.351, + "loss_pixel": 0.1629, + "loss_text": 1.4667, + "ppl": 5.1018, + "step": 9532 + }, + { + "epoch": 0.05, + "global_step": 9533, + "learning_rate": 0.0004610475792988314, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1629, + "loss_text": 1.454, + "ppl": 5.0374, + "step": 9533 + }, + { + "epoch": 0.05, + "global_step": 9534, + "learning_rate": 0.0004610434056761269, + "loss": 1.6547, + "loss_base2": 2.3872, + "loss_pixel": 0.1625, + "loss_text": 1.4922, + "ppl": 5.2315, + "step": 9534 + }, + { + "epoch": 0.05, + "global_step": 9535, + "learning_rate": 0.0004610392320534224, + "loss": 1.6418, + "loss_base2": 2.3686, + "loss_pixel": 0.1635, + "loss_text": 1.4783, + "ppl": 5.1645, + "step": 9535 + }, + { + "epoch": 0.05, + "global_step": 9536, + "learning_rate": 0.00046103505843071783, + "loss": 1.6028, + "loss_base2": 2.3124, + "loss_pixel": 0.1633, + "loss_text": 1.4395, + "ppl": 4.9669, + "step": 9536 + }, + { + "epoch": 0.05, + "global_step": 9537, + "learning_rate": 0.00046103088480801334, + "loss": 1.596, + "loss_base2": 2.3025, + "loss_pixel": 0.1622, + "loss_text": 1.4338, + "ppl": 4.9333, + "step": 9537 + }, + { + "epoch": 0.05, + "global_step": 9538, + "learning_rate": 0.00046102671118530885, + "loss": 1.6435, + "loss_base2": 2.3711, + "loss_pixel": 0.163, + "loss_text": 1.4805, + "ppl": 5.1732, + "step": 9538 + }, + { + "epoch": 0.05, + "global_step": 9539, + "learning_rate": 0.00046102253756260435, + "loss": 1.6529, + "loss_base2": 2.3846, + "loss_pixel": 0.1628, + "loss_text": 1.49, + "ppl": 5.2221, + "step": 9539 + }, + { + "epoch": 0.05, + "global_step": 9540, + "learning_rate": 0.0004610183639398998, + "loss": 1.6252, + "loss_base2": 2.3447, + "loss_pixel": 0.163, + "loss_text": 1.4622, + "ppl": 5.0794, + "step": 9540 + }, + { + "epoch": 0.05, + "global_step": 9541, + "learning_rate": 0.0004610141903171953, + "loss": 1.6381, + "loss_base2": 2.3633, + "loss_pixel": 0.1634, + "loss_text": 1.4747, + "ppl": 5.1454, + "step": 9541 + }, + { + "epoch": 0.05, + "global_step": 9542, + "learning_rate": 0.0004610100166944908, + "loss": 1.6318, + "loss_base2": 2.3542, + "loss_pixel": 0.1637, + "loss_text": 1.4681, + "ppl": 5.1131, + "step": 9542 + }, + { + "epoch": 0.05, + "global_step": 9543, + "learning_rate": 0.00046100584307178633, + "loss": 1.6222, + "loss_base2": 2.3403, + "loss_pixel": 0.1628, + "loss_text": 1.4594, + "ppl": 5.0642, + "step": 9543 + }, + { + "epoch": 0.05, + "global_step": 9544, + "learning_rate": 0.00046100166944908184, + "loss": 1.6249, + "loss_base2": 2.3442, + "loss_pixel": 0.1645, + "loss_text": 1.4604, + "ppl": 5.0779, + "step": 9544 + }, + { + "epoch": 0.05, + "global_step": 9545, + "learning_rate": 0.0004609974958263773, + "loss": 1.6237, + "loss_base2": 2.3425, + "loss_pixel": 0.1641, + "loss_text": 1.4596, + "ppl": 5.0718, + "step": 9545 + }, + { + "epoch": 0.05, + "global_step": 9546, + "learning_rate": 0.0004609933222036728, + "loss": 1.621, + "loss_base2": 2.3386, + "loss_pixel": 0.1627, + "loss_text": 1.4583, + "ppl": 5.0581, + "step": 9546 + }, + { + "epoch": 0.05, + "global_step": 9547, + "learning_rate": 0.0004609891485809683, + "loss": 1.6224, + "loss_base2": 2.3406, + "loss_pixel": 0.1634, + "loss_text": 1.459, + "ppl": 5.0652, + "step": 9547 + }, + { + "epoch": 0.05, + "global_step": 9548, + "learning_rate": 0.0004609849749582638, + "loss": 1.6251, + "loss_base2": 2.3445, + "loss_pixel": 0.1621, + "loss_text": 1.463, + "ppl": 5.0789, + "step": 9548 + }, + { + "epoch": 0.05, + "global_step": 9549, + "learning_rate": 0.00046098080133555926, + "loss": 1.6346, + "loss_base2": 2.3582, + "loss_pixel": 0.1628, + "loss_text": 1.4719, + "ppl": 5.1274, + "step": 9549 + }, + { + "epoch": 0.05, + "global_step": 9550, + "learning_rate": 0.00046097662771285477, + "loss": 1.6217, + "loss_base2": 2.3396, + "loss_pixel": 0.1638, + "loss_text": 1.4578, + "ppl": 5.0617, + "step": 9550 + }, + { + "epoch": 0.05, + "global_step": 9551, + "learning_rate": 0.0004609724540901503, + "loss": 1.6217, + "loss_base2": 2.3396, + "loss_pixel": 0.1628, + "loss_text": 1.459, + "ppl": 5.0617, + "step": 9551 + }, + { + "epoch": 0.05, + "global_step": 9552, + "learning_rate": 0.0004609682804674458, + "loss": 1.6191, + "loss_base2": 2.3359, + "loss_pixel": 0.1619, + "loss_text": 1.4573, + "ppl": 5.0485, + "step": 9552 + }, + { + "epoch": 0.05, + "global_step": 9553, + "learning_rate": 0.0004609641068447413, + "loss": 1.6245, + "loss_base2": 2.3437, + "loss_pixel": 0.1624, + "loss_text": 1.4621, + "ppl": 5.0759, + "step": 9553 + }, + { + "epoch": 0.05, + "global_step": 9554, + "learning_rate": 0.00046095993322203675, + "loss": 1.6333, + "loss_base2": 2.3564, + "loss_pixel": 0.1623, + "loss_text": 1.4711, + "ppl": 5.1207, + "step": 9554 + }, + { + "epoch": 0.05, + "global_step": 9555, + "learning_rate": 0.0004609557595993322, + "loss": 1.6361, + "loss_base2": 2.3604, + "loss_pixel": 0.1631, + "loss_text": 1.473, + "ppl": 5.1351, + "step": 9555 + }, + { + "epoch": 0.05, + "global_step": 9556, + "learning_rate": 0.0004609515859766277, + "loss": 1.6427, + "loss_base2": 2.3699, + "loss_pixel": 0.1635, + "loss_text": 1.4792, + "ppl": 5.1691, + "step": 9556 + }, + { + "epoch": 0.05, + "global_step": 9557, + "learning_rate": 0.0004609474123539232, + "loss": 1.6266, + "loss_base2": 2.3467, + "loss_pixel": 0.1629, + "loss_text": 1.4637, + "ppl": 5.0866, + "step": 9557 + }, + { + "epoch": 0.05, + "global_step": 9558, + "learning_rate": 0.00046094323873121867, + "loss": 1.4597, + "loss_base2": 2.1059, + "loss_pixel": 0.1622, + "loss_text": 1.2975, + "ppl": 4.3047, + "step": 9558 + }, + { + "epoch": 0.05, + "global_step": 9559, + "learning_rate": 0.0004609390651085142, + "loss": 1.425, + "loss_base2": 2.0558, + "loss_pixel": 0.1631, + "loss_text": 1.2619, + "ppl": 4.1579, + "step": 9559 + }, + { + "epoch": 0.05, + "global_step": 9560, + "learning_rate": 0.0004609348914858097, + "loss": 1.3974, + "loss_base2": 2.016, + "loss_pixel": 0.1612, + "loss_text": 1.2362, + "ppl": 4.0447, + "step": 9560 + }, + { + "epoch": 0.05, + "global_step": 9561, + "learning_rate": 0.0004609307178631052, + "loss": 1.4231, + "loss_base2": 2.0531, + "loss_pixel": 0.1632, + "loss_text": 1.2599, + "ppl": 4.15, + "step": 9561 + }, + { + "epoch": 0.05, + "global_step": 9562, + "learning_rate": 0.0004609265442404007, + "loss": 1.385, + "loss_base2": 1.9981, + "loss_pixel": 0.1637, + "loss_text": 1.2214, + "ppl": 3.9948, + "step": 9562 + }, + { + "epoch": 0.05, + "global_step": 9563, + "learning_rate": 0.00046092237061769615, + "loss": 1.4228, + "loss_base2": 2.0527, + "loss_pixel": 0.1625, + "loss_text": 1.2603, + "ppl": 4.1487, + "step": 9563 + }, + { + "epoch": 0.05, + "global_step": 9564, + "learning_rate": 0.00046091819699499166, + "loss": 1.3921, + "loss_base2": 2.0084, + "loss_pixel": 0.1633, + "loss_text": 1.2288, + "ppl": 4.0233, + "step": 9564 + }, + { + "epoch": 0.05, + "global_step": 9565, + "learning_rate": 0.00046091402337228716, + "loss": 1.4203, + "loss_base2": 2.0491, + "loss_pixel": 0.1616, + "loss_text": 1.2587, + "ppl": 4.1384, + "step": 9565 + }, + { + "epoch": 0.05, + "global_step": 9566, + "learning_rate": 0.00046090984974958267, + "loss": 1.5782, + "loss_base2": 2.2769, + "loss_pixel": 0.1622, + "loss_text": 1.416, + "ppl": 4.8462, + "step": 9566 + }, + { + "epoch": 0.05, + "global_step": 9567, + "learning_rate": 0.0004609056761268781, + "loss": 1.6419, + "loss_base2": 2.3688, + "loss_pixel": 0.1637, + "loss_text": 1.4782, + "ppl": 5.165, + "step": 9567 + }, + { + "epoch": 0.05, + "global_step": 9568, + "learning_rate": 0.00046090150250417363, + "loss": 1.6415, + "loss_base2": 2.3682, + "loss_pixel": 0.1657, + "loss_text": 1.4759, + "ppl": 5.1629, + "step": 9568 + }, + { + "epoch": 0.05, + "global_step": 9569, + "learning_rate": 0.00046089732888146914, + "loss": 1.638, + "loss_base2": 2.3631, + "loss_pixel": 0.1629, + "loss_text": 1.4751, + "ppl": 5.1449, + "step": 9569 + }, + { + "epoch": 0.05, + "global_step": 9570, + "learning_rate": 0.00046089315525876465, + "loss": 1.6461, + "loss_base2": 2.3748, + "loss_pixel": 0.1626, + "loss_text": 1.4835, + "ppl": 5.1867, + "step": 9570 + }, + { + "epoch": 0.05, + "global_step": 9571, + "learning_rate": 0.00046088898163606015, + "loss": 1.6396, + "loss_base2": 2.3654, + "loss_pixel": 0.1635, + "loss_text": 1.4761, + "ppl": 5.1531, + "step": 9571 + }, + { + "epoch": 0.05, + "global_step": 9572, + "learning_rate": 0.0004608848080133556, + "loss": 1.6269, + "loss_base2": 2.3471, + "loss_pixel": 0.1637, + "loss_text": 1.4633, + "ppl": 5.0881, + "step": 9572 + }, + { + "epoch": 0.05, + "global_step": 9573, + "learning_rate": 0.0004608806343906511, + "loss": 1.6314, + "loss_base2": 2.3536, + "loss_pixel": 0.1628, + "loss_text": 1.4686, + "ppl": 5.111, + "step": 9573 + }, + { + "epoch": 0.05, + "global_step": 9574, + "learning_rate": 0.00046087646076794657, + "loss": 1.6291, + "loss_base2": 2.3503, + "loss_pixel": 0.1621, + "loss_text": 1.4669, + "ppl": 5.0993, + "step": 9574 + }, + { + "epoch": 0.05, + "global_step": 9575, + "learning_rate": 0.0004608722871452421, + "loss": 1.6355, + "loss_base2": 2.3595, + "loss_pixel": 0.1625, + "loss_text": 1.473, + "ppl": 5.132, + "step": 9575 + }, + { + "epoch": 0.05, + "global_step": 9576, + "learning_rate": 0.00046086811352253753, + "loss": 1.633, + "loss_base2": 2.3559, + "loss_pixel": 0.1625, + "loss_text": 1.4705, + "ppl": 5.1192, + "step": 9576 + }, + { + "epoch": 0.05, + "global_step": 9577, + "learning_rate": 0.00046086393989983303, + "loss": 1.6129, + "loss_base2": 2.3269, + "loss_pixel": 0.1634, + "loss_text": 1.4496, + "ppl": 5.0173, + "step": 9577 + }, + { + "epoch": 0.05, + "global_step": 9578, + "learning_rate": 0.00046085976627712854, + "loss": 1.61, + "loss_base2": 2.3227, + "loss_pixel": 0.1615, + "loss_text": 1.4485, + "ppl": 5.0028, + "step": 9578 + }, + { + "epoch": 0.05, + "global_step": 9579, + "learning_rate": 0.00046085559265442405, + "loss": 1.6454, + "loss_base2": 2.3738, + "loss_pixel": 0.1617, + "loss_text": 1.4836, + "ppl": 5.1831, + "step": 9579 + }, + { + "epoch": 0.05, + "global_step": 9580, + "learning_rate": 0.00046085141903171956, + "loss": 1.623, + "loss_base2": 2.3415, + "loss_pixel": 0.163, + "loss_text": 1.46, + "ppl": 5.0683, + "step": 9580 + }, + { + "epoch": 0.05, + "global_step": 9581, + "learning_rate": 0.000460847245409015, + "loss": 1.6331, + "loss_base2": 2.3561, + "loss_pixel": 0.1621, + "loss_text": 1.471, + "ppl": 5.1197, + "step": 9581 + }, + { + "epoch": 0.05, + "global_step": 9582, + "learning_rate": 0.0004608430717863105, + "loss": 1.6259, + "loss_base2": 2.3457, + "loss_pixel": 0.1627, + "loss_text": 1.4631, + "ppl": 5.083, + "step": 9582 + }, + { + "epoch": 0.05, + "global_step": 9583, + "learning_rate": 0.000460838898163606, + "loss": 1.6302, + "loss_base2": 2.3519, + "loss_pixel": 0.1622, + "loss_text": 1.468, + "ppl": 5.1049, + "step": 9583 + }, + { + "epoch": 0.05, + "global_step": 9584, + "learning_rate": 0.00046083472454090153, + "loss": 1.5799, + "loss_base2": 2.2793, + "loss_pixel": 0.1617, + "loss_text": 1.4182, + "ppl": 4.8545, + "step": 9584 + }, + { + "epoch": 0.05, + "global_step": 9585, + "learning_rate": 0.000460830550918197, + "loss": 1.6236, + "loss_base2": 2.3424, + "loss_pixel": 0.1619, + "loss_text": 1.4616, + "ppl": 5.0713, + "step": 9585 + }, + { + "epoch": 0.05, + "global_step": 9586, + "learning_rate": 0.0004608263772954925, + "loss": 1.6262, + "loss_base2": 2.3461, + "loss_pixel": 0.1611, + "loss_text": 1.4651, + "ppl": 5.0845, + "step": 9586 + }, + { + "epoch": 0.05, + "global_step": 9587, + "learning_rate": 0.000460822203672788, + "loss": 1.6269, + "loss_base2": 2.3471, + "loss_pixel": 0.1631, + "loss_text": 1.4639, + "ppl": 5.0881, + "step": 9587 + }, + { + "epoch": 0.05, + "global_step": 9588, + "learning_rate": 0.0004608180300500835, + "loss": 1.6092, + "loss_base2": 2.3216, + "loss_pixel": 0.1626, + "loss_text": 1.4466, + "ppl": 4.9988, + "step": 9588 + }, + { + "epoch": 0.05, + "global_step": 9589, + "learning_rate": 0.000460813856427379, + "loss": 1.6329, + "loss_base2": 2.3558, + "loss_pixel": 0.1611, + "loss_text": 1.4718, + "ppl": 5.1187, + "step": 9589 + }, + { + "epoch": 0.05, + "global_step": 9590, + "learning_rate": 0.00046080968280467447, + "loss": 1.6354, + "loss_base2": 2.3594, + "loss_pixel": 0.1628, + "loss_text": 1.4726, + "ppl": 5.1315, + "step": 9590 + }, + { + "epoch": 0.05, + "global_step": 9591, + "learning_rate": 0.00046080550918197, + "loss": 1.628, + "loss_base2": 2.3487, + "loss_pixel": 0.1622, + "loss_text": 1.4658, + "ppl": 5.0937, + "step": 9591 + }, + { + "epoch": 0.05, + "global_step": 9592, + "learning_rate": 0.0004608013355592655, + "loss": 1.6188, + "loss_base2": 2.3354, + "loss_pixel": 0.1615, + "loss_text": 1.4574, + "ppl": 5.047, + "step": 9592 + }, + { + "epoch": 0.05, + "global_step": 9593, + "learning_rate": 0.00046079716193656093, + "loss": 1.6423, + "loss_base2": 2.3693, + "loss_pixel": 0.1611, + "loss_text": 1.4811, + "ppl": 5.167, + "step": 9593 + }, + { + "epoch": 0.05, + "global_step": 9594, + "learning_rate": 0.0004607929883138564, + "loss": 1.6389, + "loss_base2": 2.3644, + "loss_pixel": 0.1613, + "loss_text": 1.4776, + "ppl": 5.1495, + "step": 9594 + }, + { + "epoch": 0.05, + "global_step": 9595, + "learning_rate": 0.0004607888146911519, + "loss": 1.6207, + "loss_base2": 2.3382, + "loss_pixel": 0.1616, + "loss_text": 1.4591, + "ppl": 5.0566, + "step": 9595 + }, + { + "epoch": 0.05, + "global_step": 9596, + "learning_rate": 0.0004607846410684474, + "loss": 1.6283, + "loss_base2": 2.3491, + "loss_pixel": 0.1621, + "loss_text": 1.4662, + "ppl": 5.0952, + "step": 9596 + }, + { + "epoch": 0.05, + "global_step": 9597, + "learning_rate": 0.0004607804674457429, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.1616, + "loss_text": 1.4534, + "ppl": 5.0284, + "step": 9597 + }, + { + "epoch": 0.05, + "global_step": 9598, + "learning_rate": 0.0004607762938230384, + "loss": 1.6297, + "loss_base2": 2.3512, + "loss_pixel": 0.1621, + "loss_text": 1.4676, + "ppl": 5.1023, + "step": 9598 + }, + { + "epoch": 0.05, + "global_step": 9599, + "learning_rate": 0.00046077212020033387, + "loss": 1.6341, + "loss_base2": 2.3575, + "loss_pixel": 0.1629, + "loss_text": 1.4712, + "ppl": 5.1248, + "step": 9599 + }, + { + "epoch": 0.05, + "global_step": 9600, + "learning_rate": 0.0004607679465776294, + "loss": 1.6325, + "loss_base2": 2.3552, + "loss_pixel": 0.1627, + "loss_text": 1.4698, + "ppl": 5.1167, + "step": 9600 + }, + { + "epoch": 0.05, + "global_step": 9601, + "learning_rate": 0.0004607637729549249, + "loss": 1.6188, + "loss_base2": 2.3354, + "loss_pixel": 0.1624, + "loss_text": 1.4564, + "ppl": 5.047, + "step": 9601 + }, + { + "epoch": 0.05, + "global_step": 9602, + "learning_rate": 0.0004607595993322204, + "loss": 1.6401, + "loss_base2": 2.3662, + "loss_pixel": 0.1634, + "loss_text": 1.4767, + "ppl": 5.1557, + "step": 9602 + }, + { + "epoch": 0.05, + "global_step": 9603, + "learning_rate": 0.0004607554257095159, + "loss": 1.611, + "loss_base2": 2.3242, + "loss_pixel": 0.1624, + "loss_text": 1.4486, + "ppl": 5.0078, + "step": 9603 + }, + { + "epoch": 0.05, + "global_step": 9604, + "learning_rate": 0.00046075125208681135, + "loss": 1.6082, + "loss_base2": 2.3201, + "loss_pixel": 0.1628, + "loss_text": 1.4453, + "ppl": 4.9938, + "step": 9604 + }, + { + "epoch": 0.05, + "global_step": 9605, + "learning_rate": 0.00046074707846410686, + "loss": 1.6243, + "loss_base2": 2.3434, + "loss_pixel": 0.1626, + "loss_text": 1.4617, + "ppl": 5.0749, + "step": 9605 + }, + { + "epoch": 0.05, + "global_step": 9606, + "learning_rate": 0.00046074290484140237, + "loss": 1.6273, + "loss_base2": 2.3477, + "loss_pixel": 0.1631, + "loss_text": 1.4642, + "ppl": 5.0901, + "step": 9606 + }, + { + "epoch": 0.05, + "global_step": 9607, + "learning_rate": 0.0004607387312186979, + "loss": 1.6275, + "loss_base2": 2.348, + "loss_pixel": 0.1641, + "loss_text": 1.4634, + "ppl": 5.0911, + "step": 9607 + }, + { + "epoch": 0.05, + "global_step": 9608, + "learning_rate": 0.00046073455759599333, + "loss": 1.6406, + "loss_base2": 2.3669, + "loss_pixel": 0.1647, + "loss_text": 1.4759, + "ppl": 5.1583, + "step": 9608 + }, + { + "epoch": 0.05, + "global_step": 9609, + "learning_rate": 0.00046073038397328884, + "loss": 1.6177, + "loss_base2": 2.3338, + "loss_pixel": 0.1625, + "loss_text": 1.4551, + "ppl": 5.0415, + "step": 9609 + }, + { + "epoch": 0.05, + "global_step": 9610, + "learning_rate": 0.00046072621035058434, + "loss": 1.6298, + "loss_base2": 2.3513, + "loss_pixel": 0.1645, + "loss_text": 1.4653, + "ppl": 5.1029, + "step": 9610 + }, + { + "epoch": 0.05, + "global_step": 9611, + "learning_rate": 0.00046072203672787985, + "loss": 1.6142, + "loss_base2": 2.3288, + "loss_pixel": 0.1629, + "loss_text": 1.4513, + "ppl": 5.0239, + "step": 9611 + }, + { + "epoch": 0.05, + "global_step": 9612, + "learning_rate": 0.0004607178631051753, + "loss": 1.6175, + "loss_base2": 2.3336, + "loss_pixel": 0.1569, + "loss_text": 1.4605, + "ppl": 5.0405, + "step": 9612 + }, + { + "epoch": 0.05, + "global_step": 9613, + "learning_rate": 0.00046071368948247076, + "loss": 1.6202, + "loss_base2": 2.3375, + "loss_pixel": 0.1564, + "loss_text": 1.4638, + "ppl": 5.0541, + "step": 9613 + }, + { + "epoch": 0.05, + "global_step": 9614, + "learning_rate": 0.00046070951585976626, + "loss": 1.6118, + "loss_base2": 2.3253, + "loss_pixel": 0.1537, + "loss_text": 1.4582, + "ppl": 5.0118, + "step": 9614 + }, + { + "epoch": 0.05, + "global_step": 9615, + "learning_rate": 0.00046070534223706177, + "loss": 1.6003, + "loss_base2": 2.3087, + "loss_pixel": 0.156, + "loss_text": 1.4443, + "ppl": 4.9545, + "step": 9615 + }, + { + "epoch": 0.05, + "global_step": 9616, + "learning_rate": 0.0004607011686143573, + "loss": 1.5928, + "loss_base2": 2.2979, + "loss_pixel": 0.1534, + "loss_text": 1.4394, + "ppl": 4.9175, + "step": 9616 + }, + { + "epoch": 0.05, + "global_step": 9617, + "learning_rate": 0.00046069699499165273, + "loss": 1.6273, + "loss_base2": 2.3477, + "loss_pixel": 0.1564, + "loss_text": 1.4709, + "ppl": 5.0901, + "step": 9617 + }, + { + "epoch": 0.05, + "global_step": 9618, + "learning_rate": 0.00046069282136894824, + "loss": 1.6305, + "loss_base2": 2.3523, + "loss_pixel": 0.1545, + "loss_text": 1.476, + "ppl": 5.1064, + "step": 9618 + }, + { + "epoch": 0.05, + "global_step": 9619, + "learning_rate": 0.00046068864774624375, + "loss": 1.6261, + "loss_base2": 2.346, + "loss_pixel": 0.1546, + "loss_text": 1.4715, + "ppl": 5.084, + "step": 9619 + }, + { + "epoch": 0.05, + "global_step": 9620, + "learning_rate": 0.00046068447412353925, + "loss": 1.6017, + "loss_base2": 2.3108, + "loss_pixel": 0.1543, + "loss_text": 1.4475, + "ppl": 4.9615, + "step": 9620 + }, + { + "epoch": 0.05, + "global_step": 9621, + "learning_rate": 0.00046068030050083476, + "loss": 1.6214, + "loss_base2": 2.3392, + "loss_pixel": 0.1536, + "loss_text": 1.4678, + "ppl": 5.0602, + "step": 9621 + }, + { + "epoch": 0.05, + "global_step": 9622, + "learning_rate": 0.0004606761268781302, + "loss": 1.6231, + "loss_base2": 2.3416, + "loss_pixel": 0.1534, + "loss_text": 1.4698, + "ppl": 5.0688, + "step": 9622 + }, + { + "epoch": 0.05, + "global_step": 9623, + "learning_rate": 0.0004606719532554257, + "loss": 1.6109, + "loss_base2": 2.324, + "loss_pixel": 0.1545, + "loss_text": 1.4564, + "ppl": 5.0073, + "step": 9623 + }, + { + "epoch": 0.05, + "global_step": 9624, + "learning_rate": 0.00046066777963272123, + "loss": 1.6055, + "loss_base2": 2.3162, + "loss_pixel": 0.153, + "loss_text": 1.4524, + "ppl": 4.9803, + "step": 9624 + }, + { + "epoch": 0.05, + "global_step": 9625, + "learning_rate": 0.00046066360601001674, + "loss": 1.6147, + "loss_base2": 2.3295, + "loss_pixel": 0.1544, + "loss_text": 1.4603, + "ppl": 5.0264, + "step": 9625 + }, + { + "epoch": 0.05, + "global_step": 9626, + "learning_rate": 0.0004606594323873122, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1521, + "loss_text": 1.4649, + "ppl": 5.0374, + "step": 9626 + }, + { + "epoch": 0.05, + "global_step": 9627, + "learning_rate": 0.0004606552587646077, + "loss": 1.6268, + "loss_base2": 2.347, + "loss_pixel": 0.1531, + "loss_text": 1.4737, + "ppl": 5.0876, + "step": 9627 + }, + { + "epoch": 0.05, + "global_step": 9628, + "learning_rate": 0.0004606510851419032, + "loss": 1.6139, + "loss_base2": 2.3284, + "loss_pixel": 0.1627, + "loss_text": 1.4512, + "ppl": 5.0224, + "step": 9628 + }, + { + "epoch": 0.05, + "global_step": 9629, + "learning_rate": 0.0004606469115191987, + "loss": 1.6359, + "loss_base2": 2.3601, + "loss_pixel": 0.168, + "loss_text": 1.468, + "ppl": 5.1341, + "step": 9629 + }, + { + "epoch": 0.05, + "global_step": 9630, + "learning_rate": 0.00046064273789649416, + "loss": 1.6424, + "loss_base2": 2.3695, + "loss_pixel": 0.1676, + "loss_text": 1.4748, + "ppl": 5.1676, + "step": 9630 + }, + { + "epoch": 0.05, + "global_step": 9631, + "learning_rate": 0.0004606385642737896, + "loss": 1.6165, + "loss_base2": 2.3321, + "loss_pixel": 0.1535, + "loss_text": 1.463, + "ppl": 5.0354, + "step": 9631 + }, + { + "epoch": 0.05, + "global_step": 9632, + "learning_rate": 0.0004606343906510851, + "loss": 1.6113, + "loss_base2": 2.3246, + "loss_pixel": 0.1547, + "loss_text": 1.4565, + "ppl": 5.0093, + "step": 9632 + }, + { + "epoch": 0.05, + "global_step": 9633, + "learning_rate": 0.00046063021702838063, + "loss": 1.6193, + "loss_base2": 2.3362, + "loss_pixel": 0.1567, + "loss_text": 1.4627, + "ppl": 5.0496, + "step": 9633 + }, + { + "epoch": 0.05, + "global_step": 9634, + "learning_rate": 0.00046062604340567614, + "loss": 1.6166, + "loss_base2": 2.3323, + "loss_pixel": 0.1543, + "loss_text": 1.4623, + "ppl": 5.0359, + "step": 9634 + }, + { + "epoch": 0.05, + "global_step": 9635, + "learning_rate": 0.0004606218697829716, + "loss": 1.6009, + "loss_base2": 2.3096, + "loss_pixel": 0.1526, + "loss_text": 1.4482, + "ppl": 4.9575, + "step": 9635 + }, + { + "epoch": 0.05, + "global_step": 9636, + "learning_rate": 0.0004606176961602671, + "loss": 1.6245, + "loss_base2": 2.3437, + "loss_pixel": 0.1529, + "loss_text": 1.4717, + "ppl": 5.0759, + "step": 9636 + }, + { + "epoch": 0.05, + "global_step": 9637, + "learning_rate": 0.0004606135225375626, + "loss": 1.6069, + "loss_base2": 2.3183, + "loss_pixel": 0.1546, + "loss_text": 1.4523, + "ppl": 4.9873, + "step": 9637 + }, + { + "epoch": 0.05, + "global_step": 9638, + "learning_rate": 0.0004606093489148581, + "loss": 1.626, + "loss_base2": 2.3458, + "loss_pixel": 0.1521, + "loss_text": 1.4739, + "ppl": 5.0835, + "step": 9638 + }, + { + "epoch": 0.05, + "global_step": 9639, + "learning_rate": 0.0004606051752921536, + "loss": 1.6059, + "loss_base2": 2.3168, + "loss_pixel": 0.153, + "loss_text": 1.4529, + "ppl": 4.9823, + "step": 9639 + }, + { + "epoch": 0.05, + "global_step": 9640, + "learning_rate": 0.0004606010016694491, + "loss": 1.6234, + "loss_base2": 2.3421, + "loss_pixel": 0.1535, + "loss_text": 1.4698, + "ppl": 5.0703, + "step": 9640 + }, + { + "epoch": 0.05, + "global_step": 9641, + "learning_rate": 0.0004605968280467446, + "loss": 1.6157, + "loss_base2": 2.331, + "loss_pixel": 0.1521, + "loss_text": 1.4636, + "ppl": 5.0314, + "step": 9641 + }, + { + "epoch": 0.05, + "global_step": 9642, + "learning_rate": 0.0004605926544240401, + "loss": 1.6049, + "loss_base2": 2.3154, + "loss_pixel": 0.1547, + "loss_text": 1.4501, + "ppl": 4.9774, + "step": 9642 + }, + { + "epoch": 0.05, + "global_step": 9643, + "learning_rate": 0.0004605884808013356, + "loss": 1.622, + "loss_base2": 2.3401, + "loss_pixel": 0.1518, + "loss_text": 1.4703, + "ppl": 5.0632, + "step": 9643 + }, + { + "epoch": 0.05, + "global_step": 9644, + "learning_rate": 0.00046058430717863105, + "loss": 1.6234, + "loss_base2": 2.3421, + "loss_pixel": 0.1515, + "loss_text": 1.4719, + "ppl": 5.0703, + "step": 9644 + }, + { + "epoch": 0.05, + "global_step": 9645, + "learning_rate": 0.00046058013355592656, + "loss": 1.6029, + "loss_base2": 2.3125, + "loss_pixel": 0.1544, + "loss_text": 1.4485, + "ppl": 4.9674, + "step": 9645 + }, + { + "epoch": 0.05, + "global_step": 9646, + "learning_rate": 0.00046057595993322206, + "loss": 1.6048, + "loss_base2": 2.3152, + "loss_pixel": 0.1502, + "loss_text": 1.4547, + "ppl": 4.9769, + "step": 9646 + }, + { + "epoch": 0.05, + "global_step": 9647, + "learning_rate": 0.00046057178631051757, + "loss": 1.5867, + "loss_base2": 2.2891, + "loss_pixel": 0.156, + "loss_text": 1.4307, + "ppl": 4.8876, + "step": 9647 + }, + { + "epoch": 0.05, + "global_step": 9648, + "learning_rate": 0.0004605676126878131, + "loss": 1.6295, + "loss_base2": 2.3509, + "loss_pixel": 0.1637, + "loss_text": 1.4658, + "ppl": 5.1013, + "step": 9648 + }, + { + "epoch": 0.05, + "global_step": 9649, + "learning_rate": 0.0004605634390651085, + "loss": 1.6357, + "loss_base2": 2.3598, + "loss_pixel": 0.1637, + "loss_text": 1.472, + "ppl": 5.133, + "step": 9649 + }, + { + "epoch": 0.05, + "global_step": 9650, + "learning_rate": 0.000460559265442404, + "loss": 1.6032, + "loss_base2": 2.3129, + "loss_pixel": 0.1638, + "loss_text": 1.4395, + "ppl": 4.9689, + "step": 9650 + }, + { + "epoch": 0.05, + "global_step": 9651, + "learning_rate": 0.0004605550918196995, + "loss": 1.6282, + "loss_base2": 2.349, + "loss_pixel": 0.1631, + "loss_text": 1.4651, + "ppl": 5.0947, + "step": 9651 + }, + { + "epoch": 0.05, + "global_step": 9652, + "learning_rate": 0.000460550918196995, + "loss": 1.6165, + "loss_base2": 2.3321, + "loss_pixel": 0.1625, + "loss_text": 1.4541, + "ppl": 5.0354, + "step": 9652 + }, + { + "epoch": 0.05, + "global_step": 9653, + "learning_rate": 0.00046054674457429045, + "loss": 1.6321, + "loss_base2": 2.3546, + "loss_pixel": 0.1646, + "loss_text": 1.4675, + "ppl": 5.1146, + "step": 9653 + }, + { + "epoch": 0.05, + "global_step": 9654, + "learning_rate": 0.00046054257095158596, + "loss": 1.6514, + "loss_base2": 2.3825, + "loss_pixel": 0.1627, + "loss_text": 1.4887, + "ppl": 5.2143, + "step": 9654 + }, + { + "epoch": 0.05, + "global_step": 9655, + "learning_rate": 0.00046053839732888147, + "loss": 1.6396, + "loss_base2": 2.3654, + "loss_pixel": 0.162, + "loss_text": 1.4775, + "ppl": 5.1531, + "step": 9655 + }, + { + "epoch": 0.05, + "global_step": 9656, + "learning_rate": 0.000460534223706177, + "loss": 1.6373, + "loss_base2": 2.3621, + "loss_pixel": 0.1623, + "loss_text": 1.475, + "ppl": 5.1413, + "step": 9656 + }, + { + "epoch": 0.05, + "global_step": 9657, + "learning_rate": 0.0004605300500834725, + "loss": 1.6119, + "loss_base2": 2.3255, + "loss_pixel": 0.1617, + "loss_text": 1.4502, + "ppl": 5.0123, + "step": 9657 + }, + { + "epoch": 0.05, + "global_step": 9658, + "learning_rate": 0.00046052587646076793, + "loss": 1.63, + "loss_base2": 2.3516, + "loss_pixel": 0.1621, + "loss_text": 1.468, + "ppl": 5.1039, + "step": 9658 + }, + { + "epoch": 0.05, + "global_step": 9659, + "learning_rate": 0.00046052170283806344, + "loss": 1.6252, + "loss_base2": 2.3447, + "loss_pixel": 0.1626, + "loss_text": 1.4626, + "ppl": 5.0794, + "step": 9659 + }, + { + "epoch": 0.05, + "global_step": 9660, + "learning_rate": 0.00046051752921535895, + "loss": 1.6387, + "loss_base2": 2.3641, + "loss_pixel": 0.1629, + "loss_text": 1.4759, + "ppl": 5.1485, + "step": 9660 + }, + { + "epoch": 0.05, + "global_step": 9661, + "learning_rate": 0.00046051335559265446, + "loss": 1.6251, + "loss_base2": 2.3445, + "loss_pixel": 0.1628, + "loss_text": 1.4623, + "ppl": 5.0789, + "step": 9661 + }, + { + "epoch": 0.05, + "global_step": 9662, + "learning_rate": 0.00046050918196994996, + "loss": 1.6268, + "loss_base2": 2.347, + "loss_pixel": 0.1627, + "loss_text": 1.4641, + "ppl": 5.0876, + "step": 9662 + }, + { + "epoch": 0.05, + "global_step": 9663, + "learning_rate": 0.0004605050083472454, + "loss": 1.6167, + "loss_base2": 2.3324, + "loss_pixel": 0.1618, + "loss_text": 1.4549, + "ppl": 5.0364, + "step": 9663 + }, + { + "epoch": 0.05, + "global_step": 9664, + "learning_rate": 0.0004605008347245409, + "loss": 1.6335, + "loss_base2": 2.3566, + "loss_pixel": 0.1618, + "loss_text": 1.4718, + "ppl": 5.1218, + "step": 9664 + }, + { + "epoch": 0.05, + "global_step": 9665, + "learning_rate": 0.00046049666110183643, + "loss": 1.5985, + "loss_base2": 2.3061, + "loss_pixel": 0.1629, + "loss_text": 1.4356, + "ppl": 4.9456, + "step": 9665 + }, + { + "epoch": 0.05, + "global_step": 9666, + "learning_rate": 0.00046049248747913194, + "loss": 1.6183, + "loss_base2": 2.3347, + "loss_pixel": 0.1609, + "loss_text": 1.4574, + "ppl": 5.0445, + "step": 9666 + }, + { + "epoch": 0.05, + "global_step": 9667, + "learning_rate": 0.0004604883138564274, + "loss": 1.623, + "loss_base2": 2.3415, + "loss_pixel": 0.1633, + "loss_text": 1.4597, + "ppl": 5.0683, + "step": 9667 + }, + { + "epoch": 0.05, + "global_step": 9668, + "learning_rate": 0.00046048414023372285, + "loss": 1.6089, + "loss_base2": 2.3212, + "loss_pixel": 0.1613, + "loss_text": 1.4477, + "ppl": 4.9973, + "step": 9668 + }, + { + "epoch": 0.05, + "global_step": 9669, + "learning_rate": 0.00046047996661101835, + "loss": 1.5991, + "loss_base2": 2.307, + "loss_pixel": 0.1615, + "loss_text": 1.4376, + "ppl": 4.9486, + "step": 9669 + }, + { + "epoch": 0.05, + "global_step": 9670, + "learning_rate": 0.00046047579298831386, + "loss": 1.5952, + "loss_base2": 2.3014, + "loss_pixel": 0.1623, + "loss_text": 1.4329, + "ppl": 4.9293, + "step": 9670 + }, + { + "epoch": 0.05, + "global_step": 9671, + "learning_rate": 0.00046047161936560937, + "loss": 1.6301, + "loss_base2": 2.3517, + "loss_pixel": 0.1625, + "loss_text": 1.4676, + "ppl": 5.1044, + "step": 9671 + }, + { + "epoch": 0.05, + "global_step": 9672, + "learning_rate": 0.0004604674457429048, + "loss": 1.6239, + "loss_base2": 2.3428, + "loss_pixel": 0.1607, + "loss_text": 1.4633, + "ppl": 5.0728, + "step": 9672 + }, + { + "epoch": 0.05, + "global_step": 9673, + "learning_rate": 0.00046046327212020033, + "loss": 1.6293, + "loss_base2": 2.3506, + "loss_pixel": 0.1614, + "loss_text": 1.4679, + "ppl": 5.1003, + "step": 9673 + }, + { + "epoch": 0.05, + "global_step": 9674, + "learning_rate": 0.00046045909849749584, + "loss": 1.6141, + "loss_base2": 2.3287, + "loss_pixel": 0.1623, + "loss_text": 1.4519, + "ppl": 5.0234, + "step": 9674 + }, + { + "epoch": 0.05, + "global_step": 9675, + "learning_rate": 0.00046045492487479134, + "loss": 1.6389, + "loss_base2": 2.3644, + "loss_pixel": 0.1634, + "loss_text": 1.4755, + "ppl": 5.1495, + "step": 9675 + }, + { + "epoch": 0.05, + "global_step": 9676, + "learning_rate": 0.0004604507512520868, + "loss": 1.6318, + "loss_base2": 2.3542, + "loss_pixel": 0.161, + "loss_text": 1.4708, + "ppl": 5.1131, + "step": 9676 + }, + { + "epoch": 0.05, + "global_step": 9677, + "learning_rate": 0.0004604465776293823, + "loss": 1.6129, + "loss_base2": 2.3269, + "loss_pixel": 0.1618, + "loss_text": 1.4511, + "ppl": 5.0173, + "step": 9677 + }, + { + "epoch": 0.05, + "global_step": 9678, + "learning_rate": 0.0004604424040066778, + "loss": 1.6215, + "loss_base2": 2.3393, + "loss_pixel": 0.1603, + "loss_text": 1.4612, + "ppl": 5.0607, + "step": 9678 + }, + { + "epoch": 0.05, + "global_step": 9679, + "learning_rate": 0.0004604382303839733, + "loss": 1.6059, + "loss_base2": 2.3168, + "loss_pixel": 0.1612, + "loss_text": 1.4447, + "ppl": 4.9823, + "step": 9679 + }, + { + "epoch": 0.05, + "global_step": 9680, + "learning_rate": 0.0004604340567612688, + "loss": 1.6098, + "loss_base2": 2.3225, + "loss_pixel": 0.1614, + "loss_text": 1.4485, + "ppl": 5.0018, + "step": 9680 + }, + { + "epoch": 0.05, + "global_step": 9681, + "learning_rate": 0.0004604298831385643, + "loss": 1.5905, + "loss_base2": 2.2946, + "loss_pixel": 0.1617, + "loss_text": 1.4288, + "ppl": 4.9062, + "step": 9681 + }, + { + "epoch": 0.05, + "global_step": 9682, + "learning_rate": 0.0004604257095158598, + "loss": 1.6231, + "loss_base2": 2.3416, + "loss_pixel": 0.1608, + "loss_text": 1.4623, + "ppl": 5.0688, + "step": 9682 + }, + { + "epoch": 0.05, + "global_step": 9683, + "learning_rate": 0.0004604215358931553, + "loss": 1.6339, + "loss_base2": 2.3572, + "loss_pixel": 0.1624, + "loss_text": 1.4716, + "ppl": 5.1238, + "step": 9683 + }, + { + "epoch": 0.05, + "global_step": 9684, + "learning_rate": 0.0004604173622704508, + "loss": 1.6143, + "loss_base2": 2.3289, + "loss_pixel": 0.162, + "loss_text": 1.4523, + "ppl": 5.0244, + "step": 9684 + }, + { + "epoch": 0.05, + "global_step": 9685, + "learning_rate": 0.00046041318864774625, + "loss": 1.6249, + "loss_base2": 2.3442, + "loss_pixel": 0.1621, + "loss_text": 1.4628, + "ppl": 5.0779, + "step": 9685 + }, + { + "epoch": 0.05, + "global_step": 9686, + "learning_rate": 0.0004604090150250417, + "loss": 1.6404, + "loss_base2": 2.3666, + "loss_pixel": 0.1604, + "loss_text": 1.48, + "ppl": 5.1572, + "step": 9686 + }, + { + "epoch": 0.05, + "global_step": 9687, + "learning_rate": 0.0004604048414023372, + "loss": 1.6257, + "loss_base2": 2.3454, + "loss_pixel": 0.1619, + "loss_text": 1.4639, + "ppl": 5.082, + "step": 9687 + }, + { + "epoch": 0.05, + "global_step": 9688, + "learning_rate": 0.0004604006677796327, + "loss": 1.6227, + "loss_base2": 2.3411, + "loss_pixel": 0.1601, + "loss_text": 1.4626, + "ppl": 5.0668, + "step": 9688 + }, + { + "epoch": 0.05, + "global_step": 9689, + "learning_rate": 0.00046039649415692823, + "loss": 1.6196, + "loss_base2": 2.3366, + "loss_pixel": 0.1604, + "loss_text": 1.4592, + "ppl": 5.0511, + "step": 9689 + }, + { + "epoch": 0.05, + "global_step": 9690, + "learning_rate": 0.0004603923205342237, + "loss": 1.6251, + "loss_base2": 2.3445, + "loss_pixel": 0.1612, + "loss_text": 1.4638, + "ppl": 5.0789, + "step": 9690 + }, + { + "epoch": 0.05, + "global_step": 9691, + "learning_rate": 0.0004603881469115192, + "loss": 1.6171, + "loss_base2": 2.333, + "loss_pixel": 0.1612, + "loss_text": 1.456, + "ppl": 5.0385, + "step": 9691 + }, + { + "epoch": 0.05, + "global_step": 9692, + "learning_rate": 0.0004603839732888147, + "loss": 1.6126, + "loss_base2": 2.3265, + "loss_pixel": 0.163, + "loss_text": 1.4496, + "ppl": 5.0158, + "step": 9692 + }, + { + "epoch": 0.05, + "global_step": 9693, + "learning_rate": 0.0004603797996661102, + "loss": 1.6108, + "loss_base2": 2.3239, + "loss_pixel": 0.1637, + "loss_text": 1.4471, + "ppl": 5.0068, + "step": 9693 + }, + { + "epoch": 0.05, + "global_step": 9694, + "learning_rate": 0.00046037562604340566, + "loss": 1.6247, + "loss_base2": 2.3439, + "loss_pixel": 0.1615, + "loss_text": 1.4632, + "ppl": 5.0769, + "step": 9694 + }, + { + "epoch": 0.05, + "global_step": 9695, + "learning_rate": 0.00046037145242070116, + "loss": 1.6247, + "loss_base2": 2.3439, + "loss_pixel": 0.1611, + "loss_text": 1.4636, + "ppl": 5.0769, + "step": 9695 + }, + { + "epoch": 0.05, + "global_step": 9696, + "learning_rate": 0.00046036727879799667, + "loss": 1.6152, + "loss_base2": 2.3302, + "loss_pixel": 0.1609, + "loss_text": 1.4543, + "ppl": 5.0289, + "step": 9696 + }, + { + "epoch": 0.05, + "global_step": 9697, + "learning_rate": 0.0004603631051752922, + "loss": 1.6265, + "loss_base2": 2.3465, + "loss_pixel": 0.1606, + "loss_text": 1.466, + "ppl": 5.086, + "step": 9697 + }, + { + "epoch": 0.05, + "global_step": 9698, + "learning_rate": 0.0004603589315525877, + "loss": 1.6213, + "loss_base2": 2.339, + "loss_pixel": 0.1616, + "loss_text": 1.4598, + "ppl": 5.0597, + "step": 9698 + }, + { + "epoch": 0.05, + "global_step": 9699, + "learning_rate": 0.00046035475792988314, + "loss": 1.6376, + "loss_base2": 2.3626, + "loss_pixel": 0.1637, + "loss_text": 1.4739, + "ppl": 5.1428, + "step": 9699 + }, + { + "epoch": 0.05, + "global_step": 9700, + "learning_rate": 0.00046035058430717865, + "loss": 1.6307, + "loss_base2": 2.3526, + "loss_pixel": 0.1607, + "loss_text": 1.47, + "ppl": 5.1074, + "step": 9700 + }, + { + "epoch": 0.05, + "global_step": 9701, + "learning_rate": 0.00046034641068447415, + "loss": 1.6183, + "loss_base2": 2.3347, + "loss_pixel": 0.1623, + "loss_text": 1.456, + "ppl": 5.0445, + "step": 9701 + }, + { + "epoch": 0.05, + "global_step": 9702, + "learning_rate": 0.00046034223706176966, + "loss": 1.6271, + "loss_base2": 2.3474, + "loss_pixel": 0.1625, + "loss_text": 1.4646, + "ppl": 5.0891, + "step": 9702 + }, + { + "epoch": 0.05, + "global_step": 9703, + "learning_rate": 0.0004603380634390651, + "loss": 1.6089, + "loss_base2": 2.3212, + "loss_pixel": 0.1622, + "loss_text": 1.4466, + "ppl": 4.9973, + "step": 9703 + }, + { + "epoch": 0.05, + "global_step": 9704, + "learning_rate": 0.0004603338898163606, + "loss": 1.4563, + "loss_base2": 2.101, + "loss_pixel": 0.1612, + "loss_text": 1.2951, + "ppl": 4.2901, + "step": 9704 + }, + { + "epoch": 0.05, + "global_step": 9705, + "learning_rate": 0.0004603297161936561, + "loss": 1.4194, + "loss_base2": 2.0478, + "loss_pixel": 0.1628, + "loss_text": 1.2566, + "ppl": 4.1346, + "step": 9705 + }, + { + "epoch": 0.05, + "global_step": 9706, + "learning_rate": 0.0004603255425709516, + "loss": 1.4172, + "loss_base2": 2.0446, + "loss_pixel": 0.1588, + "loss_text": 1.2584, + "ppl": 4.1256, + "step": 9706 + }, + { + "epoch": 0.05, + "global_step": 9707, + "learning_rate": 0.0004603213689482471, + "loss": 1.3974, + "loss_base2": 2.016, + "loss_pixel": 0.154, + "loss_text": 1.2435, + "ppl": 4.0447, + "step": 9707 + }, + { + "epoch": 0.05, + "global_step": 9708, + "learning_rate": 0.00046031719532554254, + "loss": 1.3827, + "loss_base2": 1.9948, + "loss_pixel": 0.1514, + "loss_text": 1.2313, + "ppl": 3.9856, + "step": 9708 + }, + { + "epoch": 0.05, + "global_step": 9709, + "learning_rate": 0.00046031302170283805, + "loss": 1.4, + "loss_base2": 2.0198, + "loss_pixel": 0.155, + "loss_text": 1.245, + "ppl": 4.0552, + "step": 9709 + }, + { + "epoch": 0.05, + "global_step": 9710, + "learning_rate": 0.00046030884808013356, + "loss": 1.3993, + "loss_base2": 2.0188, + "loss_pixel": 0.1526, + "loss_text": 1.2466, + "ppl": 4.0524, + "step": 9710 + }, + { + "epoch": 0.05, + "global_step": 9711, + "learning_rate": 0.00046030467445742906, + "loss": 1.3884, + "loss_base2": 2.003, + "loss_pixel": 0.1539, + "loss_text": 1.2345, + "ppl": 4.0084, + "step": 9711 + }, + { + "epoch": 0.05, + "global_step": 9712, + "learning_rate": 0.00046030050083472457, + "loss": 1.3943, + "loss_base2": 2.0115, + "loss_pixel": 0.1514, + "loss_text": 1.2429, + "ppl": 4.0322, + "step": 9712 + }, + { + "epoch": 0.05, + "global_step": 9713, + "learning_rate": 0.00046029632721202, + "loss": 1.4, + "loss_base2": 2.0198, + "loss_pixel": 0.151, + "loss_text": 1.2491, + "ppl": 4.0552, + "step": 9713 + }, + { + "epoch": 0.05, + "global_step": 9714, + "learning_rate": 0.00046029215358931553, + "loss": 1.3997, + "loss_base2": 2.0193, + "loss_pixel": 0.1538, + "loss_text": 1.2459, + "ppl": 4.054, + "step": 9714 + }, + { + "epoch": 0.05, + "global_step": 9715, + "learning_rate": 0.00046028797996661104, + "loss": 1.4082, + "loss_base2": 2.0316, + "loss_pixel": 0.1543, + "loss_text": 1.2539, + "ppl": 4.0886, + "step": 9715 + }, + { + "epoch": 0.05, + "global_step": 9716, + "learning_rate": 0.00046028380634390655, + "loss": 1.3924, + "loss_base2": 2.0088, + "loss_pixel": 0.1529, + "loss_text": 1.2395, + "ppl": 4.0245, + "step": 9716 + }, + { + "epoch": 0.05, + "global_step": 9717, + "learning_rate": 0.000460279632721202, + "loss": 1.4099, + "loss_base2": 2.0341, + "loss_pixel": 0.1552, + "loss_text": 1.2546, + "ppl": 4.0955, + "step": 9717 + }, + { + "epoch": 0.05, + "global_step": 9718, + "learning_rate": 0.0004602754590984975, + "loss": 1.3861, + "loss_base2": 1.9997, + "loss_pixel": 0.154, + "loss_text": 1.2321, + "ppl": 3.9992, + "step": 9718 + }, + { + "epoch": 0.05, + "global_step": 9719, + "learning_rate": 0.000460271285475793, + "loss": 1.413, + "loss_base2": 2.0385, + "loss_pixel": 0.1502, + "loss_text": 1.2628, + "ppl": 4.1083, + "step": 9719 + }, + { + "epoch": 0.05, + "global_step": 9720, + "learning_rate": 0.0004602671118530885, + "loss": 1.3891, + "loss_base2": 2.004, + "loss_pixel": 0.1503, + "loss_text": 1.2388, + "ppl": 4.0112, + "step": 9720 + }, + { + "epoch": 0.05, + "global_step": 9721, + "learning_rate": 0.00046026293823038403, + "loss": 1.4008, + "loss_base2": 2.0209, + "loss_pixel": 0.1504, + "loss_text": 1.2504, + "ppl": 4.0584, + "step": 9721 + }, + { + "epoch": 0.05, + "global_step": 9722, + "learning_rate": 0.0004602587646076795, + "loss": 1.3882, + "loss_base2": 2.0027, + "loss_pixel": 0.1526, + "loss_text": 1.2356, + "ppl": 4.0076, + "step": 9722 + }, + { + "epoch": 0.05, + "global_step": 9723, + "learning_rate": 0.000460254590984975, + "loss": 1.4035, + "loss_base2": 2.0248, + "loss_pixel": 0.1609, + "loss_text": 1.2426, + "ppl": 4.0694, + "step": 9723 + }, + { + "epoch": 0.05, + "global_step": 9724, + "learning_rate": 0.00046025041736227044, + "loss": 1.4019, + "loss_base2": 2.0225, + "loss_pixel": 0.166, + "loss_text": 1.236, + "ppl": 4.0629, + "step": 9724 + }, + { + "epoch": 0.05, + "global_step": 9725, + "learning_rate": 0.00046024624373956595, + "loss": 1.3939, + "loss_base2": 2.011, + "loss_pixel": 0.1669, + "loss_text": 1.2269, + "ppl": 4.0305, + "step": 9725 + }, + { + "epoch": 0.05, + "global_step": 9726, + "learning_rate": 0.0004602420701168614, + "loss": 1.3993, + "loss_base2": 2.0188, + "loss_pixel": 0.1648, + "loss_text": 1.2346, + "ppl": 4.0524, + "step": 9726 + }, + { + "epoch": 0.05, + "global_step": 9727, + "learning_rate": 0.0004602378964941569, + "loss": 1.4091, + "loss_base2": 2.0329, + "loss_pixel": 0.1658, + "loss_text": 1.2433, + "ppl": 4.0923, + "step": 9727 + }, + { + "epoch": 0.05, + "global_step": 9728, + "learning_rate": 0.0004602337228714524, + "loss": 1.4175, + "loss_base2": 2.045, + "loss_pixel": 0.1646, + "loss_text": 1.2529, + "ppl": 4.1268, + "step": 9728 + }, + { + "epoch": 0.05, + "global_step": 9729, + "learning_rate": 0.0004602295492487479, + "loss": 1.4099, + "loss_base2": 2.0341, + "loss_pixel": 0.1635, + "loss_text": 1.2464, + "ppl": 4.0955, + "step": 9729 + }, + { + "epoch": 0.05, + "global_step": 9730, + "learning_rate": 0.00046022537562604343, + "loss": 1.4153, + "loss_base2": 2.0418, + "loss_pixel": 0.1634, + "loss_text": 1.252, + "ppl": 4.1177, + "step": 9730 + }, + { + "epoch": 0.05, + "global_step": 9731, + "learning_rate": 0.0004602212020033389, + "loss": 1.4018, + "loss_base2": 2.0224, + "loss_pixel": 0.1625, + "loss_text": 1.2393, + "ppl": 4.0625, + "step": 9731 + }, + { + "epoch": 0.05, + "global_step": 9732, + "learning_rate": 0.0004602170283806344, + "loss": 1.3983, + "loss_base2": 2.0173, + "loss_pixel": 0.1631, + "loss_text": 1.2352, + "ppl": 4.0483, + "step": 9732 + }, + { + "epoch": 0.05, + "global_step": 9733, + "learning_rate": 0.0004602128547579299, + "loss": 1.3992, + "loss_base2": 2.0186, + "loss_pixel": 0.1651, + "loss_text": 1.2341, + "ppl": 4.052, + "step": 9733 + }, + { + "epoch": 0.05, + "global_step": 9734, + "learning_rate": 0.0004602086811352254, + "loss": 1.4326, + "loss_base2": 2.0668, + "loss_pixel": 0.1631, + "loss_text": 1.2695, + "ppl": 4.1896, + "step": 9734 + }, + { + "epoch": 0.05, + "global_step": 9735, + "learning_rate": 0.00046020450751252086, + "loss": 1.3961, + "loss_base2": 2.0141, + "loss_pixel": 0.1626, + "loss_text": 1.2335, + "ppl": 4.0394, + "step": 9735 + }, + { + "epoch": 0.05, + "global_step": 9736, + "learning_rate": 0.00046020033388981637, + "loss": 1.412, + "loss_base2": 2.0371, + "loss_pixel": 0.1627, + "loss_text": 1.2493, + "ppl": 4.1042, + "step": 9736 + }, + { + "epoch": 0.05, + "global_step": 9737, + "learning_rate": 0.0004601961602671119, + "loss": 1.4033, + "loss_base2": 2.0245, + "loss_pixel": 0.1629, + "loss_text": 1.2404, + "ppl": 4.0686, + "step": 9737 + }, + { + "epoch": 0.05, + "global_step": 9738, + "learning_rate": 0.0004601919866444074, + "loss": 1.3857, + "loss_base2": 1.9991, + "loss_pixel": 0.1627, + "loss_text": 1.223, + "ppl": 3.9976, + "step": 9738 + }, + { + "epoch": 0.05, + "global_step": 9739, + "learning_rate": 0.0004601878130217029, + "loss": 1.4159, + "loss_base2": 2.0427, + "loss_pixel": 0.1621, + "loss_text": 1.2538, + "ppl": 4.1202, + "step": 9739 + }, + { + "epoch": 0.05, + "global_step": 9740, + "learning_rate": 0.00046018363939899834, + "loss": 1.3938, + "loss_base2": 2.0108, + "loss_pixel": 0.1639, + "loss_text": 1.2299, + "ppl": 4.0301, + "step": 9740 + }, + { + "epoch": 0.05, + "global_step": 9741, + "learning_rate": 0.00046017946577629385, + "loss": 1.4143, + "loss_base2": 2.0404, + "loss_pixel": 0.1621, + "loss_text": 1.2522, + "ppl": 4.1136, + "step": 9741 + }, + { + "epoch": 0.05, + "global_step": 9742, + "learning_rate": 0.00046017529215358936, + "loss": 1.397, + "loss_base2": 2.0154, + "loss_pixel": 0.1632, + "loss_text": 1.2338, + "ppl": 4.0431, + "step": 9742 + }, + { + "epoch": 0.05, + "global_step": 9743, + "learning_rate": 0.0004601711185308848, + "loss": 1.4054, + "loss_base2": 2.0276, + "loss_pixel": 0.1618, + "loss_text": 1.2436, + "ppl": 4.0772, + "step": 9743 + }, + { + "epoch": 0.05, + "global_step": 9744, + "learning_rate": 0.00046016694490818026, + "loss": 1.4136, + "loss_base2": 2.0394, + "loss_pixel": 0.1628, + "loss_text": 1.2508, + "ppl": 4.1107, + "step": 9744 + }, + { + "epoch": 0.05, + "global_step": 9745, + "learning_rate": 0.00046016277128547577, + "loss": 1.4164, + "loss_base2": 2.0434, + "loss_pixel": 0.1622, + "loss_text": 1.2543, + "ppl": 4.1223, + "step": 9745 + }, + { + "epoch": 0.05, + "global_step": 9746, + "learning_rate": 0.0004601585976627713, + "loss": 1.4083, + "loss_base2": 2.0317, + "loss_pixel": 0.161, + "loss_text": 1.2473, + "ppl": 4.089, + "step": 9746 + }, + { + "epoch": 0.05, + "global_step": 9747, + "learning_rate": 0.0004601544240400668, + "loss": 1.3886, + "loss_base2": 2.0033, + "loss_pixel": 0.1619, + "loss_text": 1.2267, + "ppl": 4.0092, + "step": 9747 + }, + { + "epoch": 0.05, + "global_step": 9748, + "learning_rate": 0.0004601502504173623, + "loss": 1.4023, + "loss_base2": 2.0231, + "loss_pixel": 0.1625, + "loss_text": 1.2398, + "ppl": 4.0645, + "step": 9748 + }, + { + "epoch": 0.05, + "global_step": 9749, + "learning_rate": 0.00046014607679465775, + "loss": 1.4167, + "loss_base2": 2.0439, + "loss_pixel": 0.1614, + "loss_text": 1.2553, + "ppl": 4.1235, + "step": 9749 + }, + { + "epoch": 0.05, + "global_step": 9750, + "learning_rate": 0.00046014190317195325, + "loss": 1.3857, + "loss_base2": 1.9991, + "loss_pixel": 0.1623, + "loss_text": 1.2233, + "ppl": 3.9976, + "step": 9750 + }, + { + "epoch": 0.05, + "global_step": 9751, + "learning_rate": 0.00046013772954924876, + "loss": 1.4129, + "loss_base2": 2.0384, + "loss_pixel": 0.1619, + "loss_text": 1.251, + "ppl": 4.1079, + "step": 9751 + }, + { + "epoch": 0.05, + "global_step": 9752, + "learning_rate": 0.00046013355592654427, + "loss": 1.4286, + "loss_base2": 2.061, + "loss_pixel": 0.1624, + "loss_text": 1.2662, + "ppl": 4.1729, + "step": 9752 + }, + { + "epoch": 0.05, + "global_step": 9753, + "learning_rate": 0.0004601293823038397, + "loss": 1.411, + "loss_base2": 2.0356, + "loss_pixel": 0.1619, + "loss_text": 1.2491, + "ppl": 4.1001, + "step": 9753 + }, + { + "epoch": 0.05, + "global_step": 9754, + "learning_rate": 0.00046012520868113523, + "loss": 1.3841, + "loss_base2": 1.9968, + "loss_pixel": 0.1612, + "loss_text": 1.2229, + "ppl": 3.9912, + "step": 9754 + }, + { + "epoch": 0.05, + "global_step": 9755, + "learning_rate": 0.00046012103505843074, + "loss": 1.4171, + "loss_base2": 2.0444, + "loss_pixel": 0.1626, + "loss_text": 1.2545, + "ppl": 4.1251, + "step": 9755 + }, + { + "epoch": 0.05, + "global_step": 9756, + "learning_rate": 0.00046011686143572624, + "loss": 1.4082, + "loss_base2": 2.0316, + "loss_pixel": 0.162, + "loss_text": 1.2461, + "ppl": 4.0886, + "step": 9756 + }, + { + "epoch": 0.05, + "global_step": 9757, + "learning_rate": 0.00046011268781302175, + "loss": 1.412, + "loss_base2": 2.0371, + "loss_pixel": 0.1599, + "loss_text": 1.2521, + "ppl": 4.1042, + "step": 9757 + }, + { + "epoch": 0.05, + "global_step": 9758, + "learning_rate": 0.0004601085141903172, + "loss": 1.3814, + "loss_base2": 1.9929, + "loss_pixel": 0.1625, + "loss_text": 1.2188, + "ppl": 3.9805, + "step": 9758 + }, + { + "epoch": 0.05, + "global_step": 9759, + "learning_rate": 0.0004601043405676127, + "loss": 1.4532, + "loss_base2": 2.0965, + "loss_pixel": 0.162, + "loss_text": 1.2912, + "ppl": 4.2768, + "step": 9759 + }, + { + "epoch": 0.05, + "global_step": 9760, + "learning_rate": 0.0004601001669449082, + "loss": 1.6496, + "loss_base2": 2.3799, + "loss_pixel": 0.1605, + "loss_text": 1.4891, + "ppl": 5.2049, + "step": 9760 + }, + { + "epoch": 0.05, + "global_step": 9761, + "learning_rate": 0.0004600959933222037, + "loss": 1.6509, + "loss_base2": 2.3817, + "loss_pixel": 0.1612, + "loss_text": 1.4896, + "ppl": 5.2117, + "step": 9761 + }, + { + "epoch": 0.05, + "global_step": 9762, + "learning_rate": 0.0004600918196994991, + "loss": 1.649, + "loss_base2": 2.379, + "loss_pixel": 0.162, + "loss_text": 1.4869, + "ppl": 5.2018, + "step": 9762 + }, + { + "epoch": 0.05, + "global_step": 9763, + "learning_rate": 0.00046008764607679463, + "loss": 1.6316, + "loss_base2": 2.3539, + "loss_pixel": 0.1617, + "loss_text": 1.4698, + "ppl": 5.112, + "step": 9763 + }, + { + "epoch": 0.05, + "global_step": 9764, + "learning_rate": 0.00046008347245409014, + "loss": 1.6309, + "loss_base2": 2.3529, + "loss_pixel": 0.1622, + "loss_text": 1.4687, + "ppl": 5.1085, + "step": 9764 + }, + { + "epoch": 0.05, + "global_step": 9765, + "learning_rate": 0.00046007929883138565, + "loss": 1.6359, + "loss_base2": 2.3601, + "loss_pixel": 0.1622, + "loss_text": 1.4737, + "ppl": 5.1341, + "step": 9765 + }, + { + "epoch": 0.05, + "global_step": 9766, + "learning_rate": 0.00046007512520868115, + "loss": 1.6324, + "loss_base2": 2.3551, + "loss_pixel": 0.1625, + "loss_text": 1.47, + "ppl": 5.1161, + "step": 9766 + }, + { + "epoch": 0.05, + "global_step": 9767, + "learning_rate": 0.0004600709515859766, + "loss": 1.618, + "loss_base2": 2.3343, + "loss_pixel": 0.1612, + "loss_text": 1.4568, + "ppl": 5.043, + "step": 9767 + }, + { + "epoch": 0.05, + "global_step": 9768, + "learning_rate": 0.0004600667779632721, + "loss": 1.6365, + "loss_base2": 2.361, + "loss_pixel": 0.1616, + "loss_text": 1.475, + "ppl": 5.1372, + "step": 9768 + }, + { + "epoch": 0.05, + "global_step": 9769, + "learning_rate": 0.0004600626043405676, + "loss": 1.6303, + "loss_base2": 2.352, + "loss_pixel": 0.1625, + "loss_text": 1.4678, + "ppl": 5.1054, + "step": 9769 + }, + { + "epoch": 0.05, + "global_step": 9770, + "learning_rate": 0.00046005843071786313, + "loss": 1.6316, + "loss_base2": 2.3539, + "loss_pixel": 0.1612, + "loss_text": 1.4704, + "ppl": 5.112, + "step": 9770 + }, + { + "epoch": 0.05, + "global_step": 9771, + "learning_rate": 0.00046005425709515864, + "loss": 1.6061, + "loss_base2": 2.3171, + "loss_pixel": 0.1628, + "loss_text": 1.4433, + "ppl": 4.9833, + "step": 9771 + }, + { + "epoch": 0.05, + "global_step": 9772, + "learning_rate": 0.0004600500834724541, + "loss": 1.6407, + "loss_base2": 2.367, + "loss_pixel": 0.1619, + "loss_text": 1.4788, + "ppl": 5.1588, + "step": 9772 + }, + { + "epoch": 0.05, + "global_step": 9773, + "learning_rate": 0.0004600459098497496, + "loss": 1.6249, + "loss_base2": 2.3442, + "loss_pixel": 0.1614, + "loss_text": 1.4635, + "ppl": 5.0779, + "step": 9773 + }, + { + "epoch": 0.05, + "global_step": 9774, + "learning_rate": 0.0004600417362270451, + "loss": 1.633, + "loss_base2": 2.3559, + "loss_pixel": 0.1621, + "loss_text": 1.4709, + "ppl": 5.1192, + "step": 9774 + }, + { + "epoch": 0.05, + "global_step": 9775, + "learning_rate": 0.0004600375626043406, + "loss": 1.6458, + "loss_base2": 2.3744, + "loss_pixel": 0.1633, + "loss_text": 1.4825, + "ppl": 5.1852, + "step": 9775 + }, + { + "epoch": 0.05, + "global_step": 9776, + "learning_rate": 0.00046003338898163606, + "loss": 1.6344, + "loss_base2": 2.3579, + "loss_pixel": 0.1624, + "loss_text": 1.4721, + "ppl": 5.1264, + "step": 9776 + }, + { + "epoch": 0.05, + "global_step": 9777, + "learning_rate": 0.00046002921535893157, + "loss": 1.6087, + "loss_base2": 2.3209, + "loss_pixel": 0.1615, + "loss_text": 1.4471, + "ppl": 4.9963, + "step": 9777 + }, + { + "epoch": 0.05, + "global_step": 9778, + "learning_rate": 0.0004600250417362271, + "loss": 1.6183, + "loss_base2": 2.3347, + "loss_pixel": 0.1622, + "loss_text": 1.4562, + "ppl": 5.0445, + "step": 9778 + }, + { + "epoch": 0.05, + "global_step": 9779, + "learning_rate": 0.0004600208681135226, + "loss": 1.6126, + "loss_base2": 2.3265, + "loss_pixel": 0.1608, + "loss_text": 1.4518, + "ppl": 5.0158, + "step": 9779 + }, + { + "epoch": 0.05, + "global_step": 9780, + "learning_rate": 0.0004600166944908181, + "loss": 1.6312, + "loss_base2": 2.3533, + "loss_pixel": 0.1616, + "loss_text": 1.4696, + "ppl": 5.11, + "step": 9780 + }, + { + "epoch": 0.05, + "global_step": 9781, + "learning_rate": 0.0004600125208681135, + "loss": 1.6322, + "loss_base2": 2.3548, + "loss_pixel": 0.1614, + "loss_text": 1.4708, + "ppl": 5.1151, + "step": 9781 + }, + { + "epoch": 0.05, + "global_step": 9782, + "learning_rate": 0.000460008347245409, + "loss": 1.6407, + "loss_base2": 2.367, + "loss_pixel": 0.1626, + "loss_text": 1.478, + "ppl": 5.1588, + "step": 9782 + }, + { + "epoch": 0.05, + "global_step": 9783, + "learning_rate": 0.0004600041736227045, + "loss": 1.6119, + "loss_base2": 2.3255, + "loss_pixel": 0.1612, + "loss_text": 1.4507, + "ppl": 5.0123, + "step": 9783 + }, + { + "epoch": 0.05, + "global_step": 9784, + "learning_rate": 0.00046, + "loss": 1.6217, + "loss_base2": 2.3396, + "loss_pixel": 0.1579, + "loss_text": 1.4638, + "ppl": 5.0617, + "step": 9784 + }, + { + "epoch": 0.05, + "global_step": 9785, + "learning_rate": 0.00045999582637729547, + "loss": 1.627, + "loss_base2": 2.3473, + "loss_pixel": 0.1532, + "loss_text": 1.4739, + "ppl": 5.0886, + "step": 9785 + }, + { + "epoch": 0.05, + "global_step": 9786, + "learning_rate": 0.000459991652754591, + "loss": 1.6124, + "loss_base2": 2.3262, + "loss_pixel": 0.1519, + "loss_text": 1.4604, + "ppl": 5.0148, + "step": 9786 + }, + { + "epoch": 0.05, + "global_step": 9787, + "learning_rate": 0.0004599874791318865, + "loss": 1.6104, + "loss_base2": 2.3233, + "loss_pixel": 0.1527, + "loss_text": 1.4577, + "ppl": 5.0048, + "step": 9787 + }, + { + "epoch": 0.05, + "global_step": 9788, + "learning_rate": 0.000459983305509182, + "loss": 1.6241, + "loss_base2": 2.3431, + "loss_pixel": 0.153, + "loss_text": 1.4712, + "ppl": 5.0739, + "step": 9788 + }, + { + "epoch": 0.05, + "global_step": 9789, + "learning_rate": 0.0004599791318864775, + "loss": 1.6232, + "loss_base2": 2.3418, + "loss_pixel": 0.15, + "loss_text": 1.4732, + "ppl": 5.0693, + "step": 9789 + }, + { + "epoch": 0.05, + "global_step": 9790, + "learning_rate": 0.00045997495826377295, + "loss": 1.6131, + "loss_base2": 2.3272, + "loss_pixel": 0.1506, + "loss_text": 1.4625, + "ppl": 5.0183, + "step": 9790 + }, + { + "epoch": 0.05, + "global_step": 9791, + "learning_rate": 0.00045997078464106846, + "loss": 1.6203, + "loss_base2": 2.3376, + "loss_pixel": 0.1508, + "loss_text": 1.4695, + "ppl": 5.0546, + "step": 9791 + }, + { + "epoch": 0.05, + "global_step": 9792, + "learning_rate": 0.00045996661101836396, + "loss": 1.6126, + "loss_base2": 2.3265, + "loss_pixel": 0.1502, + "loss_text": 1.4624, + "ppl": 5.0158, + "step": 9792 + }, + { + "epoch": 0.05, + "global_step": 9793, + "learning_rate": 0.00045996243739565947, + "loss": 1.6077, + "loss_base2": 2.3194, + "loss_pixel": 0.1519, + "loss_text": 1.4558, + "ppl": 4.9913, + "step": 9793 + }, + { + "epoch": 0.05, + "global_step": 9794, + "learning_rate": 0.0004599582637729549, + "loss": 1.6273, + "loss_base2": 2.3477, + "loss_pixel": 0.1517, + "loss_text": 1.4755, + "ppl": 5.0901, + "step": 9794 + }, + { + "epoch": 0.05, + "global_step": 9795, + "learning_rate": 0.00045995409015025043, + "loss": 1.6166, + "loss_base2": 2.3323, + "loss_pixel": 0.1491, + "loss_text": 1.4675, + "ppl": 5.0359, + "step": 9795 + }, + { + "epoch": 0.05, + "global_step": 9796, + "learning_rate": 0.00045994991652754594, + "loss": 1.6099, + "loss_base2": 2.3226, + "loss_pixel": 0.1503, + "loss_text": 1.4596, + "ppl": 5.0023, + "step": 9796 + }, + { + "epoch": 0.05, + "global_step": 9797, + "learning_rate": 0.00045994574290484145, + "loss": 1.6093, + "loss_base2": 2.3217, + "loss_pixel": 0.15, + "loss_text": 1.4593, + "ppl": 4.9993, + "step": 9797 + }, + { + "epoch": 0.05, + "global_step": 9798, + "learning_rate": 0.00045994156928213695, + "loss": 1.6173, + "loss_base2": 2.3333, + "loss_pixel": 0.1513, + "loss_text": 1.466, + "ppl": 5.0395, + "step": 9798 + }, + { + "epoch": 0.05, + "global_step": 9799, + "learning_rate": 0.00045993739565943235, + "loss": 1.6126, + "loss_base2": 2.3265, + "loss_pixel": 0.1518, + "loss_text": 1.4609, + "ppl": 5.0158, + "step": 9799 + }, + { + "epoch": 0.05, + "global_step": 9800, + "learning_rate": 0.00045993322203672786, + "loss": 1.6139, + "loss_base2": 2.3284, + "loss_pixel": 0.1517, + "loss_text": 1.4622, + "ppl": 5.0224, + "step": 9800 + }, + { + "epoch": 0.05, + "global_step": 9801, + "learning_rate": 0.00045992904841402337, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1527, + "loss_text": 1.4641, + "ppl": 5.0374, + "step": 9801 + }, + { + "epoch": 0.05, + "global_step": 9802, + "learning_rate": 0.0004599248747913189, + "loss": 1.6012, + "loss_base2": 2.31, + "loss_pixel": 0.1492, + "loss_text": 1.452, + "ppl": 4.959, + "step": 9802 + }, + { + "epoch": 0.05, + "global_step": 9803, + "learning_rate": 0.00045992070116861433, + "loss": 1.6123, + "loss_base2": 2.3261, + "loss_pixel": 0.1516, + "loss_text": 1.4607, + "ppl": 5.0143, + "step": 9803 + }, + { + "epoch": 0.05, + "global_step": 9804, + "learning_rate": 0.00045991652754590984, + "loss": 1.6181, + "loss_base2": 2.3344, + "loss_pixel": 0.1527, + "loss_text": 1.4654, + "ppl": 5.0435, + "step": 9804 + }, + { + "epoch": 0.05, + "global_step": 9805, + "learning_rate": 0.00045991235392320534, + "loss": 1.6105, + "loss_base2": 2.3235, + "loss_pixel": 0.1501, + "loss_text": 1.4604, + "ppl": 5.0053, + "step": 9805 + }, + { + "epoch": 0.05, + "global_step": 9806, + "learning_rate": 0.00045990818030050085, + "loss": 1.6133, + "loss_base2": 2.3275, + "loss_pixel": 0.1501, + "loss_text": 1.4632, + "ppl": 5.0193, + "step": 9806 + }, + { + "epoch": 0.05, + "global_step": 9807, + "learning_rate": 0.00045990400667779636, + "loss": 1.6027, + "loss_base2": 2.3122, + "loss_pixel": 0.1495, + "loss_text": 1.4532, + "ppl": 4.9664, + "step": 9807 + }, + { + "epoch": 0.05, + "global_step": 9808, + "learning_rate": 0.0004598998330550918, + "loss": 1.6419, + "loss_base2": 2.3688, + "loss_pixel": 0.1514, + "loss_text": 1.4905, + "ppl": 5.165, + "step": 9808 + }, + { + "epoch": 0.05, + "global_step": 9809, + "learning_rate": 0.0004598956594323873, + "loss": 1.615, + "loss_base2": 2.33, + "loss_pixel": 0.149, + "loss_text": 1.466, + "ppl": 5.0279, + "step": 9809 + }, + { + "epoch": 0.05, + "global_step": 9810, + "learning_rate": 0.0004598914858096828, + "loss": 1.6048, + "loss_base2": 2.3152, + "loss_pixel": 0.1504, + "loss_text": 1.4544, + "ppl": 4.9769, + "step": 9810 + }, + { + "epoch": 0.05, + "global_step": 9811, + "learning_rate": 0.00045988731218697833, + "loss": 1.6015, + "loss_base2": 2.3105, + "loss_pixel": 0.1499, + "loss_text": 1.4516, + "ppl": 4.9605, + "step": 9811 + }, + { + "epoch": 0.05, + "global_step": 9812, + "learning_rate": 0.0004598831385642738, + "loss": 1.6094, + "loss_base2": 2.3219, + "loss_pixel": 0.1501, + "loss_text": 1.4592, + "ppl": 4.9998, + "step": 9812 + }, + { + "epoch": 0.05, + "global_step": 9813, + "learning_rate": 0.0004598789649415693, + "loss": 1.5829, + "loss_base2": 2.2836, + "loss_pixel": 0.1501, + "loss_text": 1.4328, + "ppl": 4.8691, + "step": 9813 + }, + { + "epoch": 0.05, + "global_step": 9814, + "learning_rate": 0.0004598747913188648, + "loss": 1.5988, + "loss_base2": 2.3066, + "loss_pixel": 0.1513, + "loss_text": 1.4475, + "ppl": 4.9471, + "step": 9814 + }, + { + "epoch": 0.05, + "global_step": 9815, + "learning_rate": 0.0004598706176961603, + "loss": 1.6223, + "loss_base2": 2.3405, + "loss_pixel": 0.1497, + "loss_text": 1.4726, + "ppl": 5.0647, + "step": 9815 + }, + { + "epoch": 0.05, + "global_step": 9816, + "learning_rate": 0.0004598664440734558, + "loss": 1.6012, + "loss_base2": 2.31, + "loss_pixel": 0.1461, + "loss_text": 1.4551, + "ppl": 4.959, + "step": 9816 + }, + { + "epoch": 0.05, + "global_step": 9817, + "learning_rate": 0.00045986227045075127, + "loss": 1.6223, + "loss_base2": 2.3405, + "loss_pixel": 0.1475, + "loss_text": 1.4748, + "ppl": 5.0647, + "step": 9817 + }, + { + "epoch": 0.05, + "global_step": 9818, + "learning_rate": 0.0004598580968280467, + "loss": 1.624, + "loss_base2": 2.3429, + "loss_pixel": 0.1501, + "loss_text": 1.4739, + "ppl": 5.0733, + "step": 9818 + }, + { + "epoch": 0.05, + "global_step": 9819, + "learning_rate": 0.00045985392320534223, + "loss": 1.6263, + "loss_base2": 2.3463, + "loss_pixel": 0.1488, + "loss_text": 1.4776, + "ppl": 5.085, + "step": 9819 + }, + { + "epoch": 0.05, + "global_step": 9820, + "learning_rate": 0.00045984974958263774, + "loss": 1.6161, + "loss_base2": 2.3315, + "loss_pixel": 0.161, + "loss_text": 1.4551, + "ppl": 5.0334, + "step": 9820 + }, + { + "epoch": 0.05, + "global_step": 9821, + "learning_rate": 0.0004598455759599332, + "loss": 1.6272, + "loss_base2": 2.3476, + "loss_pixel": 0.1629, + "loss_text": 1.4643, + "ppl": 5.0896, + "step": 9821 + }, + { + "epoch": 0.05, + "global_step": 9822, + "learning_rate": 0.0004598414023372287, + "loss": 1.601, + "loss_base2": 2.3098, + "loss_pixel": 0.1631, + "loss_text": 1.4379, + "ppl": 4.958, + "step": 9822 + }, + { + "epoch": 0.05, + "global_step": 9823, + "learning_rate": 0.0004598372287145242, + "loss": 1.6207, + "loss_base2": 2.3382, + "loss_pixel": 0.1623, + "loss_text": 1.4584, + "ppl": 5.0566, + "step": 9823 + }, + { + "epoch": 0.05, + "global_step": 9824, + "learning_rate": 0.0004598330550918197, + "loss": 1.6321, + "loss_base2": 2.3546, + "loss_pixel": 0.1615, + "loss_text": 1.4706, + "ppl": 5.1146, + "step": 9824 + }, + { + "epoch": 0.05, + "global_step": 9825, + "learning_rate": 0.0004598288814691152, + "loss": 1.6059, + "loss_base2": 2.3168, + "loss_pixel": 0.1624, + "loss_text": 1.4435, + "ppl": 4.9823, + "step": 9825 + }, + { + "epoch": 0.05, + "global_step": 9826, + "learning_rate": 0.00045982470784641067, + "loss": 1.6305, + "loss_base2": 2.3523, + "loss_pixel": 0.1632, + "loss_text": 1.4673, + "ppl": 5.1064, + "step": 9826 + }, + { + "epoch": 0.05, + "global_step": 9827, + "learning_rate": 0.0004598205342237062, + "loss": 1.602, + "loss_base2": 2.3112, + "loss_pixel": 0.1633, + "loss_text": 1.4387, + "ppl": 4.9629, + "step": 9827 + }, + { + "epoch": 0.05, + "global_step": 9828, + "learning_rate": 0.0004598163606010017, + "loss": 1.6177, + "loss_base2": 2.3338, + "loss_pixel": 0.1629, + "loss_text": 1.4548, + "ppl": 5.0415, + "step": 9828 + }, + { + "epoch": 0.05, + "global_step": 9829, + "learning_rate": 0.0004598121869782972, + "loss": 1.6133, + "loss_base2": 2.3275, + "loss_pixel": 0.162, + "loss_text": 1.4513, + "ppl": 5.0193, + "step": 9829 + }, + { + "epoch": 0.05, + "global_step": 9830, + "learning_rate": 0.0004598080133555927, + "loss": 1.632, + "loss_base2": 2.3545, + "loss_pixel": 0.1615, + "loss_text": 1.4706, + "ppl": 5.1141, + "step": 9830 + }, + { + "epoch": 0.05, + "global_step": 9831, + "learning_rate": 0.00045980383973288815, + "loss": 1.6211, + "loss_base2": 2.3388, + "loss_pixel": 0.1612, + "loss_text": 1.4599, + "ppl": 5.0587, + "step": 9831 + }, + { + "epoch": 0.05, + "global_step": 9832, + "learning_rate": 0.00045979966611018366, + "loss": 1.6134, + "loss_base2": 2.3276, + "loss_pixel": 0.1608, + "loss_text": 1.4526, + "ppl": 5.0198, + "step": 9832 + }, + { + "epoch": 0.05, + "global_step": 9833, + "learning_rate": 0.00045979549248747917, + "loss": 1.4386, + "loss_base2": 2.0755, + "loss_pixel": 0.1631, + "loss_text": 1.2755, + "ppl": 4.2148, + "step": 9833 + }, + { + "epoch": 0.05, + "global_step": 9834, + "learning_rate": 0.0004597913188647747, + "loss": 1.4165, + "loss_base2": 2.0436, + "loss_pixel": 0.1632, + "loss_text": 1.2533, + "ppl": 4.1227, + "step": 9834 + }, + { + "epoch": 0.05, + "global_step": 9835, + "learning_rate": 0.00045978714524207013, + "loss": 1.4007, + "loss_base2": 2.0208, + "loss_pixel": 0.1635, + "loss_text": 1.2372, + "ppl": 4.058, + "step": 9835 + }, + { + "epoch": 0.05, + "global_step": 9836, + "learning_rate": 0.00045978297161936564, + "loss": 1.3926, + "loss_base2": 2.0091, + "loss_pixel": 0.1632, + "loss_text": 1.2293, + "ppl": 4.0253, + "step": 9836 + }, + { + "epoch": 0.05, + "global_step": 9837, + "learning_rate": 0.0004597787979966611, + "loss": 1.402, + "loss_base2": 2.0227, + "loss_pixel": 0.1628, + "loss_text": 1.2392, + "ppl": 4.0633, + "step": 9837 + }, + { + "epoch": 0.05, + "global_step": 9838, + "learning_rate": 0.0004597746243739566, + "loss": 1.4101, + "loss_base2": 2.0343, + "loss_pixel": 0.1623, + "loss_text": 1.2478, + "ppl": 4.0964, + "step": 9838 + }, + { + "epoch": 0.05, + "global_step": 9839, + "learning_rate": 0.0004597704507512521, + "loss": 1.3953, + "loss_base2": 2.013, + "loss_pixel": 0.1623, + "loss_text": 1.233, + "ppl": 4.0362, + "step": 9839 + }, + { + "epoch": 0.05, + "global_step": 9840, + "learning_rate": 0.00045976627712854756, + "loss": 1.451, + "loss_base2": 2.0934, + "loss_pixel": 0.1631, + "loss_text": 1.2879, + "ppl": 4.2674, + "step": 9840 + }, + { + "epoch": 0.05, + "global_step": 9841, + "learning_rate": 0.00045976210350584306, + "loss": 1.5612, + "loss_base2": 2.2523, + "loss_pixel": 0.1625, + "loss_text": 1.3987, + "ppl": 4.7645, + "step": 9841 + }, + { + "epoch": 0.05, + "global_step": 9842, + "learning_rate": 0.00045975792988313857, + "loss": 1.5089, + "loss_base2": 2.1769, + "loss_pixel": 0.1626, + "loss_text": 1.3464, + "ppl": 4.5218, + "step": 9842 + }, + { + "epoch": 0.05, + "global_step": 9843, + "learning_rate": 0.0004597537562604341, + "loss": 1.4029, + "loss_base2": 2.024, + "loss_pixel": 0.1627, + "loss_text": 1.2402, + "ppl": 4.067, + "step": 9843 + }, + { + "epoch": 0.05, + "global_step": 9844, + "learning_rate": 0.00045974958263772953, + "loss": 1.4005, + "loss_base2": 2.0205, + "loss_pixel": 0.1611, + "loss_text": 1.2394, + "ppl": 4.0572, + "step": 9844 + }, + { + "epoch": 0.05, + "global_step": 9845, + "learning_rate": 0.00045974540901502504, + "loss": 1.4277, + "loss_base2": 2.0597, + "loss_pixel": 0.163, + "loss_text": 1.2647, + "ppl": 4.1691, + "step": 9845 + }, + { + "epoch": 0.05, + "global_step": 9846, + "learning_rate": 0.00045974123539232055, + "loss": 1.4091, + "loss_base2": 2.0329, + "loss_pixel": 0.1612, + "loss_text": 1.2479, + "ppl": 4.0923, + "step": 9846 + }, + { + "epoch": 0.05, + "global_step": 9847, + "learning_rate": 0.00045973706176961605, + "loss": 1.3857, + "loss_base2": 1.9991, + "loss_pixel": 0.1639, + "loss_text": 1.2218, + "ppl": 3.9976, + "step": 9847 + }, + { + "epoch": 0.05, + "global_step": 9848, + "learning_rate": 0.00045973288814691156, + "loss": 1.4031, + "loss_base2": 2.0242, + "loss_pixel": 0.1615, + "loss_text": 1.2416, + "ppl": 4.0678, + "step": 9848 + }, + { + "epoch": 0.05, + "global_step": 9849, + "learning_rate": 0.000459728714524207, + "loss": 1.3927, + "loss_base2": 2.0092, + "loss_pixel": 0.1605, + "loss_text": 1.2322, + "ppl": 4.0257, + "step": 9849 + }, + { + "epoch": 0.05, + "global_step": 9850, + "learning_rate": 0.0004597245409015025, + "loss": 1.3896, + "loss_base2": 2.0048, + "loss_pixel": 0.1625, + "loss_text": 1.2271, + "ppl": 4.0132, + "step": 9850 + }, + { + "epoch": 0.05, + "global_step": 9851, + "learning_rate": 0.00045972036727879803, + "loss": 1.5498, + "loss_base2": 2.2359, + "loss_pixel": 0.1622, + "loss_text": 1.3876, + "ppl": 4.7105, + "step": 9851 + }, + { + "epoch": 0.05, + "global_step": 9852, + "learning_rate": 0.00045971619365609354, + "loss": 1.6537, + "loss_base2": 2.3858, + "loss_pixel": 0.1625, + "loss_text": 1.4912, + "ppl": 5.2263, + "step": 9852 + }, + { + "epoch": 0.05, + "global_step": 9853, + "learning_rate": 0.000459712020033389, + "loss": 1.6583, + "loss_base2": 2.3924, + "loss_pixel": 0.1615, + "loss_text": 1.4968, + "ppl": 5.2504, + "step": 9853 + }, + { + "epoch": 0.05, + "global_step": 9854, + "learning_rate": 0.0004597078464106845, + "loss": 1.6318, + "loss_base2": 2.3542, + "loss_pixel": 0.1619, + "loss_text": 1.4699, + "ppl": 5.1131, + "step": 9854 + }, + { + "epoch": 0.05, + "global_step": 9855, + "learning_rate": 0.00045970367278797995, + "loss": 1.6342, + "loss_base2": 2.3577, + "loss_pixel": 0.1614, + "loss_text": 1.4728, + "ppl": 5.1254, + "step": 9855 + }, + { + "epoch": 0.05, + "global_step": 9856, + "learning_rate": 0.00045969949916527546, + "loss": 1.6122, + "loss_base2": 2.3259, + "loss_pixel": 0.1614, + "loss_text": 1.4508, + "ppl": 5.0138, + "step": 9856 + }, + { + "epoch": 0.05, + "global_step": 9857, + "learning_rate": 0.00045969532554257096, + "loss": 1.6455, + "loss_base2": 2.374, + "loss_pixel": 0.1627, + "loss_text": 1.4828, + "ppl": 5.1836, + "step": 9857 + }, + { + "epoch": 0.05, + "global_step": 9858, + "learning_rate": 0.0004596911519198664, + "loss": 1.6241, + "loss_base2": 2.3431, + "loss_pixel": 0.1615, + "loss_text": 1.4626, + "ppl": 5.0739, + "step": 9858 + }, + { + "epoch": 0.05, + "global_step": 9859, + "learning_rate": 0.0004596869782971619, + "loss": 1.618, + "loss_base2": 2.3343, + "loss_pixel": 0.1608, + "loss_text": 1.4572, + "ppl": 5.043, + "step": 9859 + }, + { + "epoch": 0.05, + "global_step": 9860, + "learning_rate": 0.00045968280467445743, + "loss": 1.6504, + "loss_base2": 2.381, + "loss_pixel": 0.1608, + "loss_text": 1.4896, + "ppl": 5.2091, + "step": 9860 + }, + { + "epoch": 0.05, + "global_step": 9861, + "learning_rate": 0.00045967863105175294, + "loss": 1.6261, + "loss_base2": 2.346, + "loss_pixel": 0.1611, + "loss_text": 1.465, + "ppl": 5.084, + "step": 9861 + }, + { + "epoch": 0.05, + "global_step": 9862, + "learning_rate": 0.0004596744574290484, + "loss": 1.6237, + "loss_base2": 2.3425, + "loss_pixel": 0.1609, + "loss_text": 1.4628, + "ppl": 5.0718, + "step": 9862 + }, + { + "epoch": 0.05, + "global_step": 9863, + "learning_rate": 0.0004596702838063439, + "loss": 1.6246, + "loss_base2": 2.3438, + "loss_pixel": 0.1606, + "loss_text": 1.464, + "ppl": 5.0764, + "step": 9863 + }, + { + "epoch": 0.05, + "global_step": 9864, + "learning_rate": 0.0004596661101836394, + "loss": 1.6243, + "loss_base2": 2.3434, + "loss_pixel": 0.1617, + "loss_text": 1.4626, + "ppl": 5.0749, + "step": 9864 + }, + { + "epoch": 0.05, + "global_step": 9865, + "learning_rate": 0.0004596619365609349, + "loss": 1.6131, + "loss_base2": 2.3272, + "loss_pixel": 0.161, + "loss_text": 1.4521, + "ppl": 5.0183, + "step": 9865 + }, + { + "epoch": 0.05, + "global_step": 9866, + "learning_rate": 0.0004596577629382304, + "loss": 1.6285, + "loss_base2": 2.3494, + "loss_pixel": 0.1619, + "loss_text": 1.4666, + "ppl": 5.0962, + "step": 9866 + }, + { + "epoch": 0.05, + "global_step": 9867, + "learning_rate": 0.0004596535893155259, + "loss": 1.6147, + "loss_base2": 2.3295, + "loss_pixel": 0.1616, + "loss_text": 1.4531, + "ppl": 5.0264, + "step": 9867 + }, + { + "epoch": 0.05, + "global_step": 9868, + "learning_rate": 0.0004596494156928214, + "loss": 1.622, + "loss_base2": 2.3401, + "loss_pixel": 0.1621, + "loss_text": 1.4599, + "ppl": 5.0632, + "step": 9868 + }, + { + "epoch": 0.05, + "global_step": 9869, + "learning_rate": 0.0004596452420701169, + "loss": 1.6356, + "loss_base2": 2.3597, + "loss_pixel": 0.16, + "loss_text": 1.4756, + "ppl": 5.1325, + "step": 9869 + }, + { + "epoch": 0.05, + "global_step": 9870, + "learning_rate": 0.0004596410684474124, + "loss": 1.5946, + "loss_base2": 2.3005, + "loss_pixel": 0.1615, + "loss_text": 1.4331, + "ppl": 4.9264, + "step": 9870 + }, + { + "epoch": 0.05, + "global_step": 9871, + "learning_rate": 0.00045963689482470785, + "loss": 1.6419, + "loss_base2": 2.3688, + "loss_pixel": 0.1604, + "loss_text": 1.4816, + "ppl": 5.165, + "step": 9871 + }, + { + "epoch": 0.05, + "global_step": 9872, + "learning_rate": 0.00045963272120200336, + "loss": 1.6342, + "loss_base2": 2.3577, + "loss_pixel": 0.1612, + "loss_text": 1.473, + "ppl": 5.1254, + "step": 9872 + }, + { + "epoch": 0.05, + "global_step": 9873, + "learning_rate": 0.00045962854757929886, + "loss": 1.6177, + "loss_base2": 2.3338, + "loss_pixel": 0.1612, + "loss_text": 1.4564, + "ppl": 5.0415, + "step": 9873 + }, + { + "epoch": 0.05, + "global_step": 9874, + "learning_rate": 0.0004596243739565943, + "loss": 1.6175, + "loss_base2": 2.3336, + "loss_pixel": 0.1613, + "loss_text": 1.4562, + "ppl": 5.0405, + "step": 9874 + }, + { + "epoch": 0.05, + "global_step": 9875, + "learning_rate": 0.0004596202003338898, + "loss": 1.61, + "loss_base2": 2.3227, + "loss_pixel": 0.1611, + "loss_text": 1.4489, + "ppl": 5.0028, + "step": 9875 + }, + { + "epoch": 0.05, + "global_step": 9876, + "learning_rate": 0.0004596160267111853, + "loss": 1.6265, + "loss_base2": 2.3465, + "loss_pixel": 0.1615, + "loss_text": 1.465, + "ppl": 5.086, + "step": 9876 + }, + { + "epoch": 0.05, + "global_step": 9877, + "learning_rate": 0.0004596118530884808, + "loss": 1.6024, + "loss_base2": 2.3118, + "loss_pixel": 0.1613, + "loss_text": 1.4411, + "ppl": 4.9649, + "step": 9877 + }, + { + "epoch": 0.05, + "global_step": 9878, + "learning_rate": 0.0004596076794657763, + "loss": 1.6154, + "loss_base2": 2.3305, + "loss_pixel": 0.1613, + "loss_text": 1.4541, + "ppl": 5.0299, + "step": 9878 + }, + { + "epoch": 0.05, + "global_step": 9879, + "learning_rate": 0.0004596035058430718, + "loss": 1.6333, + "loss_base2": 2.3564, + "loss_pixel": 0.1607, + "loss_text": 1.4727, + "ppl": 5.1207, + "step": 9879 + }, + { + "epoch": 0.05, + "global_step": 9880, + "learning_rate": 0.00045959933222036725, + "loss": 1.6354, + "loss_base2": 2.3594, + "loss_pixel": 0.1605, + "loss_text": 1.4749, + "ppl": 5.1315, + "step": 9880 + }, + { + "epoch": 0.05, + "global_step": 9881, + "learning_rate": 0.00045959515859766276, + "loss": 1.6283, + "loss_base2": 2.3491, + "loss_pixel": 0.161, + "loss_text": 1.4673, + "ppl": 5.0952, + "step": 9881 + }, + { + "epoch": 0.05, + "global_step": 9882, + "learning_rate": 0.00045959098497495827, + "loss": 1.6398, + "loss_base2": 2.3657, + "loss_pixel": 0.16, + "loss_text": 1.4798, + "ppl": 5.1541, + "step": 9882 + }, + { + "epoch": 0.05, + "global_step": 9883, + "learning_rate": 0.0004595868113522538, + "loss": 1.6286, + "loss_base2": 2.3496, + "loss_pixel": 0.161, + "loss_text": 1.4676, + "ppl": 5.0967, + "step": 9883 + }, + { + "epoch": 0.05, + "global_step": 9884, + "learning_rate": 0.0004595826377295493, + "loss": 1.6077, + "loss_base2": 2.3194, + "loss_pixel": 0.1616, + "loss_text": 1.4462, + "ppl": 4.9913, + "step": 9884 + }, + { + "epoch": 0.05, + "global_step": 9885, + "learning_rate": 0.00045957846410684474, + "loss": 1.6277, + "loss_base2": 2.3483, + "loss_pixel": 0.1609, + "loss_text": 1.4668, + "ppl": 5.0921, + "step": 9885 + }, + { + "epoch": 0.05, + "global_step": 9886, + "learning_rate": 0.00045957429048414024, + "loss": 1.6227, + "loss_base2": 2.3411, + "loss_pixel": 0.1631, + "loss_text": 1.4597, + "ppl": 5.0668, + "step": 9886 + }, + { + "epoch": 0.05, + "global_step": 9887, + "learning_rate": 0.00045957011686143575, + "loss": 1.6291, + "loss_base2": 2.3503, + "loss_pixel": 0.1603, + "loss_text": 1.4689, + "ppl": 5.0993, + "step": 9887 + }, + { + "epoch": 0.05, + "global_step": 9888, + "learning_rate": 0.00045956594323873126, + "loss": 1.6121, + "loss_base2": 2.3258, + "loss_pixel": 0.161, + "loss_text": 1.4511, + "ppl": 5.0133, + "step": 9888 + }, + { + "epoch": 0.05, + "global_step": 9889, + "learning_rate": 0.00045956176961602676, + "loss": 1.6259, + "loss_base2": 2.3457, + "loss_pixel": 0.1626, + "loss_text": 1.4633, + "ppl": 5.083, + "step": 9889 + }, + { + "epoch": 0.05, + "global_step": 9890, + "learning_rate": 0.0004595575959933222, + "loss": 1.6175, + "loss_base2": 2.3336, + "loss_pixel": 0.1617, + "loss_text": 1.4558, + "ppl": 5.0405, + "step": 9890 + }, + { + "epoch": 0.05, + "global_step": 9891, + "learning_rate": 0.0004595534223706177, + "loss": 1.6003, + "loss_base2": 2.3087, + "loss_pixel": 0.1612, + "loss_text": 1.439, + "ppl": 4.9545, + "step": 9891 + }, + { + "epoch": 0.05, + "global_step": 9892, + "learning_rate": 0.00045954924874791323, + "loss": 1.6333, + "loss_base2": 2.3564, + "loss_pixel": 0.1603, + "loss_text": 1.473, + "ppl": 5.1207, + "step": 9892 + }, + { + "epoch": 0.05, + "global_step": 9893, + "learning_rate": 0.0004595450751252087, + "loss": 1.6249, + "loss_base2": 2.3442, + "loss_pixel": 0.1624, + "loss_text": 1.4625, + "ppl": 5.0779, + "step": 9893 + }, + { + "epoch": 0.05, + "global_step": 9894, + "learning_rate": 0.00045954090150250414, + "loss": 1.6067, + "loss_base2": 2.318, + "loss_pixel": 0.1612, + "loss_text": 1.4454, + "ppl": 4.9863, + "step": 9894 + }, + { + "epoch": 0.05, + "global_step": 9895, + "learning_rate": 0.00045953672787979965, + "loss": 1.5534, + "loss_base2": 2.2411, + "loss_pixel": 0.161, + "loss_text": 1.3924, + "ppl": 4.7275, + "step": 9895 + }, + { + "epoch": 0.05, + "global_step": 9896, + "learning_rate": 0.00045953255425709515, + "loss": 1.4318, + "loss_base2": 2.0657, + "loss_pixel": 0.1589, + "loss_text": 1.2729, + "ppl": 4.1862, + "step": 9896 + }, + { + "epoch": 0.05, + "global_step": 9897, + "learning_rate": 0.00045952838063439066, + "loss": 1.4084, + "loss_base2": 2.0319, + "loss_pixel": 0.161, + "loss_text": 1.2474, + "ppl": 4.0894, + "step": 9897 + }, + { + "epoch": 0.05, + "global_step": 9898, + "learning_rate": 0.00045952420701168617, + "loss": 1.4214, + "loss_base2": 2.0506, + "loss_pixel": 0.1606, + "loss_text": 1.2608, + "ppl": 4.1429, + "step": 9898 + }, + { + "epoch": 0.05, + "global_step": 9899, + "learning_rate": 0.0004595200333889816, + "loss": 1.4166, + "loss_base2": 2.0437, + "loss_pixel": 0.1611, + "loss_text": 1.2555, + "ppl": 4.1231, + "step": 9899 + }, + { + "epoch": 0.05, + "global_step": 9900, + "learning_rate": 0.00045951585976627713, + "loss": 1.4163, + "loss_base2": 2.0433, + "loss_pixel": 0.1599, + "loss_text": 1.2564, + "ppl": 4.1218, + "step": 9900 + }, + { + "epoch": 0.05, + "global_step": 9901, + "learning_rate": 0.00045951168614357264, + "loss": 1.3937, + "loss_base2": 2.0107, + "loss_pixel": 0.1603, + "loss_text": 1.2334, + "ppl": 4.0297, + "step": 9901 + }, + { + "epoch": 0.05, + "global_step": 9902, + "learning_rate": 0.00045950751252086814, + "loss": 1.3916, + "loss_base2": 2.0077, + "loss_pixel": 0.1623, + "loss_text": 1.2293, + "ppl": 4.0213, + "step": 9902 + }, + { + "epoch": 0.05, + "global_step": 9903, + "learning_rate": 0.0004595033388981636, + "loss": 1.4118, + "loss_base2": 2.0368, + "loss_pixel": 0.1607, + "loss_text": 1.2511, + "ppl": 4.1033, + "step": 9903 + }, + { + "epoch": 0.05, + "global_step": 9904, + "learning_rate": 0.0004594991652754591, + "loss": 1.6157, + "loss_base2": 2.331, + "loss_pixel": 0.1609, + "loss_text": 1.4548, + "ppl": 5.0314, + "step": 9904 + }, + { + "epoch": 0.05, + "global_step": 9905, + "learning_rate": 0.0004594949916527546, + "loss": 1.6563, + "loss_base2": 2.3895, + "loss_pixel": 0.1619, + "loss_text": 1.4944, + "ppl": 5.2399, + "step": 9905 + }, + { + "epoch": 0.05, + "global_step": 9906, + "learning_rate": 0.0004594908180300501, + "loss": 1.6518, + "loss_base2": 2.383, + "loss_pixel": 0.1619, + "loss_text": 1.4899, + "ppl": 5.2164, + "step": 9906 + }, + { + "epoch": 0.05, + "global_step": 9907, + "learning_rate": 0.0004594866444073456, + "loss": 1.633, + "loss_base2": 2.3559, + "loss_pixel": 0.161, + "loss_text": 1.4719, + "ppl": 5.1192, + "step": 9907 + }, + { + "epoch": 0.05, + "global_step": 9908, + "learning_rate": 0.0004594824707846411, + "loss": 1.6479, + "loss_base2": 2.3774, + "loss_pixel": 0.1609, + "loss_text": 1.487, + "ppl": 5.1961, + "step": 9908 + }, + { + "epoch": 0.05, + "global_step": 9909, + "learning_rate": 0.0004594782971619366, + "loss": 1.6349, + "loss_base2": 2.3587, + "loss_pixel": 0.1602, + "loss_text": 1.4746, + "ppl": 5.1289, + "step": 9909 + }, + { + "epoch": 0.05, + "global_step": 9910, + "learning_rate": 0.0004594741235392321, + "loss": 1.6194, + "loss_base2": 2.3363, + "loss_pixel": 0.1614, + "loss_text": 1.458, + "ppl": 5.0501, + "step": 9910 + }, + { + "epoch": 0.05, + "global_step": 9911, + "learning_rate": 0.0004594699499165276, + "loss": 1.6314, + "loss_base2": 2.3536, + "loss_pixel": 0.1615, + "loss_text": 1.4699, + "ppl": 5.111, + "step": 9911 + }, + { + "epoch": 0.05, + "global_step": 9912, + "learning_rate": 0.000459465776293823, + "loss": 1.631, + "loss_base2": 2.353, + "loss_pixel": 0.1608, + "loss_text": 1.4702, + "ppl": 5.109, + "step": 9912 + }, + { + "epoch": 0.05, + "global_step": 9913, + "learning_rate": 0.0004594616026711185, + "loss": 1.6405, + "loss_base2": 2.3667, + "loss_pixel": 0.1606, + "loss_text": 1.4799, + "ppl": 5.1577, + "step": 9913 + }, + { + "epoch": 0.05, + "global_step": 9914, + "learning_rate": 0.000459457429048414, + "loss": 1.6112, + "loss_base2": 2.3245, + "loss_pixel": 0.1601, + "loss_text": 1.451, + "ppl": 5.0088, + "step": 9914 + }, + { + "epoch": 0.05, + "global_step": 9915, + "learning_rate": 0.0004594532554257095, + "loss": 1.6338, + "loss_base2": 2.3571, + "loss_pixel": 0.1617, + "loss_text": 1.4721, + "ppl": 5.1233, + "step": 9915 + }, + { + "epoch": 0.05, + "global_step": 9916, + "learning_rate": 0.00045944908180300503, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1615, + "loss_text": 1.4554, + "ppl": 5.0374, + "step": 9916 + }, + { + "epoch": 0.05, + "global_step": 9917, + "learning_rate": 0.0004594449081803005, + "loss": 1.6485, + "loss_base2": 2.3783, + "loss_pixel": 0.1623, + "loss_text": 1.4862, + "ppl": 5.1992, + "step": 9917 + }, + { + "epoch": 0.05, + "global_step": 9918, + "learning_rate": 0.000459440734557596, + "loss": 1.6247, + "loss_base2": 2.3439, + "loss_pixel": 0.1615, + "loss_text": 1.4632, + "ppl": 5.0769, + "step": 9918 + }, + { + "epoch": 0.05, + "global_step": 9919, + "learning_rate": 0.0004594365609348915, + "loss": 1.6332, + "loss_base2": 2.3562, + "loss_pixel": 0.1617, + "loss_text": 1.4716, + "ppl": 5.1202, + "step": 9919 + }, + { + "epoch": 0.05, + "global_step": 9920, + "learning_rate": 0.000459432387312187, + "loss": 1.6215, + "loss_base2": 2.3393, + "loss_pixel": 0.1615, + "loss_text": 1.46, + "ppl": 5.0607, + "step": 9920 + }, + { + "epoch": 0.05, + "global_step": 9921, + "learning_rate": 0.00045942821368948246, + "loss": 1.6275, + "loss_base2": 2.348, + "loss_pixel": 0.1609, + "loss_text": 1.4666, + "ppl": 5.0911, + "step": 9921 + }, + { + "epoch": 0.05, + "global_step": 9922, + "learning_rate": 0.00045942404006677796, + "loss": 1.637, + "loss_base2": 2.3617, + "loss_pixel": 0.1606, + "loss_text": 1.4764, + "ppl": 5.1397, + "step": 9922 + }, + { + "epoch": 0.05, + "global_step": 9923, + "learning_rate": 0.00045941986644407347, + "loss": 1.6198, + "loss_base2": 2.3369, + "loss_pixel": 0.1595, + "loss_text": 1.4603, + "ppl": 5.0521, + "step": 9923 + }, + { + "epoch": 0.05, + "global_step": 9924, + "learning_rate": 0.000459415692821369, + "loss": 1.6297, + "loss_base2": 2.3512, + "loss_pixel": 0.1608, + "loss_text": 1.4689, + "ppl": 5.1023, + "step": 9924 + }, + { + "epoch": 0.05, + "global_step": 9925, + "learning_rate": 0.0004594115191986645, + "loss": 1.6427, + "loss_base2": 2.3699, + "loss_pixel": 0.1604, + "loss_text": 1.4822, + "ppl": 5.1691, + "step": 9925 + }, + { + "epoch": 0.05, + "global_step": 9926, + "learning_rate": 0.00045940734557595994, + "loss": 1.6251, + "loss_base2": 2.3445, + "loss_pixel": 0.1599, + "loss_text": 1.4652, + "ppl": 5.0789, + "step": 9926 + }, + { + "epoch": 0.05, + "global_step": 9927, + "learning_rate": 0.00045940317195325545, + "loss": 1.6353, + "loss_base2": 2.3592, + "loss_pixel": 0.1606, + "loss_text": 1.4747, + "ppl": 5.131, + "step": 9927 + }, + { + "epoch": 0.05, + "global_step": 9928, + "learning_rate": 0.00045939899833055095, + "loss": 1.6312, + "loss_base2": 2.3533, + "loss_pixel": 0.16, + "loss_text": 1.4712, + "ppl": 5.11, + "step": 9928 + }, + { + "epoch": 0.05, + "global_step": 9929, + "learning_rate": 0.00045939482470784646, + "loss": 1.6385, + "loss_base2": 2.3639, + "loss_pixel": 0.1592, + "loss_text": 1.4794, + "ppl": 5.1474, + "step": 9929 + }, + { + "epoch": 0.05, + "global_step": 9930, + "learning_rate": 0.00045939065108514186, + "loss": 1.6234, + "loss_base2": 2.3421, + "loss_pixel": 0.1605, + "loss_text": 1.4629, + "ppl": 5.0703, + "step": 9930 + }, + { + "epoch": 0.05, + "global_step": 9931, + "learning_rate": 0.00045938647746243737, + "loss": 1.6164, + "loss_base2": 2.332, + "loss_pixel": 0.1611, + "loss_text": 1.4553, + "ppl": 5.0349, + "step": 9931 + }, + { + "epoch": 0.05, + "global_step": 9932, + "learning_rate": 0.0004593823038397329, + "loss": 1.636, + "loss_base2": 2.3602, + "loss_pixel": 0.1599, + "loss_text": 1.476, + "ppl": 5.1346, + "step": 9932 + }, + { + "epoch": 0.05, + "global_step": 9933, + "learning_rate": 0.0004593781302170284, + "loss": 1.5956, + "loss_base2": 2.302, + "loss_pixel": 0.1609, + "loss_text": 1.4348, + "ppl": 4.9313, + "step": 9933 + }, + { + "epoch": 0.05, + "global_step": 9934, + "learning_rate": 0.0004593739565943239, + "loss": 1.6207, + "loss_base2": 2.3382, + "loss_pixel": 0.1624, + "loss_text": 1.4583, + "ppl": 5.0566, + "step": 9934 + }, + { + "epoch": 0.05, + "global_step": 9935, + "learning_rate": 0.00045936978297161934, + "loss": 1.6233, + "loss_base2": 2.3419, + "loss_pixel": 0.1604, + "loss_text": 1.4629, + "ppl": 5.0698, + "step": 9935 + }, + { + "epoch": 0.05, + "global_step": 9936, + "learning_rate": 0.00045936560934891485, + "loss": 1.6144, + "loss_base2": 2.3291, + "loss_pixel": 0.1608, + "loss_text": 1.4536, + "ppl": 5.0249, + "step": 9936 + }, + { + "epoch": 0.05, + "global_step": 9937, + "learning_rate": 0.00045936143572621036, + "loss": 1.6175, + "loss_base2": 2.3336, + "loss_pixel": 0.1613, + "loss_text": 1.4561, + "ppl": 5.0405, + "step": 9937 + }, + { + "epoch": 0.05, + "global_step": 9938, + "learning_rate": 0.00045935726210350586, + "loss": 1.6198, + "loss_base2": 2.3369, + "loss_pixel": 0.1618, + "loss_text": 1.458, + "ppl": 5.0521, + "step": 9938 + }, + { + "epoch": 0.05, + "global_step": 9939, + "learning_rate": 0.0004593530884808013, + "loss": 1.6222, + "loss_base2": 2.3403, + "loss_pixel": 0.1616, + "loss_text": 1.4606, + "ppl": 5.0642, + "step": 9939 + }, + { + "epoch": 0.05, + "global_step": 9940, + "learning_rate": 0.0004593489148580968, + "loss": 1.623, + "loss_base2": 2.3415, + "loss_pixel": 0.1618, + "loss_text": 1.4612, + "ppl": 5.0683, + "step": 9940 + }, + { + "epoch": 0.05, + "global_step": 9941, + "learning_rate": 0.00045934474123539233, + "loss": 1.6146, + "loss_base2": 2.3294, + "loss_pixel": 0.1614, + "loss_text": 1.4532, + "ppl": 5.0259, + "step": 9941 + }, + { + "epoch": 0.05, + "global_step": 9942, + "learning_rate": 0.00045934056761268784, + "loss": 1.634, + "loss_base2": 2.3574, + "loss_pixel": 0.1612, + "loss_text": 1.4728, + "ppl": 5.1243, + "step": 9942 + }, + { + "epoch": 0.05, + "global_step": 9943, + "learning_rate": 0.00045933639398998335, + "loss": 1.6098, + "loss_base2": 2.3225, + "loss_pixel": 0.1611, + "loss_text": 1.4487, + "ppl": 5.0018, + "step": 9943 + }, + { + "epoch": 0.05, + "global_step": 9944, + "learning_rate": 0.0004593322203672788, + "loss": 1.6056, + "loss_base2": 2.3164, + "loss_pixel": 0.1608, + "loss_text": 1.4448, + "ppl": 4.9808, + "step": 9944 + }, + { + "epoch": 0.05, + "global_step": 9945, + "learning_rate": 0.0004593280467445743, + "loss": 1.6374, + "loss_base2": 2.3623, + "loss_pixel": 0.1608, + "loss_text": 1.4767, + "ppl": 5.1418, + "step": 9945 + }, + { + "epoch": 0.05, + "global_step": 9946, + "learning_rate": 0.0004593238731218698, + "loss": 1.632, + "loss_base2": 2.3545, + "loss_pixel": 0.1602, + "loss_text": 1.4718, + "ppl": 5.1141, + "step": 9946 + }, + { + "epoch": 0.05, + "global_step": 9947, + "learning_rate": 0.0004593196994991653, + "loss": 1.6135, + "loss_base2": 2.3278, + "loss_pixel": 0.1607, + "loss_text": 1.4528, + "ppl": 5.0204, + "step": 9947 + }, + { + "epoch": 0.05, + "global_step": 9948, + "learning_rate": 0.00045931552587646083, + "loss": 1.6291, + "loss_base2": 2.3503, + "loss_pixel": 0.1615, + "loss_text": 1.4676, + "ppl": 5.0993, + "step": 9948 + }, + { + "epoch": 0.05, + "global_step": 9949, + "learning_rate": 0.00045931135225375623, + "loss": 1.614, + "loss_base2": 2.3285, + "loss_pixel": 0.1601, + "loss_text": 1.4539, + "ppl": 5.0229, + "step": 9949 + }, + { + "epoch": 0.05, + "global_step": 9950, + "learning_rate": 0.00045930717863105174, + "loss": 1.6245, + "loss_base2": 2.3437, + "loss_pixel": 0.1607, + "loss_text": 1.4639, + "ppl": 5.0759, + "step": 9950 + }, + { + "epoch": 0.05, + "global_step": 9951, + "learning_rate": 0.00045930300500834724, + "loss": 1.6105, + "loss_base2": 2.3235, + "loss_pixel": 0.1609, + "loss_text": 1.4496, + "ppl": 5.0053, + "step": 9951 + }, + { + "epoch": 0.05, + "global_step": 9952, + "learning_rate": 0.00045929883138564275, + "loss": 1.6393, + "loss_base2": 2.365, + "loss_pixel": 0.1597, + "loss_text": 1.4797, + "ppl": 5.1516, + "step": 9952 + }, + { + "epoch": 0.05, + "global_step": 9953, + "learning_rate": 0.0004592946577629382, + "loss": 1.6184, + "loss_base2": 2.3349, + "loss_pixel": 0.1589, + "loss_text": 1.4595, + "ppl": 5.045, + "step": 9953 + }, + { + "epoch": 0.05, + "global_step": 9954, + "learning_rate": 0.0004592904841402337, + "loss": 1.5577, + "loss_base2": 2.2473, + "loss_pixel": 0.1603, + "loss_text": 1.3974, + "ppl": 4.7479, + "step": 9954 + }, + { + "epoch": 0.05, + "global_step": 9955, + "learning_rate": 0.0004592863105175292, + "loss": 1.6218, + "loss_base2": 2.3398, + "loss_pixel": 0.1612, + "loss_text": 1.4606, + "ppl": 5.0622, + "step": 9955 + }, + { + "epoch": 0.05, + "global_step": 9956, + "learning_rate": 0.0004592821368948247, + "loss": 1.6236, + "loss_base2": 2.3424, + "loss_pixel": 0.162, + "loss_text": 1.4615, + "ppl": 5.0713, + "step": 9956 + }, + { + "epoch": 0.05, + "global_step": 9957, + "learning_rate": 0.00045927796327212023, + "loss": 1.6288, + "loss_base2": 2.3499, + "loss_pixel": 0.1634, + "loss_text": 1.4654, + "ppl": 5.0978, + "step": 9957 + }, + { + "epoch": 0.05, + "global_step": 9958, + "learning_rate": 0.0004592737896494157, + "loss": 1.6337, + "loss_base2": 2.3569, + "loss_pixel": 0.1628, + "loss_text": 1.4709, + "ppl": 5.1228, + "step": 9958 + }, + { + "epoch": 0.05, + "global_step": 9959, + "learning_rate": 0.0004592696160267112, + "loss": 1.6225, + "loss_base2": 2.3408, + "loss_pixel": 0.1611, + "loss_text": 1.4614, + "ppl": 5.0657, + "step": 9959 + }, + { + "epoch": 0.05, + "global_step": 9960, + "learning_rate": 0.0004592654424040067, + "loss": 1.6259, + "loss_base2": 2.3457, + "loss_pixel": 0.1619, + "loss_text": 1.464, + "ppl": 5.083, + "step": 9960 + }, + { + "epoch": 0.05, + "global_step": 9961, + "learning_rate": 0.0004592612687813022, + "loss": 1.6343, + "loss_base2": 2.3578, + "loss_pixel": 0.1617, + "loss_text": 1.4726, + "ppl": 5.1259, + "step": 9961 + }, + { + "epoch": 0.05, + "global_step": 9962, + "learning_rate": 0.00045925709515859766, + "loss": 1.6221, + "loss_base2": 2.3402, + "loss_pixel": 0.1612, + "loss_text": 1.461, + "ppl": 5.0637, + "step": 9962 + }, + { + "epoch": 0.05, + "global_step": 9963, + "learning_rate": 0.00045925292153589317, + "loss": 1.6161, + "loss_base2": 2.3315, + "loss_pixel": 0.1607, + "loss_text": 1.4554, + "ppl": 5.0334, + "step": 9963 + }, + { + "epoch": 0.05, + "global_step": 9964, + "learning_rate": 0.0004592487479131887, + "loss": 1.633, + "loss_base2": 2.3559, + "loss_pixel": 0.1628, + "loss_text": 1.4702, + "ppl": 5.1192, + "step": 9964 + }, + { + "epoch": 0.05, + "global_step": 9965, + "learning_rate": 0.0004592445742904842, + "loss": 1.611, + "loss_base2": 2.3242, + "loss_pixel": 0.1605, + "loss_text": 1.4504, + "ppl": 5.0078, + "step": 9965 + }, + { + "epoch": 0.05, + "global_step": 9966, + "learning_rate": 0.0004592404006677797, + "loss": 1.6253, + "loss_base2": 2.3448, + "loss_pixel": 0.162, + "loss_text": 1.4633, + "ppl": 5.0799, + "step": 9966 + }, + { + "epoch": 0.05, + "global_step": 9967, + "learning_rate": 0.00045923622704507514, + "loss": 1.6065, + "loss_base2": 2.3177, + "loss_pixel": 0.1643, + "loss_text": 1.4423, + "ppl": 4.9853, + "step": 9967 + }, + { + "epoch": 0.05, + "global_step": 9968, + "learning_rate": 0.0004592320534223706, + "loss": 1.6241, + "loss_base2": 2.3431, + "loss_pixel": 0.1637, + "loss_text": 1.4604, + "ppl": 5.0739, + "step": 9968 + }, + { + "epoch": 0.05, + "global_step": 9969, + "learning_rate": 0.0004592278797996661, + "loss": 1.6157, + "loss_base2": 2.331, + "loss_pixel": 0.1634, + "loss_text": 1.4523, + "ppl": 5.0314, + "step": 9969 + }, + { + "epoch": 0.05, + "global_step": 9970, + "learning_rate": 0.0004592237061769616, + "loss": 1.6104, + "loss_base2": 2.3233, + "loss_pixel": 0.1646, + "loss_text": 1.4457, + "ppl": 5.0048, + "step": 9970 + }, + { + "epoch": 0.05, + "global_step": 9971, + "learning_rate": 0.00045921953255425706, + "loss": 1.6214, + "loss_base2": 2.3392, + "loss_pixel": 0.1659, + "loss_text": 1.4555, + "ppl": 5.0602, + "step": 9971 + }, + { + "epoch": 0.05, + "global_step": 9972, + "learning_rate": 0.00045921535893155257, + "loss": 1.6263, + "loss_base2": 2.3463, + "loss_pixel": 0.164, + "loss_text": 1.4623, + "ppl": 5.085, + "step": 9972 + }, + { + "epoch": 0.05, + "global_step": 9973, + "learning_rate": 0.0004592111853088481, + "loss": 1.6139, + "loss_base2": 2.3284, + "loss_pixel": 0.1648, + "loss_text": 1.4492, + "ppl": 5.0224, + "step": 9973 + }, + { + "epoch": 0.05, + "global_step": 9974, + "learning_rate": 0.0004592070116861436, + "loss": 1.6338, + "loss_base2": 2.3571, + "loss_pixel": 0.1646, + "loss_text": 1.4692, + "ppl": 5.1233, + "step": 9974 + }, + { + "epoch": 0.05, + "global_step": 9975, + "learning_rate": 0.0004592028380634391, + "loss": 1.6299, + "loss_base2": 2.3514, + "loss_pixel": 0.1649, + "loss_text": 1.465, + "ppl": 5.1034, + "step": 9975 + }, + { + "epoch": 0.05, + "global_step": 9976, + "learning_rate": 0.00045919866444073455, + "loss": 1.4616, + "loss_base2": 2.1086, + "loss_pixel": 0.1661, + "loss_text": 1.2954, + "ppl": 4.3129, + "step": 9976 + }, + { + "epoch": 0.05, + "global_step": 9977, + "learning_rate": 0.00045919449081803005, + "loss": 1.4081, + "loss_base2": 2.0315, + "loss_pixel": 0.1645, + "loss_text": 1.2435, + "ppl": 4.0882, + "step": 9977 + }, + { + "epoch": 0.05, + "global_step": 9978, + "learning_rate": 0.00045919031719532556, + "loss": 1.4162, + "loss_base2": 2.0431, + "loss_pixel": 0.1644, + "loss_text": 1.2518, + "ppl": 4.1214, + "step": 9978 + }, + { + "epoch": 0.05, + "global_step": 9979, + "learning_rate": 0.00045918614357262107, + "loss": 1.4147, + "loss_base2": 2.041, + "loss_pixel": 0.1643, + "loss_text": 1.2503, + "ppl": 4.1153, + "step": 9979 + }, + { + "epoch": 0.05, + "global_step": 9980, + "learning_rate": 0.0004591819699499165, + "loss": 1.4065, + "loss_base2": 2.0292, + "loss_pixel": 0.1631, + "loss_text": 1.2434, + "ppl": 4.0816, + "step": 9980 + }, + { + "epoch": 0.05, + "global_step": 9981, + "learning_rate": 0.00045917779632721203, + "loss": 1.3946, + "loss_base2": 2.012, + "loss_pixel": 0.1615, + "loss_text": 1.2331, + "ppl": 4.0334, + "step": 9981 + }, + { + "epoch": 0.05, + "global_step": 9982, + "learning_rate": 0.00045917362270450754, + "loss": 1.4059, + "loss_base2": 2.0283, + "loss_pixel": 0.1633, + "loss_text": 1.2426, + "ppl": 4.0792, + "step": 9982 + }, + { + "epoch": 0.05, + "global_step": 9983, + "learning_rate": 0.00045916944908180304, + "loss": 1.5166, + "loss_base2": 2.188, + "loss_pixel": 0.1627, + "loss_text": 1.3539, + "ppl": 4.5567, + "step": 9983 + }, + { + "epoch": 0.05, + "global_step": 9984, + "learning_rate": 0.00045916527545909855, + "loss": 1.6297, + "loss_base2": 2.3512, + "loss_pixel": 0.1623, + "loss_text": 1.4674, + "ppl": 5.1023, + "step": 9984 + }, + { + "epoch": 0.05, + "global_step": 9985, + "learning_rate": 0.000459161101836394, + "loss": 1.6172, + "loss_base2": 2.3331, + "loss_pixel": 0.163, + "loss_text": 1.4542, + "ppl": 5.039, + "step": 9985 + }, + { + "epoch": 0.05, + "global_step": 9986, + "learning_rate": 0.0004591569282136895, + "loss": 1.6263, + "loss_base2": 2.3463, + "loss_pixel": 0.1627, + "loss_text": 1.4635, + "ppl": 5.085, + "step": 9986 + }, + { + "epoch": 0.05, + "global_step": 9987, + "learning_rate": 0.00045915275459098496, + "loss": 1.6264, + "loss_base2": 2.3464, + "loss_pixel": 0.1627, + "loss_text": 1.4637, + "ppl": 5.0855, + "step": 9987 + }, + { + "epoch": 0.05, + "global_step": 9988, + "learning_rate": 0.00045914858096828047, + "loss": 1.6379, + "loss_base2": 2.363, + "loss_pixel": 0.1623, + "loss_text": 1.4756, + "ppl": 5.1444, + "step": 9988 + }, + { + "epoch": 0.05, + "global_step": 9989, + "learning_rate": 0.0004591444073455759, + "loss": 1.6284, + "loss_base2": 2.3493, + "loss_pixel": 0.1639, + "loss_text": 1.4646, + "ppl": 5.0957, + "step": 9989 + }, + { + "epoch": 0.05, + "global_step": 9990, + "learning_rate": 0.00045914023372287143, + "loss": 1.5973, + "loss_base2": 2.3044, + "loss_pixel": 0.1614, + "loss_text": 1.4359, + "ppl": 4.9397, + "step": 9990 + }, + { + "epoch": 0.05, + "global_step": 9991, + "learning_rate": 0.00045913606010016694, + "loss": 1.6302, + "loss_base2": 2.3519, + "loss_pixel": 0.1607, + "loss_text": 1.4695, + "ppl": 5.1049, + "step": 9991 + }, + { + "epoch": 0.05, + "global_step": 9992, + "learning_rate": 0.00045913188647746245, + "loss": 1.6347, + "loss_base2": 2.3584, + "loss_pixel": 0.1617, + "loss_text": 1.473, + "ppl": 5.1279, + "step": 9992 + }, + { + "epoch": 0.05, + "global_step": 9993, + "learning_rate": 0.00045912771285475795, + "loss": 1.6266, + "loss_base2": 2.3467, + "loss_pixel": 0.1618, + "loss_text": 1.4648, + "ppl": 5.0866, + "step": 9993 + }, + { + "epoch": 0.05, + "global_step": 9994, + "learning_rate": 0.0004591235392320534, + "loss": 1.6081, + "loss_base2": 2.32, + "loss_pixel": 0.1629, + "loss_text": 1.4452, + "ppl": 4.9933, + "step": 9994 + }, + { + "epoch": 0.05, + "global_step": 9995, + "learning_rate": 0.0004591193656093489, + "loss": 1.6277, + "loss_base2": 2.3483, + "loss_pixel": 0.1622, + "loss_text": 1.4655, + "ppl": 5.0921, + "step": 9995 + }, + { + "epoch": 0.05, + "global_step": 9996, + "learning_rate": 0.0004591151919866444, + "loss": 1.6221, + "loss_base2": 2.3402, + "loss_pixel": 0.1626, + "loss_text": 1.4596, + "ppl": 5.0637, + "step": 9996 + }, + { + "epoch": 0.05, + "global_step": 9997, + "learning_rate": 0.00045911101836393993, + "loss": 1.62, + "loss_base2": 2.3372, + "loss_pixel": 0.1612, + "loss_text": 1.4588, + "ppl": 5.0531, + "step": 9997 + }, + { + "epoch": 0.05, + "global_step": 9998, + "learning_rate": 0.0004591068447412354, + "loss": 1.6225, + "loss_base2": 2.3408, + "loss_pixel": 0.1603, + "loss_text": 1.4622, + "ppl": 5.0657, + "step": 9998 + }, + { + "epoch": 0.05, + "global_step": 9999, + "learning_rate": 0.0004591026711185309, + "loss": 1.6306, + "loss_base2": 2.3525, + "loss_pixel": 0.1603, + "loss_text": 1.4703, + "ppl": 5.1069, + "step": 9999 + }, + { + "epoch": 0.05, + "global_step": 10000, + "learning_rate": 0.0004590984974958264, + "loss": 1.6264, + "loss_base2": 2.3464, + "loss_pixel": 0.161, + "loss_text": 1.4654, + "ppl": 5.0855, + "step": 10000 + }, + { + "epoch": 0.05, + "global_step": 10001, + "learning_rate": 0.0004590943238731219, + "loss": 1.6167, + "loss_base2": 2.3324, + "loss_pixel": 0.1613, + "loss_text": 1.4553, + "ppl": 5.0364, + "step": 10001 + }, + { + "epoch": 0.05, + "global_step": 10002, + "learning_rate": 0.0004590901502504174, + "loss": 1.6191, + "loss_base2": 2.3359, + "loss_pixel": 0.1601, + "loss_text": 1.459, + "ppl": 5.0485, + "step": 10002 + }, + { + "epoch": 0.05, + "global_step": 10003, + "learning_rate": 0.00045908597662771286, + "loss": 1.6394, + "loss_base2": 2.3652, + "loss_pixel": 0.1641, + "loss_text": 1.4753, + "ppl": 5.1521, + "step": 10003 + }, + { + "epoch": 0.05, + "global_step": 10004, + "learning_rate": 0.00045908180300500837, + "loss": 1.6084, + "loss_base2": 2.3204, + "loss_pixel": 0.162, + "loss_text": 1.4464, + "ppl": 4.9948, + "step": 10004 + }, + { + "epoch": 0.05, + "global_step": 10005, + "learning_rate": 0.0004590776293823039, + "loss": 1.6329, + "loss_base2": 2.3558, + "loss_pixel": 0.1616, + "loss_text": 1.4713, + "ppl": 5.1187, + "step": 10005 + }, + { + "epoch": 0.05, + "global_step": 10006, + "learning_rate": 0.00045907345575959933, + "loss": 1.6053, + "loss_base2": 2.316, + "loss_pixel": 0.1612, + "loss_text": 1.4441, + "ppl": 4.9794, + "step": 10006 + }, + { + "epoch": 0.05, + "global_step": 10007, + "learning_rate": 0.00045906928213689484, + "loss": 1.6249, + "loss_base2": 2.3442, + "loss_pixel": 0.1592, + "loss_text": 1.4656, + "ppl": 5.0779, + "step": 10007 + }, + { + "epoch": 0.05, + "global_step": 10008, + "learning_rate": 0.0004590651085141903, + "loss": 1.5656, + "loss_base2": 2.2587, + "loss_pixel": 0.1607, + "loss_text": 1.4049, + "ppl": 4.7855, + "step": 10008 + }, + { + "epoch": 0.05, + "global_step": 10009, + "learning_rate": 0.0004590609348914858, + "loss": 1.4307, + "loss_base2": 2.0641, + "loss_pixel": 0.1604, + "loss_text": 1.2704, + "ppl": 4.1816, + "step": 10009 + }, + { + "epoch": 0.05, + "global_step": 10010, + "learning_rate": 0.0004590567612687813, + "loss": 1.4209, + "loss_base2": 2.0499, + "loss_pixel": 0.1613, + "loss_text": 1.2596, + "ppl": 4.1408, + "step": 10010 + }, + { + "epoch": 0.05, + "global_step": 10011, + "learning_rate": 0.0004590525876460768, + "loss": 1.4131, + "loss_base2": 2.0387, + "loss_pixel": 0.1599, + "loss_text": 1.2532, + "ppl": 4.1087, + "step": 10011 + }, + { + "epoch": 0.05, + "global_step": 10012, + "learning_rate": 0.00045904841402337227, + "loss": 1.4058, + "loss_base2": 2.0281, + "loss_pixel": 0.1623, + "loss_text": 1.2435, + "ppl": 4.0788, + "step": 10012 + }, + { + "epoch": 0.05, + "global_step": 10013, + "learning_rate": 0.0004590442404006678, + "loss": 1.3916, + "loss_base2": 2.0077, + "loss_pixel": 0.1601, + "loss_text": 1.2316, + "ppl": 4.0213, + "step": 10013 + }, + { + "epoch": 0.05, + "global_step": 10014, + "learning_rate": 0.0004590400667779633, + "loss": 1.388, + "loss_base2": 2.0025, + "loss_pixel": 0.1612, + "loss_text": 1.2268, + "ppl": 4.0068, + "step": 10014 + }, + { + "epoch": 0.05, + "global_step": 10015, + "learning_rate": 0.0004590358931552588, + "loss": 1.4046, + "loss_base2": 2.0264, + "loss_pixel": 0.1626, + "loss_text": 1.2419, + "ppl": 4.0739, + "step": 10015 + }, + { + "epoch": 0.05, + "global_step": 10016, + "learning_rate": 0.0004590317195325543, + "loss": 1.4921, + "loss_base2": 2.1526, + "loss_pixel": 0.1615, + "loss_text": 1.3305, + "ppl": 4.4464, + "step": 10016 + }, + { + "epoch": 0.05, + "global_step": 10017, + "learning_rate": 0.00045902754590984975, + "loss": 1.6322, + "loss_base2": 2.3548, + "loss_pixel": 0.1601, + "loss_text": 1.4721, + "ppl": 5.1151, + "step": 10017 + }, + { + "epoch": 0.05, + "global_step": 10018, + "learning_rate": 0.00045902337228714526, + "loss": 1.6382, + "loss_base2": 2.3634, + "loss_pixel": 0.1596, + "loss_text": 1.4787, + "ppl": 5.1459, + "step": 10018 + }, + { + "epoch": 0.05, + "global_step": 10019, + "learning_rate": 0.00045901919866444076, + "loss": 1.6229, + "loss_base2": 2.3413, + "loss_pixel": 0.1592, + "loss_text": 1.4637, + "ppl": 5.0678, + "step": 10019 + }, + { + "epoch": 0.05, + "global_step": 10020, + "learning_rate": 0.00045901502504173627, + "loss": 1.6278, + "loss_base2": 2.3484, + "loss_pixel": 0.1606, + "loss_text": 1.4672, + "ppl": 5.0927, + "step": 10020 + }, + { + "epoch": 0.05, + "global_step": 10021, + "learning_rate": 0.0004590108514190317, + "loss": 1.6139, + "loss_base2": 2.3284, + "loss_pixel": 0.1594, + "loss_text": 1.4546, + "ppl": 5.0224, + "step": 10021 + }, + { + "epoch": 0.05, + "global_step": 10022, + "learning_rate": 0.00045900667779632723, + "loss": 1.6288, + "loss_base2": 2.3499, + "loss_pixel": 0.1599, + "loss_text": 1.4689, + "ppl": 5.0978, + "step": 10022 + }, + { + "epoch": 0.05, + "global_step": 10023, + "learning_rate": 0.00045900250417362274, + "loss": 1.633, + "loss_base2": 2.3559, + "loss_pixel": 0.1603, + "loss_text": 1.4727, + "ppl": 5.1192, + "step": 10023 + }, + { + "epoch": 0.05, + "global_step": 10024, + "learning_rate": 0.0004589983305509182, + "loss": 1.6341, + "loss_base2": 2.3575, + "loss_pixel": 0.1607, + "loss_text": 1.4734, + "ppl": 5.1248, + "step": 10024 + }, + { + "epoch": 0.05, + "global_step": 10025, + "learning_rate": 0.0004589941569282137, + "loss": 1.6364, + "loss_base2": 2.3608, + "loss_pixel": 0.1609, + "loss_text": 1.4755, + "ppl": 5.1366, + "step": 10025 + }, + { + "epoch": 0.05, + "global_step": 10026, + "learning_rate": 0.00045898998330550915, + "loss": 1.6244, + "loss_base2": 2.3435, + "loss_pixel": 0.1605, + "loss_text": 1.4639, + "ppl": 5.0754, + "step": 10026 + }, + { + "epoch": 0.05, + "global_step": 10027, + "learning_rate": 0.00045898580968280466, + "loss": 1.6345, + "loss_base2": 2.3581, + "loss_pixel": 0.1629, + "loss_text": 1.4717, + "ppl": 5.1269, + "step": 10027 + }, + { + "epoch": 0.05, + "global_step": 10028, + "learning_rate": 0.00045898163606010017, + "loss": 1.6075, + "loss_base2": 2.3191, + "loss_pixel": 0.1661, + "loss_text": 1.4414, + "ppl": 4.9903, + "step": 10028 + }, + { + "epoch": 0.05, + "global_step": 10029, + "learning_rate": 0.0004589774624373957, + "loss": 1.6405, + "loss_base2": 2.3667, + "loss_pixel": 0.1663, + "loss_text": 1.4743, + "ppl": 5.1577, + "step": 10029 + }, + { + "epoch": 0.05, + "global_step": 10030, + "learning_rate": 0.00045897328881469113, + "loss": 1.6288, + "loss_base2": 2.3499, + "loss_pixel": 0.1667, + "loss_text": 1.4621, + "ppl": 5.0978, + "step": 10030 + }, + { + "epoch": 0.05, + "global_step": 10031, + "learning_rate": 0.00045896911519198664, + "loss": 1.6407, + "loss_base2": 2.367, + "loss_pixel": 0.1668, + "loss_text": 1.4739, + "ppl": 5.1588, + "step": 10031 + }, + { + "epoch": 0.05, + "global_step": 10032, + "learning_rate": 0.00045896494156928214, + "loss": 1.6403, + "loss_base2": 2.3665, + "loss_pixel": 0.1652, + "loss_text": 1.4752, + "ppl": 5.1567, + "step": 10032 + }, + { + "epoch": 0.05, + "global_step": 10033, + "learning_rate": 0.00045896076794657765, + "loss": 1.6334, + "loss_base2": 2.3565, + "loss_pixel": 0.1624, + "loss_text": 1.4711, + "ppl": 5.1213, + "step": 10033 + }, + { + "epoch": 0.05, + "global_step": 10034, + "learning_rate": 0.00045895659432387316, + "loss": 1.6314, + "loss_base2": 2.3536, + "loss_pixel": 0.1627, + "loss_text": 1.4686, + "ppl": 5.111, + "step": 10034 + }, + { + "epoch": 0.05, + "global_step": 10035, + "learning_rate": 0.0004589524207011686, + "loss": 1.6183, + "loss_base2": 2.3347, + "loss_pixel": 0.163, + "loss_text": 1.4552, + "ppl": 5.0445, + "step": 10035 + }, + { + "epoch": 0.05, + "global_step": 10036, + "learning_rate": 0.0004589482470784641, + "loss": 1.618, + "loss_base2": 2.3343, + "loss_pixel": 0.1622, + "loss_text": 1.4558, + "ppl": 5.043, + "step": 10036 + }, + { + "epoch": 0.05, + "global_step": 10037, + "learning_rate": 0.0004589440734557596, + "loss": 1.617, + "loss_base2": 2.3328, + "loss_pixel": 0.1626, + "loss_text": 1.4544, + "ppl": 5.038, + "step": 10037 + }, + { + "epoch": 0.05, + "global_step": 10038, + "learning_rate": 0.00045893989983305513, + "loss": 1.6385, + "loss_base2": 2.3639, + "loss_pixel": 0.1607, + "loss_text": 1.4778, + "ppl": 5.1474, + "step": 10038 + }, + { + "epoch": 0.05, + "global_step": 10039, + "learning_rate": 0.0004589357262103506, + "loss": 1.6258, + "loss_base2": 2.3455, + "loss_pixel": 0.1614, + "loss_text": 1.4644, + "ppl": 5.0825, + "step": 10039 + }, + { + "epoch": 0.05, + "global_step": 10040, + "learning_rate": 0.0004589315525876461, + "loss": 1.5405, + "loss_base2": 2.2225, + "loss_pixel": 0.1617, + "loss_text": 1.3789, + "ppl": 4.6669, + "step": 10040 + }, + { + "epoch": 0.05, + "global_step": 10041, + "learning_rate": 0.0004589273789649416, + "loss": 1.4174, + "loss_base2": 2.0449, + "loss_pixel": 0.1617, + "loss_text": 1.2557, + "ppl": 4.1264, + "step": 10041 + }, + { + "epoch": 0.05, + "global_step": 10042, + "learning_rate": 0.0004589232053422371, + "loss": 1.4175, + "loss_base2": 2.045, + "loss_pixel": 0.162, + "loss_text": 1.2556, + "ppl": 4.1268, + "step": 10042 + }, + { + "epoch": 0.05, + "global_step": 10043, + "learning_rate": 0.00045891903171953256, + "loss": 1.4043, + "loss_base2": 2.026, + "loss_pixel": 0.161, + "loss_text": 1.2432, + "ppl": 4.0727, + "step": 10043 + }, + { + "epoch": 0.05, + "global_step": 10044, + "learning_rate": 0.000458914858096828, + "loss": 1.4112, + "loss_base2": 2.0359, + "loss_pixel": 0.1604, + "loss_text": 1.2508, + "ppl": 4.1009, + "step": 10044 + }, + { + "epoch": 0.05, + "global_step": 10045, + "learning_rate": 0.0004589106844741235, + "loss": 1.3985, + "loss_base2": 2.0176, + "loss_pixel": 0.1616, + "loss_text": 1.2369, + "ppl": 4.0491, + "step": 10045 + }, + { + "epoch": 0.05, + "global_step": 10046, + "learning_rate": 0.00045890651085141903, + "loss": 1.4119, + "loss_base2": 2.0369, + "loss_pixel": 0.1607, + "loss_text": 1.2513, + "ppl": 4.1037, + "step": 10046 + }, + { + "epoch": 0.05, + "global_step": 10047, + "learning_rate": 0.00045890233722871454, + "loss": 1.4274, + "loss_base2": 2.0593, + "loss_pixel": 0.1616, + "loss_text": 1.2659, + "ppl": 4.1678, + "step": 10047 + }, + { + "epoch": 0.05, + "global_step": 10048, + "learning_rate": 0.00045889816360601, + "loss": 1.4064, + "loss_base2": 2.029, + "loss_pixel": 0.1609, + "loss_text": 1.2455, + "ppl": 4.0812, + "step": 10048 + }, + { + "epoch": 0.05, + "global_step": 10049, + "learning_rate": 0.0004588939899833055, + "loss": 1.4059, + "loss_base2": 2.0283, + "loss_pixel": 0.162, + "loss_text": 1.2439, + "ppl": 4.0792, + "step": 10049 + }, + { + "epoch": 0.05, + "global_step": 10050, + "learning_rate": 0.000458889816360601, + "loss": 1.4067, + "loss_base2": 2.0294, + "loss_pixel": 0.161, + "loss_text": 1.2457, + "ppl": 4.0825, + "step": 10050 + }, + { + "epoch": 0.05, + "global_step": 10051, + "learning_rate": 0.0004588856427378965, + "loss": 1.4058, + "loss_base2": 2.0281, + "loss_pixel": 0.1604, + "loss_text": 1.2454, + "ppl": 4.0788, + "step": 10051 + }, + { + "epoch": 0.05, + "global_step": 10052, + "learning_rate": 0.000458881469115192, + "loss": 1.4312, + "loss_base2": 2.0648, + "loss_pixel": 0.1613, + "loss_text": 1.27, + "ppl": 4.1837, + "step": 10052 + }, + { + "epoch": 0.05, + "global_step": 10053, + "learning_rate": 0.00045887729549248747, + "loss": 1.4122, + "loss_base2": 2.0374, + "loss_pixel": 0.1631, + "loss_text": 1.2492, + "ppl": 4.105, + "step": 10053 + }, + { + "epoch": 0.05, + "global_step": 10054, + "learning_rate": 0.000458873121869783, + "loss": 1.4078, + "loss_base2": 2.031, + "loss_pixel": 0.1614, + "loss_text": 1.2464, + "ppl": 4.087, + "step": 10054 + }, + { + "epoch": 0.05, + "global_step": 10055, + "learning_rate": 0.0004588689482470785, + "loss": 1.4016, + "loss_base2": 2.0221, + "loss_pixel": 0.1599, + "loss_text": 1.2418, + "ppl": 4.0617, + "step": 10055 + }, + { + "epoch": 0.05, + "global_step": 10056, + "learning_rate": 0.000458864774624374, + "loss": 1.41, + "loss_base2": 2.0342, + "loss_pixel": 0.1607, + "loss_text": 1.2492, + "ppl": 4.096, + "step": 10056 + }, + { + "epoch": 0.05, + "global_step": 10057, + "learning_rate": 0.00045886060100166945, + "loss": 1.3957, + "loss_base2": 2.0136, + "loss_pixel": 0.1603, + "loss_text": 1.2354, + "ppl": 4.0378, + "step": 10057 + }, + { + "epoch": 0.05, + "global_step": 10058, + "learning_rate": 0.00045885642737896495, + "loss": 1.4135, + "loss_base2": 2.0392, + "loss_pixel": 0.1605, + "loss_text": 1.253, + "ppl": 4.1103, + "step": 10058 + }, + { + "epoch": 0.05, + "global_step": 10059, + "learning_rate": 0.00045885225375626046, + "loss": 1.397, + "loss_base2": 2.0154, + "loss_pixel": 0.1597, + "loss_text": 1.2372, + "ppl": 4.0431, + "step": 10059 + }, + { + "epoch": 0.05, + "global_step": 10060, + "learning_rate": 0.00045884808013355597, + "loss": 1.4065, + "loss_base2": 2.0292, + "loss_pixel": 0.1603, + "loss_text": 1.2462, + "ppl": 4.0816, + "step": 10060 + }, + { + "epoch": 0.05, + "global_step": 10061, + "learning_rate": 0.0004588439065108515, + "loss": 1.3999, + "loss_base2": 2.0196, + "loss_pixel": 0.16, + "loss_text": 1.24, + "ppl": 4.0548, + "step": 10061 + }, + { + "epoch": 0.05, + "global_step": 10062, + "learning_rate": 0.0004588397328881469, + "loss": 1.3817, + "loss_base2": 1.9934, + "loss_pixel": 0.1602, + "loss_text": 1.2215, + "ppl": 3.9817, + "step": 10062 + }, + { + "epoch": 0.05, + "global_step": 10063, + "learning_rate": 0.0004588355592654424, + "loss": 1.4072, + "loss_base2": 2.0302, + "loss_pixel": 0.1615, + "loss_text": 1.2457, + "ppl": 4.0845, + "step": 10063 + }, + { + "epoch": 0.05, + "global_step": 10064, + "learning_rate": 0.0004588313856427379, + "loss": 1.5444, + "loss_base2": 2.2281, + "loss_pixel": 0.1602, + "loss_text": 1.3841, + "ppl": 4.6852, + "step": 10064 + }, + { + "epoch": 0.05, + "global_step": 10065, + "learning_rate": 0.0004588272120200334, + "loss": 1.4314, + "loss_base2": 2.0651, + "loss_pixel": 0.1611, + "loss_text": 1.2703, + "ppl": 4.1846, + "step": 10065 + }, + { + "epoch": 0.05, + "global_step": 10066, + "learning_rate": 0.0004588230383973289, + "loss": 1.3994, + "loss_base2": 2.0189, + "loss_pixel": 0.1603, + "loss_text": 1.2391, + "ppl": 4.0528, + "step": 10066 + }, + { + "epoch": 0.05, + "global_step": 10067, + "learning_rate": 0.00045881886477462436, + "loss": 1.4109, + "loss_base2": 2.0355, + "loss_pixel": 0.1609, + "loss_text": 1.25, + "ppl": 4.0996, + "step": 10067 + }, + { + "epoch": 0.05, + "global_step": 10068, + "learning_rate": 0.00045881469115191986, + "loss": 1.4231, + "loss_base2": 2.0531, + "loss_pixel": 0.1601, + "loss_text": 1.2629, + "ppl": 4.15, + "step": 10068 + }, + { + "epoch": 0.05, + "global_step": 10069, + "learning_rate": 0.00045881051752921537, + "loss": 1.3866, + "loss_base2": 2.0004, + "loss_pixel": 0.1615, + "loss_text": 1.2251, + "ppl": 4.0012, + "step": 10069 + }, + { + "epoch": 0.05, + "global_step": 10070, + "learning_rate": 0.0004588063439065109, + "loss": 1.3964, + "loss_base2": 2.0146, + "loss_pixel": 0.1611, + "loss_text": 1.2353, + "ppl": 4.0406, + "step": 10070 + }, + { + "epoch": 0.05, + "global_step": 10071, + "learning_rate": 0.00045880217028380633, + "loss": 1.3947, + "loss_base2": 2.0121, + "loss_pixel": 0.1613, + "loss_text": 1.2333, + "ppl": 4.0338, + "step": 10071 + }, + { + "epoch": 0.05, + "global_step": 10072, + "learning_rate": 0.00045879799666110184, + "loss": 1.5095, + "loss_base2": 2.1777, + "loss_pixel": 0.1595, + "loss_text": 1.35, + "ppl": 4.5245, + "step": 10072 + }, + { + "epoch": 0.05, + "global_step": 10073, + "learning_rate": 0.00045879382303839735, + "loss": 1.6066, + "loss_base2": 2.3178, + "loss_pixel": 0.1603, + "loss_text": 1.4463, + "ppl": 4.9858, + "step": 10073 + }, + { + "epoch": 0.05, + "global_step": 10074, + "learning_rate": 0.00045878964941569285, + "loss": 1.6223, + "loss_base2": 2.3405, + "loss_pixel": 0.1598, + "loss_text": 1.4626, + "ppl": 5.0647, + "step": 10074 + }, + { + "epoch": 0.05, + "global_step": 10075, + "learning_rate": 0.00045878547579298836, + "loss": 1.4919, + "loss_base2": 2.1524, + "loss_pixel": 0.1604, + "loss_text": 1.3315, + "ppl": 4.4455, + "step": 10075 + }, + { + "epoch": 0.05, + "global_step": 10076, + "learning_rate": 0.0004587813021702838, + "loss": 1.4003, + "loss_base2": 2.0202, + "loss_pixel": 0.1605, + "loss_text": 1.2398, + "ppl": 4.0564, + "step": 10076 + }, + { + "epoch": 0.05, + "global_step": 10077, + "learning_rate": 0.0004587771285475793, + "loss": 1.4357, + "loss_base2": 2.0713, + "loss_pixel": 0.162, + "loss_text": 1.2737, + "ppl": 4.2026, + "step": 10077 + }, + { + "epoch": 0.05, + "global_step": 10078, + "learning_rate": 0.00045877295492487483, + "loss": 1.4215, + "loss_base2": 2.0508, + "loss_pixel": 0.1609, + "loss_text": 1.2606, + "ppl": 4.1433, + "step": 10078 + }, + { + "epoch": 0.05, + "global_step": 10079, + "learning_rate": 0.00045876878130217034, + "loss": 1.4158, + "loss_base2": 2.0426, + "loss_pixel": 0.1614, + "loss_text": 1.2544, + "ppl": 4.1198, + "step": 10079 + }, + { + "epoch": 0.05, + "global_step": 10080, + "learning_rate": 0.00045876460767946574, + "loss": 1.4316, + "loss_base2": 2.0654, + "loss_pixel": 0.1605, + "loss_text": 1.2711, + "ppl": 4.1854, + "step": 10080 + }, + { + "epoch": 0.05, + "global_step": 10081, + "learning_rate": 0.00045876043405676124, + "loss": 1.4094, + "loss_base2": 2.0333, + "loss_pixel": 0.1609, + "loss_text": 1.2485, + "ppl": 4.0935, + "step": 10081 + }, + { + "epoch": 0.05, + "global_step": 10082, + "learning_rate": 0.00045875626043405675, + "loss": 1.3967, + "loss_base2": 2.015, + "loss_pixel": 0.1597, + "loss_text": 1.2369, + "ppl": 4.0418, + "step": 10082 + }, + { + "epoch": 0.05, + "global_step": 10083, + "learning_rate": 0.00045875208681135226, + "loss": 1.3994, + "loss_base2": 2.0189, + "loss_pixel": 0.1591, + "loss_text": 1.2403, + "ppl": 4.0528, + "step": 10083 + }, + { + "epoch": 0.05, + "global_step": 10084, + "learning_rate": 0.00045874791318864776, + "loss": 1.4079, + "loss_base2": 2.0312, + "loss_pixel": 0.16, + "loss_text": 1.2479, + "ppl": 4.0874, + "step": 10084 + }, + { + "epoch": 0.05, + "global_step": 10085, + "learning_rate": 0.0004587437395659432, + "loss": 1.4179, + "loss_base2": 2.0456, + "loss_pixel": 0.1608, + "loss_text": 1.2571, + "ppl": 4.1284, + "step": 10085 + }, + { + "epoch": 0.05, + "global_step": 10086, + "learning_rate": 0.0004587395659432387, + "loss": 1.4015, + "loss_base2": 2.0219, + "loss_pixel": 0.1594, + "loss_text": 1.2421, + "ppl": 4.0613, + "step": 10086 + }, + { + "epoch": 0.05, + "global_step": 10087, + "learning_rate": 0.00045873539232053423, + "loss": 1.4052, + "loss_base2": 2.0273, + "loss_pixel": 0.161, + "loss_text": 1.2442, + "ppl": 4.0763, + "step": 10087 + }, + { + "epoch": 0.05, + "global_step": 10088, + "learning_rate": 0.00045873121869782974, + "loss": 1.3894, + "loss_base2": 2.0045, + "loss_pixel": 0.1594, + "loss_text": 1.23, + "ppl": 4.0124, + "step": 10088 + }, + { + "epoch": 0.05, + "global_step": 10089, + "learning_rate": 0.0004587270450751252, + "loss": 1.4002, + "loss_base2": 2.0201, + "loss_pixel": 0.1609, + "loss_text": 1.2392, + "ppl": 4.056, + "step": 10089 + }, + { + "epoch": 0.05, + "global_step": 10090, + "learning_rate": 0.0004587228714524207, + "loss": 1.5771, + "loss_base2": 2.2753, + "loss_pixel": 0.1619, + "loss_text": 1.4152, + "ppl": 4.8409, + "step": 10090 + }, + { + "epoch": 0.05, + "global_step": 10091, + "learning_rate": 0.0004587186978297162, + "loss": 1.6897, + "loss_base2": 2.4377, + "loss_pixel": 0.1619, + "loss_text": 1.5277, + "ppl": 5.4179, + "step": 10091 + }, + { + "epoch": 0.05, + "global_step": 10092, + "learning_rate": 0.0004587145242070117, + "loss": 1.6729, + "loss_base2": 2.4135, + "loss_pixel": 0.1617, + "loss_text": 1.5113, + "ppl": 5.3276, + "step": 10092 + }, + { + "epoch": 0.05, + "global_step": 10093, + "learning_rate": 0.0004587103505843072, + "loss": 1.6714, + "loss_base2": 2.4113, + "loss_pixel": 0.1615, + "loss_text": 1.5099, + "ppl": 5.3196, + "step": 10093 + }, + { + "epoch": 0.05, + "global_step": 10094, + "learning_rate": 0.0004587061769616027, + "loss": 1.6837, + "loss_base2": 2.4291, + "loss_pixel": 0.1629, + "loss_text": 1.5208, + "ppl": 5.3854, + "step": 10094 + }, + { + "epoch": 0.05, + "global_step": 10095, + "learning_rate": 0.0004587020033388982, + "loss": 1.6705, + "loss_base2": 2.41, + "loss_pixel": 0.1618, + "loss_text": 1.5086, + "ppl": 5.3148, + "step": 10095 + }, + { + "epoch": 0.05, + "global_step": 10096, + "learning_rate": 0.0004586978297161937, + "loss": 1.6685, + "loss_base2": 2.4071, + "loss_pixel": 0.1614, + "loss_text": 1.5071, + "ppl": 5.3042, + "step": 10096 + }, + { + "epoch": 0.05, + "global_step": 10097, + "learning_rate": 0.0004586936560934892, + "loss": 1.6484, + "loss_base2": 2.3781, + "loss_pixel": 0.1615, + "loss_text": 1.4869, + "ppl": 5.1987, + "step": 10097 + }, + { + "epoch": 0.05, + "global_step": 10098, + "learning_rate": 0.00045868948247078465, + "loss": 1.6587, + "loss_base2": 2.393, + "loss_pixel": 0.1615, + "loss_text": 1.4972, + "ppl": 5.2525, + "step": 10098 + }, + { + "epoch": 0.05, + "global_step": 10099, + "learning_rate": 0.0004586853088480801, + "loss": 1.6668, + "loss_base2": 2.4047, + "loss_pixel": 0.1611, + "loss_text": 1.5057, + "ppl": 5.2952, + "step": 10099 + }, + { + "epoch": 0.05, + "global_step": 10100, + "learning_rate": 0.0004586811352253756, + "loss": 1.636, + "loss_base2": 2.3602, + "loss_pixel": 0.162, + "loss_text": 1.4741, + "ppl": 5.1346, + "step": 10100 + }, + { + "epoch": 0.05, + "global_step": 10101, + "learning_rate": 0.0004586769616026711, + "loss": 1.6274, + "loss_base2": 2.3478, + "loss_pixel": 0.1616, + "loss_text": 1.4659, + "ppl": 5.0906, + "step": 10101 + }, + { + "epoch": 0.05, + "global_step": 10102, + "learning_rate": 0.0004586727879799666, + "loss": 1.6377, + "loss_base2": 2.3627, + "loss_pixel": 0.1616, + "loss_text": 1.4761, + "ppl": 5.1433, + "step": 10102 + }, + { + "epoch": 0.05, + "global_step": 10103, + "learning_rate": 0.0004586686143572621, + "loss": 1.6684, + "loss_base2": 2.407, + "loss_pixel": 0.1596, + "loss_text": 1.5088, + "ppl": 5.3037, + "step": 10103 + }, + { + "epoch": 0.05, + "global_step": 10104, + "learning_rate": 0.0004586644407345576, + "loss": 1.6522, + "loss_base2": 2.3836, + "loss_pixel": 0.1609, + "loss_text": 1.4914, + "ppl": 5.2184, + "step": 10104 + }, + { + "epoch": 0.05, + "global_step": 10105, + "learning_rate": 0.0004586602671118531, + "loss": 1.6511, + "loss_base2": 2.382, + "loss_pixel": 0.1606, + "loss_text": 1.4905, + "ppl": 5.2127, + "step": 10105 + }, + { + "epoch": 0.05, + "global_step": 10106, + "learning_rate": 0.0004586560934891486, + "loss": 1.6393, + "loss_base2": 2.365, + "loss_pixel": 0.1606, + "loss_text": 1.4786, + "ppl": 5.1516, + "step": 10106 + }, + { + "epoch": 0.05, + "global_step": 10107, + "learning_rate": 0.00045865191986644405, + "loss": 1.6454, + "loss_base2": 2.3738, + "loss_pixel": 0.1611, + "loss_text": 1.4843, + "ppl": 5.1831, + "step": 10107 + }, + { + "epoch": 0.05, + "global_step": 10108, + "learning_rate": 0.00045864774624373956, + "loss": 1.6427, + "loss_base2": 2.3699, + "loss_pixel": 0.1606, + "loss_text": 1.4821, + "ppl": 5.1691, + "step": 10108 + }, + { + "epoch": 0.05, + "global_step": 10109, + "learning_rate": 0.00045864357262103507, + "loss": 1.6189, + "loss_base2": 2.3356, + "loss_pixel": 0.1597, + "loss_text": 1.4592, + "ppl": 5.0475, + "step": 10109 + }, + { + "epoch": 0.05, + "global_step": 10110, + "learning_rate": 0.0004586393989983306, + "loss": 1.6291, + "loss_base2": 2.3503, + "loss_pixel": 0.1603, + "loss_text": 1.4689, + "ppl": 5.0993, + "step": 10110 + }, + { + "epoch": 0.05, + "global_step": 10111, + "learning_rate": 0.0004586352253756261, + "loss": 1.6253, + "loss_base2": 2.3448, + "loss_pixel": 0.1608, + "loss_text": 1.4645, + "ppl": 5.0799, + "step": 10111 + }, + { + "epoch": 0.05, + "global_step": 10112, + "learning_rate": 0.00045863105175292154, + "loss": 1.6193, + "loss_base2": 2.3362, + "loss_pixel": 0.1593, + "loss_text": 1.46, + "ppl": 5.0496, + "step": 10112 + }, + { + "epoch": 0.05, + "global_step": 10113, + "learning_rate": 0.00045862687813021704, + "loss": 1.6286, + "loss_base2": 2.3496, + "loss_pixel": 0.1604, + "loss_text": 1.4682, + "ppl": 5.0967, + "step": 10113 + }, + { + "epoch": 0.05, + "global_step": 10114, + "learning_rate": 0.00045862270450751255, + "loss": 1.6173, + "loss_base2": 2.3333, + "loss_pixel": 0.1606, + "loss_text": 1.4568, + "ppl": 5.0395, + "step": 10114 + }, + { + "epoch": 0.05, + "global_step": 10115, + "learning_rate": 0.00045861853088480806, + "loss": 1.6186, + "loss_base2": 2.3351, + "loss_pixel": 0.1609, + "loss_text": 1.4577, + "ppl": 5.046, + "step": 10115 + }, + { + "epoch": 0.05, + "global_step": 10116, + "learning_rate": 0.00045861435726210356, + "loss": 1.6418, + "loss_base2": 2.3686, + "loss_pixel": 0.1604, + "loss_text": 1.4814, + "ppl": 5.1645, + "step": 10116 + }, + { + "epoch": 0.05, + "global_step": 10117, + "learning_rate": 0.000458610183639399, + "loss": 1.6216, + "loss_base2": 2.3395, + "loss_pixel": 0.1597, + "loss_text": 1.4619, + "ppl": 5.0612, + "step": 10117 + }, + { + "epoch": 0.05, + "global_step": 10118, + "learning_rate": 0.00045860601001669447, + "loss": 1.6358, + "loss_base2": 2.36, + "loss_pixel": 0.1605, + "loss_text": 1.4753, + "ppl": 5.1336, + "step": 10118 + }, + { + "epoch": 0.05, + "global_step": 10119, + "learning_rate": 0.00045860183639399, + "loss": 1.6205, + "loss_base2": 2.3379, + "loss_pixel": 0.1602, + "loss_text": 1.4602, + "ppl": 5.0556, + "step": 10119 + }, + { + "epoch": 0.05, + "global_step": 10120, + "learning_rate": 0.0004585976627712855, + "loss": 1.6292, + "loss_base2": 2.3504, + "loss_pixel": 0.1609, + "loss_text": 1.4683, + "ppl": 5.0998, + "step": 10120 + }, + { + "epoch": 0.05, + "global_step": 10121, + "learning_rate": 0.00045859348914858094, + "loss": 1.6221, + "loss_base2": 2.3402, + "loss_pixel": 0.1616, + "loss_text": 1.4606, + "ppl": 5.0637, + "step": 10121 + }, + { + "epoch": 0.05, + "global_step": 10122, + "learning_rate": 0.00045858931552587645, + "loss": 1.6239, + "loss_base2": 2.3428, + "loss_pixel": 0.1611, + "loss_text": 1.4628, + "ppl": 5.0728, + "step": 10122 + }, + { + "epoch": 0.05, + "global_step": 10123, + "learning_rate": 0.00045858514190317195, + "loss": 1.6172, + "loss_base2": 2.3331, + "loss_pixel": 0.1597, + "loss_text": 1.4575, + "ppl": 5.039, + "step": 10123 + }, + { + "epoch": 0.05, + "global_step": 10124, + "learning_rate": 0.00045858096828046746, + "loss": 1.6186, + "loss_base2": 2.3351, + "loss_pixel": 0.1598, + "loss_text": 1.4589, + "ppl": 5.046, + "step": 10124 + }, + { + "epoch": 0.05, + "global_step": 10125, + "learning_rate": 0.00045857679465776297, + "loss": 1.6362, + "loss_base2": 2.3605, + "loss_pixel": 0.1613, + "loss_text": 1.4748, + "ppl": 5.1356, + "step": 10125 + }, + { + "epoch": 0.05, + "global_step": 10126, + "learning_rate": 0.0004585726210350584, + "loss": 1.6292, + "loss_base2": 2.3504, + "loss_pixel": 0.1621, + "loss_text": 1.4672, + "ppl": 5.0998, + "step": 10126 + }, + { + "epoch": 0.05, + "global_step": 10127, + "learning_rate": 0.00045856844741235393, + "loss": 1.6329, + "loss_base2": 2.3558, + "loss_pixel": 0.1605, + "loss_text": 1.4724, + "ppl": 5.1187, + "step": 10127 + }, + { + "epoch": 0.05, + "global_step": 10128, + "learning_rate": 0.00045856427378964944, + "loss": 1.6319, + "loss_base2": 2.3543, + "loss_pixel": 0.1582, + "loss_text": 1.4738, + "ppl": 5.1136, + "step": 10128 + }, + { + "epoch": 0.05, + "global_step": 10129, + "learning_rate": 0.00045856010016694494, + "loss": 1.6191, + "loss_base2": 2.3359, + "loss_pixel": 0.1595, + "loss_text": 1.4595, + "ppl": 5.0485, + "step": 10129 + }, + { + "epoch": 0.05, + "global_step": 10130, + "learning_rate": 0.0004585559265442404, + "loss": 1.6194, + "loss_base2": 2.3363, + "loss_pixel": 0.1599, + "loss_text": 1.4595, + "ppl": 5.0501, + "step": 10130 + }, + { + "epoch": 0.05, + "global_step": 10131, + "learning_rate": 0.0004585517529215359, + "loss": 1.6358, + "loss_base2": 2.36, + "loss_pixel": 0.1595, + "loss_text": 1.4763, + "ppl": 5.1336, + "step": 10131 + }, + { + "epoch": 0.05, + "global_step": 10132, + "learning_rate": 0.0004585475792988314, + "loss": 1.6241, + "loss_base2": 2.3431, + "loss_pixel": 0.1588, + "loss_text": 1.4653, + "ppl": 5.0739, + "step": 10132 + }, + { + "epoch": 0.05, + "global_step": 10133, + "learning_rate": 0.0004585434056761269, + "loss": 1.6215, + "loss_base2": 2.3393, + "loss_pixel": 0.1599, + "loss_text": 1.4616, + "ppl": 5.0607, + "step": 10133 + }, + { + "epoch": 0.05, + "global_step": 10134, + "learning_rate": 0.0004585392320534224, + "loss": 1.6332, + "loss_base2": 2.3562, + "loss_pixel": 0.1597, + "loss_text": 1.4735, + "ppl": 5.1202, + "step": 10134 + }, + { + "epoch": 0.05, + "global_step": 10135, + "learning_rate": 0.0004585350584307179, + "loss": 1.6177, + "loss_base2": 2.3338, + "loss_pixel": 0.1609, + "loss_text": 1.4567, + "ppl": 5.0415, + "step": 10135 + }, + { + "epoch": 0.05, + "global_step": 10136, + "learning_rate": 0.0004585308848080134, + "loss": 1.6206, + "loss_base2": 2.338, + "loss_pixel": 0.1592, + "loss_text": 1.4613, + "ppl": 5.0561, + "step": 10136 + }, + { + "epoch": 0.05, + "global_step": 10137, + "learning_rate": 0.00045852671118530884, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.16, + "loss_text": 1.4552, + "ppl": 5.0284, + "step": 10137 + }, + { + "epoch": 0.05, + "global_step": 10138, + "learning_rate": 0.00045852253756260435, + "loss": 1.6241, + "loss_base2": 2.3431, + "loss_pixel": 0.1577, + "loss_text": 1.4664, + "ppl": 5.0739, + "step": 10138 + }, + { + "epoch": 0.05, + "global_step": 10139, + "learning_rate": 0.0004585183639398998, + "loss": 1.6233, + "loss_base2": 2.3419, + "loss_pixel": 0.159, + "loss_text": 1.4643, + "ppl": 5.0698, + "step": 10139 + }, + { + "epoch": 0.05, + "global_step": 10140, + "learning_rate": 0.0004585141903171953, + "loss": 1.6118, + "loss_base2": 2.3253, + "loss_pixel": 0.1593, + "loss_text": 1.4525, + "ppl": 5.0118, + "step": 10140 + }, + { + "epoch": 0.05, + "global_step": 10141, + "learning_rate": 0.0004585100166944908, + "loss": 1.6251, + "loss_base2": 2.3445, + "loss_pixel": 0.1594, + "loss_text": 1.4657, + "ppl": 5.0789, + "step": 10141 + }, + { + "epoch": 0.05, + "global_step": 10142, + "learning_rate": 0.0004585058430717863, + "loss": 1.6168, + "loss_base2": 2.3325, + "loss_pixel": 0.1593, + "loss_text": 1.4575, + "ppl": 5.0369, + "step": 10142 + }, + { + "epoch": 0.05, + "global_step": 10143, + "learning_rate": 0.00045850166944908183, + "loss": 1.6305, + "loss_base2": 2.3523, + "loss_pixel": 0.1604, + "loss_text": 1.4702, + "ppl": 5.1064, + "step": 10143 + }, + { + "epoch": 0.05, + "global_step": 10144, + "learning_rate": 0.0004584974958263773, + "loss": 1.6314, + "loss_base2": 2.3536, + "loss_pixel": 0.1595, + "loss_text": 1.4719, + "ppl": 5.111, + "step": 10144 + }, + { + "epoch": 0.05, + "global_step": 10145, + "learning_rate": 0.0004584933222036728, + "loss": 1.6026, + "loss_base2": 2.3121, + "loss_pixel": 0.1596, + "loss_text": 1.443, + "ppl": 4.9659, + "step": 10145 + }, + { + "epoch": 0.05, + "global_step": 10146, + "learning_rate": 0.0004584891485809683, + "loss": 1.6175, + "loss_base2": 2.3336, + "loss_pixel": 0.1594, + "loss_text": 1.4581, + "ppl": 5.0405, + "step": 10146 + }, + { + "epoch": 0.05, + "global_step": 10147, + "learning_rate": 0.0004584849749582638, + "loss": 1.6163, + "loss_base2": 2.3318, + "loss_pixel": 0.1588, + "loss_text": 1.4575, + "ppl": 5.0344, + "step": 10147 + }, + { + "epoch": 0.05, + "global_step": 10148, + "learning_rate": 0.00045848080133555926, + "loss": 1.5975, + "loss_base2": 2.3047, + "loss_pixel": 0.161, + "loss_text": 1.4365, + "ppl": 4.9407, + "step": 10148 + }, + { + "epoch": 0.05, + "global_step": 10149, + "learning_rate": 0.00045847662771285476, + "loss": 1.6279, + "loss_base2": 2.3486, + "loss_pixel": 0.1598, + "loss_text": 1.4681, + "ppl": 5.0932, + "step": 10149 + }, + { + "epoch": 0.05, + "global_step": 10150, + "learning_rate": 0.00045847245409015027, + "loss": 1.6207, + "loss_base2": 2.3382, + "loss_pixel": 0.1594, + "loss_text": 1.4613, + "ppl": 5.0566, + "step": 10150 + }, + { + "epoch": 0.05, + "global_step": 10151, + "learning_rate": 0.0004584682804674458, + "loss": 1.6126, + "loss_base2": 2.3265, + "loss_pixel": 0.1614, + "loss_text": 1.4511, + "ppl": 5.0158, + "step": 10151 + }, + { + "epoch": 0.05, + "global_step": 10152, + "learning_rate": 0.0004584641068447413, + "loss": 1.6156, + "loss_base2": 2.3308, + "loss_pixel": 0.1604, + "loss_text": 1.4552, + "ppl": 5.0309, + "step": 10152 + }, + { + "epoch": 0.05, + "global_step": 10153, + "learning_rate": 0.00045845993322203674, + "loss": 1.6224, + "loss_base2": 2.3406, + "loss_pixel": 0.1602, + "loss_text": 1.4622, + "ppl": 5.0652, + "step": 10153 + }, + { + "epoch": 0.05, + "global_step": 10154, + "learning_rate": 0.00045845575959933225, + "loss": 1.5988, + "loss_base2": 2.3066, + "loss_pixel": 0.159, + "loss_text": 1.4398, + "ppl": 4.9471, + "step": 10154 + }, + { + "epoch": 0.05, + "global_step": 10155, + "learning_rate": 0.00045845158597662775, + "loss": 1.6265, + "loss_base2": 2.3465, + "loss_pixel": 0.1616, + "loss_text": 1.4649, + "ppl": 5.086, + "step": 10155 + }, + { + "epoch": 0.05, + "global_step": 10156, + "learning_rate": 0.0004584474123539232, + "loss": 1.6385, + "loss_base2": 2.3639, + "loss_pixel": 0.1605, + "loss_text": 1.478, + "ppl": 5.1474, + "step": 10156 + }, + { + "epoch": 0.05, + "global_step": 10157, + "learning_rate": 0.00045844323873121866, + "loss": 1.6171, + "loss_base2": 2.333, + "loss_pixel": 0.1595, + "loss_text": 1.4576, + "ppl": 5.0385, + "step": 10157 + }, + { + "epoch": 0.05, + "global_step": 10158, + "learning_rate": 0.00045843906510851417, + "loss": 1.6105, + "loss_base2": 2.3235, + "loss_pixel": 0.1606, + "loss_text": 1.4498, + "ppl": 5.0053, + "step": 10158 + }, + { + "epoch": 0.05, + "global_step": 10159, + "learning_rate": 0.0004584348914858097, + "loss": 1.5627, + "loss_base2": 2.2545, + "loss_pixel": 0.1602, + "loss_text": 1.4025, + "ppl": 4.7717, + "step": 10159 + }, + { + "epoch": 0.05, + "global_step": 10160, + "learning_rate": 0.0004584307178631052, + "loss": 1.6111, + "loss_base2": 2.3243, + "loss_pixel": 0.1579, + "loss_text": 1.4532, + "ppl": 5.0083, + "step": 10160 + }, + { + "epoch": 0.05, + "global_step": 10161, + "learning_rate": 0.0004584265442404007, + "loss": 1.6268, + "loss_base2": 2.347, + "loss_pixel": 0.1597, + "loss_text": 1.4671, + "ppl": 5.0876, + "step": 10161 + }, + { + "epoch": 0.05, + "global_step": 10162, + "learning_rate": 0.00045842237061769614, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1605, + "loss_text": 1.4563, + "ppl": 5.0374, + "step": 10162 + }, + { + "epoch": 0.05, + "global_step": 10163, + "learning_rate": 0.00045841819699499165, + "loss": 1.6042, + "loss_base2": 2.3144, + "loss_pixel": 0.1595, + "loss_text": 1.4447, + "ppl": 4.9739, + "step": 10163 + }, + { + "epoch": 0.05, + "global_step": 10164, + "learning_rate": 0.00045841402337228716, + "loss": 1.6003, + "loss_base2": 2.3087, + "loss_pixel": 0.1584, + "loss_text": 1.4419, + "ppl": 4.9545, + "step": 10164 + }, + { + "epoch": 0.05, + "global_step": 10165, + "learning_rate": 0.00045840984974958266, + "loss": 1.6309, + "loss_base2": 2.3529, + "loss_pixel": 0.1595, + "loss_text": 1.4714, + "ppl": 5.1085, + "step": 10165 + }, + { + "epoch": 0.05, + "global_step": 10166, + "learning_rate": 0.0004584056761268781, + "loss": 1.6138, + "loss_base2": 2.3282, + "loss_pixel": 0.1597, + "loss_text": 1.4541, + "ppl": 5.0219, + "step": 10166 + }, + { + "epoch": 0.05, + "global_step": 10167, + "learning_rate": 0.0004584015025041736, + "loss": 1.6318, + "loss_base2": 2.3542, + "loss_pixel": 0.1593, + "loss_text": 1.4725, + "ppl": 5.1131, + "step": 10167 + }, + { + "epoch": 0.05, + "global_step": 10168, + "learning_rate": 0.00045839732888146913, + "loss": 1.6238, + "loss_base2": 2.3426, + "loss_pixel": 0.1604, + "loss_text": 1.4634, + "ppl": 5.0723, + "step": 10168 + }, + { + "epoch": 0.05, + "global_step": 10169, + "learning_rate": 0.00045839315525876464, + "loss": 1.6206, + "loss_base2": 2.338, + "loss_pixel": 0.16, + "loss_text": 1.4607, + "ppl": 5.0561, + "step": 10169 + }, + { + "epoch": 0.05, + "global_step": 10170, + "learning_rate": 0.00045838898163606015, + "loss": 1.6292, + "loss_base2": 2.3504, + "loss_pixel": 0.1598, + "loss_text": 1.4694, + "ppl": 5.0998, + "step": 10170 + }, + { + "epoch": 0.05, + "global_step": 10171, + "learning_rate": 0.0004583848080133556, + "loss": 1.6155, + "loss_base2": 2.3307, + "loss_pixel": 0.1593, + "loss_text": 1.4562, + "ppl": 5.0304, + "step": 10171 + }, + { + "epoch": 0.05, + "global_step": 10172, + "learning_rate": 0.0004583806343906511, + "loss": 1.6378, + "loss_base2": 2.3628, + "loss_pixel": 0.1589, + "loss_text": 1.4788, + "ppl": 5.1438, + "step": 10172 + }, + { + "epoch": 0.05, + "global_step": 10173, + "learning_rate": 0.0004583764607679466, + "loss": 1.6366, + "loss_base2": 2.3611, + "loss_pixel": 0.1591, + "loss_text": 1.4775, + "ppl": 5.1377, + "step": 10173 + }, + { + "epoch": 0.05, + "global_step": 10174, + "learning_rate": 0.0004583722871452421, + "loss": 1.6229, + "loss_base2": 2.3413, + "loss_pixel": 0.1592, + "loss_text": 1.4637, + "ppl": 5.0678, + "step": 10174 + }, + { + "epoch": 0.05, + "global_step": 10175, + "learning_rate": 0.0004583681135225376, + "loss": 1.6235, + "loss_base2": 2.3422, + "loss_pixel": 0.1587, + "loss_text": 1.4648, + "ppl": 5.0708, + "step": 10175 + }, + { + "epoch": 0.05, + "global_step": 10176, + "learning_rate": 0.00045836393989983303, + "loss": 1.6322, + "loss_base2": 2.3548, + "loss_pixel": 0.1603, + "loss_text": 1.4719, + "ppl": 5.1151, + "step": 10176 + }, + { + "epoch": 0.05, + "global_step": 10177, + "learning_rate": 0.00045835976627712854, + "loss": 1.6145, + "loss_base2": 2.3292, + "loss_pixel": 0.1604, + "loss_text": 1.4542, + "ppl": 5.0254, + "step": 10177 + }, + { + "epoch": 0.05, + "global_step": 10178, + "learning_rate": 0.00045835559265442404, + "loss": 1.6114, + "loss_base2": 2.3248, + "loss_pixel": 0.1603, + "loss_text": 1.4512, + "ppl": 5.0098, + "step": 10178 + }, + { + "epoch": 0.05, + "global_step": 10179, + "learning_rate": 0.00045835141903171955, + "loss": 1.6167, + "loss_base2": 2.3324, + "loss_pixel": 0.161, + "loss_text": 1.4557, + "ppl": 5.0364, + "step": 10179 + }, + { + "epoch": 0.05, + "global_step": 10180, + "learning_rate": 0.000458347245409015, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1607, + "loss_text": 1.4562, + "ppl": 5.0374, + "step": 10180 + }, + { + "epoch": 0.05, + "global_step": 10181, + "learning_rate": 0.0004583430717863105, + "loss": 1.6194, + "loss_base2": 2.3363, + "loss_pixel": 0.16, + "loss_text": 1.4594, + "ppl": 5.0501, + "step": 10181 + }, + { + "epoch": 0.05, + "global_step": 10182, + "learning_rate": 0.000458338898163606, + "loss": 1.6268, + "loss_base2": 2.347, + "loss_pixel": 0.1612, + "loss_text": 1.4656, + "ppl": 5.0876, + "step": 10182 + }, + { + "epoch": 0.05, + "global_step": 10183, + "learning_rate": 0.0004583347245409015, + "loss": 1.4355, + "loss_base2": 2.071, + "loss_pixel": 0.1592, + "loss_text": 1.2763, + "ppl": 4.2017, + "step": 10183 + }, + { + "epoch": 0.05, + "global_step": 10184, + "learning_rate": 0.00045833055091819703, + "loss": 1.4212, + "loss_base2": 2.0504, + "loss_pixel": 0.1604, + "loss_text": 1.2608, + "ppl": 4.1421, + "step": 10184 + }, + { + "epoch": 0.05, + "global_step": 10185, + "learning_rate": 0.0004583263772954925, + "loss": 1.3878, + "loss_base2": 2.0022, + "loss_pixel": 0.1606, + "loss_text": 1.2272, + "ppl": 4.006, + "step": 10185 + }, + { + "epoch": 0.05, + "global_step": 10186, + "learning_rate": 0.000458322203672788, + "loss": 1.4163, + "loss_base2": 2.0433, + "loss_pixel": 0.1599, + "loss_text": 1.2564, + "ppl": 4.1218, + "step": 10186 + }, + { + "epoch": 0.05, + "global_step": 10187, + "learning_rate": 0.0004583180300500835, + "loss": 1.4014, + "loss_base2": 2.0218, + "loss_pixel": 0.1591, + "loss_text": 1.2423, + "ppl": 4.0609, + "step": 10187 + }, + { + "epoch": 0.05, + "global_step": 10188, + "learning_rate": 0.000458313856427379, + "loss": 1.4221, + "loss_base2": 2.0517, + "loss_pixel": 0.1599, + "loss_text": 1.2622, + "ppl": 4.1458, + "step": 10188 + }, + { + "epoch": 0.05, + "global_step": 10189, + "learning_rate": 0.00045830968280467446, + "loss": 1.3934, + "loss_base2": 2.0103, + "loss_pixel": 0.1607, + "loss_text": 1.2327, + "ppl": 4.0285, + "step": 10189 + }, + { + "epoch": 0.05, + "global_step": 10190, + "learning_rate": 0.00045830550918196997, + "loss": 1.4023, + "loss_base2": 2.0231, + "loss_pixel": 0.1596, + "loss_text": 1.2428, + "ppl": 4.0645, + "step": 10190 + }, + { + "epoch": 0.05, + "global_step": 10191, + "learning_rate": 0.0004583013355592655, + "loss": 1.5397, + "loss_base2": 2.2213, + "loss_pixel": 0.1594, + "loss_text": 1.3802, + "ppl": 4.6632, + "step": 10191 + }, + { + "epoch": 0.05, + "global_step": 10192, + "learning_rate": 0.000458297161936561, + "loss": 1.6451, + "loss_base2": 2.3734, + "loss_pixel": 0.1598, + "loss_text": 1.4853, + "ppl": 5.1815, + "step": 10192 + }, + { + "epoch": 0.05, + "global_step": 10193, + "learning_rate": 0.00045829298831385644, + "loss": 1.6309, + "loss_base2": 2.3529, + "loss_pixel": 0.1616, + "loss_text": 1.4693, + "ppl": 5.1085, + "step": 10193 + }, + { + "epoch": 0.05, + "global_step": 10194, + "learning_rate": 0.0004582888146911519, + "loss": 1.6274, + "loss_base2": 2.3478, + "loss_pixel": 0.1607, + "loss_text": 1.4667, + "ppl": 5.0906, + "step": 10194 + }, + { + "epoch": 0.05, + "global_step": 10195, + "learning_rate": 0.0004582846410684474, + "loss": 1.6254, + "loss_base2": 2.345, + "loss_pixel": 0.1601, + "loss_text": 1.4653, + "ppl": 5.0805, + "step": 10195 + }, + { + "epoch": 0.05, + "global_step": 10196, + "learning_rate": 0.0004582804674457429, + "loss": 1.6427, + "loss_base2": 2.3699, + "loss_pixel": 0.1593, + "loss_text": 1.4833, + "ppl": 5.1691, + "step": 10196 + }, + { + "epoch": 0.05, + "global_step": 10197, + "learning_rate": 0.0004582762938230384, + "loss": 1.6085, + "loss_base2": 2.3206, + "loss_pixel": 0.1579, + "loss_text": 1.4506, + "ppl": 4.9953, + "step": 10197 + }, + { + "epoch": 0.05, + "global_step": 10198, + "learning_rate": 0.00045827212020033386, + "loss": 1.6085, + "loss_base2": 2.3206, + "loss_pixel": 0.1601, + "loss_text": 1.4484, + "ppl": 4.9953, + "step": 10198 + }, + { + "epoch": 0.05, + "global_step": 10199, + "learning_rate": 0.00045826794657762937, + "loss": 1.6237, + "loss_base2": 2.3425, + "loss_pixel": 0.1609, + "loss_text": 1.4627, + "ppl": 5.0718, + "step": 10199 + }, + { + "epoch": 0.05, + "global_step": 10200, + "learning_rate": 0.0004582637729549249, + "loss": 1.6371, + "loss_base2": 2.3618, + "loss_pixel": 0.1584, + "loss_text": 1.4787, + "ppl": 5.1402, + "step": 10200 + }, + { + "epoch": 0.05, + "global_step": 10201, + "learning_rate": 0.0004582595993322204, + "loss": 1.6066, + "loss_base2": 2.3178, + "loss_pixel": 0.1601, + "loss_text": 1.4465, + "ppl": 4.9858, + "step": 10201 + }, + { + "epoch": 0.05, + "global_step": 10202, + "learning_rate": 0.0004582554257095159, + "loss": 1.6156, + "loss_base2": 2.3308, + "loss_pixel": 0.1603, + "loss_text": 1.4553, + "ppl": 5.0309, + "step": 10202 + }, + { + "epoch": 0.05, + "global_step": 10203, + "learning_rate": 0.00045825125208681135, + "loss": 1.605, + "loss_base2": 2.3155, + "loss_pixel": 0.1603, + "loss_text": 1.4447, + "ppl": 4.9779, + "step": 10203 + }, + { + "epoch": 0.05, + "global_step": 10204, + "learning_rate": 0.00045824707846410685, + "loss": 1.6282, + "loss_base2": 2.349, + "loss_pixel": 0.1591, + "loss_text": 1.4691, + "ppl": 5.0947, + "step": 10204 + }, + { + "epoch": 0.05, + "global_step": 10205, + "learning_rate": 0.00045824290484140236, + "loss": 1.6246, + "loss_base2": 2.3438, + "loss_pixel": 0.1593, + "loss_text": 1.4654, + "ppl": 5.0764, + "step": 10205 + }, + { + "epoch": 0.05, + "global_step": 10206, + "learning_rate": 0.00045823873121869787, + "loss": 1.6144, + "loss_base2": 2.3291, + "loss_pixel": 0.1595, + "loss_text": 1.4549, + "ppl": 5.0249, + "step": 10206 + }, + { + "epoch": 0.05, + "global_step": 10207, + "learning_rate": 0.0004582345575959933, + "loss": 1.6236, + "loss_base2": 2.3424, + "loss_pixel": 0.1588, + "loss_text": 1.4649, + "ppl": 5.0713, + "step": 10207 + }, + { + "epoch": 0.05, + "global_step": 10208, + "learning_rate": 0.00045823038397328883, + "loss": 1.6244, + "loss_base2": 2.3435, + "loss_pixel": 0.1597, + "loss_text": 1.4647, + "ppl": 5.0754, + "step": 10208 + }, + { + "epoch": 0.05, + "global_step": 10209, + "learning_rate": 0.00045822621035058434, + "loss": 1.6172, + "loss_base2": 2.3331, + "loss_pixel": 0.1597, + "loss_text": 1.4575, + "ppl": 5.039, + "step": 10209 + }, + { + "epoch": 0.05, + "global_step": 10210, + "learning_rate": 0.00045822203672787984, + "loss": 1.6286, + "loss_base2": 2.3496, + "loss_pixel": 0.1599, + "loss_text": 1.4686, + "ppl": 5.0967, + "step": 10210 + }, + { + "epoch": 0.05, + "global_step": 10211, + "learning_rate": 0.00045821786310517535, + "loss": 1.6241, + "loss_base2": 2.3431, + "loss_pixel": 0.1588, + "loss_text": 1.4652, + "ppl": 5.0739, + "step": 10211 + }, + { + "epoch": 0.05, + "global_step": 10212, + "learning_rate": 0.00045821368948247075, + "loss": 1.616, + "loss_base2": 2.3314, + "loss_pixel": 0.1583, + "loss_text": 1.4577, + "ppl": 5.0329, + "step": 10212 + }, + { + "epoch": 0.05, + "global_step": 10213, + "learning_rate": 0.00045820951585976626, + "loss": 1.6235, + "loss_base2": 2.3422, + "loss_pixel": 0.1602, + "loss_text": 1.4634, + "ppl": 5.0708, + "step": 10213 + }, + { + "epoch": 0.05, + "global_step": 10214, + "learning_rate": 0.00045820534223706176, + "loss": 1.626, + "loss_base2": 2.3458, + "loss_pixel": 0.1586, + "loss_text": 1.4674, + "ppl": 5.0835, + "step": 10214 + }, + { + "epoch": 0.05, + "global_step": 10215, + "learning_rate": 0.00045820116861435727, + "loss": 1.6248, + "loss_base2": 2.3441, + "loss_pixel": 0.1591, + "loss_text": 1.4658, + "ppl": 5.0774, + "step": 10215 + }, + { + "epoch": 0.05, + "global_step": 10216, + "learning_rate": 0.0004581969949916527, + "loss": 1.5896, + "loss_base2": 2.2933, + "loss_pixel": 0.1604, + "loss_text": 1.4292, + "ppl": 4.9018, + "step": 10216 + }, + { + "epoch": 0.05, + "global_step": 10217, + "learning_rate": 0.00045819282136894823, + "loss": 1.6365, + "loss_base2": 2.361, + "loss_pixel": 0.1577, + "loss_text": 1.4788, + "ppl": 5.1372, + "step": 10217 + }, + { + "epoch": 0.05, + "global_step": 10218, + "learning_rate": 0.00045818864774624374, + "loss": 1.6105, + "loss_base2": 2.3235, + "loss_pixel": 0.1599, + "loss_text": 1.4505, + "ppl": 5.0053, + "step": 10218 + }, + { + "epoch": 0.05, + "global_step": 10219, + "learning_rate": 0.00045818447412353925, + "loss": 1.614, + "loss_base2": 2.3285, + "loss_pixel": 0.1588, + "loss_text": 1.4552, + "ppl": 5.0229, + "step": 10219 + }, + { + "epoch": 0.05, + "global_step": 10220, + "learning_rate": 0.00045818030050083475, + "loss": 1.6236, + "loss_base2": 2.3424, + "loss_pixel": 0.1594, + "loss_text": 1.4641, + "ppl": 5.0713, + "step": 10220 + }, + { + "epoch": 0.05, + "global_step": 10221, + "learning_rate": 0.0004581761268781302, + "loss": 1.6278, + "loss_base2": 2.3484, + "loss_pixel": 0.1595, + "loss_text": 1.4683, + "ppl": 5.0927, + "step": 10221 + }, + { + "epoch": 0.05, + "global_step": 10222, + "learning_rate": 0.0004581719532554257, + "loss": 1.5978, + "loss_base2": 2.3051, + "loss_pixel": 0.1594, + "loss_text": 1.4384, + "ppl": 4.9421, + "step": 10222 + }, + { + "epoch": 0.05, + "global_step": 10223, + "learning_rate": 0.0004581677796327212, + "loss": 1.6273, + "loss_base2": 2.3477, + "loss_pixel": 0.1599, + "loss_text": 1.4674, + "ppl": 5.0901, + "step": 10223 + }, + { + "epoch": 0.05, + "global_step": 10224, + "learning_rate": 0.00045816360601001673, + "loss": 1.6138, + "loss_base2": 2.3282, + "loss_pixel": 0.1596, + "loss_text": 1.4542, + "ppl": 5.0219, + "step": 10224 + }, + { + "epoch": 0.05, + "global_step": 10225, + "learning_rate": 0.0004581594323873122, + "loss": 1.6278, + "loss_base2": 2.3484, + "loss_pixel": 0.16, + "loss_text": 1.4678, + "ppl": 5.0927, + "step": 10225 + }, + { + "epoch": 0.05, + "global_step": 10226, + "learning_rate": 0.0004581552587646077, + "loss": 1.6147, + "loss_base2": 2.3295, + "loss_pixel": 0.1591, + "loss_text": 1.4556, + "ppl": 5.0264, + "step": 10226 + }, + { + "epoch": 0.05, + "global_step": 10227, + "learning_rate": 0.0004581510851419032, + "loss": 1.6123, + "loss_base2": 2.3261, + "loss_pixel": 0.1584, + "loss_text": 1.4539, + "ppl": 5.0143, + "step": 10227 + }, + { + "epoch": 0.05, + "global_step": 10228, + "learning_rate": 0.0004581469115191987, + "loss": 1.6161, + "loss_base2": 2.3315, + "loss_pixel": 0.1595, + "loss_text": 1.4566, + "ppl": 5.0334, + "step": 10228 + }, + { + "epoch": 0.05, + "global_step": 10229, + "learning_rate": 0.0004581427378964942, + "loss": 1.6074, + "loss_base2": 2.319, + "loss_pixel": 0.1604, + "loss_text": 1.447, + "ppl": 4.9898, + "step": 10229 + }, + { + "epoch": 0.05, + "global_step": 10230, + "learning_rate": 0.00045813856427378966, + "loss": 1.6225, + "loss_base2": 2.3408, + "loss_pixel": 0.1595, + "loss_text": 1.4631, + "ppl": 5.0657, + "step": 10230 + }, + { + "epoch": 0.05, + "global_step": 10231, + "learning_rate": 0.0004581343906510851, + "loss": 1.6274, + "loss_base2": 2.3478, + "loss_pixel": 0.1607, + "loss_text": 1.4667, + "ppl": 5.0906, + "step": 10231 + }, + { + "epoch": 0.05, + "global_step": 10232, + "learning_rate": 0.0004581302170283806, + "loss": 1.6204, + "loss_base2": 2.3377, + "loss_pixel": 0.1601, + "loss_text": 1.4603, + "ppl": 5.0551, + "step": 10232 + }, + { + "epoch": 0.05, + "global_step": 10233, + "learning_rate": 0.00045812604340567613, + "loss": 1.6037, + "loss_base2": 2.3137, + "loss_pixel": 0.1602, + "loss_text": 1.4435, + "ppl": 4.9714, + "step": 10233 + }, + { + "epoch": 0.05, + "global_step": 10234, + "learning_rate": 0.00045812186978297164, + "loss": 1.6295, + "loss_base2": 2.3509, + "loss_pixel": 0.1653, + "loss_text": 1.4642, + "ppl": 5.1013, + "step": 10234 + }, + { + "epoch": 0.05, + "global_step": 10235, + "learning_rate": 0.0004581176961602671, + "loss": 1.6271, + "loss_base2": 2.3474, + "loss_pixel": 0.1856, + "loss_text": 1.4415, + "ppl": 5.0891, + "step": 10235 + }, + { + "epoch": 0.05, + "global_step": 10236, + "learning_rate": 0.0004581135225375626, + "loss": 1.7151, + "loss_base2": 2.4744, + "loss_pixel": 0.264, + "loss_text": 1.4511, + "ppl": 5.5572, + "step": 10236 + }, + { + "epoch": 0.05, + "global_step": 10237, + "learning_rate": 0.0004581093489148581, + "loss": 1.7809, + "loss_base2": 2.5693, + "loss_pixel": 0.3268, + "loss_text": 1.4541, + "ppl": 5.9352, + "step": 10237 + }, + { + "epoch": 0.05, + "global_step": 10238, + "learning_rate": 0.0004581051752921536, + "loss": 1.7946, + "loss_base2": 2.5891, + "loss_pixel": 0.318, + "loss_text": 1.4766, + "ppl": 6.0171, + "step": 10238 + }, + { + "epoch": 0.05, + "global_step": 10239, + "learning_rate": 0.00045810100166944907, + "loss": 1.7888, + "loss_base2": 2.5807, + "loss_pixel": 0.3322, + "loss_text": 1.4567, + "ppl": 5.9823, + "step": 10239 + }, + { + "epoch": 0.05, + "global_step": 10240, + "learning_rate": 0.0004580968280467446, + "loss": 1.825, + "loss_base2": 2.6329, + "loss_pixel": 0.3643, + "loss_text": 1.4607, + "ppl": 6.2028, + "step": 10240 + }, + { + "epoch": 0.05, + "global_step": 10241, + "learning_rate": 0.0004580926544240401, + "loss": 1.999, + "loss_base2": 2.8839, + "loss_pixel": 0.5276, + "loss_text": 1.4714, + "ppl": 7.3817, + "step": 10241 + }, + { + "epoch": 0.05, + "global_step": 10242, + "learning_rate": 0.0004580884808013356, + "loss": 1.8992, + "loss_base2": 2.74, + "loss_pixel": 0.4207, + "loss_text": 1.4785, + "ppl": 6.6805, + "step": 10242 + }, + { + "epoch": 0.05, + "global_step": 10243, + "learning_rate": 0.0004580843071786311, + "loss": 3.1755, + "loss_base2": 4.5813, + "loss_pixel": 0.3909, + "loss_text": 2.7846, + "ppl": 23.9388, + "step": 10243 + }, + { + "epoch": 0.05, + "global_step": 10244, + "learning_rate": 0.00045808013355592655, + "loss": 1.9908, + "loss_base2": 2.8721, + "loss_pixel": 0.4007, + "loss_text": 1.59, + "ppl": 7.3214, + "step": 10244 + }, + { + "epoch": 0.05, + "global_step": 10245, + "learning_rate": 0.00045807595993322206, + "loss": 2.0647, + "loss_base2": 2.9787, + "loss_pixel": 0.3845, + "loss_text": 1.6802, + "ppl": 7.8829, + "step": 10245 + }, + { + "epoch": 0.05, + "global_step": 10246, + "learning_rate": 0.00045807178631051756, + "loss": 2.3418, + "loss_base2": 3.3785, + "loss_pixel": 0.3774, + "loss_text": 1.9644, + "ppl": 10.3999, + "step": 10246 + }, + { + "epoch": 0.05, + "global_step": 10247, + "learning_rate": 0.00045806761268781307, + "loss": 2.1428, + "loss_base2": 3.0914, + "loss_pixel": 0.3734, + "loss_text": 1.7695, + "ppl": 8.5233, + "step": 10247 + }, + { + "epoch": 0.05, + "global_step": 10248, + "learning_rate": 0.0004580634390651085, + "loss": 2.1566, + "loss_base2": 3.1113, + "loss_pixel": 0.3695, + "loss_text": 1.7871, + "ppl": 8.6417, + "step": 10248 + }, + { + "epoch": 0.05, + "global_step": 10249, + "learning_rate": 0.000458059265442404, + "loss": 2.0995, + "loss_base2": 3.0289, + "loss_pixel": 0.3642, + "loss_text": 1.7352, + "ppl": 8.1621, + "step": 10249 + }, + { + "epoch": 0.05, + "global_step": 10250, + "learning_rate": 0.0004580550918196995, + "loss": 2.1066, + "loss_base2": 3.0392, + "loss_pixel": 0.3785, + "loss_text": 1.7281, + "ppl": 8.2202, + "step": 10250 + }, + { + "epoch": 0.05, + "global_step": 10251, + "learning_rate": 0.000458050918196995, + "loss": 2.1481, + "loss_base2": 3.0991, + "loss_pixel": 0.3896, + "loss_text": 1.7584, + "ppl": 8.5686, + "step": 10251 + }, + { + "epoch": 0.05, + "global_step": 10252, + "learning_rate": 0.0004580467445742905, + "loss": 2.2478, + "loss_base2": 3.2429, + "loss_pixel": 0.4189, + "loss_text": 1.8288, + "ppl": 9.4669, + "step": 10252 + }, + { + "epoch": 0.05, + "global_step": 10253, + "learning_rate": 0.00045804257095158595, + "loss": 2.1524, + "loss_base2": 3.1053, + "loss_pixel": 0.381, + "loss_text": 1.7714, + "ppl": 8.6055, + "step": 10253 + }, + { + "epoch": 0.05, + "global_step": 10254, + "learning_rate": 0.00045803839732888146, + "loss": 2.2621, + "loss_base2": 3.2635, + "loss_pixel": 0.4025, + "loss_text": 1.8596, + "ppl": 9.6032, + "step": 10254 + }, + { + "epoch": 0.05, + "global_step": 10255, + "learning_rate": 0.00045803422370617697, + "loss": 2.2272, + "loss_base2": 3.2132, + "loss_pixel": 0.3859, + "loss_text": 1.8413, + "ppl": 9.2739, + "step": 10255 + }, + { + "epoch": 0.05, + "global_step": 10256, + "learning_rate": 0.0004580300500834725, + "loss": 2.2254, + "loss_base2": 3.2106, + "loss_pixel": 0.3858, + "loss_text": 1.8396, + "ppl": 9.2572, + "step": 10256 + }, + { + "epoch": 0.05, + "global_step": 10257, + "learning_rate": 0.00045802587646076793, + "loss": 2.2007, + "loss_base2": 3.1749, + "loss_pixel": 0.3836, + "loss_text": 1.8171, + "ppl": 9.0313, + "step": 10257 + }, + { + "epoch": 0.05, + "global_step": 10258, + "learning_rate": 0.00045802170283806344, + "loss": 2.1631, + "loss_base2": 3.1207, + "loss_pixel": 0.3854, + "loss_text": 1.7777, + "ppl": 8.6981, + "step": 10258 + }, + { + "epoch": 0.05, + "global_step": 10259, + "learning_rate": 0.00045801752921535894, + "loss": 2.138, + "loss_base2": 3.0845, + "loss_pixel": 0.3786, + "loss_text": 1.7594, + "ppl": 8.4825, + "step": 10259 + }, + { + "epoch": 0.05, + "global_step": 10260, + "learning_rate": 0.00045801335559265445, + "loss": 2.1293, + "loss_base2": 3.0719, + "loss_pixel": 0.3833, + "loss_text": 1.746, + "ppl": 8.409, + "step": 10260 + }, + { + "epoch": 0.05, + "global_step": 10261, + "learning_rate": 0.00045800918196994996, + "loss": 2.102, + "loss_base2": 3.0325, + "loss_pixel": 0.375, + "loss_text": 1.7271, + "ppl": 8.1825, + "step": 10261 + }, + { + "epoch": 0.05, + "global_step": 10262, + "learning_rate": 0.0004580050083472454, + "loss": 2.0947, + "loss_base2": 3.022, + "loss_pixel": 0.3733, + "loss_text": 1.7214, + "ppl": 8.123, + "step": 10262 + }, + { + "epoch": 0.05, + "global_step": 10263, + "learning_rate": 0.0004580008347245409, + "loss": 2.0847, + "loss_base2": 3.0076, + "loss_pixel": 0.3719, + "loss_text": 1.7128, + "ppl": 8.0422, + "step": 10263 + }, + { + "epoch": 0.05, + "global_step": 10264, + "learning_rate": 0.0004579966611018364, + "loss": 2.078, + "loss_base2": 2.9979, + "loss_pixel": 0.3675, + "loss_text": 1.7106, + "ppl": 7.9885, + "step": 10264 + }, + { + "epoch": 0.05, + "global_step": 10265, + "learning_rate": 0.00045799248747913193, + "loss": 2.1951, + "loss_base2": 3.1669, + "loss_pixel": 0.3668, + "loss_text": 1.8283, + "ppl": 8.9809, + "step": 10265 + }, + { + "epoch": 0.05, + "global_step": 10266, + "learning_rate": 0.0004579883138564274, + "loss": 2.1254, + "loss_base2": 3.0663, + "loss_pixel": 0.3627, + "loss_text": 1.7627, + "ppl": 8.3762, + "step": 10266 + }, + { + "epoch": 0.05, + "global_step": 10267, + "learning_rate": 0.0004579841402337229, + "loss": 2.1594, + "loss_base2": 3.1154, + "loss_pixel": 0.3603, + "loss_text": 1.7991, + "ppl": 8.6659, + "step": 10267 + }, + { + "epoch": 0.05, + "global_step": 10268, + "learning_rate": 0.00045797996661101835, + "loss": 2.16, + "loss_base2": 3.1162, + "loss_pixel": 0.3563, + "loss_text": 1.8036, + "ppl": 8.6711, + "step": 10268 + }, + { + "epoch": 0.05, + "global_step": 10269, + "learning_rate": 0.00045797579298831385, + "loss": 2.1401, + "loss_base2": 3.0875, + "loss_pixel": 0.353, + "loss_text": 1.7871, + "ppl": 8.5003, + "step": 10269 + }, + { + "epoch": 0.05, + "global_step": 10270, + "learning_rate": 0.00045797161936560936, + "loss": 2.1068, + "loss_base2": 3.0395, + "loss_pixel": 0.3495, + "loss_text": 1.7573, + "ppl": 8.2219, + "step": 10270 + }, + { + "epoch": 0.05, + "global_step": 10271, + "learning_rate": 0.0004579674457429048, + "loss": 2.092, + "loss_base2": 3.0181, + "loss_pixel": 0.3498, + "loss_text": 1.7422, + "ppl": 8.1011, + "step": 10271 + }, + { + "epoch": 0.05, + "global_step": 10272, + "learning_rate": 0.0004579632721202003, + "loss": 2.0912, + "loss_base2": 3.017, + "loss_pixel": 0.3502, + "loss_text": 1.7409, + "ppl": 8.0946, + "step": 10272 + }, + { + "epoch": 0.05, + "global_step": 10273, + "learning_rate": 0.00045795909849749583, + "loss": 2.0878, + "loss_base2": 3.0121, + "loss_pixel": 0.375, + "loss_text": 1.7128, + "ppl": 8.0671, + "step": 10273 + }, + { + "epoch": 0.05, + "global_step": 10274, + "learning_rate": 0.00045795492487479134, + "loss": 2.0887, + "loss_base2": 3.0134, + "loss_pixel": 0.3887, + "loss_text": 1.7, + "ppl": 8.0744, + "step": 10274 + }, + { + "epoch": 0.05, + "global_step": 10275, + "learning_rate": 0.0004579507512520868, + "loss": 2.0726, + "loss_base2": 2.9901, + "loss_pixel": 0.375, + "loss_text": 1.6976, + "ppl": 7.9455, + "step": 10275 + }, + { + "epoch": 0.05, + "global_step": 10276, + "learning_rate": 0.0004579465776293823, + "loss": 2.065, + "loss_base2": 2.9792, + "loss_pixel": 0.382, + "loss_text": 1.683, + "ppl": 7.8853, + "step": 10276 + }, + { + "epoch": 0.05, + "global_step": 10277, + "learning_rate": 0.0004579424040066778, + "loss": 2.0739, + "loss_base2": 2.992, + "loss_pixel": 0.3821, + "loss_text": 1.6918, + "ppl": 7.9558, + "step": 10277 + }, + { + "epoch": 0.05, + "global_step": 10278, + "learning_rate": 0.0004579382303839733, + "loss": 2.0417, + "loss_base2": 2.9456, + "loss_pixel": 0.3743, + "loss_text": 1.6674, + "ppl": 7.7037, + "step": 10278 + }, + { + "epoch": 0.05, + "global_step": 10279, + "learning_rate": 0.0004579340567612688, + "loss": 2.031, + "loss_base2": 2.9301, + "loss_pixel": 0.3751, + "loss_text": 1.6559, + "ppl": 7.6217, + "step": 10279 + }, + { + "epoch": 0.05, + "global_step": 10280, + "learning_rate": 0.00045792988313856427, + "loss": 2.0189, + "loss_base2": 2.9127, + "loss_pixel": 0.3719, + "loss_text": 1.6469, + "ppl": 7.53, + "step": 10280 + }, + { + "epoch": 0.05, + "global_step": 10281, + "learning_rate": 0.0004579257095158598, + "loss": 2.0331, + "loss_base2": 2.9331, + "loss_pixel": 0.3745, + "loss_text": 1.6585, + "ppl": 7.6377, + "step": 10281 + }, + { + "epoch": 0.05, + "global_step": 10282, + "learning_rate": 0.0004579215358931553, + "loss": 1.9917, + "loss_base2": 2.8734, + "loss_pixel": 0.3689, + "loss_text": 1.6228, + "ppl": 7.328, + "step": 10282 + }, + { + "epoch": 0.05, + "global_step": 10283, + "learning_rate": 0.0004579173622704508, + "loss": 1.997, + "loss_base2": 2.8811, + "loss_pixel": 0.3709, + "loss_text": 1.6261, + "ppl": 7.3669, + "step": 10283 + }, + { + "epoch": 0.05, + "global_step": 10284, + "learning_rate": 0.00045791318864774625, + "loss": 1.863, + "loss_base2": 2.6877, + "loss_pixel": 0.373, + "loss_text": 1.49, + "ppl": 6.443, + "step": 10284 + }, + { + "epoch": 0.05, + "global_step": 10285, + "learning_rate": 0.00045790901502504175, + "loss": 1.7612, + "loss_base2": 2.5409, + "loss_pixel": 0.3658, + "loss_text": 1.3953, + "ppl": 5.8194, + "step": 10285 + }, + { + "epoch": 0.05, + "global_step": 10286, + "learning_rate": 0.00045790484140233726, + "loss": 1.7749, + "loss_base2": 2.5606, + "loss_pixel": 0.3729, + "loss_text": 1.402, + "ppl": 5.8997, + "step": 10286 + }, + { + "epoch": 0.05, + "global_step": 10287, + "learning_rate": 0.0004579006677796327, + "loss": 1.7797, + "loss_base2": 2.5676, + "loss_pixel": 0.3809, + "loss_text": 1.3988, + "ppl": 5.9281, + "step": 10287 + }, + { + "epoch": 0.05, + "global_step": 10288, + "learning_rate": 0.0004578964941569282, + "loss": 1.7786, + "loss_base2": 2.566, + "loss_pixel": 0.3847, + "loss_text": 1.3939, + "ppl": 5.9216, + "step": 10288 + }, + { + "epoch": 0.05, + "global_step": 10289, + "learning_rate": 0.0004578923205342237, + "loss": 1.7673, + "loss_base2": 2.5497, + "loss_pixel": 0.3804, + "loss_text": 1.3869, + "ppl": 5.855, + "step": 10289 + }, + { + "epoch": 0.05, + "global_step": 10290, + "learning_rate": 0.0004578881469115192, + "loss": 1.7583, + "loss_base2": 2.5367, + "loss_pixel": 0.3755, + "loss_text": 1.3829, + "ppl": 5.8026, + "step": 10290 + }, + { + "epoch": 0.05, + "global_step": 10291, + "learning_rate": 0.0004578839732888147, + "loss": 1.8285, + "loss_base2": 2.638, + "loss_pixel": 0.3758, + "loss_text": 1.4528, + "ppl": 6.2245, + "step": 10291 + }, + { + "epoch": 0.05, + "global_step": 10292, + "learning_rate": 0.0004578797996661102, + "loss": 1.9966, + "loss_base2": 2.8805, + "loss_pixel": 0.3751, + "loss_text": 1.6215, + "ppl": 7.364, + "step": 10292 + }, + { + "epoch": 0.05, + "global_step": 10293, + "learning_rate": 0.0004578756260434057, + "loss": 1.9721, + "loss_base2": 2.8451, + "loss_pixel": 0.3714, + "loss_text": 1.6007, + "ppl": 7.1858, + "step": 10293 + }, + { + "epoch": 0.05, + "global_step": 10294, + "learning_rate": 0.00045787145242070116, + "loss": 1.9723, + "loss_base2": 2.8454, + "loss_pixel": 0.3704, + "loss_text": 1.6019, + "ppl": 7.1872, + "step": 10294 + }, + { + "epoch": 0.05, + "global_step": 10295, + "learning_rate": 0.00045786727879799666, + "loss": 1.96, + "loss_base2": 2.8277, + "loss_pixel": 0.3675, + "loss_text": 1.5925, + "ppl": 7.0993, + "step": 10295 + }, + { + "epoch": 0.05, + "global_step": 10296, + "learning_rate": 0.00045786310517529217, + "loss": 1.9699, + "loss_base2": 2.842, + "loss_pixel": 0.3662, + "loss_text": 1.6036, + "ppl": 7.17, + "step": 10296 + }, + { + "epoch": 0.05, + "global_step": 10297, + "learning_rate": 0.0004578589315525877, + "loss": 1.9508, + "loss_base2": 2.8144, + "loss_pixel": 0.3652, + "loss_text": 1.5856, + "ppl": 7.0343, + "step": 10297 + }, + { + "epoch": 0.05, + "global_step": 10298, + "learning_rate": 0.00045785475792988313, + "loss": 1.936, + "loss_base2": 2.7931, + "loss_pixel": 0.3645, + "loss_text": 1.5715, + "ppl": 6.931, + "step": 10298 + }, + { + "epoch": 0.05, + "global_step": 10299, + "learning_rate": 0.00045785058430717864, + "loss": 1.9509, + "loss_base2": 2.8146, + "loss_pixel": 0.3626, + "loss_text": 1.5883, + "ppl": 7.035, + "step": 10299 + }, + { + "epoch": 0.05, + "global_step": 10300, + "learning_rate": 0.00045784641068447415, + "loss": 1.9274, + "loss_base2": 2.7807, + "loss_pixel": 0.3585, + "loss_text": 1.5689, + "ppl": 6.8716, + "step": 10300 + }, + { + "epoch": 0.05, + "global_step": 10301, + "learning_rate": 0.00045784223706176965, + "loss": 1.941, + "loss_base2": 2.8003, + "loss_pixel": 0.3561, + "loss_text": 1.5848, + "ppl": 6.9657, + "step": 10301 + }, + { + "epoch": 0.05, + "global_step": 10302, + "learning_rate": 0.00045783806343906516, + "loss": 1.8793, + "loss_base2": 2.7113, + "loss_pixel": 0.354, + "loss_text": 1.5253, + "ppl": 6.5489, + "step": 10302 + }, + { + "epoch": 0.05, + "global_step": 10303, + "learning_rate": 0.0004578338898163606, + "loss": 1.9086, + "loss_base2": 2.7535, + "loss_pixel": 0.3515, + "loss_text": 1.557, + "ppl": 6.7436, + "step": 10303 + }, + { + "epoch": 0.05, + "global_step": 10304, + "learning_rate": 0.0004578297161936561, + "loss": 1.9184, + "loss_base2": 2.7677, + "loss_pixel": 0.3519, + "loss_text": 1.5665, + "ppl": 6.8101, + "step": 10304 + }, + { + "epoch": 0.05, + "global_step": 10305, + "learning_rate": 0.00045782554257095163, + "loss": 1.9171, + "loss_base2": 2.7658, + "loss_pixel": 0.3494, + "loss_text": 1.5676, + "ppl": 6.8012, + "step": 10305 + }, + { + "epoch": 0.05, + "global_step": 10306, + "learning_rate": 0.0004578213689482471, + "loss": 1.8964, + "loss_base2": 2.7359, + "loss_pixel": 0.3476, + "loss_text": 1.5487, + "ppl": 6.6619, + "step": 10306 + }, + { + "epoch": 0.05, + "global_step": 10307, + "learning_rate": 0.00045781719532554254, + "loss": 1.8892, + "loss_base2": 2.7255, + "loss_pixel": 0.3464, + "loss_text": 1.5428, + "ppl": 6.6141, + "step": 10307 + }, + { + "epoch": 0.05, + "global_step": 10308, + "learning_rate": 0.00045781302170283804, + "loss": 1.893, + "loss_base2": 2.731, + "loss_pixel": 0.3455, + "loss_text": 1.5475, + "ppl": 6.6393, + "step": 10308 + }, + { + "epoch": 0.05, + "global_step": 10309, + "learning_rate": 0.00045780884808013355, + "loss": 1.8998, + "loss_base2": 2.7408, + "loss_pixel": 0.3437, + "loss_text": 1.5561, + "ppl": 6.6846, + "step": 10309 + }, + { + "epoch": 0.05, + "global_step": 10310, + "learning_rate": 0.00045780467445742906, + "loss": 1.8819, + "loss_base2": 2.715, + "loss_pixel": 0.343, + "loss_text": 1.5389, + "ppl": 6.566, + "step": 10310 + }, + { + "epoch": 0.05, + "global_step": 10311, + "learning_rate": 0.00045780050083472456, + "loss": 1.9056, + "loss_base2": 2.7492, + "loss_pixel": 0.3428, + "loss_text": 1.5628, + "ppl": 6.7234, + "step": 10311 + }, + { + "epoch": 0.05, + "global_step": 10312, + "learning_rate": 0.00045779632721202, + "loss": 1.8833, + "loss_base2": 2.717, + "loss_pixel": 0.3423, + "loss_text": 1.541, + "ppl": 6.5752, + "step": 10312 + }, + { + "epoch": 0.05, + "global_step": 10313, + "learning_rate": 0.0004577921535893155, + "loss": 1.885, + "loss_base2": 2.7195, + "loss_pixel": 0.3442, + "loss_text": 1.5408, + "ppl": 6.5864, + "step": 10313 + }, + { + "epoch": 0.05, + "global_step": 10314, + "learning_rate": 0.00045778797996661103, + "loss": 1.8575, + "loss_base2": 2.6798, + "loss_pixel": 0.3409, + "loss_text": 1.5166, + "ppl": 6.4077, + "step": 10314 + }, + { + "epoch": 0.05, + "global_step": 10315, + "learning_rate": 0.00045778380634390654, + "loss": 1.8756, + "loss_base2": 2.7059, + "loss_pixel": 0.3439, + "loss_text": 1.5317, + "ppl": 6.5247, + "step": 10315 + }, + { + "epoch": 0.05, + "global_step": 10316, + "learning_rate": 0.000457779632721202, + "loss": 1.6724, + "loss_base2": 2.4128, + "loss_pixel": 0.3468, + "loss_text": 1.3256, + "ppl": 5.3249, + "step": 10316 + }, + { + "epoch": 0.05, + "global_step": 10317, + "learning_rate": 0.0004577754590984975, + "loss": 1.6673, + "loss_base2": 2.4054, + "loss_pixel": 0.3489, + "loss_text": 1.3183, + "ppl": 5.2978, + "step": 10317 + }, + { + "epoch": 0.05, + "global_step": 10318, + "learning_rate": 0.000457771285475793, + "loss": 1.6813, + "loss_base2": 2.4256, + "loss_pixel": 0.3448, + "loss_text": 1.3365, + "ppl": 5.3725, + "step": 10318 + }, + { + "epoch": 0.05, + "global_step": 10319, + "learning_rate": 0.0004577671118530885, + "loss": 1.6452, + "loss_base2": 2.3735, + "loss_pixel": 0.3435, + "loss_text": 1.3016, + "ppl": 5.182, + "step": 10319 + }, + { + "epoch": 0.05, + "global_step": 10320, + "learning_rate": 0.000457762938230384, + "loss": 1.6513, + "loss_base2": 2.3823, + "loss_pixel": 0.3439, + "loss_text": 1.3074, + "ppl": 5.2138, + "step": 10320 + }, + { + "epoch": 0.05, + "global_step": 10321, + "learning_rate": 0.0004577587646076795, + "loss": 1.6471, + "loss_base2": 2.3763, + "loss_pixel": 0.3423, + "loss_text": 1.3048, + "ppl": 5.1919, + "step": 10321 + }, + { + "epoch": 0.05, + "global_step": 10322, + "learning_rate": 0.000457754590984975, + "loss": 1.6541, + "loss_base2": 2.3864, + "loss_pixel": 0.3408, + "loss_text": 1.3133, + "ppl": 5.2284, + "step": 10322 + }, + { + "epoch": 0.05, + "global_step": 10323, + "learning_rate": 0.0004577504173622705, + "loss": 1.7532, + "loss_base2": 2.5293, + "loss_pixel": 0.3421, + "loss_text": 1.4111, + "ppl": 5.773, + "step": 10323 + }, + { + "epoch": 0.05, + "global_step": 10324, + "learning_rate": 0.000457746243739566, + "loss": 1.8951, + "loss_base2": 2.7341, + "loss_pixel": 0.3402, + "loss_text": 1.5549, + "ppl": 6.6532, + "step": 10324 + }, + { + "epoch": 0.05, + "global_step": 10325, + "learning_rate": 0.0004577420701168614, + "loss": 1.8791, + "loss_base2": 2.711, + "loss_pixel": 0.3403, + "loss_text": 1.5388, + "ppl": 6.5476, + "step": 10325 + }, + { + "epoch": 0.05, + "global_step": 10326, + "learning_rate": 0.0004577378964941569, + "loss": 1.8926, + "loss_base2": 2.7304, + "loss_pixel": 0.3387, + "loss_text": 1.554, + "ppl": 6.6366, + "step": 10326 + }, + { + "epoch": 0.05, + "global_step": 10327, + "learning_rate": 0.0004577337228714524, + "loss": 1.8669, + "loss_base2": 2.6934, + "loss_pixel": 0.3371, + "loss_text": 1.5298, + "ppl": 6.4682, + "step": 10327 + }, + { + "epoch": 0.05, + "global_step": 10328, + "learning_rate": 0.0004577295492487479, + "loss": 1.8664, + "loss_base2": 2.6926, + "loss_pixel": 0.3366, + "loss_text": 1.5298, + "ppl": 6.465, + "step": 10328 + }, + { + "epoch": 0.05, + "global_step": 10329, + "learning_rate": 0.0004577253756260434, + "loss": 1.8517, + "loss_base2": 2.6714, + "loss_pixel": 0.336, + "loss_text": 1.5157, + "ppl": 6.3706, + "step": 10329 + }, + { + "epoch": 0.05, + "global_step": 10330, + "learning_rate": 0.0004577212020033389, + "loss": 1.858, + "loss_base2": 2.6805, + "loss_pixel": 0.3362, + "loss_text": 1.5218, + "ppl": 6.4109, + "step": 10330 + }, + { + "epoch": 0.05, + "global_step": 10331, + "learning_rate": 0.0004577170283806344, + "loss": 1.857, + "loss_base2": 2.6791, + "loss_pixel": 0.3348, + "loss_text": 1.5222, + "ppl": 6.4045, + "step": 10331 + }, + { + "epoch": 0.05, + "global_step": 10332, + "learning_rate": 0.0004577128547579299, + "loss": 1.8636, + "loss_base2": 2.6886, + "loss_pixel": 0.3339, + "loss_text": 1.5297, + "ppl": 6.4469, + "step": 10332 + }, + { + "epoch": 0.05, + "global_step": 10333, + "learning_rate": 0.0004577086811352254, + "loss": 1.8631, + "loss_base2": 2.6879, + "loss_pixel": 0.3321, + "loss_text": 1.531, + "ppl": 6.4437, + "step": 10333 + }, + { + "epoch": 0.05, + "global_step": 10334, + "learning_rate": 0.00045770450751252085, + "loss": 1.85, + "loss_base2": 2.669, + "loss_pixel": 0.3315, + "loss_text": 1.5185, + "ppl": 6.3598, + "step": 10334 + }, + { + "epoch": 0.05, + "global_step": 10335, + "learning_rate": 0.00045770033388981636, + "loss": 1.8627, + "loss_base2": 2.6873, + "loss_pixel": 0.3361, + "loss_text": 1.5266, + "ppl": 6.4411, + "step": 10335 + }, + { + "epoch": 0.05, + "global_step": 10336, + "learning_rate": 0.00045769616026711187, + "loss": 1.8492, + "loss_base2": 2.6678, + "loss_pixel": 0.3383, + "loss_text": 1.5109, + "ppl": 6.3547, + "step": 10336 + }, + { + "epoch": 0.05, + "global_step": 10337, + "learning_rate": 0.0004576919866444074, + "loss": 1.8638, + "loss_base2": 2.6889, + "loss_pixel": 0.3334, + "loss_text": 1.5304, + "ppl": 6.4482, + "step": 10337 + }, + { + "epoch": 0.05, + "global_step": 10338, + "learning_rate": 0.0004576878130217029, + "loss": 1.8321, + "loss_base2": 2.6432, + "loss_pixel": 0.3346, + "loss_text": 1.4974, + "ppl": 6.247, + "step": 10338 + }, + { + "epoch": 0.05, + "global_step": 10339, + "learning_rate": 0.00045768363939899834, + "loss": 1.8389, + "loss_base2": 2.653, + "loss_pixel": 0.3303, + "loss_text": 1.5086, + "ppl": 6.2896, + "step": 10339 + }, + { + "epoch": 0.05, + "global_step": 10340, + "learning_rate": 0.00045767946577629384, + "loss": 1.8467, + "loss_base2": 2.6642, + "loss_pixel": 0.3296, + "loss_text": 1.5171, + "ppl": 6.3389, + "step": 10340 + }, + { + "epoch": 0.05, + "global_step": 10341, + "learning_rate": 0.00045767529215358935, + "loss": 1.848, + "loss_base2": 2.6661, + "loss_pixel": 0.3301, + "loss_text": 1.5179, + "ppl": 6.3471, + "step": 10341 + }, + { + "epoch": 0.05, + "global_step": 10342, + "learning_rate": 0.00045767111853088486, + "loss": 1.8417, + "loss_base2": 2.657, + "loss_pixel": 0.3291, + "loss_text": 1.5126, + "ppl": 6.3073, + "step": 10342 + }, + { + "epoch": 0.05, + "global_step": 10343, + "learning_rate": 0.00045766694490818026, + "loss": 1.8429, + "loss_base2": 2.6587, + "loss_pixel": 0.3282, + "loss_text": 1.5147, + "ppl": 6.3148, + "step": 10343 + }, + { + "epoch": 0.05, + "global_step": 10344, + "learning_rate": 0.00045766277128547576, + "loss": 1.8278, + "loss_base2": 2.637, + "loss_pixel": 0.3269, + "loss_text": 1.5009, + "ppl": 6.2202, + "step": 10344 + }, + { + "epoch": 0.05, + "global_step": 10345, + "learning_rate": 0.00045765859766277127, + "loss": 1.8587, + "loss_base2": 2.6815, + "loss_pixel": 0.3318, + "loss_text": 1.527, + "ppl": 6.4154, + "step": 10345 + }, + { + "epoch": 0.05, + "global_step": 10346, + "learning_rate": 0.0004576544240400668, + "loss": 1.835, + "loss_base2": 2.6473, + "loss_pixel": 0.3255, + "loss_text": 1.5095, + "ppl": 6.2651, + "step": 10346 + }, + { + "epoch": 0.05, + "global_step": 10347, + "learning_rate": 0.0004576502504173623, + "loss": 1.8191, + "loss_base2": 2.6244, + "loss_pixel": 0.3265, + "loss_text": 1.4926, + "ppl": 6.1663, + "step": 10347 + }, + { + "epoch": 0.05, + "global_step": 10348, + "learning_rate": 0.00045764607679465774, + "loss": 1.8159, + "loss_base2": 2.6198, + "loss_pixel": 0.3266, + "loss_text": 1.4893, + "ppl": 6.1466, + "step": 10348 + }, + { + "epoch": 0.05, + "global_step": 10349, + "learning_rate": 0.00045764190317195325, + "loss": 1.845, + "loss_base2": 2.6618, + "loss_pixel": 0.3238, + "loss_text": 1.5213, + "ppl": 6.3281, + "step": 10349 + }, + { + "epoch": 0.05, + "global_step": 10350, + "learning_rate": 0.00045763772954924875, + "loss": 1.8454, + "loss_base2": 2.6623, + "loss_pixel": 0.3325, + "loss_text": 1.5129, + "ppl": 6.3306, + "step": 10350 + }, + { + "epoch": 0.05, + "global_step": 10351, + "learning_rate": 0.00045763355592654426, + "loss": 1.8302, + "loss_base2": 2.6404, + "loss_pixel": 0.3236, + "loss_text": 1.5066, + "ppl": 6.2351, + "step": 10351 + }, + { + "epoch": 0.05, + "global_step": 10352, + "learning_rate": 0.00045762938230383977, + "loss": 1.8142, + "loss_base2": 2.6173, + "loss_pixel": 0.3231, + "loss_text": 1.4911, + "ppl": 6.1362, + "step": 10352 + }, + { + "epoch": 0.05, + "global_step": 10353, + "learning_rate": 0.0004576252086811352, + "loss": 1.8494, + "loss_base2": 2.6681, + "loss_pixel": 0.3219, + "loss_text": 1.5275, + "ppl": 6.356, + "step": 10353 + }, + { + "epoch": 0.05, + "global_step": 10354, + "learning_rate": 0.00045762103505843073, + "loss": 1.8138, + "loss_base2": 2.6168, + "loss_pixel": 0.3222, + "loss_text": 1.4916, + "ppl": 6.1337, + "step": 10354 + }, + { + "epoch": 0.05, + "global_step": 10355, + "learning_rate": 0.00045761686143572624, + "loss": 1.823, + "loss_base2": 2.63, + "loss_pixel": 0.3197, + "loss_text": 1.5033, + "ppl": 6.1904, + "step": 10355 + }, + { + "epoch": 0.05, + "global_step": 10356, + "learning_rate": 0.00045761268781302174, + "loss": 1.8201, + "loss_base2": 2.6258, + "loss_pixel": 0.322, + "loss_text": 1.4981, + "ppl": 6.1725, + "step": 10356 + }, + { + "epoch": 0.05, + "global_step": 10357, + "learning_rate": 0.0004576085141903172, + "loss": 1.8073, + "loss_base2": 2.6074, + "loss_pixel": 0.3188, + "loss_text": 1.4885, + "ppl": 6.094, + "step": 10357 + }, + { + "epoch": 0.05, + "global_step": 10358, + "learning_rate": 0.0004576043405676127, + "loss": 1.8109, + "loss_base2": 2.6126, + "loss_pixel": 0.3196, + "loss_text": 1.4914, + "ppl": 6.1159, + "step": 10358 + }, + { + "epoch": 0.05, + "global_step": 10359, + "learning_rate": 0.0004576001669449082, + "loss": 1.8074, + "loss_base2": 2.6075, + "loss_pixel": 0.315, + "loss_text": 1.4924, + "ppl": 6.0946, + "step": 10359 + }, + { + "epoch": 0.05, + "global_step": 10360, + "learning_rate": 0.0004575959933222037, + "loss": 1.8016, + "loss_base2": 2.5992, + "loss_pixel": 0.314, + "loss_text": 1.4876, + "ppl": 6.0593, + "step": 10360 + }, + { + "epoch": 0.05, + "global_step": 10361, + "learning_rate": 0.0004575918196994992, + "loss": 1.8243, + "loss_base2": 2.6319, + "loss_pixel": 0.3118, + "loss_text": 1.5125, + "ppl": 6.1985, + "step": 10361 + }, + { + "epoch": 0.05, + "global_step": 10362, + "learning_rate": 0.0004575876460767946, + "loss": 1.8132, + "loss_base2": 2.6159, + "loss_pixel": 0.3112, + "loss_text": 1.502, + "ppl": 6.13, + "step": 10362 + }, + { + "epoch": 0.05, + "global_step": 10363, + "learning_rate": 0.00045758347245409013, + "loss": 1.8125, + "loss_base2": 2.6149, + "loss_pixel": 0.3102, + "loss_text": 1.5024, + "ppl": 6.1257, + "step": 10363 + }, + { + "epoch": 0.05, + "global_step": 10364, + "learning_rate": 0.00045757929883138564, + "loss": 1.8039, + "loss_base2": 2.6025, + "loss_pixel": 0.3145, + "loss_text": 1.4894, + "ppl": 6.0733, + "step": 10364 + }, + { + "epoch": 0.05, + "global_step": 10365, + "learning_rate": 0.00045757512520868115, + "loss": 1.8033, + "loss_base2": 2.6016, + "loss_pixel": 0.3182, + "loss_text": 1.485, + "ppl": 6.0696, + "step": 10365 + }, + { + "epoch": 0.05, + "global_step": 10366, + "learning_rate": 0.0004575709515859766, + "loss": 1.7995, + "loss_base2": 2.5961, + "loss_pixel": 0.3156, + "loss_text": 1.4839, + "ppl": 6.0466, + "step": 10366 + }, + { + "epoch": 0.05, + "global_step": 10367, + "learning_rate": 0.0004575667779632721, + "loss": 1.7996, + "loss_base2": 2.5963, + "loss_pixel": 0.3126, + "loss_text": 1.4869, + "ppl": 6.0472, + "step": 10367 + }, + { + "epoch": 0.05, + "global_step": 10368, + "learning_rate": 0.0004575626043405676, + "loss": 1.7894, + "loss_base2": 2.5816, + "loss_pixel": 0.3114, + "loss_text": 1.478, + "ppl": 5.9859, + "step": 10368 + }, + { + "epoch": 0.05, + "global_step": 10369, + "learning_rate": 0.0004575584307178631, + "loss": 1.7846, + "loss_base2": 2.5746, + "loss_pixel": 0.3077, + "loss_text": 1.4769, + "ppl": 5.9572, + "step": 10369 + }, + { + "epoch": 0.05, + "global_step": 10370, + "learning_rate": 0.00045755425709515863, + "loss": 1.7893, + "loss_base2": 2.5814, + "loss_pixel": 0.3061, + "loss_text": 1.4833, + "ppl": 5.9853, + "step": 10370 + }, + { + "epoch": 0.05, + "global_step": 10371, + "learning_rate": 0.0004575500834724541, + "loss": 1.7943, + "loss_base2": 2.5886, + "loss_pixel": 0.3059, + "loss_text": 1.4884, + "ppl": 6.0153, + "step": 10371 + }, + { + "epoch": 0.05, + "global_step": 10372, + "learning_rate": 0.0004575459098497496, + "loss": 1.8012, + "loss_base2": 2.5986, + "loss_pixel": 0.3045, + "loss_text": 1.4966, + "ppl": 6.0569, + "step": 10372 + }, + { + "epoch": 0.05, + "global_step": 10373, + "learning_rate": 0.0004575417362270451, + "loss": 1.783, + "loss_base2": 2.5723, + "loss_pixel": 0.3031, + "loss_text": 1.4799, + "ppl": 5.9477, + "step": 10373 + }, + { + "epoch": 0.05, + "global_step": 10374, + "learning_rate": 0.0004575375626043406, + "loss": 1.7926, + "loss_base2": 2.5862, + "loss_pixel": 0.3024, + "loss_text": 1.4902, + "ppl": 6.005, + "step": 10374 + }, + { + "epoch": 0.05, + "global_step": 10375, + "learning_rate": 0.00045753338898163606, + "loss": 1.7833, + "loss_base2": 2.5728, + "loss_pixel": 0.3045, + "loss_text": 1.4788, + "ppl": 5.9495, + "step": 10375 + }, + { + "epoch": 0.05, + "global_step": 10376, + "learning_rate": 0.00045752921535893156, + "loss": 1.7906, + "loss_base2": 2.5833, + "loss_pixel": 0.3065, + "loss_text": 1.4842, + "ppl": 5.993, + "step": 10376 + }, + { + "epoch": 0.05, + "global_step": 10377, + "learning_rate": 0.00045752504173622707, + "loss": 1.7926, + "loss_base2": 2.5862, + "loss_pixel": 0.304, + "loss_text": 1.4886, + "ppl": 6.005, + "step": 10377 + }, + { + "epoch": 0.05, + "global_step": 10378, + "learning_rate": 0.0004575208681135226, + "loss": 1.7797, + "loss_base2": 2.5676, + "loss_pixel": 0.3016, + "loss_text": 1.4781, + "ppl": 5.9281, + "step": 10378 + }, + { + "epoch": 0.05, + "global_step": 10379, + "learning_rate": 0.0004575166944908181, + "loss": 1.7886, + "loss_base2": 2.5804, + "loss_pixel": 0.3065, + "loss_text": 1.4821, + "ppl": 5.9811, + "step": 10379 + }, + { + "epoch": 0.05, + "global_step": 10380, + "learning_rate": 0.00045751252086811354, + "loss": 1.7991, + "loss_base2": 2.5956, + "loss_pixel": 0.3047, + "loss_text": 1.4944, + "ppl": 6.0442, + "step": 10380 + }, + { + "epoch": 0.05, + "global_step": 10381, + "learning_rate": 0.000457508347245409, + "loss": 1.7734, + "loss_base2": 2.5585, + "loss_pixel": 0.3, + "loss_text": 1.4733, + "ppl": 5.8908, + "step": 10381 + }, + { + "epoch": 0.05, + "global_step": 10382, + "learning_rate": 0.0004575041736227045, + "loss": 1.7902, + "loss_base2": 2.5827, + "loss_pixel": 0.3006, + "loss_text": 1.4896, + "ppl": 5.9907, + "step": 10382 + }, + { + "epoch": 0.05, + "global_step": 10383, + "learning_rate": 0.0004575, + "loss": 1.7662, + "loss_base2": 2.5481, + "loss_pixel": 0.2984, + "loss_text": 1.4677, + "ppl": 5.8486, + "step": 10383 + }, + { + "epoch": 0.05, + "global_step": 10384, + "learning_rate": 0.00045749582637729546, + "loss": 1.7966, + "loss_base2": 2.5919, + "loss_pixel": 0.2984, + "loss_text": 1.4981, + "ppl": 6.0291, + "step": 10384 + }, + { + "epoch": 0.05, + "global_step": 10385, + "learning_rate": 0.00045749165275459097, + "loss": 1.7746, + "loss_base2": 2.5602, + "loss_pixel": 0.2963, + "loss_text": 1.4783, + "ppl": 5.8979, + "step": 10385 + }, + { + "epoch": 0.05, + "global_step": 10386, + "learning_rate": 0.0004574874791318865, + "loss": 1.7722, + "loss_base2": 2.5567, + "loss_pixel": 0.2966, + "loss_text": 1.4756, + "ppl": 5.8838, + "step": 10386 + }, + { + "epoch": 0.05, + "global_step": 10387, + "learning_rate": 0.000457483305509182, + "loss": 1.77, + "loss_base2": 2.5536, + "loss_pixel": 0.2958, + "loss_text": 1.4742, + "ppl": 5.8709, + "step": 10387 + }, + { + "epoch": 0.05, + "global_step": 10388, + "learning_rate": 0.0004574791318864775, + "loss": 1.7824, + "loss_base2": 2.5715, + "loss_pixel": 0.2946, + "loss_text": 1.4878, + "ppl": 5.9441, + "step": 10388 + }, + { + "epoch": 0.05, + "global_step": 10389, + "learning_rate": 0.00045747495826377294, + "loss": 1.7822, + "loss_base2": 2.5712, + "loss_pixel": 0.2934, + "loss_text": 1.4887, + "ppl": 5.9429, + "step": 10389 + }, + { + "epoch": 0.05, + "global_step": 10390, + "learning_rate": 0.00045747078464106845, + "loss": 1.7939, + "loss_base2": 2.5881, + "loss_pixel": 0.2928, + "loss_text": 1.5011, + "ppl": 6.0129, + "step": 10390 + }, + { + "epoch": 0.05, + "global_step": 10391, + "learning_rate": 0.00045746661101836396, + "loss": 1.7962, + "loss_base2": 2.5914, + "loss_pixel": 0.2938, + "loss_text": 1.5023, + "ppl": 6.0267, + "step": 10391 + }, + { + "epoch": 0.05, + "global_step": 10392, + "learning_rate": 0.00045746243739565946, + "loss": 1.775, + "loss_base2": 2.5608, + "loss_pixel": 0.2915, + "loss_text": 1.4835, + "ppl": 5.9003, + "step": 10392 + }, + { + "epoch": 0.05, + "global_step": 10393, + "learning_rate": 0.0004574582637729549, + "loss": 1.7785, + "loss_base2": 2.5658, + "loss_pixel": 0.2935, + "loss_text": 1.485, + "ppl": 5.921, + "step": 10393 + }, + { + "epoch": 0.05, + "global_step": 10394, + "learning_rate": 0.0004574540901502504, + "loss": 1.772, + "loss_base2": 2.5565, + "loss_pixel": 0.2905, + "loss_text": 1.4816, + "ppl": 5.8826, + "step": 10394 + }, + { + "epoch": 0.05, + "global_step": 10395, + "learning_rate": 0.00045744991652754593, + "loss": 1.7846, + "loss_base2": 2.5746, + "loss_pixel": 0.2891, + "loss_text": 1.4955, + "ppl": 5.9572, + "step": 10395 + }, + { + "epoch": 0.05, + "global_step": 10396, + "learning_rate": 0.00045744574290484144, + "loss": 1.7784, + "loss_base2": 2.5657, + "loss_pixel": 0.2885, + "loss_text": 1.4899, + "ppl": 5.9204, + "step": 10396 + }, + { + "epoch": 0.05, + "global_step": 10397, + "learning_rate": 0.00045744156928213695, + "loss": 1.746, + "loss_base2": 2.5189, + "loss_pixel": 0.2883, + "loss_text": 1.4577, + "ppl": 5.7316, + "step": 10397 + }, + { + "epoch": 0.05, + "global_step": 10398, + "learning_rate": 0.0004574373956594324, + "loss": 1.5687, + "loss_base2": 2.2632, + "loss_pixel": 0.2865, + "loss_text": 1.2822, + "ppl": 4.8004, + "step": 10398 + }, + { + "epoch": 0.05, + "global_step": 10399, + "learning_rate": 0.0004574332220367279, + "loss": 1.5801, + "loss_base2": 2.2796, + "loss_pixel": 0.2875, + "loss_text": 1.2925, + "ppl": 4.8554, + "step": 10399 + }, + { + "epoch": 0.05, + "global_step": 10400, + "learning_rate": 0.00045742904841402336, + "loss": 1.5631, + "loss_base2": 2.2551, + "loss_pixel": 0.2875, + "loss_text": 1.2755, + "ppl": 4.7736, + "step": 10400 + }, + { + "epoch": 0.05, + "global_step": 10401, + "learning_rate": 0.00045742487479131887, + "loss": 1.5547, + "loss_base2": 2.243, + "loss_pixel": 0.2875, + "loss_text": 1.2672, + "ppl": 4.7337, + "step": 10401 + }, + { + "epoch": 0.05, + "global_step": 10402, + "learning_rate": 0.0004574207011686143, + "loss": 1.6057, + "loss_base2": 2.3165, + "loss_pixel": 0.2992, + "loss_text": 1.3065, + "ppl": 4.9813, + "step": 10402 + }, + { + "epoch": 0.05, + "global_step": 10403, + "learning_rate": 0.00045741652754590983, + "loss": 1.5812, + "loss_base2": 2.2812, + "loss_pixel": 0.3137, + "loss_text": 1.2675, + "ppl": 4.8608, + "step": 10403 + }, + { + "epoch": 0.05, + "global_step": 10404, + "learning_rate": 0.00045741235392320534, + "loss": 1.5862, + "loss_base2": 2.2884, + "loss_pixel": 0.3109, + "loss_text": 1.2753, + "ppl": 4.8852, + "step": 10404 + }, + { + "epoch": 0.05, + "global_step": 10405, + "learning_rate": 0.00045740818030050084, + "loss": 1.643, + "loss_base2": 2.3703, + "loss_pixel": 0.3146, + "loss_text": 1.3284, + "ppl": 5.1707, + "step": 10405 + }, + { + "epoch": 0.05, + "global_step": 10406, + "learning_rate": 0.00045740400667779635, + "loss": 1.7266, + "loss_base2": 2.491, + "loss_pixel": 0.3065, + "loss_text": 1.4201, + "ppl": 5.6215, + "step": 10406 + }, + { + "epoch": 0.05, + "global_step": 10407, + "learning_rate": 0.0004573998330550918, + "loss": 1.753, + "loss_base2": 2.529, + "loss_pixel": 0.3052, + "loss_text": 1.4477, + "ppl": 5.7719, + "step": 10407 + }, + { + "epoch": 0.05, + "global_step": 10408, + "learning_rate": 0.0004573956594323873, + "loss": 1.7936, + "loss_base2": 2.5876, + "loss_pixel": 0.3015, + "loss_text": 1.4921, + "ppl": 6.0111, + "step": 10408 + }, + { + "epoch": 0.05, + "global_step": 10409, + "learning_rate": 0.0004573914858096828, + "loss": 1.8178, + "loss_base2": 2.6225, + "loss_pixel": 0.2988, + "loss_text": 1.519, + "ppl": 6.1583, + "step": 10409 + }, + { + "epoch": 0.05, + "global_step": 10410, + "learning_rate": 0.0004573873121869783, + "loss": 1.7868, + "loss_base2": 2.5778, + "loss_pixel": 0.2993, + "loss_text": 1.4875, + "ppl": 5.9703, + "step": 10410 + }, + { + "epoch": 0.05, + "global_step": 10411, + "learning_rate": 0.00045738313856427383, + "loss": 1.7995, + "loss_base2": 2.5961, + "loss_pixel": 0.2964, + "loss_text": 1.5032, + "ppl": 6.0466, + "step": 10411 + }, + { + "epoch": 0.05, + "global_step": 10412, + "learning_rate": 0.0004573789649415693, + "loss": 1.7801, + "loss_base2": 2.5681, + "loss_pixel": 0.2971, + "loss_text": 1.483, + "ppl": 5.9304, + "step": 10412 + }, + { + "epoch": 0.05, + "global_step": 10413, + "learning_rate": 0.0004573747913188648, + "loss": 1.7779, + "loss_base2": 2.565, + "loss_pixel": 0.2942, + "loss_text": 1.4837, + "ppl": 5.9174, + "step": 10413 + }, + { + "epoch": 0.05, + "global_step": 10414, + "learning_rate": 0.0004573706176961603, + "loss": 1.7853, + "loss_base2": 2.5756, + "loss_pixel": 0.2938, + "loss_text": 1.4915, + "ppl": 5.9614, + "step": 10414 + }, + { + "epoch": 0.05, + "global_step": 10415, + "learning_rate": 0.0004573664440734558, + "loss": 1.7679, + "loss_base2": 2.5505, + "loss_pixel": 0.2917, + "loss_text": 1.4762, + "ppl": 5.8585, + "step": 10415 + }, + { + "epoch": 0.05, + "global_step": 10416, + "learning_rate": 0.00045736227045075126, + "loss": 1.7866, + "loss_base2": 2.5775, + "loss_pixel": 0.2919, + "loss_text": 1.4947, + "ppl": 5.9691, + "step": 10416 + }, + { + "epoch": 0.05, + "global_step": 10417, + "learning_rate": 0.00045735809682804677, + "loss": 1.7791, + "loss_base2": 2.5667, + "loss_pixel": 0.2913, + "loss_text": 1.4878, + "ppl": 5.9245, + "step": 10417 + }, + { + "epoch": 0.05, + "global_step": 10418, + "learning_rate": 0.0004573539232053422, + "loss": 1.7773, + "loss_base2": 2.5641, + "loss_pixel": 0.2901, + "loss_text": 1.4872, + "ppl": 5.9139, + "step": 10418 + }, + { + "epoch": 0.05, + "global_step": 10419, + "learning_rate": 0.00045734974958263773, + "loss": 1.7707, + "loss_base2": 2.5546, + "loss_pixel": 0.2887, + "loss_text": 1.482, + "ppl": 5.875, + "step": 10419 + }, + { + "epoch": 0.05, + "global_step": 10420, + "learning_rate": 0.00045734557595993324, + "loss": 1.7813, + "loss_base2": 2.5699, + "loss_pixel": 0.2888, + "loss_text": 1.4926, + "ppl": 5.9376, + "step": 10420 + }, + { + "epoch": 0.05, + "global_step": 10421, + "learning_rate": 0.0004573414023372287, + "loss": 1.7713, + "loss_base2": 2.5554, + "loss_pixel": 0.2882, + "loss_text": 1.4831, + "ppl": 5.8785, + "step": 10421 + }, + { + "epoch": 0.05, + "global_step": 10422, + "learning_rate": 0.0004573372287145242, + "loss": 1.7773, + "loss_base2": 2.5641, + "loss_pixel": 0.2897, + "loss_text": 1.4876, + "ppl": 5.9139, + "step": 10422 + }, + { + "epoch": 0.05, + "global_step": 10423, + "learning_rate": 0.0004573330550918197, + "loss": 1.7833, + "loss_base2": 2.5728, + "loss_pixel": 0.2865, + "loss_text": 1.4969, + "ppl": 5.9495, + "step": 10423 + }, + { + "epoch": 0.05, + "global_step": 10424, + "learning_rate": 0.0004573288814691152, + "loss": 1.7761, + "loss_base2": 2.5624, + "loss_pixel": 0.287, + "loss_text": 1.4891, + "ppl": 5.9068, + "step": 10424 + }, + { + "epoch": 0.05, + "global_step": 10425, + "learning_rate": 0.00045732470784641066, + "loss": 1.7505, + "loss_base2": 2.5254, + "loss_pixel": 0.2869, + "loss_text": 1.4636, + "ppl": 5.7575, + "step": 10425 + }, + { + "epoch": 0.05, + "global_step": 10426, + "learning_rate": 0.00045732053422370617, + "loss": 1.7674, + "loss_base2": 2.5498, + "loss_pixel": 0.2848, + "loss_text": 1.4826, + "ppl": 5.8556, + "step": 10426 + }, + { + "epoch": 0.05, + "global_step": 10427, + "learning_rate": 0.0004573163606010017, + "loss": 1.7794, + "loss_base2": 2.5671, + "loss_pixel": 0.2868, + "loss_text": 1.4926, + "ppl": 5.9263, + "step": 10427 + }, + { + "epoch": 0.05, + "global_step": 10428, + "learning_rate": 0.0004573121869782972, + "loss": 1.7479, + "loss_base2": 2.5217, + "loss_pixel": 0.2871, + "loss_text": 1.4608, + "ppl": 5.7425, + "step": 10428 + }, + { + "epoch": 0.05, + "global_step": 10429, + "learning_rate": 0.0004573080133555927, + "loss": 1.764, + "loss_base2": 2.5449, + "loss_pixel": 0.2943, + "loss_text": 1.4697, + "ppl": 5.8357, + "step": 10429 + }, + { + "epoch": 0.05, + "global_step": 10430, + "learning_rate": 0.00045730383973288815, + "loss": 1.7569, + "loss_base2": 2.5347, + "loss_pixel": 0.288, + "loss_text": 1.4689, + "ppl": 5.7944, + "step": 10430 + }, + { + "epoch": 0.05, + "global_step": 10431, + "learning_rate": 0.00045729966611018365, + "loss": 1.7666, + "loss_base2": 2.5487, + "loss_pixel": 0.2882, + "loss_text": 1.4784, + "ppl": 5.8509, + "step": 10431 + }, + { + "epoch": 0.05, + "global_step": 10432, + "learning_rate": 0.00045729549248747916, + "loss": 1.7723, + "loss_base2": 2.5569, + "loss_pixel": 0.2876, + "loss_text": 1.4847, + "ppl": 5.8844, + "step": 10432 + }, + { + "epoch": 0.05, + "global_step": 10433, + "learning_rate": 0.00045729131886477467, + "loss": 1.7842, + "loss_base2": 2.5741, + "loss_pixel": 0.2863, + "loss_text": 1.4979, + "ppl": 5.9548, + "step": 10433 + }, + { + "epoch": 0.05, + "global_step": 10434, + "learning_rate": 0.0004572871452420701, + "loss": 1.7797, + "loss_base2": 2.5676, + "loss_pixel": 0.286, + "loss_text": 1.4937, + "ppl": 5.9281, + "step": 10434 + }, + { + "epoch": 0.05, + "global_step": 10435, + "learning_rate": 0.00045728297161936563, + "loss": 1.7743, + "loss_base2": 2.5598, + "loss_pixel": 0.287, + "loss_text": 1.4874, + "ppl": 5.8962, + "step": 10435 + }, + { + "epoch": 0.05, + "global_step": 10436, + "learning_rate": 0.00045727879799666114, + "loss": 1.7536, + "loss_base2": 2.5299, + "loss_pixel": 0.2893, + "loss_text": 1.4643, + "ppl": 5.7754, + "step": 10436 + }, + { + "epoch": 0.05, + "global_step": 10437, + "learning_rate": 0.0004572746243739566, + "loss": 1.7392, + "loss_base2": 2.5091, + "loss_pixel": 0.2851, + "loss_text": 1.4541, + "ppl": 5.6928, + "step": 10437 + }, + { + "epoch": 0.05, + "global_step": 10438, + "learning_rate": 0.0004572704507512521, + "loss": 1.7429, + "loss_base2": 2.5145, + "loss_pixel": 0.2847, + "loss_text": 1.4582, + "ppl": 5.7139, + "step": 10438 + }, + { + "epoch": 0.05, + "global_step": 10439, + "learning_rate": 0.00045726627712854755, + "loss": 1.7721, + "loss_base2": 2.5566, + "loss_pixel": 0.2853, + "loss_text": 1.4867, + "ppl": 5.8832, + "step": 10439 + }, + { + "epoch": 0.05, + "global_step": 10440, + "learning_rate": 0.00045726210350584306, + "loss": 1.7571, + "loss_base2": 2.535, + "loss_pixel": 0.2862, + "loss_text": 1.4709, + "ppl": 5.7956, + "step": 10440 + }, + { + "epoch": 0.05, + "global_step": 10441, + "learning_rate": 0.00045725792988313856, + "loss": 1.7466, + "loss_base2": 2.5198, + "loss_pixel": 0.2827, + "loss_text": 1.464, + "ppl": 5.7351, + "step": 10441 + }, + { + "epoch": 0.05, + "global_step": 10442, + "learning_rate": 0.00045725375626043407, + "loss": 1.76, + "loss_base2": 2.5391, + "loss_pixel": 0.2826, + "loss_text": 1.4774, + "ppl": 5.8124, + "step": 10442 + }, + { + "epoch": 0.05, + "global_step": 10443, + "learning_rate": 0.0004572495826377295, + "loss": 1.7662, + "loss_base2": 2.5481, + "loss_pixel": 0.2813, + "loss_text": 1.4849, + "ppl": 5.8486, + "step": 10443 + }, + { + "epoch": 0.05, + "global_step": 10444, + "learning_rate": 0.00045724540901502503, + "loss": 1.7436, + "loss_base2": 2.5155, + "loss_pixel": 0.2806, + "loss_text": 1.4631, + "ppl": 5.7179, + "step": 10444 + }, + { + "epoch": 0.05, + "global_step": 10445, + "learning_rate": 0.00045724123539232054, + "loss": 1.7476, + "loss_base2": 2.5213, + "loss_pixel": 0.2803, + "loss_text": 1.4673, + "ppl": 5.7408, + "step": 10445 + }, + { + "epoch": 0.05, + "global_step": 10446, + "learning_rate": 0.00045723706176961605, + "loss": 1.7479, + "loss_base2": 2.5217, + "loss_pixel": 0.279, + "loss_text": 1.4688, + "ppl": 5.7425, + "step": 10446 + }, + { + "epoch": 0.05, + "global_step": 10447, + "learning_rate": 0.00045723288814691155, + "loss": 1.7675, + "loss_base2": 2.55, + "loss_pixel": 0.2785, + "loss_text": 1.489, + "ppl": 5.8562, + "step": 10447 + }, + { + "epoch": 0.05, + "global_step": 10448, + "learning_rate": 0.000457228714524207, + "loss": 1.7593, + "loss_base2": 2.5381, + "loss_pixel": 0.2775, + "loss_text": 1.4819, + "ppl": 5.8084, + "step": 10448 + }, + { + "epoch": 0.05, + "global_step": 10449, + "learning_rate": 0.0004572245409015025, + "loss": 1.754, + "loss_base2": 2.5305, + "loss_pixel": 0.2762, + "loss_text": 1.4778, + "ppl": 5.7777, + "step": 10449 + }, + { + "epoch": 0.06, + "global_step": 10450, + "learning_rate": 0.000457220367278798, + "loss": 1.7458, + "loss_base2": 2.5187, + "loss_pixel": 0.2764, + "loss_text": 1.4694, + "ppl": 5.7305, + "step": 10450 + }, + { + "epoch": 0.06, + "global_step": 10451, + "learning_rate": 0.00045721619365609353, + "loss": 1.7506, + "loss_base2": 2.5256, + "loss_pixel": 0.2755, + "loss_text": 1.4751, + "ppl": 5.7581, + "step": 10451 + }, + { + "epoch": 0.06, + "global_step": 10452, + "learning_rate": 0.000457212020033389, + "loss": 1.7265, + "loss_base2": 2.4908, + "loss_pixel": 0.2749, + "loss_text": 1.4515, + "ppl": 5.6209, + "step": 10452 + }, + { + "epoch": 0.06, + "global_step": 10453, + "learning_rate": 0.0004572078464106845, + "loss": 1.6847, + "loss_base2": 2.4305, + "loss_pixel": 0.275, + "loss_text": 1.4097, + "ppl": 5.3908, + "step": 10453 + }, + { + "epoch": 0.06, + "global_step": 10454, + "learning_rate": 0.00045720367278798, + "loss": 1.5235, + "loss_base2": 2.1979, + "loss_pixel": 0.2748, + "loss_text": 1.2488, + "ppl": 4.5883, + "step": 10454 + }, + { + "epoch": 0.06, + "global_step": 10455, + "learning_rate": 0.0004571994991652755, + "loss": 1.5439, + "loss_base2": 2.2274, + "loss_pixel": 0.2753, + "loss_text": 1.2686, + "ppl": 4.6828, + "step": 10455 + }, + { + "epoch": 0.06, + "global_step": 10456, + "learning_rate": 0.00045719532554257096, + "loss": 1.5723, + "loss_base2": 2.2683, + "loss_pixel": 0.2765, + "loss_text": 1.2958, + "ppl": 4.8177, + "step": 10456 + }, + { + "epoch": 0.06, + "global_step": 10457, + "learning_rate": 0.0004571911519198664, + "loss": 1.5474, + "loss_base2": 2.2324, + "loss_pixel": 0.2776, + "loss_text": 1.2697, + "ppl": 4.6992, + "step": 10457 + }, + { + "epoch": 0.06, + "global_step": 10458, + "learning_rate": 0.0004571869782971619, + "loss": 1.5435, + "loss_base2": 2.2268, + "loss_pixel": 0.2752, + "loss_text": 1.2683, + "ppl": 4.6809, + "step": 10458 + }, + { + "epoch": 0.06, + "global_step": 10459, + "learning_rate": 0.0004571828046744574, + "loss": 1.5168, + "loss_base2": 2.1883, + "loss_pixel": 0.2751, + "loss_text": 1.2418, + "ppl": 4.5576, + "step": 10459 + }, + { + "epoch": 0.06, + "global_step": 10460, + "learning_rate": 0.00045717863105175293, + "loss": 1.5385, + "loss_base2": 2.2196, + "loss_pixel": 0.2779, + "loss_text": 1.2606, + "ppl": 4.6576, + "step": 10460 + }, + { + "epoch": 0.06, + "global_step": 10461, + "learning_rate": 0.0004571744574290484, + "loss": 1.5412, + "loss_base2": 2.2235, + "loss_pixel": 0.2787, + "loss_text": 1.2625, + "ppl": 4.6702, + "step": 10461 + }, + { + "epoch": 0.06, + "global_step": 10462, + "learning_rate": 0.0004571702838063439, + "loss": 1.5632, + "loss_base2": 2.2552, + "loss_pixel": 0.2757, + "loss_text": 1.2875, + "ppl": 4.7741, + "step": 10462 + }, + { + "epoch": 0.06, + "global_step": 10463, + "learning_rate": 0.0004571661101836394, + "loss": 1.5382, + "loss_base2": 2.2192, + "loss_pixel": 0.2757, + "loss_text": 1.2624, + "ppl": 4.6562, + "step": 10463 + }, + { + "epoch": 0.06, + "global_step": 10464, + "learning_rate": 0.0004571619365609349, + "loss": 1.5534, + "loss_base2": 2.2411, + "loss_pixel": 0.2769, + "loss_text": 1.2764, + "ppl": 4.7275, + "step": 10464 + }, + { + "epoch": 0.06, + "global_step": 10465, + "learning_rate": 0.0004571577629382304, + "loss": 1.5276, + "loss_base2": 2.2039, + "loss_pixel": 0.2754, + "loss_text": 1.2522, + "ppl": 4.6071, + "step": 10465 + }, + { + "epoch": 0.06, + "global_step": 10466, + "learning_rate": 0.00045715358931552587, + "loss": 1.5454, + "loss_base2": 2.2295, + "loss_pixel": 0.2742, + "loss_text": 1.2712, + "ppl": 4.6898, + "step": 10466 + }, + { + "epoch": 0.06, + "global_step": 10467, + "learning_rate": 0.0004571494156928214, + "loss": 1.5262, + "loss_base2": 2.2018, + "loss_pixel": 0.2737, + "loss_text": 1.2525, + "ppl": 4.6007, + "step": 10467 + }, + { + "epoch": 0.06, + "global_step": 10468, + "learning_rate": 0.0004571452420701169, + "loss": 1.5113, + "loss_base2": 2.1803, + "loss_pixel": 0.2716, + "loss_text": 1.2397, + "ppl": 4.5326, + "step": 10468 + }, + { + "epoch": 0.06, + "global_step": 10469, + "learning_rate": 0.0004571410684474124, + "loss": 1.5276, + "loss_base2": 2.2039, + "loss_pixel": 0.271, + "loss_text": 1.2565, + "ppl": 4.6071, + "step": 10469 + }, + { + "epoch": 0.06, + "global_step": 10470, + "learning_rate": 0.0004571368948247079, + "loss": 1.5149, + "loss_base2": 2.1855, + "loss_pixel": 0.2709, + "loss_text": 1.244, + "ppl": 4.549, + "step": 10470 + }, + { + "epoch": 0.06, + "global_step": 10471, + "learning_rate": 0.00045713272120200335, + "loss": 1.5129, + "loss_base2": 2.1827, + "loss_pixel": 0.2701, + "loss_text": 1.2428, + "ppl": 4.5399, + "step": 10471 + }, + { + "epoch": 0.06, + "global_step": 10472, + "learning_rate": 0.00045712854757929886, + "loss": 1.5252, + "loss_base2": 2.2004, + "loss_pixel": 0.2695, + "loss_text": 1.2557, + "ppl": 4.5961, + "step": 10472 + }, + { + "epoch": 0.06, + "global_step": 10473, + "learning_rate": 0.00045712437395659436, + "loss": 1.5442, + "loss_base2": 2.2278, + "loss_pixel": 0.2738, + "loss_text": 1.2704, + "ppl": 4.6842, + "step": 10473 + }, + { + "epoch": 0.06, + "global_step": 10474, + "learning_rate": 0.00045712020033388987, + "loss": 1.5185, + "loss_base2": 2.1907, + "loss_pixel": 0.273, + "loss_text": 1.2455, + "ppl": 4.5654, + "step": 10474 + }, + { + "epoch": 0.06, + "global_step": 10475, + "learning_rate": 0.00045711602671118527, + "loss": 1.5281, + "loss_base2": 2.2046, + "loss_pixel": 0.2743, + "loss_text": 1.2538, + "ppl": 4.6094, + "step": 10475 + }, + { + "epoch": 0.06, + "global_step": 10476, + "learning_rate": 0.0004571118530884808, + "loss": 1.5427, + "loss_base2": 2.2256, + "loss_pixel": 0.2695, + "loss_text": 1.2732, + "ppl": 4.6772, + "step": 10476 + }, + { + "epoch": 0.06, + "global_step": 10477, + "learning_rate": 0.0004571076794657763, + "loss": 1.5191, + "loss_base2": 2.1916, + "loss_pixel": 0.2709, + "loss_text": 1.2482, + "ppl": 4.5681, + "step": 10477 + }, + { + "epoch": 0.06, + "global_step": 10478, + "learning_rate": 0.0004571035058430718, + "loss": 1.542, + "loss_base2": 2.2246, + "loss_pixel": 0.2686, + "loss_text": 1.2735, + "ppl": 4.6739, + "step": 10478 + }, + { + "epoch": 0.06, + "global_step": 10479, + "learning_rate": 0.0004570993322203673, + "loss": 1.5138, + "loss_base2": 2.184, + "loss_pixel": 0.2695, + "loss_text": 1.2444, + "ppl": 4.544, + "step": 10479 + }, + { + "epoch": 0.06, + "global_step": 10480, + "learning_rate": 0.00045709515859766275, + "loss": 1.5237, + "loss_base2": 2.1982, + "loss_pixel": 0.2702, + "loss_text": 1.2535, + "ppl": 4.5892, + "step": 10480 + }, + { + "epoch": 0.06, + "global_step": 10481, + "learning_rate": 0.00045709098497495826, + "loss": 1.5382, + "loss_base2": 2.2192, + "loss_pixel": 0.2678, + "loss_text": 1.2704, + "ppl": 4.6562, + "step": 10481 + }, + { + "epoch": 0.06, + "global_step": 10482, + "learning_rate": 0.00045708681135225377, + "loss": 1.5243, + "loss_base2": 2.1991, + "loss_pixel": 0.2668, + "loss_text": 1.2575, + "ppl": 4.5919, + "step": 10482 + }, + { + "epoch": 0.06, + "global_step": 10483, + "learning_rate": 0.0004570826377295493, + "loss": 1.5037, + "loss_base2": 2.1694, + "loss_pixel": 0.2659, + "loss_text": 1.2378, + "ppl": 4.4983, + "step": 10483 + }, + { + "epoch": 0.06, + "global_step": 10484, + "learning_rate": 0.00045707846410684473, + "loss": 1.5244, + "loss_base2": 2.1992, + "loss_pixel": 0.2678, + "loss_text": 1.2566, + "ppl": 4.5924, + "step": 10484 + }, + { + "epoch": 0.06, + "global_step": 10485, + "learning_rate": 0.00045707429048414024, + "loss": 1.6408, + "loss_base2": 2.3672, + "loss_pixel": 0.2686, + "loss_text": 1.3723, + "ppl": 5.1593, + "step": 10485 + }, + { + "epoch": 0.06, + "global_step": 10486, + "learning_rate": 0.00045707011686143574, + "loss": 1.7842, + "loss_base2": 2.5741, + "loss_pixel": 0.2674, + "loss_text": 1.5167, + "ppl": 5.9548, + "step": 10486 + }, + { + "epoch": 0.06, + "global_step": 10487, + "learning_rate": 0.00045706594323873125, + "loss": 1.762, + "loss_base2": 2.542, + "loss_pixel": 0.2692, + "loss_text": 1.4929, + "ppl": 5.8241, + "step": 10487 + }, + { + "epoch": 0.06, + "global_step": 10488, + "learning_rate": 0.00045706176961602676, + "loss": 1.7548, + "loss_base2": 2.5316, + "loss_pixel": 0.2663, + "loss_text": 1.4886, + "ppl": 5.7823, + "step": 10488 + }, + { + "epoch": 0.06, + "global_step": 10489, + "learning_rate": 0.0004570575959933222, + "loss": 1.7494, + "loss_base2": 2.5239, + "loss_pixel": 0.2652, + "loss_text": 1.4842, + "ppl": 5.7512, + "step": 10489 + }, + { + "epoch": 0.06, + "global_step": 10490, + "learning_rate": 0.0004570534223706177, + "loss": 1.7372, + "loss_base2": 2.5062, + "loss_pixel": 0.2647, + "loss_text": 1.4725, + "ppl": 5.6814, + "step": 10490 + }, + { + "epoch": 0.06, + "global_step": 10491, + "learning_rate": 0.0004570492487479132, + "loss": 1.754, + "loss_base2": 2.5305, + "loss_pixel": 0.2656, + "loss_text": 1.4884, + "ppl": 5.7777, + "step": 10491 + }, + { + "epoch": 0.06, + "global_step": 10492, + "learning_rate": 0.00045704507512520873, + "loss": 1.7421, + "loss_base2": 2.5133, + "loss_pixel": 0.2672, + "loss_text": 1.4749, + "ppl": 5.7093, + "step": 10492 + }, + { + "epoch": 0.06, + "global_step": 10493, + "learning_rate": 0.00045704090150250413, + "loss": 1.7344, + "loss_base2": 2.5022, + "loss_pixel": 0.2666, + "loss_text": 1.4678, + "ppl": 5.6655, + "step": 10493 + }, + { + "epoch": 0.06, + "global_step": 10494, + "learning_rate": 0.00045703672787979964, + "loss": 1.7435, + "loss_base2": 2.5153, + "loss_pixel": 0.2641, + "loss_text": 1.4794, + "ppl": 5.7173, + "step": 10494 + }, + { + "epoch": 0.06, + "global_step": 10495, + "learning_rate": 0.00045703255425709515, + "loss": 1.7568, + "loss_base2": 2.5345, + "loss_pixel": 0.2667, + "loss_text": 1.4901, + "ppl": 5.7939, + "step": 10495 + }, + { + "epoch": 0.06, + "global_step": 10496, + "learning_rate": 0.00045702838063439065, + "loss": 1.7398, + "loss_base2": 2.51, + "loss_pixel": 0.2656, + "loss_text": 1.4741, + "ppl": 5.6962, + "step": 10496 + }, + { + "epoch": 0.06, + "global_step": 10497, + "learning_rate": 0.00045702420701168616, + "loss": 1.7497, + "loss_base2": 2.5243, + "loss_pixel": 0.2666, + "loss_text": 1.4831, + "ppl": 5.7529, + "step": 10497 + }, + { + "epoch": 0.06, + "global_step": 10498, + "learning_rate": 0.0004570200333889816, + "loss": 1.734, + "loss_base2": 2.5016, + "loss_pixel": 0.2667, + "loss_text": 1.4674, + "ppl": 5.6633, + "step": 10498 + }, + { + "epoch": 0.06, + "global_step": 10499, + "learning_rate": 0.0004570158597662771, + "loss": 1.7392, + "loss_base2": 2.5091, + "loss_pixel": 0.2638, + "loss_text": 1.4754, + "ppl": 5.6928, + "step": 10499 + }, + { + "epoch": 0.06, + "global_step": 10500, + "learning_rate": 0.00045701168614357263, + "loss": 1.7374, + "loss_base2": 2.5065, + "loss_pixel": 0.2633, + "loss_text": 1.4741, + "ppl": 5.6825, + "step": 10500 + }, + { + "epoch": 0.06, + "global_step": 10501, + "learning_rate": 0.00045700751252086814, + "loss": 1.753, + "loss_base2": 2.529, + "loss_pixel": 0.262, + "loss_text": 1.491, + "ppl": 5.7719, + "step": 10501 + }, + { + "epoch": 0.06, + "global_step": 10502, + "learning_rate": 0.0004570033388981636, + "loss": 1.7224, + "loss_base2": 2.4849, + "loss_pixel": 0.2622, + "loss_text": 1.4603, + "ppl": 5.5979, + "step": 10502 + }, + { + "epoch": 0.06, + "global_step": 10503, + "learning_rate": 0.0004569991652754591, + "loss": 1.7323, + "loss_base2": 2.4992, + "loss_pixel": 0.2605, + "loss_text": 1.4719, + "ppl": 5.6536, + "step": 10503 + }, + { + "epoch": 0.06, + "global_step": 10504, + "learning_rate": 0.0004569949916527546, + "loss": 1.7295, + "loss_base2": 2.4951, + "loss_pixel": 0.2614, + "loss_text": 1.4681, + "ppl": 5.6378, + "step": 10504 + }, + { + "epoch": 0.06, + "global_step": 10505, + "learning_rate": 0.0004569908180300501, + "loss": 1.7348, + "loss_base2": 2.5028, + "loss_pixel": 0.2609, + "loss_text": 1.4739, + "ppl": 5.6678, + "step": 10505 + }, + { + "epoch": 0.06, + "global_step": 10506, + "learning_rate": 0.0004569866444073456, + "loss": 1.738, + "loss_base2": 2.5074, + "loss_pixel": 0.2585, + "loss_text": 1.4795, + "ppl": 5.686, + "step": 10506 + }, + { + "epoch": 0.06, + "global_step": 10507, + "learning_rate": 0.00045698247078464107, + "loss": 1.729, + "loss_base2": 2.4944, + "loss_pixel": 0.2596, + "loss_text": 1.4694, + "ppl": 5.635, + "step": 10507 + }, + { + "epoch": 0.06, + "global_step": 10508, + "learning_rate": 0.0004569782971619366, + "loss": 1.7217, + "loss_base2": 2.4839, + "loss_pixel": 0.258, + "loss_text": 1.4636, + "ppl": 5.594, + "step": 10508 + }, + { + "epoch": 0.06, + "global_step": 10509, + "learning_rate": 0.0004569741235392321, + "loss": 1.7232, + "loss_base2": 2.4861, + "loss_pixel": 0.2614, + "loss_text": 1.4618, + "ppl": 5.6024, + "step": 10509 + }, + { + "epoch": 0.06, + "global_step": 10510, + "learning_rate": 0.0004569699499165276, + "loss": 1.7357, + "loss_base2": 2.5041, + "loss_pixel": 0.2629, + "loss_text": 1.4728, + "ppl": 5.6729, + "step": 10510 + }, + { + "epoch": 0.06, + "global_step": 10511, + "learning_rate": 0.00045696577629382305, + "loss": 1.7348, + "loss_base2": 2.5028, + "loss_pixel": 0.2647, + "loss_text": 1.4701, + "ppl": 5.6678, + "step": 10511 + }, + { + "epoch": 0.06, + "global_step": 10512, + "learning_rate": 0.0004569616026711185, + "loss": 1.7426, + "loss_base2": 2.514, + "loss_pixel": 0.2653, + "loss_text": 1.4773, + "ppl": 5.7122, + "step": 10512 + }, + { + "epoch": 0.06, + "global_step": 10513, + "learning_rate": 0.000456957429048414, + "loss": 1.7506, + "loss_base2": 2.5256, + "loss_pixel": 0.2682, + "loss_text": 1.4824, + "ppl": 5.7581, + "step": 10513 + }, + { + "epoch": 0.06, + "global_step": 10514, + "learning_rate": 0.0004569532554257095, + "loss": 1.7327, + "loss_base2": 2.4998, + "loss_pixel": 0.2654, + "loss_text": 1.4673, + "ppl": 5.6559, + "step": 10514 + }, + { + "epoch": 0.06, + "global_step": 10515, + "learning_rate": 0.000456949081803005, + "loss": 1.7218, + "loss_base2": 2.484, + "loss_pixel": 0.2638, + "loss_text": 1.458, + "ppl": 5.5946, + "step": 10515 + }, + { + "epoch": 0.06, + "global_step": 10516, + "learning_rate": 0.0004569449081803005, + "loss": 1.7444, + "loss_base2": 2.5166, + "loss_pixel": 0.2635, + "loss_text": 1.4809, + "ppl": 5.7225, + "step": 10516 + }, + { + "epoch": 0.06, + "global_step": 10517, + "learning_rate": 0.000456940734557596, + "loss": 1.7136, + "loss_base2": 2.4722, + "loss_pixel": 0.2622, + "loss_text": 1.4514, + "ppl": 5.5489, + "step": 10517 + }, + { + "epoch": 0.06, + "global_step": 10518, + "learning_rate": 0.0004569365609348915, + "loss": 1.7287, + "loss_base2": 2.494, + "loss_pixel": 0.2626, + "loss_text": 1.4661, + "ppl": 5.6333, + "step": 10518 + }, + { + "epoch": 0.06, + "global_step": 10519, + "learning_rate": 0.000456932387312187, + "loss": 1.7436, + "loss_base2": 2.5155, + "loss_pixel": 0.2594, + "loss_text": 1.4842, + "ppl": 5.7179, + "step": 10519 + }, + { + "epoch": 0.06, + "global_step": 10520, + "learning_rate": 0.00045692821368948245, + "loss": 1.7148, + "loss_base2": 2.4739, + "loss_pixel": 0.2585, + "loss_text": 1.4562, + "ppl": 5.5556, + "step": 10520 + }, + { + "epoch": 0.06, + "global_step": 10521, + "learning_rate": 0.00045692404006677796, + "loss": 1.7127, + "loss_base2": 2.4709, + "loss_pixel": 0.2591, + "loss_text": 1.4536, + "ppl": 5.5439, + "step": 10521 + }, + { + "epoch": 0.06, + "global_step": 10522, + "learning_rate": 0.00045691986644407346, + "loss": 1.7348, + "loss_base2": 2.5028, + "loss_pixel": 0.2571, + "loss_text": 1.4776, + "ppl": 5.6678, + "step": 10522 + }, + { + "epoch": 0.06, + "global_step": 10523, + "learning_rate": 0.00045691569282136897, + "loss": 1.7269, + "loss_base2": 2.4914, + "loss_pixel": 0.2575, + "loss_text": 1.4695, + "ppl": 5.6232, + "step": 10523 + }, + { + "epoch": 0.06, + "global_step": 10524, + "learning_rate": 0.0004569115191986645, + "loss": 1.7199, + "loss_base2": 2.4813, + "loss_pixel": 0.2559, + "loss_text": 1.4641, + "ppl": 5.584, + "step": 10524 + }, + { + "epoch": 0.06, + "global_step": 10525, + "learning_rate": 0.00045690734557595993, + "loss": 1.7275, + "loss_base2": 2.4923, + "loss_pixel": 0.2572, + "loss_text": 1.4703, + "ppl": 5.6266, + "step": 10525 + }, + { + "epoch": 0.06, + "global_step": 10526, + "learning_rate": 0.00045690317195325544, + "loss": 1.7357, + "loss_base2": 2.5041, + "loss_pixel": 0.257, + "loss_text": 1.4787, + "ppl": 5.6729, + "step": 10526 + }, + { + "epoch": 0.06, + "global_step": 10527, + "learning_rate": 0.00045689899833055095, + "loss": 1.7232, + "loss_base2": 2.4861, + "loss_pixel": 0.2553, + "loss_text": 1.4679, + "ppl": 5.6024, + "step": 10527 + }, + { + "epoch": 0.06, + "global_step": 10528, + "learning_rate": 0.00045689482470784645, + "loss": 1.737, + "loss_base2": 2.506, + "loss_pixel": 0.2545, + "loss_text": 1.4825, + "ppl": 5.6803, + "step": 10528 + }, + { + "epoch": 0.06, + "global_step": 10529, + "learning_rate": 0.00045689065108514196, + "loss": 1.7205, + "loss_base2": 2.4822, + "loss_pixel": 0.253, + "loss_text": 1.4675, + "ppl": 5.5873, + "step": 10529 + }, + { + "epoch": 0.06, + "global_step": 10530, + "learning_rate": 0.0004568864774624374, + "loss": 1.7097, + "loss_base2": 2.4666, + "loss_pixel": 0.2529, + "loss_text": 1.4568, + "ppl": 5.5273, + "step": 10530 + }, + { + "epoch": 0.06, + "global_step": 10531, + "learning_rate": 0.00045688230383973287, + "loss": 1.7141, + "loss_base2": 2.4729, + "loss_pixel": 0.2532, + "loss_text": 1.4609, + "ppl": 5.5517, + "step": 10531 + }, + { + "epoch": 0.06, + "global_step": 10532, + "learning_rate": 0.0004568781302170284, + "loss": 1.7352, + "loss_base2": 2.5034, + "loss_pixel": 0.2512, + "loss_text": 1.4841, + "ppl": 5.6701, + "step": 10532 + }, + { + "epoch": 0.06, + "global_step": 10533, + "learning_rate": 0.0004568739565943239, + "loss": 1.723, + "loss_base2": 2.4858, + "loss_pixel": 0.2513, + "loss_text": 1.4717, + "ppl": 5.6013, + "step": 10533 + }, + { + "epoch": 0.06, + "global_step": 10534, + "learning_rate": 0.00045686978297161934, + "loss": 1.7108, + "loss_base2": 2.4682, + "loss_pixel": 0.2513, + "loss_text": 1.4594, + "ppl": 5.5334, + "step": 10534 + }, + { + "epoch": 0.06, + "global_step": 10535, + "learning_rate": 0.00045686560934891484, + "loss": 1.7348, + "loss_base2": 2.5028, + "loss_pixel": 0.2506, + "loss_text": 1.4843, + "ppl": 5.6678, + "step": 10535 + }, + { + "epoch": 0.06, + "global_step": 10536, + "learning_rate": 0.00045686143572621035, + "loss": 1.7178, + "loss_base2": 2.4783, + "loss_pixel": 0.2498, + "loss_text": 1.468, + "ppl": 5.5723, + "step": 10536 + }, + { + "epoch": 0.06, + "global_step": 10537, + "learning_rate": 0.00045685726210350586, + "loss": 1.7315, + "loss_base2": 2.498, + "loss_pixel": 0.2503, + "loss_text": 1.4812, + "ppl": 5.6491, + "step": 10537 + }, + { + "epoch": 0.06, + "global_step": 10538, + "learning_rate": 0.00045685308848080136, + "loss": 1.7118, + "loss_base2": 2.4696, + "loss_pixel": 0.2495, + "loss_text": 1.4623, + "ppl": 5.5389, + "step": 10538 + }, + { + "epoch": 0.06, + "global_step": 10539, + "learning_rate": 0.0004568489148580968, + "loss": 1.7073, + "loss_base2": 2.4631, + "loss_pixel": 0.248, + "loss_text": 1.4593, + "ppl": 5.5141, + "step": 10539 + }, + { + "epoch": 0.06, + "global_step": 10540, + "learning_rate": 0.0004568447412353923, + "loss": 1.7109, + "loss_base2": 2.4683, + "loss_pixel": 0.2482, + "loss_text": 1.4627, + "ppl": 5.5339, + "step": 10540 + }, + { + "epoch": 0.06, + "global_step": 10541, + "learning_rate": 0.00045684056761268783, + "loss": 1.7247, + "loss_base2": 2.4882, + "loss_pixel": 0.2477, + "loss_text": 1.477, + "ppl": 5.6108, + "step": 10541 + }, + { + "epoch": 0.06, + "global_step": 10542, + "learning_rate": 0.00045683639398998334, + "loss": 1.7056, + "loss_base2": 2.4607, + "loss_pixel": 0.2484, + "loss_text": 1.4573, + "ppl": 5.5047, + "step": 10542 + }, + { + "epoch": 0.06, + "global_step": 10543, + "learning_rate": 0.0004568322203672788, + "loss": 1.7196, + "loss_base2": 2.4809, + "loss_pixel": 0.2488, + "loss_text": 1.4709, + "ppl": 5.5823, + "step": 10543 + }, + { + "epoch": 0.06, + "global_step": 10544, + "learning_rate": 0.0004568280467445743, + "loss": 1.7241, + "loss_base2": 2.4874, + "loss_pixel": 0.2527, + "loss_text": 1.4714, + "ppl": 5.6075, + "step": 10544 + }, + { + "epoch": 0.06, + "global_step": 10545, + "learning_rate": 0.0004568238731218698, + "loss": 1.7596, + "loss_base2": 2.5386, + "loss_pixel": 0.2792, + "loss_text": 1.4804, + "ppl": 5.8101, + "step": 10545 + }, + { + "epoch": 0.06, + "global_step": 10546, + "learning_rate": 0.0004568196994991653, + "loss": 1.7691, + "loss_base2": 2.5523, + "loss_pixel": 0.3199, + "loss_text": 1.4492, + "ppl": 5.8656, + "step": 10546 + }, + { + "epoch": 0.06, + "global_step": 10547, + "learning_rate": 0.0004568155258764608, + "loss": 1.8464, + "loss_base2": 2.6638, + "loss_pixel": 0.3796, + "loss_text": 1.4667, + "ppl": 6.337, + "step": 10547 + }, + { + "epoch": 0.06, + "global_step": 10548, + "learning_rate": 0.0004568113522537563, + "loss": 1.8327, + "loss_base2": 2.644, + "loss_pixel": 0.3599, + "loss_text": 1.4728, + "ppl": 6.2507, + "step": 10548 + }, + { + "epoch": 0.06, + "global_step": 10549, + "learning_rate": 0.0004568071786310518, + "loss": 1.8261, + "loss_base2": 2.6345, + "loss_pixel": 0.3538, + "loss_text": 1.4723, + "ppl": 6.2096, + "step": 10549 + }, + { + "epoch": 0.06, + "global_step": 10550, + "learning_rate": 0.00045680300500834724, + "loss": 1.8144, + "loss_base2": 2.6176, + "loss_pixel": 0.3492, + "loss_text": 1.4653, + "ppl": 6.1374, + "step": 10550 + }, + { + "epoch": 0.06, + "global_step": 10551, + "learning_rate": 0.00045679883138564274, + "loss": 1.8317, + "loss_base2": 2.6426, + "loss_pixel": 0.3426, + "loss_text": 1.4891, + "ppl": 6.2445, + "step": 10551 + }, + { + "epoch": 0.06, + "global_step": 10552, + "learning_rate": 0.0004567946577629382, + "loss": 1.8194, + "loss_base2": 2.6248, + "loss_pixel": 0.3403, + "loss_text": 1.4792, + "ppl": 6.1682, + "step": 10552 + }, + { + "epoch": 0.06, + "global_step": 10553, + "learning_rate": 0.0004567904841402337, + "loss": 1.8163, + "loss_base2": 2.6204, + "loss_pixel": 0.3343, + "loss_text": 1.482, + "ppl": 6.1491, + "step": 10553 + }, + { + "epoch": 0.06, + "global_step": 10554, + "learning_rate": 0.0004567863105175292, + "loss": 1.7965, + "loss_base2": 2.5918, + "loss_pixel": 0.3263, + "loss_text": 1.4702, + "ppl": 6.0285, + "step": 10554 + }, + { + "epoch": 0.06, + "global_step": 10555, + "learning_rate": 0.0004567821368948247, + "loss": 1.7893, + "loss_base2": 2.5814, + "loss_pixel": 0.3231, + "loss_text": 1.4662, + "ppl": 5.9853, + "step": 10555 + }, + { + "epoch": 0.06, + "global_step": 10556, + "learning_rate": 0.0004567779632721202, + "loss": 1.7907, + "loss_base2": 2.5834, + "loss_pixel": 0.3207, + "loss_text": 1.47, + "ppl": 5.9936, + "step": 10556 + }, + { + "epoch": 0.06, + "global_step": 10557, + "learning_rate": 0.0004567737896494157, + "loss": 1.5824, + "loss_base2": 2.2829, + "loss_pixel": 0.3213, + "loss_text": 1.2611, + "ppl": 4.8666, + "step": 10557 + }, + { + "epoch": 0.06, + "global_step": 10558, + "learning_rate": 0.0004567696160267112, + "loss": 1.5971, + "loss_base2": 2.3041, + "loss_pixel": 0.342, + "loss_text": 1.255, + "ppl": 4.9387, + "step": 10558 + }, + { + "epoch": 0.06, + "global_step": 10559, + "learning_rate": 0.0004567654424040067, + "loss": 1.588, + "loss_base2": 2.291, + "loss_pixel": 0.3288, + "loss_text": 1.2592, + "ppl": 4.894, + "step": 10559 + }, + { + "epoch": 0.06, + "global_step": 10560, + "learning_rate": 0.0004567612687813022, + "loss": 1.5944, + "loss_base2": 2.3002, + "loss_pixel": 0.3258, + "loss_text": 1.2686, + "ppl": 4.9254, + "step": 10560 + }, + { + "epoch": 0.06, + "global_step": 10561, + "learning_rate": 0.00045675709515859765, + "loss": 1.5675, + "loss_base2": 2.2614, + "loss_pixel": 0.3188, + "loss_text": 1.2487, + "ppl": 4.7946, + "step": 10561 + }, + { + "epoch": 0.06, + "global_step": 10562, + "learning_rate": 0.00045675292153589316, + "loss": 1.5624, + "loss_base2": 2.2541, + "loss_pixel": 0.3135, + "loss_text": 1.2489, + "ppl": 4.7703, + "step": 10562 + }, + { + "epoch": 0.06, + "global_step": 10563, + "learning_rate": 0.00045674874791318867, + "loss": 1.5542, + "loss_base2": 2.2422, + "loss_pixel": 0.3096, + "loss_text": 1.2445, + "ppl": 4.7313, + "step": 10563 + }, + { + "epoch": 0.06, + "global_step": 10564, + "learning_rate": 0.0004567445742904842, + "loss": 1.5481, + "loss_base2": 2.2334, + "loss_pixel": 0.3044, + "loss_text": 1.2437, + "ppl": 4.7025, + "step": 10564 + }, + { + "epoch": 0.06, + "global_step": 10565, + "learning_rate": 0.0004567404006677797, + "loss": 1.5298, + "loss_base2": 2.207, + "loss_pixel": 0.3016, + "loss_text": 1.2281, + "ppl": 4.6173, + "step": 10565 + }, + { + "epoch": 0.06, + "global_step": 10566, + "learning_rate": 0.00045673622704507514, + "loss": 1.5463, + "loss_base2": 2.2308, + "loss_pixel": 0.2983, + "loss_text": 1.2481, + "ppl": 4.6941, + "step": 10566 + }, + { + "epoch": 0.06, + "global_step": 10567, + "learning_rate": 0.00045673205342237064, + "loss": 1.5436, + "loss_base2": 2.2269, + "loss_pixel": 0.2965, + "loss_text": 1.2471, + "ppl": 4.6814, + "step": 10567 + }, + { + "epoch": 0.06, + "global_step": 10568, + "learning_rate": 0.00045672787979966615, + "loss": 1.5376, + "loss_base2": 2.2183, + "loss_pixel": 0.2958, + "loss_text": 1.2418, + "ppl": 4.6534, + "step": 10568 + }, + { + "epoch": 0.06, + "global_step": 10569, + "learning_rate": 0.0004567237061769616, + "loss": 1.5439, + "loss_base2": 2.2274, + "loss_pixel": 0.2924, + "loss_text": 1.2515, + "ppl": 4.6828, + "step": 10569 + }, + { + "epoch": 0.06, + "global_step": 10570, + "learning_rate": 0.00045671953255425706, + "loss": 1.5282, + "loss_base2": 2.2047, + "loss_pixel": 0.291, + "loss_text": 1.2372, + "ppl": 4.6099, + "step": 10570 + }, + { + "epoch": 0.06, + "global_step": 10571, + "learning_rate": 0.00045671535893155256, + "loss": 1.5225, + "loss_base2": 2.1965, + "loss_pixel": 0.2898, + "loss_text": 1.2327, + "ppl": 4.5837, + "step": 10571 + }, + { + "epoch": 0.06, + "global_step": 10572, + "learning_rate": 0.00045671118530884807, + "loss": 1.5417, + "loss_base2": 2.2242, + "loss_pixel": 0.2894, + "loss_text": 1.2524, + "ppl": 4.6725, + "step": 10572 + }, + { + "epoch": 0.06, + "global_step": 10573, + "learning_rate": 0.0004567070116861436, + "loss": 1.6066, + "loss_base2": 2.3178, + "loss_pixel": 0.2896, + "loss_text": 1.3169, + "ppl": 4.9858, + "step": 10573 + }, + { + "epoch": 0.06, + "global_step": 10574, + "learning_rate": 0.0004567028380634391, + "loss": 1.756, + "loss_base2": 2.5334, + "loss_pixel": 0.2894, + "loss_text": 1.4666, + "ppl": 5.7892, + "step": 10574 + }, + { + "epoch": 0.06, + "global_step": 10575, + "learning_rate": 0.00045669866444073454, + "loss": 1.7856, + "loss_base2": 2.5761, + "loss_pixel": 0.2874, + "loss_text": 1.4982, + "ppl": 5.9632, + "step": 10575 + }, + { + "epoch": 0.06, + "global_step": 10576, + "learning_rate": 0.00045669449081803005, + "loss": 1.7728, + "loss_base2": 2.5576, + "loss_pixel": 0.2832, + "loss_text": 1.4896, + "ppl": 5.8873, + "step": 10576 + }, + { + "epoch": 0.06, + "global_step": 10577, + "learning_rate": 0.00045669031719532555, + "loss": 1.7521, + "loss_base2": 2.5277, + "loss_pixel": 0.2816, + "loss_text": 1.4705, + "ppl": 5.7667, + "step": 10577 + }, + { + "epoch": 0.06, + "global_step": 10578, + "learning_rate": 0.00045668614357262106, + "loss": 1.7683, + "loss_base2": 2.5511, + "loss_pixel": 0.2806, + "loss_text": 1.4877, + "ppl": 5.8609, + "step": 10578 + }, + { + "epoch": 0.06, + "global_step": 10579, + "learning_rate": 0.00045668196994991657, + "loss": 1.7499, + "loss_base2": 2.5246, + "loss_pixel": 0.2767, + "loss_text": 1.4732, + "ppl": 5.754, + "step": 10579 + }, + { + "epoch": 0.06, + "global_step": 10580, + "learning_rate": 0.000456677796327212, + "loss": 1.7536, + "loss_base2": 2.5299, + "loss_pixel": 0.2786, + "loss_text": 1.475, + "ppl": 5.7754, + "step": 10580 + }, + { + "epoch": 0.06, + "global_step": 10581, + "learning_rate": 0.00045667362270450753, + "loss": 1.7471, + "loss_base2": 2.5205, + "loss_pixel": 0.2763, + "loss_text": 1.4708, + "ppl": 5.7379, + "step": 10581 + }, + { + "epoch": 0.06, + "global_step": 10582, + "learning_rate": 0.00045666944908180304, + "loss": 1.7572, + "loss_base2": 2.5351, + "loss_pixel": 0.2738, + "loss_text": 1.4834, + "ppl": 5.7962, + "step": 10582 + }, + { + "epoch": 0.06, + "global_step": 10583, + "learning_rate": 0.00045666527545909854, + "loss": 1.7518, + "loss_base2": 2.5273, + "loss_pixel": 0.272, + "loss_text": 1.4798, + "ppl": 5.765, + "step": 10583 + }, + { + "epoch": 0.06, + "global_step": 10584, + "learning_rate": 0.000456661101836394, + "loss": 1.7487, + "loss_base2": 2.5228, + "loss_pixel": 0.2712, + "loss_text": 1.4774, + "ppl": 5.7471, + "step": 10584 + }, + { + "epoch": 0.06, + "global_step": 10585, + "learning_rate": 0.0004566569282136895, + "loss": 1.7455, + "loss_base2": 2.5182, + "loss_pixel": 0.2705, + "loss_text": 1.475, + "ppl": 5.7288, + "step": 10585 + }, + { + "epoch": 0.06, + "global_step": 10586, + "learning_rate": 0.000456652754590985, + "loss": 1.737, + "loss_base2": 2.506, + "loss_pixel": 0.2718, + "loss_text": 1.4651, + "ppl": 5.6803, + "step": 10586 + }, + { + "epoch": 0.06, + "global_step": 10587, + "learning_rate": 0.00045664858096828046, + "loss": 1.7523, + "loss_base2": 2.528, + "loss_pixel": 0.2713, + "loss_text": 1.481, + "ppl": 5.7679, + "step": 10587 + }, + { + "epoch": 0.06, + "global_step": 10588, + "learning_rate": 0.00045664440734557597, + "loss": 1.7348, + "loss_base2": 2.5028, + "loss_pixel": 0.2683, + "loss_text": 1.4666, + "ppl": 5.6678, + "step": 10588 + }, + { + "epoch": 0.06, + "global_step": 10589, + "learning_rate": 0.0004566402337228714, + "loss": 1.7446, + "loss_base2": 2.5169, + "loss_pixel": 0.2694, + "loss_text": 1.4752, + "ppl": 5.7236, + "step": 10589 + }, + { + "epoch": 0.06, + "global_step": 10590, + "learning_rate": 0.00045663606010016693, + "loss": 1.7414, + "loss_base2": 2.5123, + "loss_pixel": 0.2688, + "loss_text": 1.4726, + "ppl": 5.7053, + "step": 10590 + }, + { + "epoch": 0.06, + "global_step": 10591, + "learning_rate": 0.00045663188647746244, + "loss": 1.7415, + "loss_base2": 2.5125, + "loss_pixel": 0.2676, + "loss_text": 1.474, + "ppl": 5.7059, + "step": 10591 + }, + { + "epoch": 0.06, + "global_step": 10592, + "learning_rate": 0.00045662771285475795, + "loss": 1.7263, + "loss_base2": 2.4905, + "loss_pixel": 0.2654, + "loss_text": 1.4609, + "ppl": 5.6198, + "step": 10592 + }, + { + "epoch": 0.06, + "global_step": 10593, + "learning_rate": 0.0004566235392320534, + "loss": 1.7308, + "loss_base2": 2.497, + "loss_pixel": 0.2648, + "loss_text": 1.4661, + "ppl": 5.6452, + "step": 10593 + }, + { + "epoch": 0.06, + "global_step": 10594, + "learning_rate": 0.0004566193656093489, + "loss": 1.7165, + "loss_base2": 2.4764, + "loss_pixel": 0.2622, + "loss_text": 1.4543, + "ppl": 5.565, + "step": 10594 + }, + { + "epoch": 0.06, + "global_step": 10595, + "learning_rate": 0.0004566151919866444, + "loss": 1.7194, + "loss_base2": 2.4806, + "loss_pixel": 0.2614, + "loss_text": 1.458, + "ppl": 5.5812, + "step": 10595 + }, + { + "epoch": 0.06, + "global_step": 10596, + "learning_rate": 0.0004566110183639399, + "loss": 1.7447, + "loss_base2": 2.5171, + "loss_pixel": 0.2629, + "loss_text": 1.4818, + "ppl": 5.7242, + "step": 10596 + }, + { + "epoch": 0.06, + "global_step": 10597, + "learning_rate": 0.00045660684474123543, + "loss": 1.7387, + "loss_base2": 2.5084, + "loss_pixel": 0.2588, + "loss_text": 1.4799, + "ppl": 5.6899, + "step": 10597 + }, + { + "epoch": 0.06, + "global_step": 10598, + "learning_rate": 0.0004566026711185309, + "loss": 1.7133, + "loss_base2": 2.4718, + "loss_pixel": 0.2574, + "loss_text": 1.4559, + "ppl": 5.5472, + "step": 10598 + }, + { + "epoch": 0.06, + "global_step": 10599, + "learning_rate": 0.0004565984974958264, + "loss": 1.7182, + "loss_base2": 2.4788, + "loss_pixel": 0.2568, + "loss_text": 1.4614, + "ppl": 5.5745, + "step": 10599 + }, + { + "epoch": 0.06, + "global_step": 10600, + "learning_rate": 0.0004565943238731219, + "loss": 1.7252, + "loss_base2": 2.4889, + "loss_pixel": 0.2557, + "loss_text": 1.4695, + "ppl": 5.6136, + "step": 10600 + }, + { + "epoch": 0.06, + "global_step": 10601, + "learning_rate": 0.0004565901502504174, + "loss": 1.7186, + "loss_base2": 2.4794, + "loss_pixel": 0.2547, + "loss_text": 1.4639, + "ppl": 5.5767, + "step": 10601 + }, + { + "epoch": 0.06, + "global_step": 10602, + "learning_rate": 0.00045658597662771286, + "loss": 1.7411, + "loss_base2": 2.5119, + "loss_pixel": 0.2543, + "loss_text": 1.4867, + "ppl": 5.7036, + "step": 10602 + }, + { + "epoch": 0.06, + "global_step": 10603, + "learning_rate": 0.00045658180300500836, + "loss": 1.7369, + "loss_base2": 2.5058, + "loss_pixel": 0.2551, + "loss_text": 1.4818, + "ppl": 5.6797, + "step": 10603 + }, + { + "epoch": 0.06, + "global_step": 10604, + "learning_rate": 0.00045657762938230387, + "loss": 1.7118, + "loss_base2": 2.4696, + "loss_pixel": 0.2525, + "loss_text": 1.4592, + "ppl": 5.5389, + "step": 10604 + }, + { + "epoch": 0.06, + "global_step": 10605, + "learning_rate": 0.0004565734557595994, + "loss": 1.729, + "loss_base2": 2.4944, + "loss_pixel": 0.2525, + "loss_text": 1.4765, + "ppl": 5.635, + "step": 10605 + }, + { + "epoch": 0.06, + "global_step": 10606, + "learning_rate": 0.00045656928213689483, + "loss": 1.7362, + "loss_base2": 2.5048, + "loss_pixel": 0.252, + "loss_text": 1.4842, + "ppl": 5.6757, + "step": 10606 + }, + { + "epoch": 0.06, + "global_step": 10607, + "learning_rate": 0.0004565651085141903, + "loss": 1.7222, + "loss_base2": 2.4846, + "loss_pixel": 0.2514, + "loss_text": 1.4708, + "ppl": 5.5968, + "step": 10607 + }, + { + "epoch": 0.06, + "global_step": 10608, + "learning_rate": 0.0004565609348914858, + "loss": 1.7312, + "loss_base2": 2.4976, + "loss_pixel": 0.2512, + "loss_text": 1.48, + "ppl": 5.6474, + "step": 10608 + }, + { + "epoch": 0.06, + "global_step": 10609, + "learning_rate": 0.0004565567612687813, + "loss": 1.7232, + "loss_base2": 2.4861, + "loss_pixel": 0.2568, + "loss_text": 1.4664, + "ppl": 5.6024, + "step": 10609 + }, + { + "epoch": 0.06, + "global_step": 10610, + "learning_rate": 0.0004565525876460768, + "loss": 1.7655, + "loss_base2": 2.5471, + "loss_pixel": 0.2763, + "loss_text": 1.4892, + "ppl": 5.8445, + "step": 10610 + }, + { + "epoch": 0.06, + "global_step": 10611, + "learning_rate": 0.00045654841402337226, + "loss": 1.7509, + "loss_base2": 2.526, + "loss_pixel": 0.2814, + "loss_text": 1.4695, + "ppl": 5.7598, + "step": 10611 + }, + { + "epoch": 0.06, + "global_step": 10612, + "learning_rate": 0.00045654424040066777, + "loss": 1.7631, + "loss_base2": 2.5436, + "loss_pixel": 0.2896, + "loss_text": 1.4735, + "ppl": 5.8305, + "step": 10612 + }, + { + "epoch": 0.06, + "global_step": 10613, + "learning_rate": 0.0004565400667779633, + "loss": 1.7507, + "loss_base2": 2.5257, + "loss_pixel": 0.2838, + "loss_text": 1.4669, + "ppl": 5.7586, + "step": 10613 + }, + { + "epoch": 0.06, + "global_step": 10614, + "learning_rate": 0.0004565358931552588, + "loss": 1.7255, + "loss_base2": 2.4894, + "loss_pixel": 0.282, + "loss_text": 1.4435, + "ppl": 5.6153, + "step": 10614 + }, + { + "epoch": 0.06, + "global_step": 10615, + "learning_rate": 0.0004565317195325543, + "loss": 1.7578, + "loss_base2": 2.536, + "loss_pixel": 0.273, + "loss_text": 1.4848, + "ppl": 5.7997, + "step": 10615 + }, + { + "epoch": 0.06, + "global_step": 10616, + "learning_rate": 0.00045652754590984974, + "loss": 1.7353, + "loss_base2": 2.5035, + "loss_pixel": 0.2726, + "loss_text": 1.4628, + "ppl": 5.6706, + "step": 10616 + }, + { + "epoch": 0.06, + "global_step": 10617, + "learning_rate": 0.00045652337228714525, + "loss": 1.7138, + "loss_base2": 2.4725, + "loss_pixel": 0.2717, + "loss_text": 1.4421, + "ppl": 5.55, + "step": 10617 + }, + { + "epoch": 0.06, + "global_step": 10618, + "learning_rate": 0.00045651919866444076, + "loss": 1.512, + "loss_base2": 2.1814, + "loss_pixel": 0.27, + "loss_text": 1.242, + "ppl": 4.5358, + "step": 10618 + }, + { + "epoch": 0.06, + "global_step": 10619, + "learning_rate": 0.00045651502504173627, + "loss": 1.5387, + "loss_base2": 2.2199, + "loss_pixel": 0.268, + "loss_text": 1.2707, + "ppl": 4.6585, + "step": 10619 + }, + { + "epoch": 0.06, + "global_step": 10620, + "learning_rate": 0.0004565108514190317, + "loss": 1.5212, + "loss_base2": 2.1946, + "loss_pixel": 0.2657, + "loss_text": 1.2555, + "ppl": 4.5777, + "step": 10620 + }, + { + "epoch": 0.06, + "global_step": 10621, + "learning_rate": 0.0004565066777963272, + "loss": 1.5156, + "loss_base2": 2.1865, + "loss_pixel": 0.2651, + "loss_text": 1.2506, + "ppl": 4.5522, + "step": 10621 + }, + { + "epoch": 0.06, + "global_step": 10622, + "learning_rate": 0.00045650250417362273, + "loss": 1.5156, + "loss_base2": 2.1865, + "loss_pixel": 0.2632, + "loss_text": 1.2523, + "ppl": 4.5522, + "step": 10622 + }, + { + "epoch": 0.06, + "global_step": 10623, + "learning_rate": 0.00045649833055091824, + "loss": 1.5092, + "loss_base2": 2.1773, + "loss_pixel": 0.2616, + "loss_text": 1.2476, + "ppl": 4.5231, + "step": 10623 + }, + { + "epoch": 0.06, + "global_step": 10624, + "learning_rate": 0.00045649415692821375, + "loss": 1.4987, + "loss_base2": 2.1622, + "loss_pixel": 0.2612, + "loss_text": 1.2375, + "ppl": 4.4759, + "step": 10624 + }, + { + "epoch": 0.06, + "global_step": 10625, + "learning_rate": 0.00045648998330550915, + "loss": 1.4981, + "loss_base2": 2.1613, + "loss_pixel": 0.2603, + "loss_text": 1.2379, + "ppl": 4.4732, + "step": 10625 + }, + { + "epoch": 0.06, + "global_step": 10626, + "learning_rate": 0.00045648580968280465, + "loss": 1.4929, + "loss_base2": 2.1538, + "loss_pixel": 0.2592, + "loss_text": 1.2336, + "ppl": 4.45, + "step": 10626 + }, + { + "epoch": 0.06, + "global_step": 10627, + "learning_rate": 0.00045648163606010016, + "loss": 1.5179, + "loss_base2": 2.1899, + "loss_pixel": 0.2573, + "loss_text": 1.2605, + "ppl": 4.5626, + "step": 10627 + }, + { + "epoch": 0.06, + "global_step": 10628, + "learning_rate": 0.00045647746243739567, + "loss": 1.5057, + "loss_base2": 2.1723, + "loss_pixel": 0.2561, + "loss_text": 1.2496, + "ppl": 4.5073, + "step": 10628 + }, + { + "epoch": 0.06, + "global_step": 10629, + "learning_rate": 0.0004564732888146911, + "loss": 1.5066, + "loss_base2": 2.1736, + "loss_pixel": 0.255, + "loss_text": 1.2516, + "ppl": 4.5114, + "step": 10629 + }, + { + "epoch": 0.06, + "global_step": 10630, + "learning_rate": 0.00045646911519198663, + "loss": 1.5157, + "loss_base2": 2.1867, + "loss_pixel": 0.2539, + "loss_text": 1.2618, + "ppl": 4.5526, + "step": 10630 + }, + { + "epoch": 0.06, + "global_step": 10631, + "learning_rate": 0.00045646494156928214, + "loss": 1.4895, + "loss_base2": 2.1489, + "loss_pixel": 0.2538, + "loss_text": 1.2357, + "ppl": 4.4349, + "step": 10631 + }, + { + "epoch": 0.06, + "global_step": 10632, + "learning_rate": 0.00045646076794657764, + "loss": 1.4969, + "loss_base2": 2.1596, + "loss_pixel": 0.2532, + "loss_text": 1.2437, + "ppl": 4.4678, + "step": 10632 + }, + { + "epoch": 0.06, + "global_step": 10633, + "learning_rate": 0.00045645659432387315, + "loss": 1.4854, + "loss_base2": 2.143, + "loss_pixel": 0.2519, + "loss_text": 1.2335, + "ppl": 4.4167, + "step": 10633 + }, + { + "epoch": 0.06, + "global_step": 10634, + "learning_rate": 0.0004564524207011686, + "loss": 1.5032, + "loss_base2": 2.1687, + "loss_pixel": 0.2511, + "loss_text": 1.2521, + "ppl": 4.4961, + "step": 10634 + }, + { + "epoch": 0.06, + "global_step": 10635, + "learning_rate": 0.0004564482470784641, + "loss": 1.4914, + "loss_base2": 2.1516, + "loss_pixel": 0.2499, + "loss_text": 1.2415, + "ppl": 4.4433, + "step": 10635 + }, + { + "epoch": 0.06, + "global_step": 10636, + "learning_rate": 0.0004564440734557596, + "loss": 1.5221, + "loss_base2": 2.1959, + "loss_pixel": 0.2494, + "loss_text": 1.2727, + "ppl": 4.5818, + "step": 10636 + }, + { + "epoch": 0.06, + "global_step": 10637, + "learning_rate": 0.0004564398998330551, + "loss": 1.5158, + "loss_base2": 2.1868, + "loss_pixel": 0.2488, + "loss_text": 1.2671, + "ppl": 4.5531, + "step": 10637 + }, + { + "epoch": 0.06, + "global_step": 10638, + "learning_rate": 0.00045643572621035063, + "loss": 1.4844, + "loss_base2": 2.1415, + "loss_pixel": 0.2483, + "loss_text": 1.236, + "ppl": 4.4123, + "step": 10638 + }, + { + "epoch": 0.06, + "global_step": 10639, + "learning_rate": 0.0004564315525876461, + "loss": 1.4735, + "loss_base2": 2.1258, + "loss_pixel": 0.249, + "loss_text": 1.2245, + "ppl": 4.3645, + "step": 10639 + }, + { + "epoch": 0.06, + "global_step": 10640, + "learning_rate": 0.0004564273789649416, + "loss": 1.4677, + "loss_base2": 2.1174, + "loss_pixel": 0.2489, + "loss_text": 1.2188, + "ppl": 4.3392, + "step": 10640 + }, + { + "epoch": 0.06, + "global_step": 10641, + "learning_rate": 0.0004564232053422371, + "loss": 1.582, + "loss_base2": 2.2823, + "loss_pixel": 0.2504, + "loss_text": 1.3317, + "ppl": 4.8647, + "step": 10641 + }, + { + "epoch": 0.06, + "global_step": 10642, + "learning_rate": 0.0004564190317195326, + "loss": 1.7349, + "loss_base2": 2.5029, + "loss_pixel": 0.2511, + "loss_text": 1.4837, + "ppl": 5.6684, + "step": 10642 + }, + { + "epoch": 0.06, + "global_step": 10643, + "learning_rate": 0.000456414858096828, + "loss": 1.7216, + "loss_base2": 2.4837, + "loss_pixel": 0.2491, + "loss_text": 1.4725, + "ppl": 5.5935, + "step": 10643 + }, + { + "epoch": 0.06, + "global_step": 10644, + "learning_rate": 0.0004564106844741235, + "loss": 1.7191, + "loss_base2": 2.4801, + "loss_pixel": 0.2503, + "loss_text": 1.4688, + "ppl": 5.5795, + "step": 10644 + }, + { + "epoch": 0.06, + "global_step": 10645, + "learning_rate": 0.000456406510851419, + "loss": 1.7373, + "loss_base2": 2.5064, + "loss_pixel": 0.2471, + "loss_text": 1.4901, + "ppl": 5.682, + "step": 10645 + }, + { + "epoch": 0.06, + "global_step": 10646, + "learning_rate": 0.00045640233722871453, + "loss": 1.7196, + "loss_base2": 2.4809, + "loss_pixel": 0.2471, + "loss_text": 1.4725, + "ppl": 5.5823, + "step": 10646 + }, + { + "epoch": 0.06, + "global_step": 10647, + "learning_rate": 0.00045639816360601004, + "loss": 1.7216, + "loss_base2": 2.4837, + "loss_pixel": 0.2465, + "loss_text": 1.4751, + "ppl": 5.5935, + "step": 10647 + }, + { + "epoch": 0.06, + "global_step": 10648, + "learning_rate": 0.0004563939899833055, + "loss": 1.7203, + "loss_base2": 2.4819, + "loss_pixel": 0.2458, + "loss_text": 1.4746, + "ppl": 5.5862, + "step": 10648 + }, + { + "epoch": 0.06, + "global_step": 10649, + "learning_rate": 0.000456389816360601, + "loss": 1.7082, + "loss_base2": 2.4644, + "loss_pixel": 0.245, + "loss_text": 1.4633, + "ppl": 5.519, + "step": 10649 + }, + { + "epoch": 0.06, + "global_step": 10650, + "learning_rate": 0.0004563856427378965, + "loss": 1.722, + "loss_base2": 2.4843, + "loss_pixel": 0.2443, + "loss_text": 1.4778, + "ppl": 5.5957, + "step": 10650 + }, + { + "epoch": 0.06, + "global_step": 10651, + "learning_rate": 0.000456381469115192, + "loss": 1.7276, + "loss_base2": 2.4924, + "loss_pixel": 0.2451, + "loss_text": 1.4825, + "ppl": 5.6271, + "step": 10651 + }, + { + "epoch": 0.06, + "global_step": 10652, + "learning_rate": 0.00045637729549248746, + "loss": 1.7399, + "loss_base2": 2.5101, + "loss_pixel": 0.2432, + "loss_text": 1.4967, + "ppl": 5.6968, + "step": 10652 + }, + { + "epoch": 0.06, + "global_step": 10653, + "learning_rate": 0.00045637312186978297, + "loss": 1.7145, + "loss_base2": 2.4735, + "loss_pixel": 0.2432, + "loss_text": 1.4713, + "ppl": 5.5539, + "step": 10653 + }, + { + "epoch": 0.06, + "global_step": 10654, + "learning_rate": 0.0004563689482470785, + "loss": 1.7277, + "loss_base2": 2.4925, + "loss_pixel": 0.2424, + "loss_text": 1.4853, + "ppl": 5.6277, + "step": 10654 + }, + { + "epoch": 0.06, + "global_step": 10655, + "learning_rate": 0.000456364774624374, + "loss": 1.7076, + "loss_base2": 2.4635, + "loss_pixel": 0.2433, + "loss_text": 1.4644, + "ppl": 5.5157, + "step": 10655 + }, + { + "epoch": 0.06, + "global_step": 10656, + "learning_rate": 0.0004563606010016695, + "loss": 1.7001, + "loss_base2": 2.4527, + "loss_pixel": 0.2415, + "loss_text": 1.4586, + "ppl": 5.4745, + "step": 10656 + }, + { + "epoch": 0.06, + "global_step": 10657, + "learning_rate": 0.00045635642737896495, + "loss": 1.7142, + "loss_base2": 2.4731, + "loss_pixel": 0.2411, + "loss_text": 1.4731, + "ppl": 5.5522, + "step": 10657 + }, + { + "epoch": 0.06, + "global_step": 10658, + "learning_rate": 0.00045635225375626045, + "loss": 1.7217, + "loss_base2": 2.4839, + "loss_pixel": 0.2412, + "loss_text": 1.4805, + "ppl": 5.594, + "step": 10658 + }, + { + "epoch": 0.06, + "global_step": 10659, + "learning_rate": 0.00045634808013355596, + "loss": 1.7165, + "loss_base2": 2.4764, + "loss_pixel": 0.2414, + "loss_text": 1.4751, + "ppl": 5.565, + "step": 10659 + }, + { + "epoch": 0.06, + "global_step": 10660, + "learning_rate": 0.00045634390651085147, + "loss": 1.7102, + "loss_base2": 2.4673, + "loss_pixel": 0.2411, + "loss_text": 1.4691, + "ppl": 5.5301, + "step": 10660 + }, + { + "epoch": 0.06, + "global_step": 10661, + "learning_rate": 0.0004563397328881469, + "loss": 1.7106, + "loss_base2": 2.4679, + "loss_pixel": 0.2411, + "loss_text": 1.4695, + "ppl": 5.5323, + "step": 10661 + }, + { + "epoch": 0.06, + "global_step": 10662, + "learning_rate": 0.0004563355592654424, + "loss": 1.7024, + "loss_base2": 2.456, + "loss_pixel": 0.2391, + "loss_text": 1.4633, + "ppl": 5.4871, + "step": 10662 + }, + { + "epoch": 0.06, + "global_step": 10663, + "learning_rate": 0.0004563313856427379, + "loss": 1.72, + "loss_base2": 2.4814, + "loss_pixel": 0.2406, + "loss_text": 1.4794, + "ppl": 5.5845, + "step": 10663 + }, + { + "epoch": 0.06, + "global_step": 10664, + "learning_rate": 0.0004563272120200334, + "loss": 1.6982, + "loss_base2": 2.45, + "loss_pixel": 0.2413, + "loss_text": 1.4568, + "ppl": 5.4641, + "step": 10664 + }, + { + "epoch": 0.06, + "global_step": 10665, + "learning_rate": 0.0004563230383973289, + "loss": 1.5953, + "loss_base2": 2.3015, + "loss_pixel": 0.2387, + "loss_text": 1.3565, + "ppl": 4.9298, + "step": 10665 + }, + { + "epoch": 0.06, + "global_step": 10666, + "learning_rate": 0.00045631886477462435, + "loss": 1.4796, + "loss_base2": 2.1346, + "loss_pixel": 0.2388, + "loss_text": 1.2408, + "ppl": 4.3912, + "step": 10666 + }, + { + "epoch": 0.06, + "global_step": 10667, + "learning_rate": 0.00045631469115191986, + "loss": 1.4823, + "loss_base2": 2.1385, + "loss_pixel": 0.238, + "loss_text": 1.2443, + "ppl": 4.4031, + "step": 10667 + }, + { + "epoch": 0.06, + "global_step": 10668, + "learning_rate": 0.00045631051752921536, + "loss": 1.5015, + "loss_base2": 2.1662, + "loss_pixel": 0.2378, + "loss_text": 1.2638, + "ppl": 4.4884, + "step": 10668 + }, + { + "epoch": 0.06, + "global_step": 10669, + "learning_rate": 0.00045630634390651087, + "loss": 1.4906, + "loss_base2": 2.1505, + "loss_pixel": 0.2372, + "loss_text": 1.2534, + "ppl": 4.4398, + "step": 10669 + }, + { + "epoch": 0.06, + "global_step": 10670, + "learning_rate": 0.0004563021702838063, + "loss": 1.4972, + "loss_base2": 2.16, + "loss_pixel": 0.2367, + "loss_text": 1.2605, + "ppl": 4.4692, + "step": 10670 + }, + { + "epoch": 0.06, + "global_step": 10671, + "learning_rate": 0.00045629799666110183, + "loss": 1.4838, + "loss_base2": 2.1407, + "loss_pixel": 0.2378, + "loss_text": 1.246, + "ppl": 4.4097, + "step": 10671 + }, + { + "epoch": 0.06, + "global_step": 10672, + "learning_rate": 0.00045629382303839734, + "loss": 1.4666, + "loss_base2": 2.1159, + "loss_pixel": 0.2364, + "loss_text": 1.2302, + "ppl": 4.3345, + "step": 10672 + }, + { + "epoch": 0.06, + "global_step": 10673, + "learning_rate": 0.00045628964941569285, + "loss": 1.4605, + "loss_base2": 2.1071, + "loss_pixel": 0.236, + "loss_text": 1.2245, + "ppl": 4.3081, + "step": 10673 + }, + { + "epoch": 0.06, + "global_step": 10674, + "learning_rate": 0.00045628547579298835, + "loss": 1.4709, + "loss_base2": 2.1221, + "loss_pixel": 0.2371, + "loss_text": 1.2338, + "ppl": 4.3532, + "step": 10674 + }, + { + "epoch": 0.06, + "global_step": 10675, + "learning_rate": 0.0004562813021702838, + "loss": 1.4676, + "loss_base2": 2.1173, + "loss_pixel": 0.2358, + "loss_text": 1.2318, + "ppl": 4.3388, + "step": 10675 + }, + { + "epoch": 0.06, + "global_step": 10676, + "learning_rate": 0.0004562771285475793, + "loss": 1.4657, + "loss_base2": 2.1146, + "loss_pixel": 0.2344, + "loss_text": 1.2313, + "ppl": 4.3306, + "step": 10676 + }, + { + "epoch": 0.06, + "global_step": 10677, + "learning_rate": 0.0004562729549248748, + "loss": 1.502, + "loss_base2": 2.1669, + "loss_pixel": 0.235, + "loss_text": 1.267, + "ppl": 4.4907, + "step": 10677 + }, + { + "epoch": 0.06, + "global_step": 10678, + "learning_rate": 0.00045626878130217033, + "loss": 1.4787, + "loss_base2": 2.1333, + "loss_pixel": 0.2359, + "loss_text": 1.2428, + "ppl": 4.3872, + "step": 10678 + }, + { + "epoch": 0.06, + "global_step": 10679, + "learning_rate": 0.0004562646076794658, + "loss": 1.4702, + "loss_base2": 2.1211, + "loss_pixel": 0.2355, + "loss_text": 1.2347, + "ppl": 4.3501, + "step": 10679 + }, + { + "epoch": 0.06, + "global_step": 10680, + "learning_rate": 0.0004562604340567613, + "loss": 1.4821, + "loss_base2": 2.1382, + "loss_pixel": 0.237, + "loss_text": 1.2452, + "ppl": 4.4022, + "step": 10680 + }, + { + "epoch": 0.06, + "global_step": 10681, + "learning_rate": 0.00045625626043405674, + "loss": 1.4825, + "loss_base2": 2.1388, + "loss_pixel": 0.2375, + "loss_text": 1.245, + "ppl": 4.4039, + "step": 10681 + }, + { + "epoch": 0.06, + "global_step": 10682, + "learning_rate": 0.00045625208681135225, + "loss": 1.4787, + "loss_base2": 2.1333, + "loss_pixel": 0.2353, + "loss_text": 1.2434, + "ppl": 4.3872, + "step": 10682 + }, + { + "epoch": 0.06, + "global_step": 10683, + "learning_rate": 0.00045624791318864776, + "loss": 1.4644, + "loss_base2": 2.1127, + "loss_pixel": 0.2358, + "loss_text": 1.2286, + "ppl": 4.3249, + "step": 10683 + }, + { + "epoch": 0.06, + "global_step": 10684, + "learning_rate": 0.0004562437395659432, + "loss": 1.4679, + "loss_base2": 2.1177, + "loss_pixel": 0.2354, + "loss_text": 1.2325, + "ppl": 4.3401, + "step": 10684 + }, + { + "epoch": 0.06, + "global_step": 10685, + "learning_rate": 0.0004562395659432387, + "loss": 1.4808, + "loss_base2": 2.1363, + "loss_pixel": 0.2349, + "loss_text": 1.2459, + "ppl": 4.3965, + "step": 10685 + }, + { + "epoch": 0.06, + "global_step": 10686, + "learning_rate": 0.0004562353923205342, + "loss": 1.4728, + "loss_base2": 2.1248, + "loss_pixel": 0.2327, + "loss_text": 1.24, + "ppl": 4.3614, + "step": 10686 + }, + { + "epoch": 0.06, + "global_step": 10687, + "learning_rate": 0.00045623121869782973, + "loss": 1.4679, + "loss_base2": 2.1177, + "loss_pixel": 0.233, + "loss_text": 1.2349, + "ppl": 4.3401, + "step": 10687 + }, + { + "epoch": 0.06, + "global_step": 10688, + "learning_rate": 0.0004562270450751252, + "loss": 1.4817, + "loss_base2": 2.1376, + "loss_pixel": 0.234, + "loss_text": 1.2477, + "ppl": 4.4004, + "step": 10688 + }, + { + "epoch": 0.06, + "global_step": 10689, + "learning_rate": 0.0004562228714524207, + "loss": 1.4761, + "loss_base2": 2.1296, + "loss_pixel": 0.2322, + "loss_text": 1.244, + "ppl": 4.3758, + "step": 10689 + }, + { + "epoch": 0.06, + "global_step": 10690, + "learning_rate": 0.0004562186978297162, + "loss": 1.479, + "loss_base2": 2.1337, + "loss_pixel": 0.2315, + "loss_text": 1.2475, + "ppl": 4.3886, + "step": 10690 + }, + { + "epoch": 0.06, + "global_step": 10691, + "learning_rate": 0.0004562145242070117, + "loss": 1.4602, + "loss_base2": 2.1066, + "loss_pixel": 0.2331, + "loss_text": 1.2271, + "ppl": 4.3068, + "step": 10691 + }, + { + "epoch": 0.06, + "global_step": 10692, + "learning_rate": 0.0004562103505843072, + "loss": 1.4764, + "loss_base2": 2.13, + "loss_pixel": 0.2314, + "loss_text": 1.245, + "ppl": 4.3772, + "step": 10692 + }, + { + "epoch": 0.06, + "global_step": 10693, + "learning_rate": 0.00045620617696160267, + "loss": 1.4757, + "loss_base2": 2.129, + "loss_pixel": 0.2311, + "loss_text": 1.2446, + "ppl": 4.3741, + "step": 10693 + }, + { + "epoch": 0.06, + "global_step": 10694, + "learning_rate": 0.0004562020033388982, + "loss": 1.474, + "loss_base2": 2.1265, + "loss_pixel": 0.2314, + "loss_text": 1.2426, + "ppl": 4.3667, + "step": 10694 + }, + { + "epoch": 0.06, + "global_step": 10695, + "learning_rate": 0.0004561978297161937, + "loss": 1.4659, + "loss_base2": 2.1148, + "loss_pixel": 0.2295, + "loss_text": 1.2364, + "ppl": 4.3314, + "step": 10695 + }, + { + "epoch": 0.06, + "global_step": 10696, + "learning_rate": 0.0004561936560934892, + "loss": 1.4693, + "loss_base2": 2.1198, + "loss_pixel": 0.2291, + "loss_text": 1.2402, + "ppl": 4.3462, + "step": 10696 + }, + { + "epoch": 0.06, + "global_step": 10697, + "learning_rate": 0.0004561894824707847, + "loss": 1.474, + "loss_base2": 2.1265, + "loss_pixel": 0.2285, + "loss_text": 1.2455, + "ppl": 4.3667, + "step": 10697 + }, + { + "epoch": 0.06, + "global_step": 10698, + "learning_rate": 0.00045618530884808015, + "loss": 1.4696, + "loss_base2": 2.1202, + "loss_pixel": 0.2296, + "loss_text": 1.24, + "ppl": 4.3475, + "step": 10698 + }, + { + "epoch": 0.06, + "global_step": 10699, + "learning_rate": 0.00045618113522537566, + "loss": 1.4657, + "loss_base2": 2.1146, + "loss_pixel": 0.2291, + "loss_text": 1.2367, + "ppl": 4.3306, + "step": 10699 + }, + { + "epoch": 0.06, + "global_step": 10700, + "learning_rate": 0.0004561769616026711, + "loss": 1.4463, + "loss_base2": 2.0866, + "loss_pixel": 0.2326, + "loss_text": 1.2137, + "ppl": 4.2474, + "step": 10700 + }, + { + "epoch": 0.06, + "global_step": 10701, + "learning_rate": 0.0004561727879799666, + "loss": 1.4896, + "loss_base2": 2.149, + "loss_pixel": 0.2425, + "loss_text": 1.2471, + "ppl": 4.4353, + "step": 10701 + }, + { + "epoch": 0.06, + "global_step": 10702, + "learning_rate": 0.00045616861435726207, + "loss": 1.5544, + "loss_base2": 2.2425, + "loss_pixel": 0.3154, + "loss_text": 1.239, + "ppl": 4.7322, + "step": 10702 + }, + { + "epoch": 0.06, + "global_step": 10703, + "learning_rate": 0.0004561644407345576, + "loss": 1.5827, + "loss_base2": 2.2834, + "loss_pixel": 0.2927, + "loss_text": 1.2901, + "ppl": 4.8681, + "step": 10703 + }, + { + "epoch": 0.06, + "global_step": 10704, + "learning_rate": 0.0004561602671118531, + "loss": 1.7478, + "loss_base2": 2.5215, + "loss_pixel": 0.2835, + "loss_text": 1.4643, + "ppl": 5.742, + "step": 10704 + }, + { + "epoch": 0.06, + "global_step": 10705, + "learning_rate": 0.0004561560934891486, + "loss": 1.7537, + "loss_base2": 2.5301, + "loss_pixel": 0.2805, + "loss_text": 1.4733, + "ppl": 5.7759, + "step": 10705 + }, + { + "epoch": 0.06, + "global_step": 10706, + "learning_rate": 0.0004561519198664441, + "loss": 1.758, + "loss_base2": 2.5363, + "loss_pixel": 0.2727, + "loss_text": 1.4853, + "ppl": 5.8008, + "step": 10706 + }, + { + "epoch": 0.06, + "global_step": 10707, + "learning_rate": 0.00045614774624373955, + "loss": 1.7584, + "loss_base2": 2.5368, + "loss_pixel": 0.2683, + "loss_text": 1.4901, + "ppl": 5.8031, + "step": 10707 + }, + { + "epoch": 0.06, + "global_step": 10708, + "learning_rate": 0.00045614357262103506, + "loss": 1.7438, + "loss_base2": 2.5158, + "loss_pixel": 0.2639, + "loss_text": 1.4799, + "ppl": 5.719, + "step": 10708 + }, + { + "epoch": 0.06, + "global_step": 10709, + "learning_rate": 0.00045613939899833057, + "loss": 1.7581, + "loss_base2": 2.5364, + "loss_pixel": 0.262, + "loss_text": 1.4961, + "ppl": 5.8014, + "step": 10709 + }, + { + "epoch": 0.06, + "global_step": 10710, + "learning_rate": 0.0004561352253756261, + "loss": 1.7478, + "loss_base2": 2.5215, + "loss_pixel": 0.2618, + "loss_text": 1.486, + "ppl": 5.742, + "step": 10710 + }, + { + "epoch": 0.06, + "global_step": 10711, + "learning_rate": 0.00045613105175292153, + "loss": 1.7306, + "loss_base2": 2.4967, + "loss_pixel": 0.2574, + "loss_text": 1.4732, + "ppl": 5.644, + "step": 10711 + }, + { + "epoch": 0.06, + "global_step": 10712, + "learning_rate": 0.00045612687813021704, + "loss": 1.7507, + "loss_base2": 2.5257, + "loss_pixel": 0.2552, + "loss_text": 1.4956, + "ppl": 5.7586, + "step": 10712 + }, + { + "epoch": 0.06, + "global_step": 10713, + "learning_rate": 0.00045612270450751254, + "loss": 1.7164, + "loss_base2": 2.4762, + "loss_pixel": 0.2539, + "loss_text": 1.4625, + "ppl": 5.5645, + "step": 10713 + }, + { + "epoch": 0.06, + "global_step": 10714, + "learning_rate": 0.00045611853088480805, + "loss": 1.7196, + "loss_base2": 2.4809, + "loss_pixel": 0.2515, + "loss_text": 1.4681, + "ppl": 5.5823, + "step": 10714 + }, + { + "epoch": 0.06, + "global_step": 10715, + "learning_rate": 0.00045611435726210356, + "loss": 1.7128, + "loss_base2": 2.471, + "loss_pixel": 0.2509, + "loss_text": 1.4619, + "ppl": 5.5445, + "step": 10715 + }, + { + "epoch": 0.06, + "global_step": 10716, + "learning_rate": 0.000456110183639399, + "loss": 1.7441, + "loss_base2": 2.5162, + "loss_pixel": 0.2483, + "loss_text": 1.4958, + "ppl": 5.7208, + "step": 10716 + }, + { + "epoch": 0.06, + "global_step": 10717, + "learning_rate": 0.0004561060100166945, + "loss": 1.7055, + "loss_base2": 2.4605, + "loss_pixel": 0.2462, + "loss_text": 1.4593, + "ppl": 5.5041, + "step": 10717 + }, + { + "epoch": 0.06, + "global_step": 10718, + "learning_rate": 0.00045610183639399, + "loss": 1.7206, + "loss_base2": 2.4823, + "loss_pixel": 0.2449, + "loss_text": 1.4757, + "ppl": 5.5879, + "step": 10718 + }, + { + "epoch": 0.06, + "global_step": 10719, + "learning_rate": 0.0004560976627712855, + "loss": 1.7102, + "loss_base2": 2.4673, + "loss_pixel": 0.2441, + "loss_text": 1.4661, + "ppl": 5.5301, + "step": 10719 + }, + { + "epoch": 0.06, + "global_step": 10720, + "learning_rate": 0.00045609348914858093, + "loss": 1.7231, + "loss_base2": 2.4859, + "loss_pixel": 0.2423, + "loss_text": 1.4808, + "ppl": 5.6019, + "step": 10720 + }, + { + "epoch": 0.06, + "global_step": 10721, + "learning_rate": 0.00045608931552587644, + "loss": 1.7103, + "loss_base2": 2.4674, + "loss_pixel": 0.2422, + "loss_text": 1.468, + "ppl": 5.5306, + "step": 10721 + }, + { + "epoch": 0.06, + "global_step": 10722, + "learning_rate": 0.00045608514190317195, + "loss": 1.7177, + "loss_base2": 2.4781, + "loss_pixel": 0.2407, + "loss_text": 1.477, + "ppl": 5.5717, + "step": 10722 + }, + { + "epoch": 0.06, + "global_step": 10723, + "learning_rate": 0.00045608096828046745, + "loss": 1.7179, + "loss_base2": 2.4784, + "loss_pixel": 0.2432, + "loss_text": 1.4747, + "ppl": 5.5728, + "step": 10723 + }, + { + "epoch": 0.06, + "global_step": 10724, + "learning_rate": 0.00045607679465776296, + "loss": 1.7302, + "loss_base2": 2.4962, + "loss_pixel": 0.2522, + "loss_text": 1.4781, + "ppl": 5.6418, + "step": 10724 + }, + { + "epoch": 0.06, + "global_step": 10725, + "learning_rate": 0.0004560726210350584, + "loss": 1.724, + "loss_base2": 2.4872, + "loss_pixel": 0.2477, + "loss_text": 1.4763, + "ppl": 5.6069, + "step": 10725 + }, + { + "epoch": 0.06, + "global_step": 10726, + "learning_rate": 0.0004560684474123539, + "loss": 1.6984, + "loss_base2": 2.4503, + "loss_pixel": 0.2449, + "loss_text": 1.4536, + "ppl": 5.4652, + "step": 10726 + }, + { + "epoch": 0.06, + "global_step": 10727, + "learning_rate": 0.00045606427378964943, + "loss": 1.712, + "loss_base2": 2.4699, + "loss_pixel": 0.2412, + "loss_text": 1.4708, + "ppl": 5.54, + "step": 10727 + }, + { + "epoch": 0.06, + "global_step": 10728, + "learning_rate": 0.00045606010016694494, + "loss": 1.5939, + "loss_base2": 2.2995, + "loss_pixel": 0.2426, + "loss_text": 1.3514, + "ppl": 4.9229, + "step": 10728 + }, + { + "epoch": 0.06, + "global_step": 10729, + "learning_rate": 0.0004560559265442404, + "loss": 1.4785, + "loss_base2": 2.133, + "loss_pixel": 0.24, + "loss_text": 1.2385, + "ppl": 4.3864, + "step": 10729 + }, + { + "epoch": 0.06, + "global_step": 10730, + "learning_rate": 0.0004560517529215359, + "loss": 1.4753, + "loss_base2": 2.1284, + "loss_pixel": 0.2375, + "loss_text": 1.2378, + "ppl": 4.3723, + "step": 10730 + }, + { + "epoch": 0.06, + "global_step": 10731, + "learning_rate": 0.0004560475792988314, + "loss": 1.4722, + "loss_base2": 2.1239, + "loss_pixel": 0.2376, + "loss_text": 1.2346, + "ppl": 4.3588, + "step": 10731 + }, + { + "epoch": 0.06, + "global_step": 10732, + "learning_rate": 0.0004560434056761269, + "loss": 1.4776, + "loss_base2": 2.1317, + "loss_pixel": 0.2372, + "loss_text": 1.2404, + "ppl": 4.3824, + "step": 10732 + }, + { + "epoch": 0.06, + "global_step": 10733, + "learning_rate": 0.0004560392320534224, + "loss": 1.4814, + "loss_base2": 2.1372, + "loss_pixel": 0.2361, + "loss_text": 1.2453, + "ppl": 4.3991, + "step": 10733 + }, + { + "epoch": 0.06, + "global_step": 10734, + "learning_rate": 0.00045603505843071787, + "loss": 1.4804, + "loss_base2": 2.1358, + "loss_pixel": 0.2342, + "loss_text": 1.2462, + "ppl": 4.3947, + "step": 10734 + }, + { + "epoch": 0.06, + "global_step": 10735, + "learning_rate": 0.0004560308848080134, + "loss": 1.462, + "loss_base2": 2.1092, + "loss_pixel": 0.2324, + "loss_text": 1.2297, + "ppl": 4.3146, + "step": 10735 + }, + { + "epoch": 0.06, + "global_step": 10736, + "learning_rate": 0.0004560267111853089, + "loss": 1.4898, + "loss_base2": 2.1493, + "loss_pixel": 0.2329, + "loss_text": 1.2569, + "ppl": 4.4362, + "step": 10736 + }, + { + "epoch": 0.06, + "global_step": 10737, + "learning_rate": 0.0004560225375626044, + "loss": 1.4568, + "loss_base2": 2.1017, + "loss_pixel": 0.2312, + "loss_text": 1.2256, + "ppl": 4.2922, + "step": 10737 + }, + { + "epoch": 0.06, + "global_step": 10738, + "learning_rate": 0.0004560183639398998, + "loss": 1.4931, + "loss_base2": 2.1541, + "loss_pixel": 0.2308, + "loss_text": 1.2623, + "ppl": 4.4509, + "step": 10738 + }, + { + "epoch": 0.06, + "global_step": 10739, + "learning_rate": 0.0004560141903171953, + "loss": 1.4691, + "loss_base2": 2.1195, + "loss_pixel": 0.2286, + "loss_text": 1.2405, + "ppl": 4.3453, + "step": 10739 + }, + { + "epoch": 0.06, + "global_step": 10740, + "learning_rate": 0.0004560100166944908, + "loss": 1.4568, + "loss_base2": 2.1017, + "loss_pixel": 0.2273, + "loss_text": 1.2295, + "ppl": 4.2922, + "step": 10740 + }, + { + "epoch": 0.06, + "global_step": 10741, + "learning_rate": 0.0004560058430717863, + "loss": 1.4497, + "loss_base2": 2.0915, + "loss_pixel": 0.2273, + "loss_text": 1.2224, + "ppl": 4.2618, + "step": 10741 + }, + { + "epoch": 0.06, + "global_step": 10742, + "learning_rate": 0.0004560016694490818, + "loss": 1.4642, + "loss_base2": 2.1124, + "loss_pixel": 0.2348, + "loss_text": 1.2293, + "ppl": 4.3241, + "step": 10742 + }, + { + "epoch": 0.06, + "global_step": 10743, + "learning_rate": 0.0004559974958263773, + "loss": 1.5776, + "loss_base2": 2.276, + "loss_pixel": 0.2335, + "loss_text": 1.344, + "ppl": 4.8433, + "step": 10743 + }, + { + "epoch": 0.06, + "global_step": 10744, + "learning_rate": 0.0004559933222036728, + "loss": 1.6917, + "loss_base2": 2.4406, + "loss_pixel": 0.2298, + "loss_text": 1.4619, + "ppl": 5.4287, + "step": 10744 + }, + { + "epoch": 0.06, + "global_step": 10745, + "learning_rate": 0.0004559891485809683, + "loss": 1.7305, + "loss_base2": 2.4966, + "loss_pixel": 0.229, + "loss_text": 1.5015, + "ppl": 5.6435, + "step": 10745 + }, + { + "epoch": 0.06, + "global_step": 10746, + "learning_rate": 0.0004559849749582638, + "loss": 1.7283, + "loss_base2": 2.4934, + "loss_pixel": 0.2289, + "loss_text": 1.4994, + "ppl": 5.6311, + "step": 10746 + }, + { + "epoch": 0.06, + "global_step": 10747, + "learning_rate": 0.00045598080133555925, + "loss": 1.7115, + "loss_base2": 2.4692, + "loss_pixel": 0.2282, + "loss_text": 1.4832, + "ppl": 5.5373, + "step": 10747 + }, + { + "epoch": 0.06, + "global_step": 10748, + "learning_rate": 0.00045597662771285476, + "loss": 1.7147, + "loss_base2": 2.4738, + "loss_pixel": 0.2281, + "loss_text": 1.4866, + "ppl": 5.555, + "step": 10748 + }, + { + "epoch": 0.06, + "global_step": 10749, + "learning_rate": 0.00045597245409015026, + "loss": 1.69, + "loss_base2": 2.4382, + "loss_pixel": 0.2276, + "loss_text": 1.4625, + "ppl": 5.4195, + "step": 10749 + }, + { + "epoch": 0.06, + "global_step": 10750, + "learning_rate": 0.00045596828046744577, + "loss": 1.7024, + "loss_base2": 2.456, + "loss_pixel": 0.2262, + "loss_text": 1.4762, + "ppl": 5.4871, + "step": 10750 + }, + { + "epoch": 0.06, + "global_step": 10751, + "learning_rate": 0.0004559641068447413, + "loss": 1.6972, + "loss_base2": 2.4485, + "loss_pixel": 0.227, + "loss_text": 1.4702, + "ppl": 5.4586, + "step": 10751 + }, + { + "epoch": 0.06, + "global_step": 10752, + "learning_rate": 0.00045595993322203673, + "loss": 1.7041, + "loss_base2": 2.4585, + "loss_pixel": 0.2259, + "loss_text": 1.4782, + "ppl": 5.4964, + "step": 10752 + }, + { + "epoch": 0.06, + "global_step": 10753, + "learning_rate": 0.00045595575959933224, + "loss": 1.6888, + "loss_base2": 2.4364, + "loss_pixel": 0.2262, + "loss_text": 1.4626, + "ppl": 5.413, + "step": 10753 + }, + { + "epoch": 0.06, + "global_step": 10754, + "learning_rate": 0.00045595158597662775, + "loss": 1.6971, + "loss_base2": 2.4484, + "loss_pixel": 0.2246, + "loss_text": 1.4726, + "ppl": 5.4581, + "step": 10754 + }, + { + "epoch": 0.06, + "global_step": 10755, + "learning_rate": 0.00045594741235392325, + "loss": 1.7096, + "loss_base2": 2.4664, + "loss_pixel": 0.2237, + "loss_text": 1.4859, + "ppl": 5.5268, + "step": 10755 + }, + { + "epoch": 0.06, + "global_step": 10756, + "learning_rate": 0.0004559432387312187, + "loss": 1.7021, + "loss_base2": 2.4556, + "loss_pixel": 0.2224, + "loss_text": 1.4797, + "ppl": 5.4855, + "step": 10756 + }, + { + "epoch": 0.06, + "global_step": 10757, + "learning_rate": 0.00045593906510851416, + "loss": 1.6727, + "loss_base2": 2.4132, + "loss_pixel": 0.2228, + "loss_text": 1.4499, + "ppl": 5.3265, + "step": 10757 + }, + { + "epoch": 0.06, + "global_step": 10758, + "learning_rate": 0.00045593489148580967, + "loss": 1.7005, + "loss_base2": 2.4533, + "loss_pixel": 0.2224, + "loss_text": 1.478, + "ppl": 5.4767, + "step": 10758 + }, + { + "epoch": 0.06, + "global_step": 10759, + "learning_rate": 0.0004559307178631052, + "loss": 1.6971, + "loss_base2": 2.4484, + "loss_pixel": 0.2229, + "loss_text": 1.4742, + "ppl": 5.4581, + "step": 10759 + }, + { + "epoch": 0.06, + "global_step": 10760, + "learning_rate": 0.0004559265442404007, + "loss": 1.6903, + "loss_base2": 2.4386, + "loss_pixel": 0.2228, + "loss_text": 1.4675, + "ppl": 5.4211, + "step": 10760 + }, + { + "epoch": 0.06, + "global_step": 10761, + "learning_rate": 0.00045592237061769614, + "loss": 1.6867, + "loss_base2": 2.4334, + "loss_pixel": 0.2218, + "loss_text": 1.4649, + "ppl": 5.4016, + "step": 10761 + }, + { + "epoch": 0.06, + "global_step": 10762, + "learning_rate": 0.00045591819699499164, + "loss": 1.6906, + "loss_base2": 2.439, + "loss_pixel": 0.2216, + "loss_text": 1.469, + "ppl": 5.4227, + "step": 10762 + }, + { + "epoch": 0.06, + "global_step": 10763, + "learning_rate": 0.00045591402337228715, + "loss": 1.6805, + "loss_base2": 2.4244, + "loss_pixel": 0.2205, + "loss_text": 1.46, + "ppl": 5.3682, + "step": 10763 + }, + { + "epoch": 0.06, + "global_step": 10764, + "learning_rate": 0.00045590984974958266, + "loss": 1.6838, + "loss_base2": 2.4292, + "loss_pixel": 0.2225, + "loss_text": 1.4614, + "ppl": 5.386, + "step": 10764 + }, + { + "epoch": 0.06, + "global_step": 10765, + "learning_rate": 0.00045590567612687817, + "loss": 1.6951, + "loss_base2": 2.4455, + "loss_pixel": 0.2193, + "loss_text": 1.4757, + "ppl": 5.4472, + "step": 10765 + }, + { + "epoch": 0.06, + "global_step": 10766, + "learning_rate": 0.0004559015025041736, + "loss": 1.6779, + "loss_base2": 2.4207, + "loss_pixel": 0.2188, + "loss_text": 1.4591, + "ppl": 5.3543, + "step": 10766 + }, + { + "epoch": 0.06, + "global_step": 10767, + "learning_rate": 0.0004558973288814691, + "loss": 1.465, + "loss_base2": 2.1135, + "loss_pixel": 0.2191, + "loss_text": 1.2459, + "ppl": 4.3275, + "step": 10767 + }, + { + "epoch": 0.06, + "global_step": 10768, + "learning_rate": 0.00045589315525876463, + "loss": 1.4691, + "loss_base2": 2.1195, + "loss_pixel": 0.2178, + "loss_text": 1.2513, + "ppl": 4.3453, + "step": 10768 + }, + { + "epoch": 0.06, + "global_step": 10769, + "learning_rate": 0.00045588898163606014, + "loss": 1.4492, + "loss_base2": 2.0908, + "loss_pixel": 0.2171, + "loss_text": 1.2322, + "ppl": 4.2597, + "step": 10769 + }, + { + "epoch": 0.06, + "global_step": 10770, + "learning_rate": 0.0004558848080133556, + "loss": 1.4598, + "loss_base2": 2.106, + "loss_pixel": 0.2165, + "loss_text": 1.2432, + "ppl": 4.3051, + "step": 10770 + }, + { + "epoch": 0.06, + "global_step": 10771, + "learning_rate": 0.0004558806343906511, + "loss": 1.4576, + "loss_base2": 2.1029, + "loss_pixel": 0.2174, + "loss_text": 1.2403, + "ppl": 4.2956, + "step": 10771 + }, + { + "epoch": 0.06, + "global_step": 10772, + "learning_rate": 0.0004558764607679466, + "loss": 1.4608, + "loss_base2": 2.1075, + "loss_pixel": 0.2162, + "loss_text": 1.2446, + "ppl": 4.3094, + "step": 10772 + }, + { + "epoch": 0.06, + "global_step": 10773, + "learning_rate": 0.0004558722871452421, + "loss": 1.4484, + "loss_base2": 2.0896, + "loss_pixel": 0.2159, + "loss_text": 1.2325, + "ppl": 4.2563, + "step": 10773 + }, + { + "epoch": 0.06, + "global_step": 10774, + "learning_rate": 0.0004558681135225376, + "loss": 1.4475, + "loss_base2": 2.0883, + "loss_pixel": 0.2153, + "loss_text": 1.2322, + "ppl": 4.2525, + "step": 10774 + }, + { + "epoch": 0.06, + "global_step": 10775, + "learning_rate": 0.000455863939899833, + "loss": 1.4296, + "loss_base2": 2.0625, + "loss_pixel": 0.2151, + "loss_text": 1.2144, + "ppl": 4.177, + "step": 10775 + }, + { + "epoch": 0.06, + "global_step": 10776, + "learning_rate": 0.00045585976627712853, + "loss": 1.4653, + "loss_base2": 2.114, + "loss_pixel": 0.2136, + "loss_text": 1.2517, + "ppl": 4.3288, + "step": 10776 + }, + { + "epoch": 0.06, + "global_step": 10777, + "learning_rate": 0.00045585559265442404, + "loss": 1.4471, + "loss_base2": 2.0877, + "loss_pixel": 0.2139, + "loss_text": 1.2332, + "ppl": 4.2508, + "step": 10777 + }, + { + "epoch": 0.06, + "global_step": 10778, + "learning_rate": 0.00045585141903171954, + "loss": 1.4478, + "loss_base2": 2.0887, + "loss_pixel": 0.2148, + "loss_text": 1.233, + "ppl": 4.2537, + "step": 10778 + }, + { + "epoch": 0.06, + "global_step": 10779, + "learning_rate": 0.000455847245409015, + "loss": 1.4547, + "loss_base2": 2.0987, + "loss_pixel": 0.2137, + "loss_text": 1.241, + "ppl": 4.2832, + "step": 10779 + }, + { + "epoch": 0.06, + "global_step": 10780, + "learning_rate": 0.0004558430717863105, + "loss": 1.4433, + "loss_base2": 2.0822, + "loss_pixel": 0.2141, + "loss_text": 1.2292, + "ppl": 4.2346, + "step": 10780 + }, + { + "epoch": 0.06, + "global_step": 10781, + "learning_rate": 0.000455838898163606, + "loss": 1.4317, + "loss_base2": 2.0655, + "loss_pixel": 0.2131, + "loss_text": 1.2186, + "ppl": 4.1858, + "step": 10781 + }, + { + "epoch": 0.06, + "global_step": 10782, + "learning_rate": 0.0004558347245409015, + "loss": 1.4526, + "loss_base2": 2.0957, + "loss_pixel": 0.2138, + "loss_text": 1.2387, + "ppl": 4.2742, + "step": 10782 + }, + { + "epoch": 0.06, + "global_step": 10783, + "learning_rate": 0.000455830550918197, + "loss": 1.4449, + "loss_base2": 2.0846, + "loss_pixel": 0.2127, + "loss_text": 1.2321, + "ppl": 4.2414, + "step": 10783 + }, + { + "epoch": 0.06, + "global_step": 10784, + "learning_rate": 0.0004558263772954925, + "loss": 1.4618, + "loss_base2": 2.1089, + "loss_pixel": 0.2131, + "loss_text": 1.2488, + "ppl": 4.3137, + "step": 10784 + }, + { + "epoch": 0.06, + "global_step": 10785, + "learning_rate": 0.000455822203672788, + "loss": 1.4651, + "loss_base2": 2.1137, + "loss_pixel": 0.2157, + "loss_text": 1.2494, + "ppl": 4.328, + "step": 10785 + }, + { + "epoch": 0.06, + "global_step": 10786, + "learning_rate": 0.0004558180300500835, + "loss": 1.4511, + "loss_base2": 2.0935, + "loss_pixel": 0.2134, + "loss_text": 1.2377, + "ppl": 4.2678, + "step": 10786 + }, + { + "epoch": 0.06, + "global_step": 10787, + "learning_rate": 0.000455813856427379, + "loss": 1.4494, + "loss_base2": 2.091, + "loss_pixel": 0.2127, + "loss_text": 1.2367, + "ppl": 4.2606, + "step": 10787 + }, + { + "epoch": 0.06, + "global_step": 10788, + "learning_rate": 0.00045580968280467445, + "loss": 1.4519, + "loss_base2": 2.0946, + "loss_pixel": 0.2144, + "loss_text": 1.2375, + "ppl": 4.2712, + "step": 10788 + }, + { + "epoch": 0.06, + "global_step": 10789, + "learning_rate": 0.00045580550918196996, + "loss": 1.4589, + "loss_base2": 2.1047, + "loss_pixel": 0.218, + "loss_text": 1.2409, + "ppl": 4.3012, + "step": 10789 + }, + { + "epoch": 0.06, + "global_step": 10790, + "learning_rate": 0.00045580133555926547, + "loss": 1.4644, + "loss_base2": 2.1127, + "loss_pixel": 0.2175, + "loss_text": 1.2469, + "ppl": 4.3249, + "step": 10790 + }, + { + "epoch": 0.06, + "global_step": 10791, + "learning_rate": 0.000455797161936561, + "loss": 1.4386, + "loss_base2": 2.0755, + "loss_pixel": 0.2167, + "loss_text": 1.2219, + "ppl": 4.2148, + "step": 10791 + }, + { + "epoch": 0.06, + "global_step": 10792, + "learning_rate": 0.0004557929883138565, + "loss": 1.473, + "loss_base2": 2.1251, + "loss_pixel": 0.2158, + "loss_text": 1.2572, + "ppl": 4.3623, + "step": 10792 + }, + { + "epoch": 0.06, + "global_step": 10793, + "learning_rate": 0.00045578881469115194, + "loss": 1.4452, + "loss_base2": 2.085, + "loss_pixel": 0.2143, + "loss_text": 1.2309, + "ppl": 4.2427, + "step": 10793 + }, + { + "epoch": 0.06, + "global_step": 10794, + "learning_rate": 0.0004557846410684474, + "loss": 1.4625, + "loss_base2": 2.1099, + "loss_pixel": 0.213, + "loss_text": 1.2495, + "ppl": 4.3167, + "step": 10794 + }, + { + "epoch": 0.06, + "global_step": 10795, + "learning_rate": 0.0004557804674457429, + "loss": 1.4587, + "loss_base2": 2.1045, + "loss_pixel": 0.2125, + "loss_text": 1.2462, + "ppl": 4.3004, + "step": 10795 + }, + { + "epoch": 0.06, + "global_step": 10796, + "learning_rate": 0.0004557762938230384, + "loss": 1.4352, + "loss_base2": 2.0706, + "loss_pixel": 0.211, + "loss_text": 1.2242, + "ppl": 4.2005, + "step": 10796 + }, + { + "epoch": 0.06, + "global_step": 10797, + "learning_rate": 0.00045577212020033386, + "loss": 1.4354, + "loss_base2": 2.0708, + "loss_pixel": 0.2107, + "loss_text": 1.2247, + "ppl": 4.2013, + "step": 10797 + }, + { + "epoch": 0.06, + "global_step": 10798, + "learning_rate": 0.00045576794657762936, + "loss": 1.4657, + "loss_base2": 2.1146, + "loss_pixel": 0.2095, + "loss_text": 1.2563, + "ppl": 4.3306, + "step": 10798 + }, + { + "epoch": 0.06, + "global_step": 10799, + "learning_rate": 0.00045576377295492487, + "loss": 1.7105, + "loss_base2": 2.4677, + "loss_pixel": 0.2103, + "loss_text": 1.5002, + "ppl": 5.5317, + "step": 10799 + }, + { + "epoch": 0.06, + "global_step": 10800, + "learning_rate": 0.0004557595993322204, + "loss": 1.6937, + "loss_base2": 2.4435, + "loss_pixel": 0.2083, + "loss_text": 1.4854, + "ppl": 5.4396, + "step": 10800 + }, + { + "epoch": 0.06, + "global_step": 10801, + "learning_rate": 0.0004557554257095159, + "loss": 1.7029, + "loss_base2": 2.4568, + "loss_pixel": 0.2077, + "loss_text": 1.4952, + "ppl": 5.4898, + "step": 10801 + }, + { + "epoch": 0.06, + "global_step": 10802, + "learning_rate": 0.00045575125208681134, + "loss": 1.6828, + "loss_base2": 2.4278, + "loss_pixel": 0.207, + "loss_text": 1.4758, + "ppl": 5.3806, + "step": 10802 + }, + { + "epoch": 0.06, + "global_step": 10803, + "learning_rate": 0.00045574707846410685, + "loss": 1.7013, + "loss_base2": 2.4545, + "loss_pixel": 0.2073, + "loss_text": 1.494, + "ppl": 5.4811, + "step": 10803 + }, + { + "epoch": 0.06, + "global_step": 10804, + "learning_rate": 0.00045574290484140235, + "loss": 1.6845, + "loss_base2": 2.4302, + "loss_pixel": 0.2069, + "loss_text": 1.4776, + "ppl": 5.3898, + "step": 10804 + }, + { + "epoch": 0.06, + "global_step": 10805, + "learning_rate": 0.00045573873121869786, + "loss": 1.6754, + "loss_base2": 2.4171, + "loss_pixel": 0.2056, + "loss_text": 1.4698, + "ppl": 5.3409, + "step": 10805 + }, + { + "epoch": 0.06, + "global_step": 10806, + "learning_rate": 0.0004557345575959933, + "loss": 1.675, + "loss_base2": 2.4165, + "loss_pixel": 0.2053, + "loss_text": 1.4698, + "ppl": 5.3388, + "step": 10806 + }, + { + "epoch": 0.06, + "global_step": 10807, + "learning_rate": 0.0004557303839732888, + "loss": 1.6876, + "loss_base2": 2.4347, + "loss_pixel": 0.2049, + "loss_text": 1.4827, + "ppl": 5.4065, + "step": 10807 + }, + { + "epoch": 0.06, + "global_step": 10808, + "learning_rate": 0.00045572621035058433, + "loss": 1.6814, + "loss_base2": 2.4257, + "loss_pixel": 0.2042, + "loss_text": 1.4772, + "ppl": 5.3731, + "step": 10808 + }, + { + "epoch": 0.06, + "global_step": 10809, + "learning_rate": 0.00045572203672787984, + "loss": 1.6868, + "loss_base2": 2.4335, + "loss_pixel": 0.2039, + "loss_text": 1.4829, + "ppl": 5.4022, + "step": 10809 + }, + { + "epoch": 0.06, + "global_step": 10810, + "learning_rate": 0.00045571786310517534, + "loss": 1.6568, + "loss_base2": 2.3903, + "loss_pixel": 0.2028, + "loss_text": 1.454, + "ppl": 5.2425, + "step": 10810 + }, + { + "epoch": 0.06, + "global_step": 10811, + "learning_rate": 0.0004557136894824708, + "loss": 1.6823, + "loss_base2": 2.427, + "loss_pixel": 0.2036, + "loss_text": 1.4786, + "ppl": 5.3779, + "step": 10811 + }, + { + "epoch": 0.06, + "global_step": 10812, + "learning_rate": 0.00045570951585976625, + "loss": 1.6798, + "loss_base2": 2.4234, + "loss_pixel": 0.2064, + "loss_text": 1.4733, + "ppl": 5.3645, + "step": 10812 + }, + { + "epoch": 0.06, + "global_step": 10813, + "learning_rate": 0.00045570534223706176, + "loss": 1.6785, + "loss_base2": 2.4216, + "loss_pixel": 0.2123, + "loss_text": 1.4663, + "ppl": 5.3575, + "step": 10813 + }, + { + "epoch": 0.06, + "global_step": 10814, + "learning_rate": 0.00045570116861435726, + "loss": 1.6782, + "loss_base2": 2.4211, + "loss_pixel": 0.2101, + "loss_text": 1.4681, + "ppl": 5.3559, + "step": 10814 + }, + { + "epoch": 0.06, + "global_step": 10815, + "learning_rate": 0.00045569699499165277, + "loss": 1.677, + "loss_base2": 2.4194, + "loss_pixel": 0.2026, + "loss_text": 1.4744, + "ppl": 5.3495, + "step": 10815 + }, + { + "epoch": 0.06, + "global_step": 10816, + "learning_rate": 0.0004556928213689482, + "loss": 1.6783, + "loss_base2": 2.4213, + "loss_pixel": 0.2008, + "loss_text": 1.4775, + "ppl": 5.3564, + "step": 10816 + }, + { + "epoch": 0.06, + "global_step": 10817, + "learning_rate": 0.00045568864774624373, + "loss": 1.6588, + "loss_base2": 2.3931, + "loss_pixel": 0.2003, + "loss_text": 1.4585, + "ppl": 5.253, + "step": 10817 + }, + { + "epoch": 0.06, + "global_step": 10818, + "learning_rate": 0.00045568447412353924, + "loss": 1.6754, + "loss_base2": 2.4171, + "loss_pixel": 0.2015, + "loss_text": 1.474, + "ppl": 5.3409, + "step": 10818 + }, + { + "epoch": 0.06, + "global_step": 10819, + "learning_rate": 0.00045568030050083475, + "loss": 1.6626, + "loss_base2": 2.3986, + "loss_pixel": 0.1966, + "loss_text": 1.466, + "ppl": 5.273, + "step": 10819 + }, + { + "epoch": 0.06, + "global_step": 10820, + "learning_rate": 0.0004556761268781302, + "loss": 1.6602, + "loss_base2": 2.3952, + "loss_pixel": 0.1969, + "loss_text": 1.4633, + "ppl": 5.2604, + "step": 10820 + }, + { + "epoch": 0.06, + "global_step": 10821, + "learning_rate": 0.0004556719532554257, + "loss": 1.6427, + "loss_base2": 2.3699, + "loss_pixel": 0.1931, + "loss_text": 1.4496, + "ppl": 5.1691, + "step": 10821 + }, + { + "epoch": 0.06, + "global_step": 10822, + "learning_rate": 0.0004556677796327212, + "loss": 1.6612, + "loss_base2": 2.3966, + "loss_pixel": 0.1927, + "loss_text": 1.4685, + "ppl": 5.2656, + "step": 10822 + }, + { + "epoch": 0.06, + "global_step": 10823, + "learning_rate": 0.0004556636060100167, + "loss": 1.6479, + "loss_base2": 2.3774, + "loss_pixel": 0.1935, + "loss_text": 1.4544, + "ppl": 5.1961, + "step": 10823 + }, + { + "epoch": 0.06, + "global_step": 10824, + "learning_rate": 0.00045565943238731223, + "loss": 1.6753, + "loss_base2": 2.4169, + "loss_pixel": 0.1931, + "loss_text": 1.4822, + "ppl": 5.3404, + "step": 10824 + }, + { + "epoch": 0.06, + "global_step": 10825, + "learning_rate": 0.0004556552587646077, + "loss": 1.651, + "loss_base2": 2.3819, + "loss_pixel": 0.1909, + "loss_text": 1.4601, + "ppl": 5.2122, + "step": 10825 + }, + { + "epoch": 0.06, + "global_step": 10826, + "learning_rate": 0.0004556510851419032, + "loss": 1.6633, + "loss_base2": 2.3996, + "loss_pixel": 0.1898, + "loss_text": 1.4734, + "ppl": 5.2767, + "step": 10826 + }, + { + "epoch": 0.06, + "global_step": 10827, + "learning_rate": 0.0004556469115191987, + "loss": 1.6414, + "loss_base2": 2.368, + "loss_pixel": 0.1899, + "loss_text": 1.4515, + "ppl": 5.1624, + "step": 10827 + }, + { + "epoch": 0.06, + "global_step": 10828, + "learning_rate": 0.0004556427378964942, + "loss": 1.6409, + "loss_base2": 2.3673, + "loss_pixel": 0.1906, + "loss_text": 1.4502, + "ppl": 5.1598, + "step": 10828 + }, + { + "epoch": 0.06, + "global_step": 10829, + "learning_rate": 0.00045563856427378966, + "loss": 1.6721, + "loss_base2": 2.4123, + "loss_pixel": 0.1927, + "loss_text": 1.4794, + "ppl": 5.3233, + "step": 10829 + }, + { + "epoch": 0.06, + "global_step": 10830, + "learning_rate": 0.00045563439065108517, + "loss": 1.6492, + "loss_base2": 2.3793, + "loss_pixel": 0.1917, + "loss_text": 1.4575, + "ppl": 5.2028, + "step": 10830 + }, + { + "epoch": 0.06, + "global_step": 10831, + "learning_rate": 0.0004556302170283806, + "loss": 1.6668, + "loss_base2": 2.4047, + "loss_pixel": 0.1932, + "loss_text": 1.4737, + "ppl": 5.2952, + "step": 10831 + }, + { + "epoch": 0.06, + "global_step": 10832, + "learning_rate": 0.0004556260434056761, + "loss": 1.6617, + "loss_base2": 2.3973, + "loss_pixel": 0.1893, + "loss_text": 1.4724, + "ppl": 5.2683, + "step": 10832 + }, + { + "epoch": 0.06, + "global_step": 10833, + "learning_rate": 0.00045562186978297163, + "loss": 1.6516, + "loss_base2": 2.3828, + "loss_pixel": 0.1894, + "loss_text": 1.4623, + "ppl": 5.2153, + "step": 10833 + }, + { + "epoch": 0.06, + "global_step": 10834, + "learning_rate": 0.0004556176961602671, + "loss": 1.6714, + "loss_base2": 2.4113, + "loss_pixel": 0.1874, + "loss_text": 1.484, + "ppl": 5.3196, + "step": 10834 + }, + { + "epoch": 0.06, + "global_step": 10835, + "learning_rate": 0.0004556135225375626, + "loss": 1.6626, + "loss_base2": 2.3986, + "loss_pixel": 0.1888, + "loss_text": 1.4738, + "ppl": 5.273, + "step": 10835 + }, + { + "epoch": 0.06, + "global_step": 10836, + "learning_rate": 0.0004556093489148581, + "loss": 1.6563, + "loss_base2": 2.3895, + "loss_pixel": 0.1865, + "loss_text": 1.4698, + "ppl": 5.2399, + "step": 10836 + }, + { + "epoch": 0.06, + "global_step": 10837, + "learning_rate": 0.0004556051752921536, + "loss": 1.6263, + "loss_base2": 2.3463, + "loss_pixel": 0.1876, + "loss_text": 1.4388, + "ppl": 5.085, + "step": 10837 + }, + { + "epoch": 0.06, + "global_step": 10838, + "learning_rate": 0.00045560100166944906, + "loss": 1.6601, + "loss_base2": 2.395, + "loss_pixel": 0.1834, + "loss_text": 1.4767, + "ppl": 5.2598, + "step": 10838 + }, + { + "epoch": 0.06, + "global_step": 10839, + "learning_rate": 0.00045559682804674457, + "loss": 1.6396, + "loss_base2": 2.3654, + "loss_pixel": 0.1849, + "loss_text": 1.4547, + "ppl": 5.1531, + "step": 10839 + }, + { + "epoch": 0.06, + "global_step": 10840, + "learning_rate": 0.0004555926544240401, + "loss": 1.6614, + "loss_base2": 2.3969, + "loss_pixel": 0.1839, + "loss_text": 1.4775, + "ppl": 5.2667, + "step": 10840 + }, + { + "epoch": 0.06, + "global_step": 10841, + "learning_rate": 0.0004555884808013356, + "loss": 1.6219, + "loss_base2": 2.3399, + "loss_pixel": 0.1814, + "loss_text": 1.4406, + "ppl": 5.0627, + "step": 10841 + }, + { + "epoch": 0.06, + "global_step": 10842, + "learning_rate": 0.0004555843071786311, + "loss": 1.6631, + "loss_base2": 2.3993, + "loss_pixel": 0.1823, + "loss_text": 1.4807, + "ppl": 5.2756, + "step": 10842 + }, + { + "epoch": 0.06, + "global_step": 10843, + "learning_rate": 0.00045558013355592654, + "loss": 1.6155, + "loss_base2": 2.3307, + "loss_pixel": 0.18, + "loss_text": 1.4355, + "ppl": 5.0304, + "step": 10843 + }, + { + "epoch": 0.06, + "global_step": 10844, + "learning_rate": 0.00045557595993322205, + "loss": 1.643, + "loss_base2": 2.3703, + "loss_pixel": 0.1802, + "loss_text": 1.4628, + "ppl": 5.1707, + "step": 10844 + }, + { + "epoch": 0.06, + "global_step": 10845, + "learning_rate": 0.00045557178631051756, + "loss": 1.637, + "loss_base2": 2.3617, + "loss_pixel": 0.1811, + "loss_text": 1.4558, + "ppl": 5.1397, + "step": 10845 + }, + { + "epoch": 0.06, + "global_step": 10846, + "learning_rate": 0.00045556761268781307, + "loss": 1.6328, + "loss_base2": 2.3556, + "loss_pixel": 0.1774, + "loss_text": 1.4554, + "ppl": 5.1182, + "step": 10846 + }, + { + "epoch": 0.06, + "global_step": 10847, + "learning_rate": 0.0004555634390651085, + "loss": 1.6505, + "loss_base2": 2.3812, + "loss_pixel": 0.1791, + "loss_text": 1.4714, + "ppl": 5.2096, + "step": 10847 + }, + { + "epoch": 0.06, + "global_step": 10848, + "learning_rate": 0.000455559265442404, + "loss": 1.6634, + "loss_base2": 2.3998, + "loss_pixel": 0.1781, + "loss_text": 1.4853, + "ppl": 5.2772, + "step": 10848 + }, + { + "epoch": 0.06, + "global_step": 10849, + "learning_rate": 0.00045555509181969953, + "loss": 1.6613, + "loss_base2": 2.3967, + "loss_pixel": 0.1766, + "loss_text": 1.4847, + "ppl": 5.2662, + "step": 10849 + }, + { + "epoch": 0.06, + "global_step": 10850, + "learning_rate": 0.000455550918196995, + "loss": 1.6368, + "loss_base2": 2.3614, + "loss_pixel": 0.1737, + "loss_text": 1.4631, + "ppl": 5.1387, + "step": 10850 + }, + { + "epoch": 0.06, + "global_step": 10851, + "learning_rate": 0.0004555467445742905, + "loss": 1.6374, + "loss_base2": 2.3623, + "loss_pixel": 0.1735, + "loss_text": 1.4639, + "ppl": 5.1418, + "step": 10851 + }, + { + "epoch": 0.06, + "global_step": 10852, + "learning_rate": 0.00045554257095158595, + "loss": 1.6446, + "loss_base2": 2.3727, + "loss_pixel": 0.1773, + "loss_text": 1.4674, + "ppl": 5.1789, + "step": 10852 + }, + { + "epoch": 0.06, + "global_step": 10853, + "learning_rate": 0.00045553839732888145, + "loss": 1.6326, + "loss_base2": 2.3553, + "loss_pixel": 0.1749, + "loss_text": 1.4576, + "ppl": 5.1172, + "step": 10853 + }, + { + "epoch": 0.06, + "global_step": 10854, + "learning_rate": 0.00045553422370617696, + "loss": 1.6442, + "loss_base2": 2.3721, + "loss_pixel": 0.1732, + "loss_text": 1.471, + "ppl": 5.1769, + "step": 10854 + }, + { + "epoch": 0.06, + "global_step": 10855, + "learning_rate": 0.00045553005008347247, + "loss": 1.6184, + "loss_base2": 2.3349, + "loss_pixel": 0.1752, + "loss_text": 1.4432, + "ppl": 5.045, + "step": 10855 + }, + { + "epoch": 0.06, + "global_step": 10856, + "learning_rate": 0.0004555258764607679, + "loss": 1.6397, + "loss_base2": 2.3656, + "loss_pixel": 0.1721, + "loss_text": 1.4676, + "ppl": 5.1536, + "step": 10856 + }, + { + "epoch": 0.06, + "global_step": 10857, + "learning_rate": 0.00045552170283806343, + "loss": 1.6119, + "loss_base2": 2.3255, + "loss_pixel": 0.1707, + "loss_text": 1.4411, + "ppl": 5.0123, + "step": 10857 + }, + { + "epoch": 0.06, + "global_step": 10858, + "learning_rate": 0.00045551752921535894, + "loss": 1.642, + "loss_base2": 2.3689, + "loss_pixel": 0.1738, + "loss_text": 1.4682, + "ppl": 5.1655, + "step": 10858 + }, + { + "epoch": 0.06, + "global_step": 10859, + "learning_rate": 0.00045551335559265444, + "loss": 1.6373, + "loss_base2": 2.3621, + "loss_pixel": 0.1706, + "loss_text": 1.4667, + "ppl": 5.1413, + "step": 10859 + }, + { + "epoch": 0.06, + "global_step": 10860, + "learning_rate": 0.00045550918196994995, + "loss": 1.643, + "loss_base2": 2.3703, + "loss_pixel": 0.1703, + "loss_text": 1.4727, + "ppl": 5.1707, + "step": 10860 + }, + { + "epoch": 0.06, + "global_step": 10861, + "learning_rate": 0.0004555050083472454, + "loss": 1.6326, + "loss_base2": 2.3553, + "loss_pixel": 0.1714, + "loss_text": 1.4612, + "ppl": 5.1172, + "step": 10861 + }, + { + "epoch": 0.06, + "global_step": 10862, + "learning_rate": 0.0004555008347245409, + "loss": 1.6407, + "loss_base2": 2.367, + "loss_pixel": 0.1672, + "loss_text": 1.4736, + "ppl": 5.1588, + "step": 10862 + }, + { + "epoch": 0.06, + "global_step": 10863, + "learning_rate": 0.0004554966611018364, + "loss": 1.6321, + "loss_base2": 2.3546, + "loss_pixel": 0.1697, + "loss_text": 1.4625, + "ppl": 5.1146, + "step": 10863 + }, + { + "epoch": 0.06, + "global_step": 10864, + "learning_rate": 0.0004554924874791319, + "loss": 1.6464, + "loss_base2": 2.3753, + "loss_pixel": 0.1889, + "loss_text": 1.4574, + "ppl": 5.1883, + "step": 10864 + }, + { + "epoch": 0.06, + "global_step": 10865, + "learning_rate": 0.0004554883138564274, + "loss": 1.6387, + "loss_base2": 2.3641, + "loss_pixel": 0.1929, + "loss_text": 1.4458, + "ppl": 5.1485, + "step": 10865 + }, + { + "epoch": 0.06, + "global_step": 10866, + "learning_rate": 0.0004554841402337229, + "loss": 1.6677, + "loss_base2": 2.406, + "loss_pixel": 0.1909, + "loss_text": 1.4768, + "ppl": 5.3, + "step": 10866 + }, + { + "epoch": 0.06, + "global_step": 10867, + "learning_rate": 0.0004554799666110184, + "loss": 1.6436, + "loss_base2": 2.3712, + "loss_pixel": 0.1865, + "loss_text": 1.4571, + "ppl": 5.1738, + "step": 10867 + }, + { + "epoch": 0.06, + "global_step": 10868, + "learning_rate": 0.0004554757929883139, + "loss": 1.6398, + "loss_base2": 2.3657, + "loss_pixel": 0.1852, + "loss_text": 1.4546, + "ppl": 5.1541, + "step": 10868 + }, + { + "epoch": 0.06, + "global_step": 10869, + "learning_rate": 0.00045547161936560935, + "loss": 1.6434, + "loss_base2": 2.3709, + "loss_pixel": 0.1849, + "loss_text": 1.4585, + "ppl": 5.1727, + "step": 10869 + }, + { + "epoch": 0.06, + "global_step": 10870, + "learning_rate": 0.0004554674457429048, + "loss": 1.6397, + "loss_base2": 2.3656, + "loss_pixel": 0.1844, + "loss_text": 1.4553, + "ppl": 5.1536, + "step": 10870 + }, + { + "epoch": 0.06, + "global_step": 10871, + "learning_rate": 0.0004554632721202003, + "loss": 1.6457, + "loss_base2": 2.3742, + "loss_pixel": 0.1858, + "loss_text": 1.4599, + "ppl": 5.1846, + "step": 10871 + }, + { + "epoch": 0.06, + "global_step": 10872, + "learning_rate": 0.0004554590984974958, + "loss": 1.6485, + "loss_base2": 2.3783, + "loss_pixel": 0.1831, + "loss_text": 1.4654, + "ppl": 5.1992, + "step": 10872 + }, + { + "epoch": 0.06, + "global_step": 10873, + "learning_rate": 0.00045545492487479133, + "loss": 1.661, + "loss_base2": 2.3963, + "loss_pixel": 0.1826, + "loss_text": 1.4784, + "ppl": 5.2646, + "step": 10873 + }, + { + "epoch": 0.06, + "global_step": 10874, + "learning_rate": 0.00045545075125208684, + "loss": 1.6392, + "loss_base2": 2.3649, + "loss_pixel": 0.1841, + "loss_text": 1.4552, + "ppl": 5.151, + "step": 10874 + }, + { + "epoch": 0.06, + "global_step": 10875, + "learning_rate": 0.0004554465776293823, + "loss": 1.6433, + "loss_base2": 2.3708, + "loss_pixel": 0.1823, + "loss_text": 1.461, + "ppl": 5.1722, + "step": 10875 + }, + { + "epoch": 0.06, + "global_step": 10876, + "learning_rate": 0.0004554424040066778, + "loss": 1.65, + "loss_base2": 2.3804, + "loss_pixel": 0.1824, + "loss_text": 1.4676, + "ppl": 5.207, + "step": 10876 + }, + { + "epoch": 0.06, + "global_step": 10877, + "learning_rate": 0.0004554382303839733, + "loss": 1.6506, + "loss_base2": 2.3813, + "loss_pixel": 0.1824, + "loss_text": 1.4682, + "ppl": 5.2101, + "step": 10877 + }, + { + "epoch": 0.06, + "global_step": 10878, + "learning_rate": 0.0004554340567612688, + "loss": 1.6312, + "loss_base2": 2.3533, + "loss_pixel": 0.1808, + "loss_text": 1.4504, + "ppl": 5.11, + "step": 10878 + }, + { + "epoch": 0.06, + "global_step": 10879, + "learning_rate": 0.00045542988313856426, + "loss": 1.6352, + "loss_base2": 2.3591, + "loss_pixel": 0.18, + "loss_text": 1.4552, + "ppl": 5.1305, + "step": 10879 + }, + { + "epoch": 0.06, + "global_step": 10880, + "learning_rate": 0.00045542570951585977, + "loss": 1.6403, + "loss_base2": 2.3665, + "loss_pixel": 0.1807, + "loss_text": 1.4596, + "ppl": 5.1567, + "step": 10880 + }, + { + "epoch": 0.06, + "global_step": 10881, + "learning_rate": 0.0004554215358931553, + "loss": 1.6563, + "loss_base2": 2.3895, + "loss_pixel": 0.1792, + "loss_text": 1.4772, + "ppl": 5.2399, + "step": 10881 + }, + { + "epoch": 0.06, + "global_step": 10882, + "learning_rate": 0.0004554173622704508, + "loss": 1.6393, + "loss_base2": 2.365, + "loss_pixel": 0.1792, + "loss_text": 1.4602, + "ppl": 5.1516, + "step": 10882 + }, + { + "epoch": 0.06, + "global_step": 10883, + "learning_rate": 0.0004554131886477463, + "loss": 1.6315, + "loss_base2": 2.3538, + "loss_pixel": 0.1787, + "loss_text": 1.4528, + "ppl": 5.1115, + "step": 10883 + }, + { + "epoch": 0.06, + "global_step": 10884, + "learning_rate": 0.00045540901502504175, + "loss": 1.6353, + "loss_base2": 2.3592, + "loss_pixel": 0.178, + "loss_text": 1.4572, + "ppl": 5.131, + "step": 10884 + }, + { + "epoch": 0.06, + "global_step": 10885, + "learning_rate": 0.00045540484140233725, + "loss": 1.6329, + "loss_base2": 2.3558, + "loss_pixel": 0.1786, + "loss_text": 1.4542, + "ppl": 5.1187, + "step": 10885 + }, + { + "epoch": 0.06, + "global_step": 10886, + "learning_rate": 0.00045540066777963276, + "loss": 1.6361, + "loss_base2": 2.3604, + "loss_pixel": 0.1791, + "loss_text": 1.4571, + "ppl": 5.1351, + "step": 10886 + }, + { + "epoch": 0.06, + "global_step": 10887, + "learning_rate": 0.00045539649415692827, + "loss": 1.6358, + "loss_base2": 2.36, + "loss_pixel": 0.1771, + "loss_text": 1.4587, + "ppl": 5.1336, + "step": 10887 + }, + { + "epoch": 0.06, + "global_step": 10888, + "learning_rate": 0.00045539232053422367, + "loss": 1.6299, + "loss_base2": 2.3514, + "loss_pixel": 0.1767, + "loss_text": 1.4532, + "ppl": 5.1034, + "step": 10888 + }, + { + "epoch": 0.06, + "global_step": 10889, + "learning_rate": 0.0004553881469115192, + "loss": 1.6354, + "loss_base2": 2.3594, + "loss_pixel": 0.178, + "loss_text": 1.4573, + "ppl": 5.1315, + "step": 10889 + }, + { + "epoch": 0.06, + "global_step": 10890, + "learning_rate": 0.0004553839732888147, + "loss": 1.6214, + "loss_base2": 2.3392, + "loss_pixel": 0.1759, + "loss_text": 1.4455, + "ppl": 5.0602, + "step": 10890 + }, + { + "epoch": 0.06, + "global_step": 10891, + "learning_rate": 0.0004553797996661102, + "loss": 1.6309, + "loss_base2": 2.3529, + "loss_pixel": 0.1769, + "loss_text": 1.454, + "ppl": 5.1085, + "step": 10891 + }, + { + "epoch": 0.06, + "global_step": 10892, + "learning_rate": 0.0004553756260434057, + "loss": 1.6741, + "loss_base2": 2.4152, + "loss_pixel": 0.1771, + "loss_text": 1.497, + "ppl": 5.334, + "step": 10892 + }, + { + "epoch": 0.06, + "global_step": 10893, + "learning_rate": 0.00045537145242070115, + "loss": 1.6352, + "loss_base2": 2.3591, + "loss_pixel": 0.1751, + "loss_text": 1.4601, + "ppl": 5.1305, + "step": 10893 + }, + { + "epoch": 0.06, + "global_step": 10894, + "learning_rate": 0.00045536727879799666, + "loss": 1.639, + "loss_base2": 2.3646, + "loss_pixel": 0.1766, + "loss_text": 1.4624, + "ppl": 5.15, + "step": 10894 + }, + { + "epoch": 0.06, + "global_step": 10895, + "learning_rate": 0.00045536310517529217, + "loss": 1.6333, + "loss_base2": 2.3564, + "loss_pixel": 0.1755, + "loss_text": 1.4578, + "ppl": 5.1207, + "step": 10895 + }, + { + "epoch": 0.06, + "global_step": 10896, + "learning_rate": 0.00045535893155258767, + "loss": 1.6269, + "loss_base2": 2.3471, + "loss_pixel": 0.1741, + "loss_text": 1.4528, + "ppl": 5.0881, + "step": 10896 + }, + { + "epoch": 0.06, + "global_step": 10897, + "learning_rate": 0.0004553547579298831, + "loss": 1.6425, + "loss_base2": 2.3696, + "loss_pixel": 0.1749, + "loss_text": 1.4676, + "ppl": 5.1681, + "step": 10897 + }, + { + "epoch": 0.06, + "global_step": 10898, + "learning_rate": 0.00045535058430717863, + "loss": 1.6344, + "loss_base2": 2.3579, + "loss_pixel": 0.1765, + "loss_text": 1.4578, + "ppl": 5.1264, + "step": 10898 + }, + { + "epoch": 0.06, + "global_step": 10899, + "learning_rate": 0.00045534641068447414, + "loss": 1.5516, + "loss_base2": 2.2385, + "loss_pixel": 0.1755, + "loss_text": 1.3761, + "ppl": 4.719, + "step": 10899 + }, + { + "epoch": 0.06, + "global_step": 10900, + "learning_rate": 0.00045534223706176965, + "loss": 1.4203, + "loss_base2": 2.0491, + "loss_pixel": 0.1743, + "loss_text": 1.246, + "ppl": 4.1384, + "step": 10900 + }, + { + "epoch": 0.06, + "global_step": 10901, + "learning_rate": 0.00045533806343906515, + "loss": 1.4367, + "loss_base2": 2.0727, + "loss_pixel": 0.1746, + "loss_text": 1.2621, + "ppl": 4.2068, + "step": 10901 + }, + { + "epoch": 0.06, + "global_step": 10902, + "learning_rate": 0.0004553338898163606, + "loss": 1.4191, + "loss_base2": 2.0473, + "loss_pixel": 0.1757, + "loss_text": 1.2433, + "ppl": 4.1334, + "step": 10902 + }, + { + "epoch": 0.06, + "global_step": 10903, + "learning_rate": 0.0004553297161936561, + "loss": 1.4112, + "loss_base2": 2.0359, + "loss_pixel": 0.1741, + "loss_text": 1.2371, + "ppl": 4.1009, + "step": 10903 + }, + { + "epoch": 0.06, + "global_step": 10904, + "learning_rate": 0.0004553255425709516, + "loss": 1.3981, + "loss_base2": 2.017, + "loss_pixel": 0.1747, + "loss_text": 1.2234, + "ppl": 4.0475, + "step": 10904 + }, + { + "epoch": 0.06, + "global_step": 10905, + "learning_rate": 0.00045532136894824713, + "loss": 1.3981, + "loss_base2": 2.017, + "loss_pixel": 0.1731, + "loss_text": 1.225, + "ppl": 4.0475, + "step": 10905 + }, + { + "epoch": 0.06, + "global_step": 10906, + "learning_rate": 0.00045531719532554253, + "loss": 1.4097, + "loss_base2": 2.0338, + "loss_pixel": 0.1741, + "loss_text": 1.2355, + "ppl": 4.0947, + "step": 10906 + }, + { + "epoch": 0.06, + "global_step": 10907, + "learning_rate": 0.00045531302170283804, + "loss": 1.5183, + "loss_base2": 2.1904, + "loss_pixel": 0.1732, + "loss_text": 1.3451, + "ppl": 4.5645, + "step": 10907 + }, + { + "epoch": 0.06, + "global_step": 10908, + "learning_rate": 0.00045530884808013354, + "loss": 1.6375, + "loss_base2": 2.3624, + "loss_pixel": 0.1737, + "loss_text": 1.4637, + "ppl": 5.1423, + "step": 10908 + }, + { + "epoch": 0.06, + "global_step": 10909, + "learning_rate": 0.00045530467445742905, + "loss": 1.6497, + "loss_base2": 2.38, + "loss_pixel": 0.1733, + "loss_text": 1.4764, + "ppl": 5.2054, + "step": 10909 + }, + { + "epoch": 0.06, + "global_step": 10910, + "learning_rate": 0.00045530050083472456, + "loss": 1.6402, + "loss_base2": 2.3663, + "loss_pixel": 0.1723, + "loss_text": 1.4679, + "ppl": 5.1562, + "step": 10910 + }, + { + "epoch": 0.06, + "global_step": 10911, + "learning_rate": 0.00045529632721202, + "loss": 1.662, + "loss_base2": 2.3978, + "loss_pixel": 0.1744, + "loss_text": 1.4875, + "ppl": 5.2698, + "step": 10911 + }, + { + "epoch": 0.06, + "global_step": 10912, + "learning_rate": 0.0004552921535893155, + "loss": 1.6471, + "loss_base2": 2.3763, + "loss_pixel": 0.1736, + "loss_text": 1.4735, + "ppl": 5.1919, + "step": 10912 + }, + { + "epoch": 0.06, + "global_step": 10913, + "learning_rate": 0.000455287979966611, + "loss": 1.6417, + "loss_base2": 2.3685, + "loss_pixel": 0.1737, + "loss_text": 1.468, + "ppl": 5.1639, + "step": 10913 + }, + { + "epoch": 0.06, + "global_step": 10914, + "learning_rate": 0.00045528380634390653, + "loss": 1.6469, + "loss_base2": 2.376, + "loss_pixel": 0.1727, + "loss_text": 1.4741, + "ppl": 5.1909, + "step": 10914 + }, + { + "epoch": 0.06, + "global_step": 10915, + "learning_rate": 0.000455279632721202, + "loss": 1.6457, + "loss_base2": 2.3742, + "loss_pixel": 0.1726, + "loss_text": 1.473, + "ppl": 5.1846, + "step": 10915 + }, + { + "epoch": 0.06, + "global_step": 10916, + "learning_rate": 0.0004552754590984975, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1711, + "loss_text": 1.4458, + "ppl": 5.0374, + "step": 10916 + }, + { + "epoch": 0.06, + "global_step": 10917, + "learning_rate": 0.000455271285475793, + "loss": 1.635, + "loss_base2": 2.3588, + "loss_pixel": 0.1721, + "loss_text": 1.4629, + "ppl": 5.1295, + "step": 10917 + }, + { + "epoch": 0.06, + "global_step": 10918, + "learning_rate": 0.0004552671118530885, + "loss": 1.6281, + "loss_base2": 2.3489, + "loss_pixel": 0.1711, + "loss_text": 1.457, + "ppl": 5.0942, + "step": 10918 + }, + { + "epoch": 0.06, + "global_step": 10919, + "learning_rate": 0.000455262938230384, + "loss": 1.6403, + "loss_base2": 2.3665, + "loss_pixel": 0.1725, + "loss_text": 1.4678, + "ppl": 5.1567, + "step": 10919 + }, + { + "epoch": 0.06, + "global_step": 10920, + "learning_rate": 0.00045525876460767947, + "loss": 1.6185, + "loss_base2": 2.335, + "loss_pixel": 0.1729, + "loss_text": 1.4456, + "ppl": 5.0455, + "step": 10920 + }, + { + "epoch": 0.06, + "global_step": 10921, + "learning_rate": 0.000455254590984975, + "loss": 1.6336, + "loss_base2": 2.3568, + "loss_pixel": 0.1725, + "loss_text": 1.4611, + "ppl": 5.1223, + "step": 10921 + }, + { + "epoch": 0.06, + "global_step": 10922, + "learning_rate": 0.0004552504173622705, + "loss": 1.6458, + "loss_base2": 2.3744, + "loss_pixel": 0.1722, + "loss_text": 1.4736, + "ppl": 5.1852, + "step": 10922 + }, + { + "epoch": 0.06, + "global_step": 10923, + "learning_rate": 0.000455246243739566, + "loss": 1.6184, + "loss_base2": 2.3349, + "loss_pixel": 0.1704, + "loss_text": 1.4481, + "ppl": 5.045, + "step": 10923 + }, + { + "epoch": 0.06, + "global_step": 10924, + "learning_rate": 0.00045524207011686144, + "loss": 1.6149, + "loss_base2": 2.3298, + "loss_pixel": 0.173, + "loss_text": 1.442, + "ppl": 5.0274, + "step": 10924 + }, + { + "epoch": 0.06, + "global_step": 10925, + "learning_rate": 0.0004552378964941569, + "loss": 1.62, + "loss_base2": 2.3372, + "loss_pixel": 0.1709, + "loss_text": 1.4491, + "ppl": 5.0531, + "step": 10925 + }, + { + "epoch": 0.06, + "global_step": 10926, + "learning_rate": 0.0004552337228714524, + "loss": 1.637, + "loss_base2": 2.3617, + "loss_pixel": 0.171, + "loss_text": 1.466, + "ppl": 5.1397, + "step": 10926 + }, + { + "epoch": 0.06, + "global_step": 10927, + "learning_rate": 0.0004552295492487479, + "loss": 1.6244, + "loss_base2": 2.3435, + "loss_pixel": 0.1701, + "loss_text": 1.4544, + "ppl": 5.0754, + "step": 10927 + }, + { + "epoch": 0.06, + "global_step": 10928, + "learning_rate": 0.0004552253756260434, + "loss": 1.6289, + "loss_base2": 2.35, + "loss_pixel": 0.1711, + "loss_text": 1.4578, + "ppl": 5.0983, + "step": 10928 + }, + { + "epoch": 0.06, + "global_step": 10929, + "learning_rate": 0.00045522120200333887, + "loss": 1.6163, + "loss_base2": 2.3318, + "loss_pixel": 0.1704, + "loss_text": 1.4459, + "ppl": 5.0344, + "step": 10929 + }, + { + "epoch": 0.06, + "global_step": 10930, + "learning_rate": 0.0004552170283806344, + "loss": 1.6057, + "loss_base2": 2.3165, + "loss_pixel": 0.1725, + "loss_text": 1.4332, + "ppl": 4.9813, + "step": 10930 + }, + { + "epoch": 0.06, + "global_step": 10931, + "learning_rate": 0.0004552128547579299, + "loss": 1.6354, + "loss_base2": 2.3594, + "loss_pixel": 0.1706, + "loss_text": 1.4648, + "ppl": 5.1315, + "step": 10931 + }, + { + "epoch": 0.06, + "global_step": 10932, + "learning_rate": 0.0004552086811352254, + "loss": 1.6167, + "loss_base2": 2.3324, + "loss_pixel": 0.1705, + "loss_text": 1.4462, + "ppl": 5.0364, + "step": 10932 + }, + { + "epoch": 0.06, + "global_step": 10933, + "learning_rate": 0.0004552045075125209, + "loss": 1.6267, + "loss_base2": 2.3468, + "loss_pixel": 0.1724, + "loss_text": 1.4543, + "ppl": 5.0871, + "step": 10933 + }, + { + "epoch": 0.06, + "global_step": 10934, + "learning_rate": 0.00045520033388981635, + "loss": 1.6329, + "loss_base2": 2.3558, + "loss_pixel": 0.17, + "loss_text": 1.4629, + "ppl": 5.1187, + "step": 10934 + }, + { + "epoch": 0.06, + "global_step": 10935, + "learning_rate": 0.00045519616026711186, + "loss": 1.6317, + "loss_base2": 2.354, + "loss_pixel": 0.1697, + "loss_text": 1.462, + "ppl": 5.1126, + "step": 10935 + }, + { + "epoch": 0.06, + "global_step": 10936, + "learning_rate": 0.00045519198664440737, + "loss": 1.6276, + "loss_base2": 2.3481, + "loss_pixel": 0.1708, + "loss_text": 1.4568, + "ppl": 5.0916, + "step": 10936 + }, + { + "epoch": 0.06, + "global_step": 10937, + "learning_rate": 0.0004551878130217029, + "loss": 1.6225, + "loss_base2": 2.3408, + "loss_pixel": 0.1709, + "loss_text": 1.4516, + "ppl": 5.0657, + "step": 10937 + }, + { + "epoch": 0.06, + "global_step": 10938, + "learning_rate": 0.00045518363939899833, + "loss": 1.6295, + "loss_base2": 2.3509, + "loss_pixel": 0.1702, + "loss_text": 1.4593, + "ppl": 5.1013, + "step": 10938 + }, + { + "epoch": 0.06, + "global_step": 10939, + "learning_rate": 0.00045517946577629384, + "loss": 1.6198, + "loss_base2": 2.3369, + "loss_pixel": 0.1705, + "loss_text": 1.4493, + "ppl": 5.0521, + "step": 10939 + }, + { + "epoch": 0.06, + "global_step": 10940, + "learning_rate": 0.00045517529215358934, + "loss": 1.6347, + "loss_base2": 2.3584, + "loss_pixel": 0.1677, + "loss_text": 1.467, + "ppl": 5.1279, + "step": 10940 + }, + { + "epoch": 0.06, + "global_step": 10941, + "learning_rate": 0.00045517111853088485, + "loss": 1.6294, + "loss_base2": 2.3507, + "loss_pixel": 0.1712, + "loss_text": 1.4583, + "ppl": 5.1008, + "step": 10941 + }, + { + "epoch": 0.06, + "global_step": 10942, + "learning_rate": 0.00045516694490818036, + "loss": 1.6238, + "loss_base2": 2.3426, + "loss_pixel": 0.1712, + "loss_text": 1.4527, + "ppl": 5.0723, + "step": 10942 + }, + { + "epoch": 0.06, + "global_step": 10943, + "learning_rate": 0.0004551627712854758, + "loss": 1.6404, + "loss_base2": 2.3666, + "loss_pixel": 0.1684, + "loss_text": 1.472, + "ppl": 5.1572, + "step": 10943 + }, + { + "epoch": 0.06, + "global_step": 10944, + "learning_rate": 0.00045515859766277126, + "loss": 1.6192, + "loss_base2": 2.336, + "loss_pixel": 0.1702, + "loss_text": 1.449, + "ppl": 5.049, + "step": 10944 + }, + { + "epoch": 0.06, + "global_step": 10945, + "learning_rate": 0.00045515442404006677, + "loss": 1.6267, + "loss_base2": 2.3468, + "loss_pixel": 0.1685, + "loss_text": 1.4582, + "ppl": 5.0871, + "step": 10945 + }, + { + "epoch": 0.06, + "global_step": 10946, + "learning_rate": 0.0004551502504173623, + "loss": 1.6283, + "loss_base2": 2.3491, + "loss_pixel": 0.1691, + "loss_text": 1.4592, + "ppl": 5.0952, + "step": 10946 + }, + { + "epoch": 0.06, + "global_step": 10947, + "learning_rate": 0.00045514607679465773, + "loss": 1.6104, + "loss_base2": 2.3233, + "loss_pixel": 0.1695, + "loss_text": 1.4409, + "ppl": 5.0048, + "step": 10947 + }, + { + "epoch": 0.06, + "global_step": 10948, + "learning_rate": 0.00045514190317195324, + "loss": 1.6298, + "loss_base2": 2.3513, + "loss_pixel": 0.1698, + "loss_text": 1.46, + "ppl": 5.1029, + "step": 10948 + }, + { + "epoch": 0.06, + "global_step": 10949, + "learning_rate": 0.00045513772954924875, + "loss": 1.6288, + "loss_base2": 2.3499, + "loss_pixel": 0.1696, + "loss_text": 1.4593, + "ppl": 5.0978, + "step": 10949 + }, + { + "epoch": 0.06, + "global_step": 10950, + "learning_rate": 0.00045513355592654425, + "loss": 1.5603, + "loss_base2": 2.251, + "loss_pixel": 0.1695, + "loss_text": 1.3908, + "ppl": 4.7602, + "step": 10950 + }, + { + "epoch": 0.06, + "global_step": 10951, + "learning_rate": 0.00045512938230383976, + "loss": 1.6188, + "loss_base2": 2.3354, + "loss_pixel": 0.1704, + "loss_text": 1.4484, + "ppl": 5.047, + "step": 10951 + }, + { + "epoch": 0.06, + "global_step": 10952, + "learning_rate": 0.0004551252086811352, + "loss": 1.6295, + "loss_base2": 2.3509, + "loss_pixel": 0.171, + "loss_text": 1.4585, + "ppl": 5.1013, + "step": 10952 + }, + { + "epoch": 0.06, + "global_step": 10953, + "learning_rate": 0.0004551210350584307, + "loss": 1.6195, + "loss_base2": 2.3364, + "loss_pixel": 0.1682, + "loss_text": 1.4513, + "ppl": 5.0506, + "step": 10953 + }, + { + "epoch": 0.06, + "global_step": 10954, + "learning_rate": 0.00045511686143572623, + "loss": 1.6462, + "loss_base2": 2.375, + "loss_pixel": 0.1693, + "loss_text": 1.4769, + "ppl": 5.1872, + "step": 10954 + }, + { + "epoch": 0.06, + "global_step": 10955, + "learning_rate": 0.00045511268781302174, + "loss": 1.6256, + "loss_base2": 2.3452, + "loss_pixel": 0.1675, + "loss_text": 1.4581, + "ppl": 5.0815, + "step": 10955 + }, + { + "epoch": 0.06, + "global_step": 10956, + "learning_rate": 0.0004551085141903172, + "loss": 1.6204, + "loss_base2": 2.3377, + "loss_pixel": 0.1683, + "loss_text": 1.452, + "ppl": 5.0551, + "step": 10956 + }, + { + "epoch": 0.06, + "global_step": 10957, + "learning_rate": 0.0004551043405676127, + "loss": 1.6232, + "loss_base2": 2.3418, + "loss_pixel": 0.1699, + "loss_text": 1.4533, + "ppl": 5.0693, + "step": 10957 + }, + { + "epoch": 0.06, + "global_step": 10958, + "learning_rate": 0.0004551001669449082, + "loss": 1.6371, + "loss_base2": 2.3618, + "loss_pixel": 0.1686, + "loss_text": 1.4685, + "ppl": 5.1402, + "step": 10958 + }, + { + "epoch": 0.06, + "global_step": 10959, + "learning_rate": 0.0004550959933222037, + "loss": 1.6158, + "loss_base2": 2.3311, + "loss_pixel": 0.1702, + "loss_text": 1.4456, + "ppl": 5.0319, + "step": 10959 + }, + { + "epoch": 0.06, + "global_step": 10960, + "learning_rate": 0.0004550918196994992, + "loss": 1.6227, + "loss_base2": 2.3411, + "loss_pixel": 0.1696, + "loss_text": 1.4531, + "ppl": 5.0668, + "step": 10960 + }, + { + "epoch": 0.06, + "global_step": 10961, + "learning_rate": 0.00045508764607679467, + "loss": 1.6012, + "loss_base2": 2.31, + "loss_pixel": 0.1694, + "loss_text": 1.4319, + "ppl": 4.959, + "step": 10961 + }, + { + "epoch": 0.06, + "global_step": 10962, + "learning_rate": 0.0004550834724540902, + "loss": 1.6145, + "loss_base2": 2.3292, + "loss_pixel": 0.1671, + "loss_text": 1.4474, + "ppl": 5.0254, + "step": 10962 + }, + { + "epoch": 0.06, + "global_step": 10963, + "learning_rate": 0.00045507929883138563, + "loss": 1.631, + "loss_base2": 2.353, + "loss_pixel": 0.1698, + "loss_text": 1.4612, + "ppl": 5.109, + "step": 10963 + }, + { + "epoch": 0.06, + "global_step": 10964, + "learning_rate": 0.00045507512520868114, + "loss": 1.626, + "loss_base2": 2.3458, + "loss_pixel": 0.1685, + "loss_text": 1.4574, + "ppl": 5.0835, + "step": 10964 + }, + { + "epoch": 0.06, + "global_step": 10965, + "learning_rate": 0.0004550709515859766, + "loss": 1.6277, + "loss_base2": 2.3483, + "loss_pixel": 0.1696, + "loss_text": 1.458, + "ppl": 5.0921, + "step": 10965 + }, + { + "epoch": 0.06, + "global_step": 10966, + "learning_rate": 0.0004550667779632721, + "loss": 1.6214, + "loss_base2": 2.3392, + "loss_pixel": 0.1691, + "loss_text": 1.4524, + "ppl": 5.0602, + "step": 10966 + }, + { + "epoch": 0.06, + "global_step": 10967, + "learning_rate": 0.0004550626043405676, + "loss": 1.6249, + "loss_base2": 2.3442, + "loss_pixel": 0.1693, + "loss_text": 1.4556, + "ppl": 5.0779, + "step": 10967 + }, + { + "epoch": 0.06, + "global_step": 10968, + "learning_rate": 0.0004550584307178631, + "loss": 1.6197, + "loss_base2": 2.3367, + "loss_pixel": 0.1686, + "loss_text": 1.4511, + "ppl": 5.0516, + "step": 10968 + }, + { + "epoch": 0.06, + "global_step": 10969, + "learning_rate": 0.0004550542570951586, + "loss": 1.6251, + "loss_base2": 2.3445, + "loss_pixel": 0.168, + "loss_text": 1.4571, + "ppl": 5.0789, + "step": 10969 + }, + { + "epoch": 0.06, + "global_step": 10970, + "learning_rate": 0.0004550500834724541, + "loss": 1.6253, + "loss_base2": 2.3448, + "loss_pixel": 0.1683, + "loss_text": 1.457, + "ppl": 5.0799, + "step": 10970 + }, + { + "epoch": 0.06, + "global_step": 10971, + "learning_rate": 0.0004550459098497496, + "loss": 1.6277, + "loss_base2": 2.3483, + "loss_pixel": 0.1691, + "loss_text": 1.4586, + "ppl": 5.0921, + "step": 10971 + }, + { + "epoch": 0.06, + "global_step": 10972, + "learning_rate": 0.0004550417362270451, + "loss": 1.6138, + "loss_base2": 2.3282, + "loss_pixel": 0.1689, + "loss_text": 1.4449, + "ppl": 5.0219, + "step": 10972 + }, + { + "epoch": 0.06, + "global_step": 10973, + "learning_rate": 0.0004550375626043406, + "loss": 1.6162, + "loss_base2": 2.3317, + "loss_pixel": 0.1673, + "loss_text": 1.4489, + "ppl": 5.0339, + "step": 10973 + }, + { + "epoch": 0.06, + "global_step": 10974, + "learning_rate": 0.00045503338898163605, + "loss": 1.6079, + "loss_base2": 2.3197, + "loss_pixel": 0.17, + "loss_text": 1.438, + "ppl": 4.9923, + "step": 10974 + }, + { + "epoch": 0.06, + "global_step": 10975, + "learning_rate": 0.00045502921535893156, + "loss": 1.6183, + "loss_base2": 2.3347, + "loss_pixel": 0.1676, + "loss_text": 1.4507, + "ppl": 5.0445, + "step": 10975 + }, + { + "epoch": 0.06, + "global_step": 10976, + "learning_rate": 0.00045502504173622707, + "loss": 1.4829, + "loss_base2": 2.1394, + "loss_pixel": 0.1689, + "loss_text": 1.314, + "ppl": 4.4057, + "step": 10976 + }, + { + "epoch": 0.06, + "global_step": 10977, + "learning_rate": 0.00045502086811352257, + "loss": 1.3968, + "loss_base2": 2.0152, + "loss_pixel": 0.1678, + "loss_text": 1.229, + "ppl": 4.0422, + "step": 10977 + }, + { + "epoch": 0.06, + "global_step": 10978, + "learning_rate": 0.0004550166944908181, + "loss": 1.4238, + "loss_base2": 2.0541, + "loss_pixel": 0.1682, + "loss_text": 1.2556, + "ppl": 4.1529, + "step": 10978 + }, + { + "epoch": 0.06, + "global_step": 10979, + "learning_rate": 0.00045501252086811353, + "loss": 1.41, + "loss_base2": 2.0342, + "loss_pixel": 0.1673, + "loss_text": 1.2427, + "ppl": 4.096, + "step": 10979 + }, + { + "epoch": 0.06, + "global_step": 10980, + "learning_rate": 0.00045500834724540904, + "loss": 1.4031, + "loss_base2": 2.0242, + "loss_pixel": 0.1674, + "loss_text": 1.2357, + "ppl": 4.0678, + "step": 10980 + }, + { + "epoch": 0.06, + "global_step": 10981, + "learning_rate": 0.0004550041736227045, + "loss": 1.3962, + "loss_base2": 2.0143, + "loss_pixel": 0.1668, + "loss_text": 1.2294, + "ppl": 4.0398, + "step": 10981 + }, + { + "epoch": 0.06, + "global_step": 10982, + "learning_rate": 0.000455, + "loss": 1.3787, + "loss_base2": 1.989, + "loss_pixel": 0.1674, + "loss_text": 1.2113, + "ppl": 3.9697, + "step": 10982 + }, + { + "epoch": 0.06, + "global_step": 10983, + "learning_rate": 0.00045499582637729545, + "loss": 1.3966, + "loss_base2": 2.0149, + "loss_pixel": 0.1678, + "loss_text": 1.2288, + "ppl": 4.0414, + "step": 10983 + }, + { + "epoch": 0.06, + "global_step": 10984, + "learning_rate": 0.00045499165275459096, + "loss": 1.4579, + "loss_base2": 2.1033, + "loss_pixel": 0.1679, + "loss_text": 1.2901, + "ppl": 4.2969, + "step": 10984 + }, + { + "epoch": 0.06, + "global_step": 10985, + "learning_rate": 0.00045498747913188647, + "loss": 1.5638, + "loss_base2": 2.2561, + "loss_pixel": 0.1672, + "loss_text": 1.3966, + "ppl": 4.7769, + "step": 10985 + }, + { + "epoch": 0.06, + "global_step": 10986, + "learning_rate": 0.000454983305509182, + "loss": 1.4968, + "loss_base2": 2.1594, + "loss_pixel": 0.1663, + "loss_text": 1.3305, + "ppl": 4.4674, + "step": 10986 + }, + { + "epoch": 0.06, + "global_step": 10987, + "learning_rate": 0.0004549791318864775, + "loss": 1.4015, + "loss_base2": 2.0219, + "loss_pixel": 0.1664, + "loss_text": 1.2351, + "ppl": 4.0613, + "step": 10987 + }, + { + "epoch": 0.06, + "global_step": 10988, + "learning_rate": 0.00045497495826377294, + "loss": 1.4057, + "loss_base2": 2.028, + "loss_pixel": 0.1675, + "loss_text": 1.2382, + "ppl": 4.0784, + "step": 10988 + }, + { + "epoch": 0.06, + "global_step": 10989, + "learning_rate": 0.00045497078464106844, + "loss": 1.3951, + "loss_base2": 2.0127, + "loss_pixel": 0.1707, + "loss_text": 1.2245, + "ppl": 4.0354, + "step": 10989 + }, + { + "epoch": 0.06, + "global_step": 10990, + "learning_rate": 0.00045496661101836395, + "loss": 1.4006, + "loss_base2": 2.0206, + "loss_pixel": 0.1703, + "loss_text": 1.2303, + "ppl": 4.0576, + "step": 10990 + }, + { + "epoch": 0.06, + "global_step": 10991, + "learning_rate": 0.00045496243739565946, + "loss": 1.4221, + "loss_base2": 2.0517, + "loss_pixel": 0.1747, + "loss_text": 1.2474, + "ppl": 4.1458, + "step": 10991 + }, + { + "epoch": 0.06, + "global_step": 10992, + "learning_rate": 0.00045495826377295497, + "loss": 1.3955, + "loss_base2": 2.0133, + "loss_pixel": 0.175, + "loss_text": 1.2205, + "ppl": 4.037, + "step": 10992 + }, + { + "epoch": 0.06, + "global_step": 10993, + "learning_rate": 0.0004549540901502504, + "loss": 1.3859, + "loss_base2": 1.9994, + "loss_pixel": 0.174, + "loss_text": 1.2119, + "ppl": 3.9984, + "step": 10993 + }, + { + "epoch": 0.06, + "global_step": 10994, + "learning_rate": 0.0004549499165275459, + "loss": 1.4065, + "loss_base2": 2.0292, + "loss_pixel": 0.175, + "loss_text": 1.2315, + "ppl": 4.0816, + "step": 10994 + }, + { + "epoch": 0.06, + "global_step": 10995, + "learning_rate": 0.00045494574290484143, + "loss": 1.4104, + "loss_base2": 2.0348, + "loss_pixel": 0.1743, + "loss_text": 1.2361, + "ppl": 4.0976, + "step": 10995 + }, + { + "epoch": 0.06, + "global_step": 10996, + "learning_rate": 0.00045494156928213694, + "loss": 1.4277, + "loss_base2": 2.0597, + "loss_pixel": 0.1722, + "loss_text": 1.2555, + "ppl": 4.1691, + "step": 10996 + }, + { + "epoch": 0.06, + "global_step": 10997, + "learning_rate": 0.0004549373956594324, + "loss": 1.3828, + "loss_base2": 1.995, + "loss_pixel": 0.1735, + "loss_text": 1.2093, + "ppl": 3.986, + "step": 10997 + }, + { + "epoch": 0.06, + "global_step": 10998, + "learning_rate": 0.0004549332220367279, + "loss": 1.4179, + "loss_base2": 2.0456, + "loss_pixel": 0.1715, + "loss_text": 1.2464, + "ppl": 4.1284, + "step": 10998 + }, + { + "epoch": 0.06, + "global_step": 10999, + "learning_rate": 0.0004549290484140234, + "loss": 1.416, + "loss_base2": 2.0429, + "loss_pixel": 0.172, + "loss_text": 1.2441, + "ppl": 4.1206, + "step": 10999 + }, + { + "epoch": 0.06, + "global_step": 11000, + "learning_rate": 0.00045492487479131886, + "loss": 1.4156, + "loss_base2": 2.0423, + "loss_pixel": 0.173, + "loss_text": 1.2427, + "ppl": 4.119, + "step": 11000 + }, + { + "epoch": 0.06, + "global_step": 11001, + "learning_rate": 0.00045492070116861437, + "loss": 1.405, + "loss_base2": 2.027, + "loss_pixel": 0.1726, + "loss_text": 1.2323, + "ppl": 4.0755, + "step": 11001 + }, + { + "epoch": 0.06, + "global_step": 11002, + "learning_rate": 0.0004549165275459098, + "loss": 1.4163, + "loss_base2": 2.0433, + "loss_pixel": 0.1784, + "loss_text": 1.2379, + "ppl": 4.1218, + "step": 11002 + }, + { + "epoch": 0.06, + "global_step": 11003, + "learning_rate": 0.00045491235392320533, + "loss": 1.4082, + "loss_base2": 2.0316, + "loss_pixel": 0.1787, + "loss_text": 1.2295, + "ppl": 4.0886, + "step": 11003 + }, + { + "epoch": 0.06, + "global_step": 11004, + "learning_rate": 0.00045490818030050084, + "loss": 1.4155, + "loss_base2": 2.0421, + "loss_pixel": 0.1764, + "loss_text": 1.2391, + "ppl": 4.1185, + "step": 11004 + }, + { + "epoch": 0.06, + "global_step": 11005, + "learning_rate": 0.00045490400667779634, + "loss": 1.4054, + "loss_base2": 2.0276, + "loss_pixel": 0.1707, + "loss_text": 1.2347, + "ppl": 4.0772, + "step": 11005 + }, + { + "epoch": 0.06, + "global_step": 11006, + "learning_rate": 0.0004548998330550918, + "loss": 1.3956, + "loss_base2": 2.0134, + "loss_pixel": 0.1699, + "loss_text": 1.2257, + "ppl": 4.0374, + "step": 11006 + }, + { + "epoch": 0.06, + "global_step": 11007, + "learning_rate": 0.0004548956594323873, + "loss": 1.3986, + "loss_base2": 2.0178, + "loss_pixel": 0.1686, + "loss_text": 1.23, + "ppl": 4.0495, + "step": 11007 + }, + { + "epoch": 0.06, + "global_step": 11008, + "learning_rate": 0.0004548914858096828, + "loss": 1.4092, + "loss_base2": 2.033, + "loss_pixel": 0.1684, + "loss_text": 1.2407, + "ppl": 4.0927, + "step": 11008 + }, + { + "epoch": 0.06, + "global_step": 11009, + "learning_rate": 0.0004548873121869783, + "loss": 1.4136, + "loss_base2": 2.0394, + "loss_pixel": 0.1708, + "loss_text": 1.2428, + "ppl": 4.1107, + "step": 11009 + }, + { + "epoch": 0.06, + "global_step": 11010, + "learning_rate": 0.0004548831385642738, + "loss": 1.4108, + "loss_base2": 2.0354, + "loss_pixel": 0.1692, + "loss_text": 1.2416, + "ppl": 4.0992, + "step": 11010 + }, + { + "epoch": 0.06, + "global_step": 11011, + "learning_rate": 0.0004548789649415693, + "loss": 1.4772, + "loss_base2": 2.1311, + "loss_pixel": 0.1684, + "loss_text": 1.3089, + "ppl": 4.3807, + "step": 11011 + }, + { + "epoch": 0.06, + "global_step": 11012, + "learning_rate": 0.0004548747913188648, + "loss": 1.4758, + "loss_base2": 2.1291, + "loss_pixel": 0.1702, + "loss_text": 1.3056, + "ppl": 4.3745, + "step": 11012 + }, + { + "epoch": 0.06, + "global_step": 11013, + "learning_rate": 0.0004548706176961603, + "loss": 1.4054, + "loss_base2": 2.0276, + "loss_pixel": 0.1674, + "loss_text": 1.238, + "ppl": 4.0772, + "step": 11013 + }, + { + "epoch": 0.06, + "global_step": 11014, + "learning_rate": 0.0004548664440734558, + "loss": 1.3979, + "loss_base2": 2.0167, + "loss_pixel": 0.1679, + "loss_text": 1.23, + "ppl": 4.0467, + "step": 11014 + }, + { + "epoch": 0.06, + "global_step": 11015, + "learning_rate": 0.00045486227045075125, + "loss": 1.4057, + "loss_base2": 2.028, + "loss_pixel": 0.1678, + "loss_text": 1.238, + "ppl": 4.0784, + "step": 11015 + }, + { + "epoch": 0.06, + "global_step": 11016, + "learning_rate": 0.00045485809682804676, + "loss": 1.4002, + "loss_base2": 2.0201, + "loss_pixel": 0.1698, + "loss_text": 1.2304, + "ppl": 4.056, + "step": 11016 + }, + { + "epoch": 0.06, + "global_step": 11017, + "learning_rate": 0.00045485392320534227, + "loss": 1.3833, + "loss_base2": 1.9957, + "loss_pixel": 0.1676, + "loss_text": 1.2157, + "ppl": 3.988, + "step": 11017 + }, + { + "epoch": 0.06, + "global_step": 11018, + "learning_rate": 0.0004548497495826378, + "loss": 1.395, + "loss_base2": 2.0126, + "loss_pixel": 0.1677, + "loss_text": 1.2273, + "ppl": 4.035, + "step": 11018 + }, + { + "epoch": 0.06, + "global_step": 11019, + "learning_rate": 0.00045484557595993323, + "loss": 1.3812, + "loss_base2": 1.9927, + "loss_pixel": 0.1663, + "loss_text": 1.2149, + "ppl": 3.9797, + "step": 11019 + }, + { + "epoch": 0.06, + "global_step": 11020, + "learning_rate": 0.0004548414023372287, + "loss": 1.3984, + "loss_base2": 2.0175, + "loss_pixel": 0.1683, + "loss_text": 1.2302, + "ppl": 4.0487, + "step": 11020 + }, + { + "epoch": 0.06, + "global_step": 11021, + "learning_rate": 0.0004548372287145242, + "loss": 1.4154, + "loss_base2": 2.042, + "loss_pixel": 0.1668, + "loss_text": 1.2486, + "ppl": 4.1181, + "step": 11021 + }, + { + "epoch": 0.06, + "global_step": 11022, + "learning_rate": 0.0004548330550918197, + "loss": 1.3992, + "loss_base2": 2.0186, + "loss_pixel": 0.167, + "loss_text": 1.2323, + "ppl": 4.052, + "step": 11022 + }, + { + "epoch": 0.06, + "global_step": 11023, + "learning_rate": 0.0004548288814691152, + "loss": 1.3933, + "loss_base2": 2.0101, + "loss_pixel": 0.1672, + "loss_text": 1.2262, + "ppl": 4.0281, + "step": 11023 + }, + { + "epoch": 0.06, + "global_step": 11024, + "learning_rate": 0.00045482470784641066, + "loss": 1.3865, + "loss_base2": 2.0003, + "loss_pixel": 0.1672, + "loss_text": 1.2193, + "ppl": 4.0008, + "step": 11024 + }, + { + "epoch": 0.06, + "global_step": 11025, + "learning_rate": 0.00045482053422370616, + "loss": 1.3932, + "loss_base2": 2.01, + "loss_pixel": 0.1649, + "loss_text": 1.2283, + "ppl": 4.0277, + "step": 11025 + }, + { + "epoch": 0.06, + "global_step": 11026, + "learning_rate": 0.00045481636060100167, + "loss": 1.4004, + "loss_base2": 2.0204, + "loss_pixel": 0.166, + "loss_text": 1.2345, + "ppl": 4.0568, + "step": 11026 + }, + { + "epoch": 0.06, + "global_step": 11027, + "learning_rate": 0.0004548121869782972, + "loss": 1.405, + "loss_base2": 2.027, + "loss_pixel": 0.1658, + "loss_text": 1.2392, + "ppl": 4.0755, + "step": 11027 + }, + { + "epoch": 0.06, + "global_step": 11028, + "learning_rate": 0.0004548080133555927, + "loss": 1.3794, + "loss_base2": 1.9901, + "loss_pixel": 0.1664, + "loss_text": 1.213, + "ppl": 3.9725, + "step": 11028 + }, + { + "epoch": 0.06, + "global_step": 11029, + "learning_rate": 0.00045480383973288814, + "loss": 1.389, + "loss_base2": 2.0039, + "loss_pixel": 0.1673, + "loss_text": 1.2217, + "ppl": 4.0108, + "step": 11029 + }, + { + "epoch": 0.06, + "global_step": 11030, + "learning_rate": 0.00045479966611018365, + "loss": 1.3826, + "loss_base2": 1.9947, + "loss_pixel": 0.1666, + "loss_text": 1.216, + "ppl": 3.9852, + "step": 11030 + }, + { + "epoch": 0.06, + "global_step": 11031, + "learning_rate": 0.00045479549248747915, + "loss": 1.3943, + "loss_base2": 2.0115, + "loss_pixel": 0.1661, + "loss_text": 1.2282, + "ppl": 4.0322, + "step": 11031 + }, + { + "epoch": 0.06, + "global_step": 11032, + "learning_rate": 0.00045479131886477466, + "loss": 1.4007, + "loss_base2": 2.0208, + "loss_pixel": 0.1662, + "loss_text": 1.2346, + "ppl": 4.058, + "step": 11032 + }, + { + "epoch": 0.06, + "global_step": 11033, + "learning_rate": 0.0004547871452420701, + "loss": 1.4104, + "loss_base2": 2.0348, + "loss_pixel": 0.1666, + "loss_text": 1.2438, + "ppl": 4.0976, + "step": 11033 + }, + { + "epoch": 0.06, + "global_step": 11034, + "learning_rate": 0.0004547829716193656, + "loss": 1.3925, + "loss_base2": 2.009, + "loss_pixel": 0.1663, + "loss_text": 1.2261, + "ppl": 4.0249, + "step": 11034 + }, + { + "epoch": 0.06, + "global_step": 11035, + "learning_rate": 0.00045477879799666113, + "loss": 1.3972, + "loss_base2": 2.0157, + "loss_pixel": 0.1665, + "loss_text": 1.2307, + "ppl": 4.0439, + "step": 11035 + }, + { + "epoch": 0.06, + "global_step": 11036, + "learning_rate": 0.00045477462437395664, + "loss": 1.4541, + "loss_base2": 2.0978, + "loss_pixel": 0.165, + "loss_text": 1.289, + "ppl": 4.2806, + "step": 11036 + }, + { + "epoch": 0.06, + "global_step": 11037, + "learning_rate": 0.00045477045075125214, + "loss": 1.5857, + "loss_base2": 2.2877, + "loss_pixel": 0.1663, + "loss_text": 1.4194, + "ppl": 4.8827, + "step": 11037 + }, + { + "epoch": 0.06, + "global_step": 11038, + "learning_rate": 0.00045476627712854754, + "loss": 1.6459, + "loss_base2": 2.3745, + "loss_pixel": 0.1648, + "loss_text": 1.4811, + "ppl": 5.1857, + "step": 11038 + }, + { + "epoch": 0.06, + "global_step": 11039, + "learning_rate": 0.00045476210350584305, + "loss": 1.6323, + "loss_base2": 2.3549, + "loss_pixel": 0.1674, + "loss_text": 1.4649, + "ppl": 5.1156, + "step": 11039 + }, + { + "epoch": 0.06, + "global_step": 11040, + "learning_rate": 0.00045475792988313856, + "loss": 1.6402, + "loss_base2": 2.3663, + "loss_pixel": 0.1659, + "loss_text": 1.4743, + "ppl": 5.1562, + "step": 11040 + }, + { + "epoch": 0.06, + "global_step": 11041, + "learning_rate": 0.00045475375626043407, + "loss": 1.6359, + "loss_base2": 2.3601, + "loss_pixel": 0.1685, + "loss_text": 1.4675, + "ppl": 5.1341, + "step": 11041 + }, + { + "epoch": 0.06, + "global_step": 11042, + "learning_rate": 0.00045474958263772957, + "loss": 1.6199, + "loss_base2": 2.337, + "loss_pixel": 0.1663, + "loss_text": 1.4536, + "ppl": 5.0526, + "step": 11042 + }, + { + "epoch": 0.06, + "global_step": 11043, + "learning_rate": 0.000454745409015025, + "loss": 1.6444, + "loss_base2": 2.3724, + "loss_pixel": 0.1664, + "loss_text": 1.478, + "ppl": 5.1779, + "step": 11043 + }, + { + "epoch": 0.06, + "global_step": 11044, + "learning_rate": 0.00045474123539232053, + "loss": 1.6328, + "loss_base2": 2.3556, + "loss_pixel": 0.1674, + "loss_text": 1.4654, + "ppl": 5.1182, + "step": 11044 + }, + { + "epoch": 0.06, + "global_step": 11045, + "learning_rate": 0.00045473706176961604, + "loss": 1.6509, + "loss_base2": 2.3817, + "loss_pixel": 0.1666, + "loss_text": 1.4843, + "ppl": 5.2117, + "step": 11045 + }, + { + "epoch": 0.06, + "global_step": 11046, + "learning_rate": 0.00045473288814691155, + "loss": 1.6247, + "loss_base2": 2.3439, + "loss_pixel": 0.1664, + "loss_text": 1.4583, + "ppl": 5.0769, + "step": 11046 + }, + { + "epoch": 0.06, + "global_step": 11047, + "learning_rate": 0.000454728714524207, + "loss": 1.6444, + "loss_base2": 2.3724, + "loss_pixel": 0.1674, + "loss_text": 1.4771, + "ppl": 5.1779, + "step": 11047 + }, + { + "epoch": 0.06, + "global_step": 11048, + "learning_rate": 0.0004547245409015025, + "loss": 1.6213, + "loss_base2": 2.339, + "loss_pixel": 0.1647, + "loss_text": 1.4565, + "ppl": 5.0597, + "step": 11048 + }, + { + "epoch": 0.06, + "global_step": 11049, + "learning_rate": 0.000454720367278798, + "loss": 1.6222, + "loss_base2": 2.3403, + "loss_pixel": 0.1663, + "loss_text": 1.4559, + "ppl": 5.0642, + "step": 11049 + }, + { + "epoch": 0.06, + "global_step": 11050, + "learning_rate": 0.0004547161936560935, + "loss": 1.6305, + "loss_base2": 2.3523, + "loss_pixel": 0.1656, + "loss_text": 1.4649, + "ppl": 5.1064, + "step": 11050 + }, + { + "epoch": 0.06, + "global_step": 11051, + "learning_rate": 0.00045471202003338903, + "loss": 1.6384, + "loss_base2": 2.3637, + "loss_pixel": 0.1659, + "loss_text": 1.4724, + "ppl": 5.1469, + "step": 11051 + }, + { + "epoch": 0.06, + "global_step": 11052, + "learning_rate": 0.0004547078464106845, + "loss": 1.6162, + "loss_base2": 2.3317, + "loss_pixel": 0.1659, + "loss_text": 1.4503, + "ppl": 5.0339, + "step": 11052 + }, + { + "epoch": 0.06, + "global_step": 11053, + "learning_rate": 0.00045470367278798, + "loss": 1.6211, + "loss_base2": 2.3388, + "loss_pixel": 0.1655, + "loss_text": 1.4556, + "ppl": 5.0587, + "step": 11053 + }, + { + "epoch": 0.06, + "global_step": 11054, + "learning_rate": 0.0004546994991652755, + "loss": 1.6274, + "loss_base2": 2.3478, + "loss_pixel": 0.1656, + "loss_text": 1.4618, + "ppl": 5.0906, + "step": 11054 + }, + { + "epoch": 0.06, + "global_step": 11055, + "learning_rate": 0.000454695325542571, + "loss": 1.622, + "loss_base2": 2.3401, + "loss_pixel": 0.167, + "loss_text": 1.455, + "ppl": 5.0632, + "step": 11055 + }, + { + "epoch": 0.06, + "global_step": 11056, + "learning_rate": 0.0004546911519198664, + "loss": 1.6302, + "loss_base2": 2.3519, + "loss_pixel": 0.1657, + "loss_text": 1.4645, + "ppl": 5.1049, + "step": 11056 + }, + { + "epoch": 0.06, + "global_step": 11057, + "learning_rate": 0.0004546869782971619, + "loss": 1.6108, + "loss_base2": 2.3239, + "loss_pixel": 0.1664, + "loss_text": 1.4444, + "ppl": 5.0068, + "step": 11057 + }, + { + "epoch": 0.06, + "global_step": 11058, + "learning_rate": 0.0004546828046744574, + "loss": 1.6355, + "loss_base2": 2.3595, + "loss_pixel": 0.1658, + "loss_text": 1.4697, + "ppl": 5.132, + "step": 11058 + }, + { + "epoch": 0.06, + "global_step": 11059, + "learning_rate": 0.0004546786310517529, + "loss": 1.4261, + "loss_base2": 2.0574, + "loss_pixel": 0.1651, + "loss_text": 1.261, + "ppl": 4.1624, + "step": 11059 + }, + { + "epoch": 0.06, + "global_step": 11060, + "learning_rate": 0.00045467445742904843, + "loss": 1.4039, + "loss_base2": 2.0254, + "loss_pixel": 0.1661, + "loss_text": 1.2378, + "ppl": 4.071, + "step": 11060 + }, + { + "epoch": 0.06, + "global_step": 11061, + "learning_rate": 0.0004546702838063439, + "loss": 1.4143, + "loss_base2": 2.0404, + "loss_pixel": 0.1649, + "loss_text": 1.2494, + "ppl": 4.1136, + "step": 11061 + }, + { + "epoch": 0.06, + "global_step": 11062, + "learning_rate": 0.0004546661101836394, + "loss": 1.4081, + "loss_base2": 2.0315, + "loss_pixel": 0.165, + "loss_text": 1.2431, + "ppl": 4.0882, + "step": 11062 + }, + { + "epoch": 0.06, + "global_step": 11063, + "learning_rate": 0.0004546619365609349, + "loss": 1.3792, + "loss_base2": 1.9898, + "loss_pixel": 0.1684, + "loss_text": 1.2107, + "ppl": 3.9717, + "step": 11063 + }, + { + "epoch": 0.06, + "global_step": 11064, + "learning_rate": 0.0004546577629382304, + "loss": 1.3959, + "loss_base2": 2.0139, + "loss_pixel": 0.165, + "loss_text": 1.2309, + "ppl": 4.0386, + "step": 11064 + }, + { + "epoch": 0.06, + "global_step": 11065, + "learning_rate": 0.00045465358931552586, + "loss": 1.3883, + "loss_base2": 2.0029, + "loss_pixel": 0.1651, + "loss_text": 1.2232, + "ppl": 4.008, + "step": 11065 + }, + { + "epoch": 0.06, + "global_step": 11066, + "learning_rate": 0.00045464941569282137, + "loss": 1.5268, + "loss_base2": 2.2027, + "loss_pixel": 0.1647, + "loss_text": 1.3621, + "ppl": 4.6034, + "step": 11066 + }, + { + "epoch": 0.06, + "global_step": 11067, + "learning_rate": 0.0004546452420701169, + "loss": 1.627, + "loss_base2": 2.3473, + "loss_pixel": 0.1647, + "loss_text": 1.4622, + "ppl": 5.0886, + "step": 11067 + }, + { + "epoch": 0.06, + "global_step": 11068, + "learning_rate": 0.0004546410684474124, + "loss": 1.6228, + "loss_base2": 2.3412, + "loss_pixel": 0.1679, + "loss_text": 1.4548, + "ppl": 5.0673, + "step": 11068 + }, + { + "epoch": 0.06, + "global_step": 11069, + "learning_rate": 0.0004546368948247079, + "loss": 1.6276, + "loss_base2": 2.3481, + "loss_pixel": 0.1702, + "loss_text": 1.4575, + "ppl": 5.0916, + "step": 11069 + }, + { + "epoch": 0.06, + "global_step": 11070, + "learning_rate": 0.00045463272120200334, + "loss": 1.6523, + "loss_base2": 2.3838, + "loss_pixel": 0.1719, + "loss_text": 1.4804, + "ppl": 5.219, + "step": 11070 + }, + { + "epoch": 0.06, + "global_step": 11071, + "learning_rate": 0.00045462854757929885, + "loss": 1.6376, + "loss_base2": 2.3626, + "loss_pixel": 0.1665, + "loss_text": 1.4711, + "ppl": 5.1428, + "step": 11071 + }, + { + "epoch": 0.06, + "global_step": 11072, + "learning_rate": 0.00045462437395659436, + "loss": 1.6312, + "loss_base2": 2.3533, + "loss_pixel": 0.1657, + "loss_text": 1.4654, + "ppl": 5.11, + "step": 11072 + }, + { + "epoch": 0.06, + "global_step": 11073, + "learning_rate": 0.00045462020033388987, + "loss": 1.6242, + "loss_base2": 2.3432, + "loss_pixel": 0.1651, + "loss_text": 1.4591, + "ppl": 5.0744, + "step": 11073 + }, + { + "epoch": 0.06, + "global_step": 11074, + "learning_rate": 0.0004546160267111853, + "loss": 1.6367, + "loss_base2": 2.3613, + "loss_pixel": 0.1651, + "loss_text": 1.4715, + "ppl": 5.1382, + "step": 11074 + }, + { + "epoch": 0.06, + "global_step": 11075, + "learning_rate": 0.00045461185308848077, + "loss": 1.634, + "loss_base2": 2.3574, + "loss_pixel": 0.1651, + "loss_text": 1.4689, + "ppl": 5.1243, + "step": 11075 + }, + { + "epoch": 0.06, + "global_step": 11076, + "learning_rate": 0.0004546076794657763, + "loss": 1.6329, + "loss_base2": 2.3558, + "loss_pixel": 0.1641, + "loss_text": 1.4689, + "ppl": 5.1187, + "step": 11076 + }, + { + "epoch": 0.06, + "global_step": 11077, + "learning_rate": 0.0004546035058430718, + "loss": 1.615, + "loss_base2": 2.33, + "loss_pixel": 0.1641, + "loss_text": 1.4509, + "ppl": 5.0279, + "step": 11077 + }, + { + "epoch": 0.06, + "global_step": 11078, + "learning_rate": 0.0004545993322203673, + "loss": 1.6209, + "loss_base2": 2.3385, + "loss_pixel": 0.1665, + "loss_text": 1.4544, + "ppl": 5.0576, + "step": 11078 + }, + { + "epoch": 0.06, + "global_step": 11079, + "learning_rate": 0.00045459515859766275, + "loss": 1.6327, + "loss_base2": 2.3555, + "loss_pixel": 0.1652, + "loss_text": 1.4675, + "ppl": 5.1177, + "step": 11079 + }, + { + "epoch": 0.06, + "global_step": 11080, + "learning_rate": 0.00045459098497495825, + "loss": 1.6232, + "loss_base2": 2.3418, + "loss_pixel": 0.1641, + "loss_text": 1.4591, + "ppl": 5.0693, + "step": 11080 + }, + { + "epoch": 0.06, + "global_step": 11081, + "learning_rate": 0.00045458681135225376, + "loss": 1.6306, + "loss_base2": 2.3525, + "loss_pixel": 0.1655, + "loss_text": 1.465, + "ppl": 5.1069, + "step": 11081 + }, + { + "epoch": 0.06, + "global_step": 11082, + "learning_rate": 0.00045458263772954927, + "loss": 1.6006, + "loss_base2": 2.3092, + "loss_pixel": 0.1643, + "loss_text": 1.4364, + "ppl": 4.956, + "step": 11082 + }, + { + "epoch": 0.06, + "global_step": 11083, + "learning_rate": 0.0004545784641068447, + "loss": 1.6088, + "loss_base2": 2.321, + "loss_pixel": 0.1634, + "loss_text": 1.4454, + "ppl": 4.9968, + "step": 11083 + }, + { + "epoch": 0.06, + "global_step": 11084, + "learning_rate": 0.00045457429048414023, + "loss": 1.6228, + "loss_base2": 2.3412, + "loss_pixel": 0.1642, + "loss_text": 1.4587, + "ppl": 5.0673, + "step": 11084 + }, + { + "epoch": 0.06, + "global_step": 11085, + "learning_rate": 0.00045457011686143574, + "loss": 1.5967, + "loss_base2": 2.3036, + "loss_pixel": 0.1642, + "loss_text": 1.4325, + "ppl": 4.9367, + "step": 11085 + }, + { + "epoch": 0.06, + "global_step": 11086, + "learning_rate": 0.00045456594323873124, + "loss": 1.622, + "loss_base2": 2.3401, + "loss_pixel": 0.1645, + "loss_text": 1.4575, + "ppl": 5.0632, + "step": 11086 + }, + { + "epoch": 0.06, + "global_step": 11087, + "learning_rate": 0.00045456176961602675, + "loss": 1.5638, + "loss_base2": 2.2561, + "loss_pixel": 0.164, + "loss_text": 1.3999, + "ppl": 4.7769, + "step": 11087 + }, + { + "epoch": 0.06, + "global_step": 11088, + "learning_rate": 0.0004545575959933222, + "loss": 1.4157, + "loss_base2": 2.0424, + "loss_pixel": 0.1663, + "loss_text": 1.2494, + "ppl": 4.1194, + "step": 11088 + }, + { + "epoch": 0.06, + "global_step": 11089, + "learning_rate": 0.0004545534223706177, + "loss": 1.4214, + "loss_base2": 2.0506, + "loss_pixel": 0.1635, + "loss_text": 1.2579, + "ppl": 4.1429, + "step": 11089 + }, + { + "epoch": 0.06, + "global_step": 11090, + "learning_rate": 0.0004545492487479132, + "loss": 1.4097, + "loss_base2": 2.0338, + "loss_pixel": 0.1647, + "loss_text": 1.245, + "ppl": 4.0947, + "step": 11090 + }, + { + "epoch": 0.06, + "global_step": 11091, + "learning_rate": 0.0004545450751252087, + "loss": 1.4177, + "loss_base2": 2.0453, + "loss_pixel": 0.1646, + "loss_text": 1.2531, + "ppl": 4.1276, + "step": 11091 + }, + { + "epoch": 0.06, + "global_step": 11092, + "learning_rate": 0.0004545409015025042, + "loss": 1.3927, + "loss_base2": 2.0092, + "loss_pixel": 0.1639, + "loss_text": 1.2288, + "ppl": 4.0257, + "step": 11092 + }, + { + "epoch": 0.06, + "global_step": 11093, + "learning_rate": 0.0004545367278797997, + "loss": 1.397, + "loss_base2": 2.0154, + "loss_pixel": 0.1658, + "loss_text": 1.2312, + "ppl": 4.0431, + "step": 11093 + }, + { + "epoch": 0.06, + "global_step": 11094, + "learning_rate": 0.00045453255425709514, + "loss": 1.3815, + "loss_base2": 1.9931, + "loss_pixel": 0.1646, + "loss_text": 1.217, + "ppl": 3.9809, + "step": 11094 + }, + { + "epoch": 0.06, + "global_step": 11095, + "learning_rate": 0.00045452838063439065, + "loss": 1.3975, + "loss_base2": 2.0162, + "loss_pixel": 0.1633, + "loss_text": 1.2341, + "ppl": 4.0451, + "step": 11095 + }, + { + "epoch": 0.06, + "global_step": 11096, + "learning_rate": 0.00045452420701168615, + "loss": 1.6435, + "loss_base2": 2.3711, + "loss_pixel": 0.1647, + "loss_text": 1.4788, + "ppl": 5.1732, + "step": 11096 + }, + { + "epoch": 0.06, + "global_step": 11097, + "learning_rate": 0.0004545200333889816, + "loss": 1.6425, + "loss_base2": 2.3696, + "loss_pixel": 0.1628, + "loss_text": 1.4797, + "ppl": 5.1681, + "step": 11097 + }, + { + "epoch": 0.06, + "global_step": 11098, + "learning_rate": 0.0004545158597662771, + "loss": 1.6427, + "loss_base2": 2.3699, + "loss_pixel": 0.1645, + "loss_text": 1.4782, + "ppl": 5.1691, + "step": 11098 + }, + { + "epoch": 0.06, + "global_step": 11099, + "learning_rate": 0.0004545116861435726, + "loss": 1.6326, + "loss_base2": 2.3553, + "loss_pixel": 0.1639, + "loss_text": 1.4687, + "ppl": 5.1172, + "step": 11099 + }, + { + "epoch": 0.06, + "global_step": 11100, + "learning_rate": 0.00045450751252086813, + "loss": 1.6034, + "loss_base2": 2.3132, + "loss_pixel": 0.1635, + "loss_text": 1.4399, + "ppl": 4.9699, + "step": 11100 + }, + { + "epoch": 0.06, + "global_step": 11101, + "learning_rate": 0.00045450333889816364, + "loss": 1.6396, + "loss_base2": 2.3654, + "loss_pixel": 0.1642, + "loss_text": 1.4754, + "ppl": 5.1531, + "step": 11101 + }, + { + "epoch": 0.06, + "global_step": 11102, + "learning_rate": 0.0004544991652754591, + "loss": 1.6173, + "loss_base2": 2.3333, + "loss_pixel": 0.1638, + "loss_text": 1.4535, + "ppl": 5.0395, + "step": 11102 + }, + { + "epoch": 0.06, + "global_step": 11103, + "learning_rate": 0.0004544949916527546, + "loss": 1.6279, + "loss_base2": 2.3486, + "loss_pixel": 0.164, + "loss_text": 1.4639, + "ppl": 5.0932, + "step": 11103 + }, + { + "epoch": 0.06, + "global_step": 11104, + "learning_rate": 0.0004544908180300501, + "loss": 1.6334, + "loss_base2": 2.3565, + "loss_pixel": 0.1633, + "loss_text": 1.4701, + "ppl": 5.1213, + "step": 11104 + }, + { + "epoch": 0.06, + "global_step": 11105, + "learning_rate": 0.0004544866444073456, + "loss": 1.6277, + "loss_base2": 2.3483, + "loss_pixel": 0.1635, + "loss_text": 1.4642, + "ppl": 5.0921, + "step": 11105 + }, + { + "epoch": 0.06, + "global_step": 11106, + "learning_rate": 0.00045448247078464107, + "loss": 1.6324, + "loss_base2": 2.3551, + "loss_pixel": 0.1644, + "loss_text": 1.468, + "ppl": 5.1161, + "step": 11106 + }, + { + "epoch": 0.06, + "global_step": 11107, + "learning_rate": 0.00045447829716193657, + "loss": 1.6332, + "loss_base2": 2.3562, + "loss_pixel": 0.1639, + "loss_text": 1.4693, + "ppl": 5.1202, + "step": 11107 + }, + { + "epoch": 0.06, + "global_step": 11108, + "learning_rate": 0.0004544741235392321, + "loss": 1.62, + "loss_base2": 2.3372, + "loss_pixel": 0.1629, + "loss_text": 1.457, + "ppl": 5.0531, + "step": 11108 + }, + { + "epoch": 0.06, + "global_step": 11109, + "learning_rate": 0.0004544699499165276, + "loss": 1.621, + "loss_base2": 2.3386, + "loss_pixel": 0.1646, + "loss_text": 1.4564, + "ppl": 5.0581, + "step": 11109 + }, + { + "epoch": 0.06, + "global_step": 11110, + "learning_rate": 0.0004544657762938231, + "loss": 1.6276, + "loss_base2": 2.3481, + "loss_pixel": 0.163, + "loss_text": 1.4646, + "ppl": 5.0916, + "step": 11110 + }, + { + "epoch": 0.06, + "global_step": 11111, + "learning_rate": 0.00045446160267111855, + "loss": 1.6198, + "loss_base2": 2.3369, + "loss_pixel": 0.1645, + "loss_text": 1.4553, + "ppl": 5.0521, + "step": 11111 + }, + { + "epoch": 0.06, + "global_step": 11112, + "learning_rate": 0.00045445742904841405, + "loss": 1.6086, + "loss_base2": 2.3207, + "loss_pixel": 0.1645, + "loss_text": 1.444, + "ppl": 4.9958, + "step": 11112 + }, + { + "epoch": 0.06, + "global_step": 11113, + "learning_rate": 0.0004544532554257095, + "loss": 1.6264, + "loss_base2": 2.3464, + "loss_pixel": 0.1622, + "loss_text": 1.4643, + "ppl": 5.0855, + "step": 11113 + }, + { + "epoch": 0.06, + "global_step": 11114, + "learning_rate": 0.000454449081803005, + "loss": 1.6148, + "loss_base2": 2.3297, + "loss_pixel": 0.1629, + "loss_text": 1.4519, + "ppl": 5.0269, + "step": 11114 + }, + { + "epoch": 0.06, + "global_step": 11115, + "learning_rate": 0.00045444490818030047, + "loss": 1.6161, + "loss_base2": 2.3315, + "loss_pixel": 0.1633, + "loss_text": 1.4528, + "ppl": 5.0334, + "step": 11115 + }, + { + "epoch": 0.06, + "global_step": 11116, + "learning_rate": 0.000454440734557596, + "loss": 1.6331, + "loss_base2": 2.3561, + "loss_pixel": 0.1637, + "loss_text": 1.4694, + "ppl": 5.1197, + "step": 11116 + }, + { + "epoch": 0.06, + "global_step": 11117, + "learning_rate": 0.0004544365609348915, + "loss": 1.5753, + "loss_base2": 2.2727, + "loss_pixel": 0.1633, + "loss_text": 1.412, + "ppl": 4.8322, + "step": 11117 + }, + { + "epoch": 0.06, + "global_step": 11118, + "learning_rate": 0.000454432387312187, + "loss": 1.5949, + "loss_base2": 2.301, + "loss_pixel": 0.1644, + "loss_text": 1.4305, + "ppl": 4.9278, + "step": 11118 + }, + { + "epoch": 0.06, + "global_step": 11119, + "learning_rate": 0.0004544282136894825, + "loss": 1.5997, + "loss_base2": 2.3079, + "loss_pixel": 0.1634, + "loss_text": 1.4363, + "ppl": 4.9515, + "step": 11119 + }, + { + "epoch": 0.06, + "global_step": 11120, + "learning_rate": 0.00045442404006677795, + "loss": 1.6295, + "loss_base2": 2.3509, + "loss_pixel": 0.164, + "loss_text": 1.4655, + "ppl": 5.1013, + "step": 11120 + }, + { + "epoch": 0.06, + "global_step": 11121, + "learning_rate": 0.00045441986644407346, + "loss": 1.6318, + "loss_base2": 2.3542, + "loss_pixel": 0.1663, + "loss_text": 1.4656, + "ppl": 5.1131, + "step": 11121 + }, + { + "epoch": 0.06, + "global_step": 11122, + "learning_rate": 0.00045441569282136897, + "loss": 1.6085, + "loss_base2": 2.3206, + "loss_pixel": 0.1632, + "loss_text": 1.4453, + "ppl": 4.9953, + "step": 11122 + }, + { + "epoch": 0.06, + "global_step": 11123, + "learning_rate": 0.00045441151919866447, + "loss": 1.6164, + "loss_base2": 2.332, + "loss_pixel": 0.1638, + "loss_text": 1.4527, + "ppl": 5.0349, + "step": 11123 + }, + { + "epoch": 0.06, + "global_step": 11124, + "learning_rate": 0.0004544073455759599, + "loss": 1.6175, + "loss_base2": 2.3336, + "loss_pixel": 0.1646, + "loss_text": 1.4529, + "ppl": 5.0405, + "step": 11124 + }, + { + "epoch": 0.06, + "global_step": 11125, + "learning_rate": 0.00045440317195325543, + "loss": 1.6235, + "loss_base2": 2.3422, + "loss_pixel": 0.1621, + "loss_text": 1.4613, + "ppl": 5.0708, + "step": 11125 + }, + { + "epoch": 0.06, + "global_step": 11126, + "learning_rate": 0.00045439899833055094, + "loss": 1.6237, + "loss_base2": 2.3425, + "loss_pixel": 0.1627, + "loss_text": 1.461, + "ppl": 5.0718, + "step": 11126 + }, + { + "epoch": 0.06, + "global_step": 11127, + "learning_rate": 0.00045439482470784645, + "loss": 1.6217, + "loss_base2": 2.3396, + "loss_pixel": 0.1631, + "loss_text": 1.4585, + "ppl": 5.0617, + "step": 11127 + }, + { + "epoch": 0.06, + "global_step": 11128, + "learning_rate": 0.00045439065108514196, + "loss": 1.613, + "loss_base2": 2.3271, + "loss_pixel": 0.1652, + "loss_text": 1.4479, + "ppl": 5.0178, + "step": 11128 + }, + { + "epoch": 0.06, + "global_step": 11129, + "learning_rate": 0.0004543864774624374, + "loss": 1.6225, + "loss_base2": 2.3408, + "loss_pixel": 0.1637, + "loss_text": 1.4588, + "ppl": 5.0657, + "step": 11129 + }, + { + "epoch": 0.06, + "global_step": 11130, + "learning_rate": 0.0004543823038397329, + "loss": 1.6237, + "loss_base2": 2.3425, + "loss_pixel": 0.1644, + "loss_text": 1.4593, + "ppl": 5.0718, + "step": 11130 + }, + { + "epoch": 0.06, + "global_step": 11131, + "learning_rate": 0.0004543781302170284, + "loss": 1.64, + "loss_base2": 2.366, + "loss_pixel": 0.1643, + "loss_text": 1.4757, + "ppl": 5.1552, + "step": 11131 + }, + { + "epoch": 0.06, + "global_step": 11132, + "learning_rate": 0.0004543739565943239, + "loss": 1.6309, + "loss_base2": 2.3529, + "loss_pixel": 0.1654, + "loss_text": 1.4654, + "ppl": 5.1085, + "step": 11132 + }, + { + "epoch": 0.06, + "global_step": 11133, + "learning_rate": 0.00045436978297161933, + "loss": 1.631, + "loss_base2": 2.353, + "loss_pixel": 0.164, + "loss_text": 1.4671, + "ppl": 5.109, + "step": 11133 + }, + { + "epoch": 0.06, + "global_step": 11134, + "learning_rate": 0.00045436560934891484, + "loss": 1.6406, + "loss_base2": 2.3669, + "loss_pixel": 0.1638, + "loss_text": 1.4768, + "ppl": 5.1583, + "step": 11134 + }, + { + "epoch": 0.06, + "global_step": 11135, + "learning_rate": 0.00045436143572621034, + "loss": 1.6349, + "loss_base2": 2.3587, + "loss_pixel": 0.1647, + "loss_text": 1.4703, + "ppl": 5.1289, + "step": 11135 + }, + { + "epoch": 0.06, + "global_step": 11136, + "learning_rate": 0.00045435726210350585, + "loss": 1.6082, + "loss_base2": 2.3201, + "loss_pixel": 0.1634, + "loss_text": 1.4448, + "ppl": 4.9938, + "step": 11136 + }, + { + "epoch": 0.06, + "global_step": 11137, + "learning_rate": 0.00045435308848080136, + "loss": 1.6085, + "loss_base2": 2.3206, + "loss_pixel": 0.1643, + "loss_text": 1.4443, + "ppl": 4.9953, + "step": 11137 + }, + { + "epoch": 0.06, + "global_step": 11138, + "learning_rate": 0.0004543489148580968, + "loss": 1.6237, + "loss_base2": 2.3425, + "loss_pixel": 0.1628, + "loss_text": 1.4609, + "ppl": 5.0718, + "step": 11138 + }, + { + "epoch": 0.06, + "global_step": 11139, + "learning_rate": 0.0004543447412353923, + "loss": 1.621, + "loss_base2": 2.3386, + "loss_pixel": 0.163, + "loss_text": 1.4579, + "ppl": 5.0581, + "step": 11139 + }, + { + "epoch": 0.06, + "global_step": 11140, + "learning_rate": 0.0004543405676126878, + "loss": 1.6095, + "loss_base2": 2.322, + "loss_pixel": 0.1633, + "loss_text": 1.4462, + "ppl": 5.0003, + "step": 11140 + }, + { + "epoch": 0.06, + "global_step": 11141, + "learning_rate": 0.00045433639398998333, + "loss": 1.6368, + "loss_base2": 2.3614, + "loss_pixel": 0.1636, + "loss_text": 1.4732, + "ppl": 5.1387, + "step": 11141 + }, + { + "epoch": 0.06, + "global_step": 11142, + "learning_rate": 0.0004543322203672788, + "loss": 1.6161, + "loss_base2": 2.3315, + "loss_pixel": 0.1633, + "loss_text": 1.4528, + "ppl": 5.0334, + "step": 11142 + }, + { + "epoch": 0.06, + "global_step": 11143, + "learning_rate": 0.0004543280467445743, + "loss": 1.6234, + "loss_base2": 2.3421, + "loss_pixel": 0.1639, + "loss_text": 1.4595, + "ppl": 5.0703, + "step": 11143 + }, + { + "epoch": 0.06, + "global_step": 11144, + "learning_rate": 0.0004543238731218698, + "loss": 1.6265, + "loss_base2": 2.3465, + "loss_pixel": 0.1631, + "loss_text": 1.4634, + "ppl": 5.086, + "step": 11144 + }, + { + "epoch": 0.06, + "global_step": 11145, + "learning_rate": 0.0004543196994991653, + "loss": 1.5878, + "loss_base2": 2.2907, + "loss_pixel": 0.1638, + "loss_text": 1.424, + "ppl": 4.893, + "step": 11145 + }, + { + "epoch": 0.06, + "global_step": 11146, + "learning_rate": 0.0004543155258764608, + "loss": 1.621, + "loss_base2": 2.3386, + "loss_pixel": 0.1621, + "loss_text": 1.4589, + "ppl": 5.0581, + "step": 11146 + }, + { + "epoch": 0.06, + "global_step": 11147, + "learning_rate": 0.00045431135225375627, + "loss": 1.6126, + "loss_base2": 2.3265, + "loss_pixel": 0.163, + "loss_text": 1.4496, + "ppl": 5.0158, + "step": 11147 + }, + { + "epoch": 0.06, + "global_step": 11148, + "learning_rate": 0.0004543071786310518, + "loss": 1.6371, + "loss_base2": 2.3618, + "loss_pixel": 0.1633, + "loss_text": 1.4738, + "ppl": 5.1402, + "step": 11148 + }, + { + "epoch": 0.06, + "global_step": 11149, + "learning_rate": 0.0004543030050083473, + "loss": 1.6252, + "loss_base2": 2.3447, + "loss_pixel": 0.1642, + "loss_text": 1.461, + "ppl": 5.0794, + "step": 11149 + }, + { + "epoch": 0.06, + "global_step": 11150, + "learning_rate": 0.00045429883138564274, + "loss": 1.6166, + "loss_base2": 2.3323, + "loss_pixel": 0.163, + "loss_text": 1.4536, + "ppl": 5.0359, + "step": 11150 + }, + { + "epoch": 0.06, + "global_step": 11151, + "learning_rate": 0.0004542946577629382, + "loss": 1.6171, + "loss_base2": 2.333, + "loss_pixel": 0.1638, + "loss_text": 1.4533, + "ppl": 5.0385, + "step": 11151 + }, + { + "epoch": 0.06, + "global_step": 11152, + "learning_rate": 0.0004542904841402337, + "loss": 1.6152, + "loss_base2": 2.3302, + "loss_pixel": 0.1631, + "loss_text": 1.4521, + "ppl": 5.0289, + "step": 11152 + }, + { + "epoch": 0.06, + "global_step": 11153, + "learning_rate": 0.0004542863105175292, + "loss": 1.626, + "loss_base2": 2.3458, + "loss_pixel": 0.1637, + "loss_text": 1.4623, + "ppl": 5.0835, + "step": 11153 + }, + { + "epoch": 0.06, + "global_step": 11154, + "learning_rate": 0.0004542821368948247, + "loss": 1.5984, + "loss_base2": 2.306, + "loss_pixel": 0.163, + "loss_text": 1.4354, + "ppl": 4.9451, + "step": 11154 + }, + { + "epoch": 0.06, + "global_step": 11155, + "learning_rate": 0.0004542779632721202, + "loss": 1.6348, + "loss_base2": 2.3585, + "loss_pixel": 0.164, + "loss_text": 1.4708, + "ppl": 5.1284, + "step": 11155 + }, + { + "epoch": 0.06, + "global_step": 11156, + "learning_rate": 0.00045427378964941567, + "loss": 1.6248, + "loss_base2": 2.3441, + "loss_pixel": 0.1638, + "loss_text": 1.461, + "ppl": 5.0774, + "step": 11156 + }, + { + "epoch": 0.06, + "global_step": 11157, + "learning_rate": 0.0004542696160267112, + "loss": 1.5998, + "loss_base2": 2.308, + "loss_pixel": 0.1639, + "loss_text": 1.436, + "ppl": 4.952, + "step": 11157 + }, + { + "epoch": 0.06, + "global_step": 11158, + "learning_rate": 0.0004542654424040067, + "loss": 1.614, + "loss_base2": 2.3285, + "loss_pixel": 0.1636, + "loss_text": 1.4505, + "ppl": 5.0229, + "step": 11158 + }, + { + "epoch": 0.06, + "global_step": 11159, + "learning_rate": 0.0004542612687813022, + "loss": 1.6105, + "loss_base2": 2.3235, + "loss_pixel": 0.1639, + "loss_text": 1.4466, + "ppl": 5.0053, + "step": 11159 + }, + { + "epoch": 0.06, + "global_step": 11160, + "learning_rate": 0.0004542570951585977, + "loss": 1.6301, + "loss_base2": 2.3517, + "loss_pixel": 0.164, + "loss_text": 1.4661, + "ppl": 5.1044, + "step": 11160 + }, + { + "epoch": 0.06, + "global_step": 11161, + "learning_rate": 0.00045425292153589315, + "loss": 1.6252, + "loss_base2": 2.3447, + "loss_pixel": 0.1633, + "loss_text": 1.4619, + "ppl": 5.0794, + "step": 11161 + }, + { + "epoch": 0.06, + "global_step": 11162, + "learning_rate": 0.00045424874791318866, + "loss": 1.6001, + "loss_base2": 2.3085, + "loss_pixel": 0.1631, + "loss_text": 1.4369, + "ppl": 4.9535, + "step": 11162 + }, + { + "epoch": 0.06, + "global_step": 11163, + "learning_rate": 0.00045424457429048417, + "loss": 1.3966, + "loss_base2": 2.0149, + "loss_pixel": 0.1628, + "loss_text": 1.2337, + "ppl": 4.0414, + "step": 11163 + }, + { + "epoch": 0.06, + "global_step": 11164, + "learning_rate": 0.0004542404006677797, + "loss": 1.4144, + "loss_base2": 2.0405, + "loss_pixel": 0.1632, + "loss_text": 1.2511, + "ppl": 4.114, + "step": 11164 + }, + { + "epoch": 0.06, + "global_step": 11165, + "learning_rate": 0.00045423622704507513, + "loss": 1.3881, + "loss_base2": 2.0026, + "loss_pixel": 0.1629, + "loss_text": 1.2252, + "ppl": 4.0072, + "step": 11165 + }, + { + "epoch": 0.06, + "global_step": 11166, + "learning_rate": 0.00045423205342237064, + "loss": 1.3807, + "loss_base2": 1.9919, + "loss_pixel": 0.1617, + "loss_text": 1.2189, + "ppl": 3.9777, + "step": 11166 + }, + { + "epoch": 0.06, + "global_step": 11167, + "learning_rate": 0.00045422787979966614, + "loss": 1.3936, + "loss_base2": 2.0105, + "loss_pixel": 0.1638, + "loss_text": 1.2298, + "ppl": 4.0293, + "step": 11167 + }, + { + "epoch": 0.06, + "global_step": 11168, + "learning_rate": 0.00045422370617696165, + "loss": 1.3755, + "loss_base2": 1.9844, + "loss_pixel": 0.164, + "loss_text": 1.2115, + "ppl": 3.9571, + "step": 11168 + }, + { + "epoch": 0.06, + "global_step": 11169, + "learning_rate": 0.0004542195325542571, + "loss": 1.38, + "loss_base2": 1.9909, + "loss_pixel": 0.1631, + "loss_text": 1.217, + "ppl": 3.9749, + "step": 11169 + }, + { + "epoch": 0.06, + "global_step": 11170, + "learning_rate": 0.00045421535893155256, + "loss": 1.3904, + "loss_base2": 2.0059, + "loss_pixel": 0.1624, + "loss_text": 1.2281, + "ppl": 4.0165, + "step": 11170 + }, + { + "epoch": 0.06, + "global_step": 11171, + "learning_rate": 0.00045421118530884807, + "loss": 1.396, + "loss_base2": 2.014, + "loss_pixel": 0.1624, + "loss_text": 1.2336, + "ppl": 4.039, + "step": 11171 + }, + { + "epoch": 0.06, + "global_step": 11172, + "learning_rate": 0.00045420701168614357, + "loss": 1.3901, + "loss_base2": 2.0055, + "loss_pixel": 0.1621, + "loss_text": 1.228, + "ppl": 4.0153, + "step": 11172 + }, + { + "epoch": 0.06, + "global_step": 11173, + "learning_rate": 0.0004542028380634391, + "loss": 1.3907, + "loss_base2": 2.0064, + "loss_pixel": 0.1627, + "loss_text": 1.228, + "ppl": 4.0177, + "step": 11173 + }, + { + "epoch": 0.06, + "global_step": 11174, + "learning_rate": 0.00045419866444073453, + "loss": 1.4027, + "loss_base2": 2.0237, + "loss_pixel": 0.1627, + "loss_text": 1.24, + "ppl": 4.0662, + "step": 11174 + }, + { + "epoch": 0.06, + "global_step": 11175, + "learning_rate": 0.00045419449081803004, + "loss": 1.383, + "loss_base2": 1.9952, + "loss_pixel": 0.1633, + "loss_text": 1.2197, + "ppl": 3.9868, + "step": 11175 + }, + { + "epoch": 0.06, + "global_step": 11176, + "learning_rate": 0.00045419031719532555, + "loss": 1.3811, + "loss_base2": 1.9925, + "loss_pixel": 0.1649, + "loss_text": 1.2162, + "ppl": 3.9793, + "step": 11176 + }, + { + "epoch": 0.06, + "global_step": 11177, + "learning_rate": 0.00045418614357262105, + "loss": 1.4081, + "loss_base2": 2.0315, + "loss_pixel": 0.1649, + "loss_text": 1.2431, + "ppl": 4.0882, + "step": 11177 + }, + { + "epoch": 0.06, + "global_step": 11178, + "learning_rate": 0.00045418196994991656, + "loss": 1.3845, + "loss_base2": 1.9974, + "loss_pixel": 0.1633, + "loss_text": 1.2212, + "ppl": 3.9928, + "step": 11178 + }, + { + "epoch": 0.06, + "global_step": 11179, + "learning_rate": 0.000454177796327212, + "loss": 1.4909, + "loss_base2": 2.1509, + "loss_pixel": 0.1646, + "loss_text": 1.3263, + "ppl": 4.4411, + "step": 11179 + }, + { + "epoch": 0.06, + "global_step": 11180, + "learning_rate": 0.0004541736227045075, + "loss": 1.6279, + "loss_base2": 2.3486, + "loss_pixel": 0.1639, + "loss_text": 1.464, + "ppl": 5.0932, + "step": 11180 + }, + { + "epoch": 0.06, + "global_step": 11181, + "learning_rate": 0.00045416944908180303, + "loss": 1.6264, + "loss_base2": 2.3464, + "loss_pixel": 0.1628, + "loss_text": 1.4635, + "ppl": 5.0855, + "step": 11181 + }, + { + "epoch": 0.06, + "global_step": 11182, + "learning_rate": 0.00045416527545909854, + "loss": 1.6329, + "loss_base2": 2.3558, + "loss_pixel": 0.1634, + "loss_text": 1.4695, + "ppl": 5.1187, + "step": 11182 + }, + { + "epoch": 0.06, + "global_step": 11183, + "learning_rate": 0.000454161101836394, + "loss": 1.6093, + "loss_base2": 2.3217, + "loss_pixel": 0.1634, + "loss_text": 1.4459, + "ppl": 4.9993, + "step": 11183 + }, + { + "epoch": 0.06, + "global_step": 11184, + "learning_rate": 0.0004541569282136895, + "loss": 1.6141, + "loss_base2": 2.3287, + "loss_pixel": 0.1636, + "loss_text": 1.4505, + "ppl": 5.0234, + "step": 11184 + }, + { + "epoch": 0.06, + "global_step": 11185, + "learning_rate": 0.000454152754590985, + "loss": 1.6264, + "loss_base2": 2.3464, + "loss_pixel": 0.1625, + "loss_text": 1.4639, + "ppl": 5.0855, + "step": 11185 + }, + { + "epoch": 0.06, + "global_step": 11186, + "learning_rate": 0.0004541485809682805, + "loss": 1.6212, + "loss_base2": 2.3389, + "loss_pixel": 0.1632, + "loss_text": 1.4581, + "ppl": 5.0592, + "step": 11186 + }, + { + "epoch": 0.06, + "global_step": 11187, + "learning_rate": 0.000454144407345576, + "loss": 1.6132, + "loss_base2": 2.3274, + "loss_pixel": 0.1639, + "loss_text": 1.4493, + "ppl": 5.0188, + "step": 11187 + }, + { + "epoch": 0.06, + "global_step": 11188, + "learning_rate": 0.0004541402337228714, + "loss": 1.626, + "loss_base2": 2.3458, + "loss_pixel": 0.1624, + "loss_text": 1.4636, + "ppl": 5.0835, + "step": 11188 + }, + { + "epoch": 0.06, + "global_step": 11189, + "learning_rate": 0.0004541360601001669, + "loss": 1.6364, + "loss_base2": 2.3608, + "loss_pixel": 0.1634, + "loss_text": 1.473, + "ppl": 5.1366, + "step": 11189 + }, + { + "epoch": 0.06, + "global_step": 11190, + "learning_rate": 0.00045413188647746243, + "loss": 1.6157, + "loss_base2": 2.331, + "loss_pixel": 0.1626, + "loss_text": 1.4531, + "ppl": 5.0314, + "step": 11190 + }, + { + "epoch": 0.06, + "global_step": 11191, + "learning_rate": 0.00045412771285475794, + "loss": 1.6389, + "loss_base2": 2.3644, + "loss_pixel": 0.163, + "loss_text": 1.4759, + "ppl": 5.1495, + "step": 11191 + }, + { + "epoch": 0.06, + "global_step": 11192, + "learning_rate": 0.0004541235392320534, + "loss": 1.6111, + "loss_base2": 2.3243, + "loss_pixel": 0.1631, + "loss_text": 1.4481, + "ppl": 5.0083, + "step": 11192 + }, + { + "epoch": 0.06, + "global_step": 11193, + "learning_rate": 0.0004541193656093489, + "loss": 1.6155, + "loss_base2": 2.3307, + "loss_pixel": 0.1628, + "loss_text": 1.4527, + "ppl": 5.0304, + "step": 11193 + }, + { + "epoch": 0.06, + "global_step": 11194, + "learning_rate": 0.0004541151919866444, + "loss": 1.6238, + "loss_base2": 2.3426, + "loss_pixel": 0.163, + "loss_text": 1.4608, + "ppl": 5.0723, + "step": 11194 + }, + { + "epoch": 0.06, + "global_step": 11195, + "learning_rate": 0.0004541110183639399, + "loss": 1.6064, + "loss_base2": 2.3175, + "loss_pixel": 0.1621, + "loss_text": 1.4443, + "ppl": 4.9848, + "step": 11195 + }, + { + "epoch": 0.06, + "global_step": 11196, + "learning_rate": 0.0004541068447412354, + "loss": 1.6202, + "loss_base2": 2.3375, + "loss_pixel": 0.1644, + "loss_text": 1.4558, + "ppl": 5.0541, + "step": 11196 + }, + { + "epoch": 0.06, + "global_step": 11197, + "learning_rate": 0.0004541026711185309, + "loss": 1.6184, + "loss_base2": 2.3349, + "loss_pixel": 0.1628, + "loss_text": 1.4555, + "ppl": 5.045, + "step": 11197 + }, + { + "epoch": 0.06, + "global_step": 11198, + "learning_rate": 0.0004540984974958264, + "loss": 1.6156, + "loss_base2": 2.3308, + "loss_pixel": 0.1623, + "loss_text": 1.4533, + "ppl": 5.0309, + "step": 11198 + }, + { + "epoch": 0.06, + "global_step": 11199, + "learning_rate": 0.0004540943238731219, + "loss": 1.6176, + "loss_base2": 2.3337, + "loss_pixel": 0.1631, + "loss_text": 1.4545, + "ppl": 5.041, + "step": 11199 + }, + { + "epoch": 0.06, + "global_step": 11200, + "learning_rate": 0.0004540901502504174, + "loss": 1.6246, + "loss_base2": 2.3438, + "loss_pixel": 0.163, + "loss_text": 1.4615, + "ppl": 5.0764, + "step": 11200 + }, + { + "epoch": 0.06, + "global_step": 11201, + "learning_rate": 0.00045408597662771285, + "loss": 1.6033, + "loss_base2": 2.3131, + "loss_pixel": 0.1629, + "loss_text": 1.4404, + "ppl": 4.9694, + "step": 11201 + }, + { + "epoch": 0.06, + "global_step": 11202, + "learning_rate": 0.00045408180300500836, + "loss": 1.6213, + "loss_base2": 2.339, + "loss_pixel": 0.1655, + "loss_text": 1.4558, + "ppl": 5.0597, + "step": 11202 + }, + { + "epoch": 0.06, + "global_step": 11203, + "learning_rate": 0.00045407762938230387, + "loss": 1.5598, + "loss_base2": 2.2503, + "loss_pixel": 0.163, + "loss_text": 1.3967, + "ppl": 4.7579, + "step": 11203 + }, + { + "epoch": 0.06, + "global_step": 11204, + "learning_rate": 0.0004540734557595994, + "loss": 1.4351, + "loss_base2": 2.0704, + "loss_pixel": 0.163, + "loss_text": 1.272, + "ppl": 4.2001, + "step": 11204 + }, + { + "epoch": 0.06, + "global_step": 11205, + "learning_rate": 0.0004540692821368949, + "loss": 1.4084, + "loss_base2": 2.0319, + "loss_pixel": 0.1624, + "loss_text": 1.246, + "ppl": 4.0894, + "step": 11205 + }, + { + "epoch": 0.06, + "global_step": 11206, + "learning_rate": 0.0004540651085141903, + "loss": 1.3998, + "loss_base2": 2.0195, + "loss_pixel": 0.1632, + "loss_text": 1.2366, + "ppl": 4.0544, + "step": 11206 + }, + { + "epoch": 0.06, + "global_step": 11207, + "learning_rate": 0.0004540609348914858, + "loss": 1.388, + "loss_base2": 2.0025, + "loss_pixel": 0.1619, + "loss_text": 1.2261, + "ppl": 4.0068, + "step": 11207 + }, + { + "epoch": 0.06, + "global_step": 11208, + "learning_rate": 0.0004540567612687813, + "loss": 1.3968, + "loss_base2": 2.0152, + "loss_pixel": 0.1622, + "loss_text": 1.2346, + "ppl": 4.0422, + "step": 11208 + }, + { + "epoch": 0.06, + "global_step": 11209, + "learning_rate": 0.0004540525876460768, + "loss": 1.3956, + "loss_base2": 2.0134, + "loss_pixel": 0.1625, + "loss_text": 1.2332, + "ppl": 4.0374, + "step": 11209 + }, + { + "epoch": 0.06, + "global_step": 11210, + "learning_rate": 0.00045404841402337225, + "loss": 1.3941, + "loss_base2": 2.0113, + "loss_pixel": 0.1621, + "loss_text": 1.232, + "ppl": 4.0313, + "step": 11210 + }, + { + "epoch": 0.06, + "global_step": 11211, + "learning_rate": 0.00045404424040066776, + "loss": 1.3857, + "loss_base2": 1.9991, + "loss_pixel": 0.1623, + "loss_text": 1.2234, + "ppl": 3.9976, + "step": 11211 + }, + { + "epoch": 0.06, + "global_step": 11212, + "learning_rate": 0.00045404006677796327, + "loss": 1.5826, + "loss_base2": 2.2832, + "loss_pixel": 0.1636, + "loss_text": 1.419, + "ppl": 4.8676, + "step": 11212 + }, + { + "epoch": 0.06, + "global_step": 11213, + "learning_rate": 0.0004540358931552588, + "loss": 1.6397, + "loss_base2": 2.3656, + "loss_pixel": 0.1607, + "loss_text": 1.479, + "ppl": 5.1536, + "step": 11213 + }, + { + "epoch": 0.06, + "global_step": 11214, + "learning_rate": 0.0004540317195325543, + "loss": 1.6449, + "loss_base2": 2.3731, + "loss_pixel": 0.162, + "loss_text": 1.4829, + "ppl": 5.1805, + "step": 11214 + }, + { + "epoch": 0.06, + "global_step": 11215, + "learning_rate": 0.00045402754590984974, + "loss": 1.6348, + "loss_base2": 2.3585, + "loss_pixel": 0.1621, + "loss_text": 1.4727, + "ppl": 5.1284, + "step": 11215 + }, + { + "epoch": 0.06, + "global_step": 11216, + "learning_rate": 0.00045402337228714524, + "loss": 1.6301, + "loss_base2": 2.3517, + "loss_pixel": 0.1618, + "loss_text": 1.4683, + "ppl": 5.1044, + "step": 11216 + }, + { + "epoch": 0.06, + "global_step": 11217, + "learning_rate": 0.00045401919866444075, + "loss": 1.6338, + "loss_base2": 2.3571, + "loss_pixel": 0.1621, + "loss_text": 1.4717, + "ppl": 5.1233, + "step": 11217 + }, + { + "epoch": 0.06, + "global_step": 11218, + "learning_rate": 0.00045401502504173626, + "loss": 1.629, + "loss_base2": 2.3502, + "loss_pixel": 0.1621, + "loss_text": 1.4669, + "ppl": 5.0988, + "step": 11218 + }, + { + "epoch": 0.06, + "global_step": 11219, + "learning_rate": 0.00045401085141903177, + "loss": 1.6299, + "loss_base2": 2.3514, + "loss_pixel": 0.1623, + "loss_text": 1.4676, + "ppl": 5.1034, + "step": 11219 + }, + { + "epoch": 0.06, + "global_step": 11220, + "learning_rate": 0.0004540066777963272, + "loss": 1.6437, + "loss_base2": 2.3714, + "loss_pixel": 0.1627, + "loss_text": 1.4809, + "ppl": 5.1743, + "step": 11220 + }, + { + "epoch": 0.06, + "global_step": 11221, + "learning_rate": 0.0004540025041736227, + "loss": 1.6191, + "loss_base2": 2.3359, + "loss_pixel": 0.162, + "loss_text": 1.4571, + "ppl": 5.0485, + "step": 11221 + }, + { + "epoch": 0.06, + "global_step": 11222, + "learning_rate": 0.00045399833055091823, + "loss": 1.6311, + "loss_base2": 2.3532, + "loss_pixel": 0.1617, + "loss_text": 1.4694, + "ppl": 5.1095, + "step": 11222 + }, + { + "epoch": 0.06, + "global_step": 11223, + "learning_rate": 0.00045399415692821374, + "loss": 1.6298, + "loss_base2": 2.3513, + "loss_pixel": 0.1624, + "loss_text": 1.4675, + "ppl": 5.1029, + "step": 11223 + }, + { + "epoch": 0.06, + "global_step": 11224, + "learning_rate": 0.0004539899833055092, + "loss": 1.6042, + "loss_base2": 2.3144, + "loss_pixel": 0.161, + "loss_text": 1.4432, + "ppl": 4.9739, + "step": 11224 + }, + { + "epoch": 0.06, + "global_step": 11225, + "learning_rate": 0.00045398580968280465, + "loss": 1.6243, + "loss_base2": 2.3434, + "loss_pixel": 0.1619, + "loss_text": 1.4624, + "ppl": 5.0749, + "step": 11225 + }, + { + "epoch": 0.06, + "global_step": 11226, + "learning_rate": 0.00045398163606010015, + "loss": 1.6087, + "loss_base2": 2.3209, + "loss_pixel": 0.1605, + "loss_text": 1.4482, + "ppl": 4.9963, + "step": 11226 + }, + { + "epoch": 0.06, + "global_step": 11227, + "learning_rate": 0.00045397746243739566, + "loss": 1.627, + "loss_base2": 2.3473, + "loss_pixel": 0.1617, + "loss_text": 1.4654, + "ppl": 5.0886, + "step": 11227 + }, + { + "epoch": 0.06, + "global_step": 11228, + "learning_rate": 0.00045397328881469117, + "loss": 1.6035, + "loss_base2": 2.3134, + "loss_pixel": 0.1624, + "loss_text": 1.4411, + "ppl": 4.9704, + "step": 11228 + }, + { + "epoch": 0.06, + "global_step": 11229, + "learning_rate": 0.0004539691151919866, + "loss": 1.6229, + "loss_base2": 2.3413, + "loss_pixel": 0.162, + "loss_text": 1.4609, + "ppl": 5.0678, + "step": 11229 + }, + { + "epoch": 0.06, + "global_step": 11230, + "learning_rate": 0.00045396494156928213, + "loss": 1.6058, + "loss_base2": 2.3167, + "loss_pixel": 0.1619, + "loss_text": 1.444, + "ppl": 4.9818, + "step": 11230 + }, + { + "epoch": 0.06, + "global_step": 11231, + "learning_rate": 0.00045396076794657764, + "loss": 1.6107, + "loss_base2": 2.3237, + "loss_pixel": 0.1622, + "loss_text": 1.4485, + "ppl": 5.0063, + "step": 11231 + }, + { + "epoch": 0.06, + "global_step": 11232, + "learning_rate": 0.00045395659432387314, + "loss": 1.6195, + "loss_base2": 2.3364, + "loss_pixel": 0.1625, + "loss_text": 1.457, + "ppl": 5.0506, + "step": 11232 + }, + { + "epoch": 0.06, + "global_step": 11233, + "learning_rate": 0.0004539524207011686, + "loss": 1.6131, + "loss_base2": 2.3272, + "loss_pixel": 0.163, + "loss_text": 1.4501, + "ppl": 5.0183, + "step": 11233 + }, + { + "epoch": 0.06, + "global_step": 11234, + "learning_rate": 0.0004539482470784641, + "loss": 1.6306, + "loss_base2": 2.3525, + "loss_pixel": 0.1619, + "loss_text": 1.4687, + "ppl": 5.1069, + "step": 11234 + }, + { + "epoch": 0.06, + "global_step": 11235, + "learning_rate": 0.0004539440734557596, + "loss": 1.6027, + "loss_base2": 2.3122, + "loss_pixel": 0.1619, + "loss_text": 1.4408, + "ppl": 4.9664, + "step": 11235 + }, + { + "epoch": 0.06, + "global_step": 11236, + "learning_rate": 0.0004539398998330551, + "loss": 1.588, + "loss_base2": 2.291, + "loss_pixel": 0.1632, + "loss_text": 1.4247, + "ppl": 4.894, + "step": 11236 + }, + { + "epoch": 0.06, + "global_step": 11237, + "learning_rate": 0.0004539357262103506, + "loss": 1.5235, + "loss_base2": 2.1979, + "loss_pixel": 0.1627, + "loss_text": 1.3608, + "ppl": 4.5883, + "step": 11237 + }, + { + "epoch": 0.06, + "global_step": 11238, + "learning_rate": 0.0004539315525876461, + "loss": 1.4196, + "loss_base2": 2.048, + "loss_pixel": 0.1616, + "loss_text": 1.258, + "ppl": 4.1355, + "step": 11238 + }, + { + "epoch": 0.06, + "global_step": 11239, + "learning_rate": 0.0004539273789649416, + "loss": 1.3927, + "loss_base2": 2.0092, + "loss_pixel": 0.1612, + "loss_text": 1.2315, + "ppl": 4.0257, + "step": 11239 + }, + { + "epoch": 0.06, + "global_step": 11240, + "learning_rate": 0.0004539232053422371, + "loss": 1.4103, + "loss_base2": 2.0346, + "loss_pixel": 0.163, + "loss_text": 1.2473, + "ppl": 4.0972, + "step": 11240 + }, + { + "epoch": 0.06, + "global_step": 11241, + "learning_rate": 0.0004539190317195326, + "loss": 1.3996, + "loss_base2": 2.0192, + "loss_pixel": 0.1624, + "loss_text": 1.2372, + "ppl": 4.0536, + "step": 11241 + }, + { + "epoch": 0.06, + "global_step": 11242, + "learning_rate": 0.00045391485809682805, + "loss": 1.3856, + "loss_base2": 1.999, + "loss_pixel": 0.1626, + "loss_text": 1.223, + "ppl": 3.9972, + "step": 11242 + }, + { + "epoch": 0.06, + "global_step": 11243, + "learning_rate": 0.00045391068447412356, + "loss": 1.3869, + "loss_base2": 2.0009, + "loss_pixel": 0.162, + "loss_text": 1.2249, + "ppl": 4.0024, + "step": 11243 + }, + { + "epoch": 0.06, + "global_step": 11244, + "learning_rate": 0.000453906510851419, + "loss": 1.3848, + "loss_base2": 1.9978, + "loss_pixel": 0.162, + "loss_text": 1.2228, + "ppl": 3.994, + "step": 11244 + }, + { + "epoch": 0.06, + "global_step": 11245, + "learning_rate": 0.0004539023372287145, + "loss": 1.4067, + "loss_base2": 2.0294, + "loss_pixel": 0.1615, + "loss_text": 1.2452, + "ppl": 4.0825, + "step": 11245 + }, + { + "epoch": 0.06, + "global_step": 11246, + "learning_rate": 0.00045389816360601003, + "loss": 1.3933, + "loss_base2": 2.0101, + "loss_pixel": 0.163, + "loss_text": 1.2302, + "ppl": 4.0281, + "step": 11246 + }, + { + "epoch": 0.06, + "global_step": 11247, + "learning_rate": 0.0004538939899833055, + "loss": 1.3959, + "loss_base2": 2.0139, + "loss_pixel": 0.1611, + "loss_text": 1.2348, + "ppl": 4.0386, + "step": 11247 + }, + { + "epoch": 0.06, + "global_step": 11248, + "learning_rate": 0.000453889816360601, + "loss": 1.3866, + "loss_base2": 2.0004, + "loss_pixel": 0.1605, + "loss_text": 1.2261, + "ppl": 4.0012, + "step": 11248 + }, + { + "epoch": 0.06, + "global_step": 11249, + "learning_rate": 0.0004538856427378965, + "loss": 1.3766, + "loss_base2": 1.986, + "loss_pixel": 0.1603, + "loss_text": 1.2163, + "ppl": 3.9614, + "step": 11249 + }, + { + "epoch": 0.06, + "global_step": 11250, + "learning_rate": 0.000453881469115192, + "loss": 1.3803, + "loss_base2": 1.9914, + "loss_pixel": 0.1586, + "loss_text": 1.2217, + "ppl": 3.9761, + "step": 11250 + }, + { + "epoch": 0.06, + "global_step": 11251, + "learning_rate": 0.00045387729549248746, + "loss": 1.3783, + "loss_base2": 1.9885, + "loss_pixel": 0.1585, + "loss_text": 1.2198, + "ppl": 3.9682, + "step": 11251 + }, + { + "epoch": 0.06, + "global_step": 11252, + "learning_rate": 0.00045387312186978297, + "loss": 1.3681, + "loss_base2": 1.9738, + "loss_pixel": 0.1589, + "loss_text": 1.2092, + "ppl": 3.9279, + "step": 11252 + }, + { + "epoch": 0.06, + "global_step": 11253, + "learning_rate": 0.00045386894824707847, + "loss": 1.398, + "loss_base2": 2.0169, + "loss_pixel": 0.1569, + "loss_text": 1.2412, + "ppl": 4.0471, + "step": 11253 + }, + { + "epoch": 0.06, + "global_step": 11254, + "learning_rate": 0.000453864774624374, + "loss": 1.3787, + "loss_base2": 1.989, + "loss_pixel": 0.1567, + "loss_text": 1.222, + "ppl": 3.9697, + "step": 11254 + }, + { + "epoch": 0.06, + "global_step": 11255, + "learning_rate": 0.0004538606010016695, + "loss": 1.3673, + "loss_base2": 1.9726, + "loss_pixel": 0.1549, + "loss_text": 1.2125, + "ppl": 3.9247, + "step": 11255 + }, + { + "epoch": 0.06, + "global_step": 11256, + "learning_rate": 0.00045385642737896494, + "loss": 1.3971, + "loss_base2": 2.0156, + "loss_pixel": 0.1588, + "loss_text": 1.2382, + "ppl": 4.0435, + "step": 11256 + }, + { + "epoch": 0.06, + "global_step": 11257, + "learning_rate": 0.00045385225375626045, + "loss": 1.3861, + "loss_base2": 1.9997, + "loss_pixel": 0.1569, + "loss_text": 1.2291, + "ppl": 3.9992, + "step": 11257 + }, + { + "epoch": 0.06, + "global_step": 11258, + "learning_rate": 0.00045384808013355596, + "loss": 1.372, + "loss_base2": 1.9794, + "loss_pixel": 0.1562, + "loss_text": 1.2158, + "ppl": 3.9432, + "step": 11258 + }, + { + "epoch": 0.06, + "global_step": 11259, + "learning_rate": 0.00045384390651085146, + "loss": 1.3913, + "loss_base2": 2.0072, + "loss_pixel": 0.1582, + "loss_text": 1.2331, + "ppl": 4.0201, + "step": 11259 + }, + { + "epoch": 0.06, + "global_step": 11260, + "learning_rate": 0.0004538397328881469, + "loss": 1.3963, + "loss_base2": 2.0144, + "loss_pixel": 0.1587, + "loss_text": 1.2376, + "ppl": 4.0402, + "step": 11260 + }, + { + "epoch": 0.06, + "global_step": 11261, + "learning_rate": 0.0004538355592654424, + "loss": 1.3823, + "loss_base2": 1.9942, + "loss_pixel": 0.1561, + "loss_text": 1.2262, + "ppl": 3.9841, + "step": 11261 + }, + { + "epoch": 0.06, + "global_step": 11262, + "learning_rate": 0.00045383138564273793, + "loss": 1.3712, + "loss_base2": 1.9782, + "loss_pixel": 0.1558, + "loss_text": 1.2154, + "ppl": 3.9401, + "step": 11262 + }, + { + "epoch": 0.06, + "global_step": 11263, + "learning_rate": 0.0004538272120200334, + "loss": 1.3498, + "loss_base2": 1.9473, + "loss_pixel": 0.1567, + "loss_text": 1.1931, + "ppl": 3.8567, + "step": 11263 + }, + { + "epoch": 0.06, + "global_step": 11264, + "learning_rate": 0.0004538230383973289, + "loss": 1.3954, + "loss_base2": 2.0131, + "loss_pixel": 0.1557, + "loss_text": 1.2397, + "ppl": 4.0366, + "step": 11264 + }, + { + "epoch": 0.06, + "global_step": 11265, + "learning_rate": 0.00045381886477462434, + "loss": 1.3872, + "loss_base2": 2.0013, + "loss_pixel": 0.1568, + "loss_text": 1.2304, + "ppl": 4.0036, + "step": 11265 + }, + { + "epoch": 0.06, + "global_step": 11266, + "learning_rate": 0.00045381469115191985, + "loss": 1.3841, + "loss_base2": 1.9968, + "loss_pixel": 0.1555, + "loss_text": 1.2285, + "ppl": 3.9912, + "step": 11266 + }, + { + "epoch": 0.06, + "global_step": 11267, + "learning_rate": 0.00045381051752921536, + "loss": 1.3986, + "loss_base2": 2.0178, + "loss_pixel": 0.157, + "loss_text": 1.2417, + "ppl": 4.0495, + "step": 11267 + }, + { + "epoch": 0.06, + "global_step": 11268, + "learning_rate": 0.00045380634390651087, + "loss": 1.3828, + "loss_base2": 1.995, + "loss_pixel": 0.154, + "loss_text": 1.2288, + "ppl": 3.986, + "step": 11268 + }, + { + "epoch": 0.06, + "global_step": 11269, + "learning_rate": 0.0004538021702838063, + "loss": 1.5071, + "loss_base2": 2.1743, + "loss_pixel": 0.155, + "loss_text": 1.352, + "ppl": 4.5136, + "step": 11269 + }, + { + "epoch": 0.06, + "global_step": 11270, + "learning_rate": 0.0004537979966611018, + "loss": 1.6252, + "loss_base2": 2.3447, + "loss_pixel": 0.1555, + "loss_text": 1.4697, + "ppl": 5.0794, + "step": 11270 + }, + { + "epoch": 0.06, + "global_step": 11271, + "learning_rate": 0.00045379382303839733, + "loss": 1.6029, + "loss_base2": 2.3125, + "loss_pixel": 0.1526, + "loss_text": 1.4503, + "ppl": 4.9674, + "step": 11271 + }, + { + "epoch": 0.06, + "global_step": 11272, + "learning_rate": 0.00045378964941569284, + "loss": 1.6309, + "loss_base2": 2.3529, + "loss_pixel": 0.1523, + "loss_text": 1.4786, + "ppl": 5.1085, + "step": 11272 + }, + { + "epoch": 0.06, + "global_step": 11273, + "learning_rate": 0.00045378547579298835, + "loss": 1.623, + "loss_base2": 2.3415, + "loss_pixel": 0.1552, + "loss_text": 1.4679, + "ppl": 5.0683, + "step": 11273 + }, + { + "epoch": 0.06, + "global_step": 11274, + "learning_rate": 0.0004537813021702838, + "loss": 1.638, + "loss_base2": 2.3631, + "loss_pixel": 0.1554, + "loss_text": 1.4826, + "ppl": 5.1449, + "step": 11274 + }, + { + "epoch": 0.06, + "global_step": 11275, + "learning_rate": 0.0004537771285475793, + "loss": 1.6002, + "loss_base2": 2.3086, + "loss_pixel": 0.1534, + "loss_text": 1.4469, + "ppl": 4.954, + "step": 11275 + }, + { + "epoch": 0.06, + "global_step": 11276, + "learning_rate": 0.0004537729549248748, + "loss": 1.6204, + "loss_base2": 2.3377, + "loss_pixel": 0.1515, + "loss_text": 1.469, + "ppl": 5.0551, + "step": 11276 + }, + { + "epoch": 0.06, + "global_step": 11277, + "learning_rate": 0.0004537687813021703, + "loss": 1.618, + "loss_base2": 2.3343, + "loss_pixel": 0.1548, + "loss_text": 1.4632, + "ppl": 5.043, + "step": 11277 + }, + { + "epoch": 0.06, + "global_step": 11278, + "learning_rate": 0.00045376460767946583, + "loss": 1.6258, + "loss_base2": 2.3455, + "loss_pixel": 0.1554, + "loss_text": 1.4704, + "ppl": 5.0825, + "step": 11278 + }, + { + "epoch": 0.06, + "global_step": 11279, + "learning_rate": 0.0004537604340567613, + "loss": 1.6159, + "loss_base2": 2.3313, + "loss_pixel": 0.152, + "loss_text": 1.4639, + "ppl": 5.0324, + "step": 11279 + }, + { + "epoch": 0.06, + "global_step": 11280, + "learning_rate": 0.0004537562604340568, + "loss": 1.6129, + "loss_base2": 2.3269, + "loss_pixel": 0.1544, + "loss_text": 1.4585, + "ppl": 5.0173, + "step": 11280 + }, + { + "epoch": 0.06, + "global_step": 11281, + "learning_rate": 0.0004537520868113523, + "loss": 1.5967, + "loss_base2": 2.3036, + "loss_pixel": 0.153, + "loss_text": 1.4437, + "ppl": 4.9367, + "step": 11281 + }, + { + "epoch": 0.06, + "global_step": 11282, + "learning_rate": 0.00045374791318864775, + "loss": 1.6236, + "loss_base2": 2.3424, + "loss_pixel": 0.1536, + "loss_text": 1.4699, + "ppl": 5.0713, + "step": 11282 + }, + { + "epoch": 0.06, + "global_step": 11283, + "learning_rate": 0.0004537437395659432, + "loss": 1.6074, + "loss_base2": 2.319, + "loss_pixel": 0.1527, + "loss_text": 1.4547, + "ppl": 4.9898, + "step": 11283 + }, + { + "epoch": 0.06, + "global_step": 11284, + "learning_rate": 0.0004537395659432387, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1503, + "loss_text": 1.4666, + "ppl": 5.0374, + "step": 11284 + }, + { + "epoch": 0.06, + "global_step": 11285, + "learning_rate": 0.0004537353923205342, + "loss": 1.6064, + "loss_base2": 2.3175, + "loss_pixel": 0.1515, + "loss_text": 1.4548, + "ppl": 4.9848, + "step": 11285 + }, + { + "epoch": 0.06, + "global_step": 11286, + "learning_rate": 0.0004537312186978297, + "loss": 1.5994, + "loss_base2": 2.3074, + "loss_pixel": 0.1509, + "loss_text": 1.4485, + "ppl": 4.9501, + "step": 11286 + }, + { + "epoch": 0.06, + "global_step": 11287, + "learning_rate": 0.00045372704507512523, + "loss": 1.6225, + "loss_base2": 2.3408, + "loss_pixel": 0.1545, + "loss_text": 1.468, + "ppl": 5.0657, + "step": 11287 + }, + { + "epoch": 0.06, + "global_step": 11288, + "learning_rate": 0.0004537228714524207, + "loss": 1.5957, + "loss_base2": 2.3021, + "loss_pixel": 0.1538, + "loss_text": 1.4419, + "ppl": 4.9318, + "step": 11288 + }, + { + "epoch": 0.06, + "global_step": 11289, + "learning_rate": 0.0004537186978297162, + "loss": 1.6117, + "loss_base2": 2.3252, + "loss_pixel": 0.1518, + "loss_text": 1.4599, + "ppl": 5.0113, + "step": 11289 + }, + { + "epoch": 0.06, + "global_step": 11290, + "learning_rate": 0.0004537145242070117, + "loss": 1.575, + "loss_base2": 2.2722, + "loss_pixel": 0.1486, + "loss_text": 1.4264, + "ppl": 4.8307, + "step": 11290 + }, + { + "epoch": 0.06, + "global_step": 11291, + "learning_rate": 0.0004537103505843072, + "loss": 1.6185, + "loss_base2": 2.335, + "loss_pixel": 0.1508, + "loss_text": 1.4677, + "ppl": 5.0455, + "step": 11291 + }, + { + "epoch": 0.06, + "global_step": 11292, + "learning_rate": 0.00045370617696160266, + "loss": 1.5936, + "loss_base2": 2.2991, + "loss_pixel": 0.1515, + "loss_text": 1.4421, + "ppl": 4.9214, + "step": 11292 + }, + { + "epoch": 0.06, + "global_step": 11293, + "learning_rate": 0.00045370200333889817, + "loss": 1.5999, + "loss_base2": 2.3082, + "loss_pixel": 0.1509, + "loss_text": 1.449, + "ppl": 4.9525, + "step": 11293 + }, + { + "epoch": 0.06, + "global_step": 11294, + "learning_rate": 0.0004536978297161937, + "loss": 1.6203, + "loss_base2": 2.3376, + "loss_pixel": 0.152, + "loss_text": 1.4682, + "ppl": 5.0546, + "step": 11294 + }, + { + "epoch": 0.06, + "global_step": 11295, + "learning_rate": 0.0004536936560934892, + "loss": 1.5956, + "loss_base2": 2.302, + "loss_pixel": 0.1531, + "loss_text": 1.4425, + "ppl": 4.9313, + "step": 11295 + }, + { + "epoch": 0.06, + "global_step": 11296, + "learning_rate": 0.0004536894824707847, + "loss": 1.5913, + "loss_base2": 2.2958, + "loss_pixel": 0.151, + "loss_text": 1.4403, + "ppl": 4.9101, + "step": 11296 + }, + { + "epoch": 0.06, + "global_step": 11297, + "learning_rate": 0.00045368530884808014, + "loss": 1.6069, + "loss_base2": 2.3183, + "loss_pixel": 0.1516, + "loss_text": 1.4554, + "ppl": 4.9873, + "step": 11297 + }, + { + "epoch": 0.06, + "global_step": 11298, + "learning_rate": 0.00045368113522537565, + "loss": 1.615, + "loss_base2": 2.33, + "loss_pixel": 0.1546, + "loss_text": 1.4604, + "ppl": 5.0279, + "step": 11298 + }, + { + "epoch": 0.06, + "global_step": 11299, + "learning_rate": 0.00045367696160267116, + "loss": 1.5901, + "loss_base2": 2.294, + "loss_pixel": 0.1527, + "loss_text": 1.4374, + "ppl": 4.9042, + "step": 11299 + }, + { + "epoch": 0.06, + "global_step": 11300, + "learning_rate": 0.00045367278797996667, + "loss": 1.5797, + "loss_base2": 2.279, + "loss_pixel": 0.1502, + "loss_text": 1.4295, + "ppl": 4.8535, + "step": 11300 + }, + { + "epoch": 0.06, + "global_step": 11301, + "learning_rate": 0.00045366861435726206, + "loss": 1.5973, + "loss_base2": 2.3044, + "loss_pixel": 0.1508, + "loss_text": 1.4466, + "ppl": 4.9397, + "step": 11301 + }, + { + "epoch": 0.06, + "global_step": 11302, + "learning_rate": 0.00045366444073455757, + "loss": 1.6063, + "loss_base2": 2.3174, + "loss_pixel": 0.1526, + "loss_text": 1.4537, + "ppl": 4.9843, + "step": 11302 + }, + { + "epoch": 0.06, + "global_step": 11303, + "learning_rate": 0.0004536602671118531, + "loss": 1.6018, + "loss_base2": 2.3109, + "loss_pixel": 0.1513, + "loss_text": 1.4505, + "ppl": 4.962, + "step": 11303 + }, + { + "epoch": 0.06, + "global_step": 11304, + "learning_rate": 0.0004536560934891486, + "loss": 1.6199, + "loss_base2": 2.337, + "loss_pixel": 0.1512, + "loss_text": 1.4687, + "ppl": 5.0526, + "step": 11304 + }, + { + "epoch": 0.06, + "global_step": 11305, + "learning_rate": 0.0004536519198664441, + "loss": 1.6209, + "loss_base2": 2.3385, + "loss_pixel": 0.1518, + "loss_text": 1.4691, + "ppl": 5.0576, + "step": 11305 + }, + { + "epoch": 0.06, + "global_step": 11306, + "learning_rate": 0.00045364774624373955, + "loss": 1.6082, + "loss_base2": 2.3201, + "loss_pixel": 0.1518, + "loss_text": 1.4564, + "ppl": 4.9938, + "step": 11306 + }, + { + "epoch": 0.06, + "global_step": 11307, + "learning_rate": 0.00045364357262103505, + "loss": 1.6049, + "loss_base2": 2.3154, + "loss_pixel": 0.1495, + "loss_text": 1.4554, + "ppl": 4.9774, + "step": 11307 + }, + { + "epoch": 0.06, + "global_step": 11308, + "learning_rate": 0.00045363939899833056, + "loss": 1.6114, + "loss_base2": 2.3248, + "loss_pixel": 0.1492, + "loss_text": 1.4622, + "ppl": 5.0098, + "step": 11308 + }, + { + "epoch": 0.06, + "global_step": 11309, + "learning_rate": 0.00045363522537562607, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.1508, + "loss_text": 1.4643, + "ppl": 5.0284, + "step": 11309 + }, + { + "epoch": 0.06, + "global_step": 11310, + "learning_rate": 0.0004536310517529215, + "loss": 1.6081, + "loss_base2": 2.32, + "loss_pixel": 0.154, + "loss_text": 1.4541, + "ppl": 4.9933, + "step": 11310 + }, + { + "epoch": 0.06, + "global_step": 11311, + "learning_rate": 0.00045362687813021703, + "loss": 1.5598, + "loss_base2": 2.2503, + "loss_pixel": 0.1494, + "loss_text": 1.4104, + "ppl": 4.7579, + "step": 11311 + }, + { + "epoch": 0.06, + "global_step": 11312, + "learning_rate": 0.00045362270450751254, + "loss": 1.5952, + "loss_base2": 2.3014, + "loss_pixel": 0.1522, + "loss_text": 1.443, + "ppl": 4.9293, + "step": 11312 + }, + { + "epoch": 0.06, + "global_step": 11313, + "learning_rate": 0.00045361853088480804, + "loss": 1.603, + "loss_base2": 2.3126, + "loss_pixel": 0.1502, + "loss_text": 1.4528, + "ppl": 4.9679, + "step": 11313 + }, + { + "epoch": 0.06, + "global_step": 11314, + "learning_rate": 0.00045361435726210355, + "loss": 1.619, + "loss_base2": 2.3357, + "loss_pixel": 0.1519, + "loss_text": 1.4671, + "ppl": 5.048, + "step": 11314 + }, + { + "epoch": 0.06, + "global_step": 11315, + "learning_rate": 0.000453610183639399, + "loss": 1.6129, + "loss_base2": 2.3269, + "loss_pixel": 0.1513, + "loss_text": 1.4616, + "ppl": 5.0173, + "step": 11315 + }, + { + "epoch": 0.06, + "global_step": 11316, + "learning_rate": 0.0004536060100166945, + "loss": 1.5257, + "loss_base2": 2.2011, + "loss_pixel": 0.1501, + "loss_text": 1.3756, + "ppl": 4.5984, + "step": 11316 + }, + { + "epoch": 0.06, + "global_step": 11317, + "learning_rate": 0.00045360183639399, + "loss": 1.3915, + "loss_base2": 2.0075, + "loss_pixel": 0.1504, + "loss_text": 1.2411, + "ppl": 4.0209, + "step": 11317 + }, + { + "epoch": 0.06, + "global_step": 11318, + "learning_rate": 0.0004535976627712855, + "loss": 1.3882, + "loss_base2": 2.0027, + "loss_pixel": 0.1483, + "loss_text": 1.2398, + "ppl": 4.0076, + "step": 11318 + }, + { + "epoch": 0.06, + "global_step": 11319, + "learning_rate": 0.0004535934891485809, + "loss": 1.3851, + "loss_base2": 1.9983, + "loss_pixel": 0.1514, + "loss_text": 1.2336, + "ppl": 3.9952, + "step": 11319 + }, + { + "epoch": 0.06, + "global_step": 11320, + "learning_rate": 0.00045358931552587643, + "loss": 1.371, + "loss_base2": 1.9779, + "loss_pixel": 0.1494, + "loss_text": 1.2216, + "ppl": 3.9393, + "step": 11320 + }, + { + "epoch": 0.06, + "global_step": 11321, + "learning_rate": 0.00045358514190317194, + "loss": 1.3678, + "loss_base2": 1.9733, + "loss_pixel": 0.1509, + "loss_text": 1.2169, + "ppl": 3.9267, + "step": 11321 + }, + { + "epoch": 0.06, + "global_step": 11322, + "learning_rate": 0.00045358096828046745, + "loss": 1.3745, + "loss_base2": 1.983, + "loss_pixel": 0.1504, + "loss_text": 1.2241, + "ppl": 3.9531, + "step": 11322 + }, + { + "epoch": 0.06, + "global_step": 11323, + "learning_rate": 0.00045357679465776295, + "loss": 1.3799, + "loss_base2": 1.9908, + "loss_pixel": 0.1511, + "loss_text": 1.2287, + "ppl": 3.9745, + "step": 11323 + }, + { + "epoch": 0.06, + "global_step": 11324, + "learning_rate": 0.0004535726210350584, + "loss": 1.3765, + "loss_base2": 1.9859, + "loss_pixel": 0.1484, + "loss_text": 1.2281, + "ppl": 3.961, + "step": 11324 + }, + { + "epoch": 0.06, + "global_step": 11325, + "learning_rate": 0.0004535684474123539, + "loss": 1.3634, + "loss_base2": 1.967, + "loss_pixel": 0.1538, + "loss_text": 1.2095, + "ppl": 3.9095, + "step": 11325 + }, + { + "epoch": 0.06, + "global_step": 11326, + "learning_rate": 0.0004535642737896494, + "loss": 1.3791, + "loss_base2": 1.9896, + "loss_pixel": 0.1488, + "loss_text": 1.2303, + "ppl": 3.9713, + "step": 11326 + }, + { + "epoch": 0.06, + "global_step": 11327, + "learning_rate": 0.00045356010016694493, + "loss": 1.3628, + "loss_base2": 1.9661, + "loss_pixel": 0.1495, + "loss_text": 1.2133, + "ppl": 3.9071, + "step": 11327 + }, + { + "epoch": 0.06, + "global_step": 11328, + "learning_rate": 0.0004535559265442404, + "loss": 1.3725, + "loss_base2": 1.9801, + "loss_pixel": 0.1521, + "loss_text": 1.2204, + "ppl": 3.9452, + "step": 11328 + }, + { + "epoch": 0.06, + "global_step": 11329, + "learning_rate": 0.0004535517529215359, + "loss": 1.3828, + "loss_base2": 1.995, + "loss_pixel": 0.15, + "loss_text": 1.2329, + "ppl": 3.986, + "step": 11329 + }, + { + "epoch": 0.06, + "global_step": 11330, + "learning_rate": 0.0004535475792988314, + "loss": 1.3586, + "loss_base2": 1.96, + "loss_pixel": 0.1493, + "loss_text": 1.2093, + "ppl": 3.8907, + "step": 11330 + }, + { + "epoch": 0.06, + "global_step": 11331, + "learning_rate": 0.0004535434056761269, + "loss": 1.3728, + "loss_base2": 1.9805, + "loss_pixel": 0.1504, + "loss_text": 1.2224, + "ppl": 3.9464, + "step": 11331 + }, + { + "epoch": 0.06, + "global_step": 11332, + "learning_rate": 0.0004535392320534224, + "loss": 1.3531, + "loss_base2": 1.9521, + "loss_pixel": 0.1493, + "loss_text": 1.2037, + "ppl": 3.8694, + "step": 11332 + }, + { + "epoch": 0.06, + "global_step": 11333, + "learning_rate": 0.00045353505843071787, + "loss": 1.36, + "loss_base2": 1.9621, + "loss_pixel": 0.151, + "loss_text": 1.2091, + "ppl": 3.8962, + "step": 11333 + }, + { + "epoch": 0.06, + "global_step": 11334, + "learning_rate": 0.00045353088480801337, + "loss": 1.3749, + "loss_base2": 1.9836, + "loss_pixel": 0.1523, + "loss_text": 1.2226, + "ppl": 3.9547, + "step": 11334 + }, + { + "epoch": 0.06, + "global_step": 11335, + "learning_rate": 0.0004535267111853089, + "loss": 1.3635, + "loss_base2": 1.9671, + "loss_pixel": 0.1512, + "loss_text": 1.2123, + "ppl": 3.9099, + "step": 11335 + }, + { + "epoch": 0.06, + "global_step": 11336, + "learning_rate": 0.0004535225375626044, + "loss": 1.3874, + "loss_base2": 2.0016, + "loss_pixel": 0.1494, + "loss_text": 1.238, + "ppl": 4.0044, + "step": 11336 + }, + { + "epoch": 0.06, + "global_step": 11337, + "learning_rate": 0.0004535183639398999, + "loss": 1.3759, + "loss_base2": 1.985, + "loss_pixel": 0.1524, + "loss_text": 1.2235, + "ppl": 3.9586, + "step": 11337 + }, + { + "epoch": 0.06, + "global_step": 11338, + "learning_rate": 0.0004535141903171953, + "loss": 1.3642, + "loss_base2": 1.9681, + "loss_pixel": 0.1508, + "loss_text": 1.2134, + "ppl": 3.9126, + "step": 11338 + }, + { + "epoch": 0.06, + "global_step": 11339, + "learning_rate": 0.0004535100166944908, + "loss": 1.3624, + "loss_base2": 1.9655, + "loss_pixel": 0.1493, + "loss_text": 1.213, + "ppl": 3.9056, + "step": 11339 + }, + { + "epoch": 0.06, + "global_step": 11340, + "learning_rate": 0.0004535058430717863, + "loss": 1.3766, + "loss_base2": 1.986, + "loss_pixel": 0.1491, + "loss_text": 1.2275, + "ppl": 3.9614, + "step": 11340 + }, + { + "epoch": 0.06, + "global_step": 11341, + "learning_rate": 0.0004535016694490818, + "loss": 1.3416, + "loss_base2": 1.9355, + "loss_pixel": 0.1505, + "loss_text": 1.1911, + "ppl": 3.8252, + "step": 11341 + }, + { + "epoch": 0.06, + "global_step": 11342, + "learning_rate": 0.00045349749582637727, + "loss": 1.6278, + "loss_base2": 2.3484, + "loss_pixel": 0.1493, + "loss_text": 1.4786, + "ppl": 5.0927, + "step": 11342 + }, + { + "epoch": 0.06, + "global_step": 11343, + "learning_rate": 0.0004534933222036728, + "loss": 1.6258, + "loss_base2": 2.3455, + "loss_pixel": 0.1528, + "loss_text": 1.473, + "ppl": 5.0825, + "step": 11343 + }, + { + "epoch": 0.06, + "global_step": 11344, + "learning_rate": 0.0004534891485809683, + "loss": 1.6324, + "loss_base2": 2.3551, + "loss_pixel": 0.151, + "loss_text": 1.4814, + "ppl": 5.1161, + "step": 11344 + }, + { + "epoch": 0.06, + "global_step": 11345, + "learning_rate": 0.0004534849749582638, + "loss": 1.6139, + "loss_base2": 2.3284, + "loss_pixel": 0.1498, + "loss_text": 1.4641, + "ppl": 5.0224, + "step": 11345 + }, + { + "epoch": 0.06, + "global_step": 11346, + "learning_rate": 0.0004534808013355593, + "loss": 1.6306, + "loss_base2": 2.3525, + "loss_pixel": 0.1506, + "loss_text": 1.4799, + "ppl": 5.1069, + "step": 11346 + }, + { + "epoch": 0.06, + "global_step": 11347, + "learning_rate": 0.00045347662771285475, + "loss": 1.5971, + "loss_base2": 2.3041, + "loss_pixel": 0.1493, + "loss_text": 1.4479, + "ppl": 4.9387, + "step": 11347 + }, + { + "epoch": 0.06, + "global_step": 11348, + "learning_rate": 0.00045347245409015026, + "loss": 1.6188, + "loss_base2": 2.3354, + "loss_pixel": 0.1491, + "loss_text": 1.4697, + "ppl": 5.047, + "step": 11348 + }, + { + "epoch": 0.06, + "global_step": 11349, + "learning_rate": 0.00045346828046744577, + "loss": 1.6147, + "loss_base2": 2.3295, + "loss_pixel": 0.1498, + "loss_text": 1.465, + "ppl": 5.0264, + "step": 11349 + }, + { + "epoch": 0.06, + "global_step": 11350, + "learning_rate": 0.0004534641068447413, + "loss": 1.6197, + "loss_base2": 2.3367, + "loss_pixel": 0.1498, + "loss_text": 1.4699, + "ppl": 5.0516, + "step": 11350 + }, + { + "epoch": 0.06, + "global_step": 11351, + "learning_rate": 0.0004534599332220367, + "loss": 1.6069, + "loss_base2": 2.3183, + "loss_pixel": 0.1491, + "loss_text": 1.4578, + "ppl": 4.9873, + "step": 11351 + }, + { + "epoch": 0.06, + "global_step": 11352, + "learning_rate": 0.00045345575959933223, + "loss": 1.643, + "loss_base2": 2.3703, + "loss_pixel": 0.1595, + "loss_text": 1.4835, + "ppl": 5.1707, + "step": 11352 + }, + { + "epoch": 0.06, + "global_step": 11353, + "learning_rate": 0.00045345158597662774, + "loss": 1.6296, + "loss_base2": 2.351, + "loss_pixel": 0.1627, + "loss_text": 1.4669, + "ppl": 5.1018, + "step": 11353 + }, + { + "epoch": 0.06, + "global_step": 11354, + "learning_rate": 0.00045344741235392325, + "loss": 1.6062, + "loss_base2": 2.3173, + "loss_pixel": 0.1643, + "loss_text": 1.4418, + "ppl": 4.9838, + "step": 11354 + }, + { + "epoch": 0.06, + "global_step": 11355, + "learning_rate": 0.00045344323873121876, + "loss": 1.6353, + "loss_base2": 2.3592, + "loss_pixel": 0.166, + "loss_text": 1.4694, + "ppl": 5.131, + "step": 11355 + }, + { + "epoch": 0.06, + "global_step": 11356, + "learning_rate": 0.0004534390651085142, + "loss": 1.6019, + "loss_base2": 2.3111, + "loss_pixel": 0.1649, + "loss_text": 1.437, + "ppl": 4.9625, + "step": 11356 + }, + { + "epoch": 0.06, + "global_step": 11357, + "learning_rate": 0.00045343489148580966, + "loss": 1.6331, + "loss_base2": 2.3561, + "loss_pixel": 0.1663, + "loss_text": 1.4668, + "ppl": 5.1197, + "step": 11357 + }, + { + "epoch": 0.06, + "global_step": 11358, + "learning_rate": 0.00045343071786310517, + "loss": 1.6449, + "loss_base2": 2.3731, + "loss_pixel": 0.1664, + "loss_text": 1.4784, + "ppl": 5.1805, + "step": 11358 + }, + { + "epoch": 0.06, + "global_step": 11359, + "learning_rate": 0.0004534265442404007, + "loss": 1.6251, + "loss_base2": 2.3445, + "loss_pixel": 0.1648, + "loss_text": 1.4603, + "ppl": 5.0789, + "step": 11359 + }, + { + "epoch": 0.06, + "global_step": 11360, + "learning_rate": 0.00045342237061769613, + "loss": 1.6115, + "loss_base2": 2.3249, + "loss_pixel": 0.1663, + "loss_text": 1.4452, + "ppl": 5.0103, + "step": 11360 + }, + { + "epoch": 0.06, + "global_step": 11361, + "learning_rate": 0.00045341819699499164, + "loss": 1.618, + "loss_base2": 2.3343, + "loss_pixel": 0.1655, + "loss_text": 1.4525, + "ppl": 5.043, + "step": 11361 + }, + { + "epoch": 0.06, + "global_step": 11362, + "learning_rate": 0.00045341402337228714, + "loss": 1.6197, + "loss_base2": 2.3367, + "loss_pixel": 0.1666, + "loss_text": 1.4532, + "ppl": 5.0516, + "step": 11362 + }, + { + "epoch": 0.06, + "global_step": 11363, + "learning_rate": 0.00045340984974958265, + "loss": 1.6058, + "loss_base2": 2.3167, + "loss_pixel": 0.1646, + "loss_text": 1.4413, + "ppl": 4.9818, + "step": 11363 + }, + { + "epoch": 0.06, + "global_step": 11364, + "learning_rate": 0.00045340567612687816, + "loss": 1.6194, + "loss_base2": 2.3363, + "loss_pixel": 0.165, + "loss_text": 1.4544, + "ppl": 5.0501, + "step": 11364 + }, + { + "epoch": 0.06, + "global_step": 11365, + "learning_rate": 0.0004534015025041736, + "loss": 1.6323, + "loss_base2": 2.3549, + "loss_pixel": 0.1648, + "loss_text": 1.4675, + "ppl": 5.1156, + "step": 11365 + }, + { + "epoch": 0.06, + "global_step": 11366, + "learning_rate": 0.0004533973288814691, + "loss": 1.6291, + "loss_base2": 2.3503, + "loss_pixel": 0.164, + "loss_text": 1.4651, + "ppl": 5.0993, + "step": 11366 + }, + { + "epoch": 0.06, + "global_step": 11367, + "learning_rate": 0.0004533931552587646, + "loss": 1.606, + "loss_base2": 2.317, + "loss_pixel": 0.1641, + "loss_text": 1.4419, + "ppl": 4.9828, + "step": 11367 + }, + { + "epoch": 0.06, + "global_step": 11368, + "learning_rate": 0.00045338898163606013, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1642, + "loss_text": 1.4527, + "ppl": 5.0374, + "step": 11368 + }, + { + "epoch": 0.06, + "global_step": 11369, + "learning_rate": 0.0004533848080133556, + "loss": 1.6136, + "loss_base2": 2.3279, + "loss_pixel": 0.1657, + "loss_text": 1.4479, + "ppl": 5.0209, + "step": 11369 + }, + { + "epoch": 0.06, + "global_step": 11370, + "learning_rate": 0.0004533806343906511, + "loss": 1.6309, + "loss_base2": 2.3529, + "loss_pixel": 0.1644, + "loss_text": 1.4666, + "ppl": 5.1085, + "step": 11370 + }, + { + "epoch": 0.06, + "global_step": 11371, + "learning_rate": 0.0004533764607679466, + "loss": 1.622, + "loss_base2": 2.3401, + "loss_pixel": 0.1627, + "loss_text": 1.4593, + "ppl": 5.0632, + "step": 11371 + }, + { + "epoch": 0.06, + "global_step": 11372, + "learning_rate": 0.0004533722871452421, + "loss": 1.6282, + "loss_base2": 2.349, + "loss_pixel": 0.1626, + "loss_text": 1.4656, + "ppl": 5.0947, + "step": 11372 + }, + { + "epoch": 0.06, + "global_step": 11373, + "learning_rate": 0.0004533681135225376, + "loss": 1.6226, + "loss_base2": 2.3409, + "loss_pixel": 0.1634, + "loss_text": 1.4593, + "ppl": 5.0662, + "step": 11373 + }, + { + "epoch": 0.06, + "global_step": 11374, + "learning_rate": 0.00045336393989983307, + "loss": 1.6285, + "loss_base2": 2.3494, + "loss_pixel": 0.1616, + "loss_text": 1.4669, + "ppl": 5.0962, + "step": 11374 + }, + { + "epoch": 0.06, + "global_step": 11375, + "learning_rate": 0.0004533597662771285, + "loss": 1.6002, + "loss_base2": 2.3086, + "loss_pixel": 0.1638, + "loss_text": 1.4364, + "ppl": 4.954, + "step": 11375 + }, + { + "epoch": 0.06, + "global_step": 11376, + "learning_rate": 0.00045335559265442403, + "loss": 1.6125, + "loss_base2": 2.3263, + "loss_pixel": 0.163, + "loss_text": 1.4495, + "ppl": 5.0153, + "step": 11376 + }, + { + "epoch": 0.06, + "global_step": 11377, + "learning_rate": 0.00045335141903171954, + "loss": 1.6158, + "loss_base2": 2.3311, + "loss_pixel": 0.1633, + "loss_text": 1.4525, + "ppl": 5.0319, + "step": 11377 + }, + { + "epoch": 0.06, + "global_step": 11378, + "learning_rate": 0.000453347245409015, + "loss": 1.607, + "loss_base2": 2.3184, + "loss_pixel": 0.162, + "loss_text": 1.4451, + "ppl": 4.9878, + "step": 11378 + }, + { + "epoch": 0.06, + "global_step": 11379, + "learning_rate": 0.0004533430717863105, + "loss": 1.602, + "loss_base2": 2.3112, + "loss_pixel": 0.1617, + "loss_text": 1.4403, + "ppl": 4.9629, + "step": 11379 + }, + { + "epoch": 0.06, + "global_step": 11380, + "learning_rate": 0.000453338898163606, + "loss": 1.6, + "loss_base2": 2.3083, + "loss_pixel": 0.163, + "loss_text": 1.437, + "ppl": 4.953, + "step": 11380 + }, + { + "epoch": 0.06, + "global_step": 11381, + "learning_rate": 0.0004533347245409015, + "loss": 1.6005, + "loss_base2": 2.309, + "loss_pixel": 0.1621, + "loss_text": 1.4384, + "ppl": 4.9555, + "step": 11381 + }, + { + "epoch": 0.06, + "global_step": 11382, + "learning_rate": 0.000453330550918197, + "loss": 1.6113, + "loss_base2": 2.3246, + "loss_pixel": 0.1625, + "loss_text": 1.4488, + "ppl": 5.0093, + "step": 11382 + }, + { + "epoch": 0.06, + "global_step": 11383, + "learning_rate": 0.00045332637729549247, + "loss": 1.6252, + "loss_base2": 2.3447, + "loss_pixel": 0.1608, + "loss_text": 1.4645, + "ppl": 5.0794, + "step": 11383 + }, + { + "epoch": 0.06, + "global_step": 11384, + "learning_rate": 0.000453322203672788, + "loss": 1.6001, + "loss_base2": 2.3085, + "loss_pixel": 0.1622, + "loss_text": 1.4378, + "ppl": 4.9535, + "step": 11384 + }, + { + "epoch": 0.06, + "global_step": 11385, + "learning_rate": 0.0004533180300500835, + "loss": 1.5716, + "loss_base2": 2.2673, + "loss_pixel": 0.1614, + "loss_text": 1.4102, + "ppl": 4.8143, + "step": 11385 + }, + { + "epoch": 0.06, + "global_step": 11386, + "learning_rate": 0.000453313856427379, + "loss": 1.3974, + "loss_base2": 2.016, + "loss_pixel": 0.1634, + "loss_text": 1.2341, + "ppl": 4.0447, + "step": 11386 + }, + { + "epoch": 0.06, + "global_step": 11387, + "learning_rate": 0.00045330968280467445, + "loss": 1.4082, + "loss_base2": 2.0316, + "loss_pixel": 0.1625, + "loss_text": 1.2457, + "ppl": 4.0886, + "step": 11387 + }, + { + "epoch": 0.06, + "global_step": 11388, + "learning_rate": 0.00045330550918196995, + "loss": 1.3926, + "loss_base2": 2.0091, + "loss_pixel": 0.1618, + "loss_text": 1.2308, + "ppl": 4.0253, + "step": 11388 + }, + { + "epoch": 0.06, + "global_step": 11389, + "learning_rate": 0.00045330133555926546, + "loss": 1.3737, + "loss_base2": 1.9818, + "loss_pixel": 0.1608, + "loss_text": 1.2129, + "ppl": 3.9499, + "step": 11389 + }, + { + "epoch": 0.06, + "global_step": 11390, + "learning_rate": 0.00045329716193656097, + "loss": 1.3839, + "loss_base2": 1.9965, + "loss_pixel": 0.1624, + "loss_text": 1.2215, + "ppl": 3.9904, + "step": 11390 + }, + { + "epoch": 0.06, + "global_step": 11391, + "learning_rate": 0.0004532929883138565, + "loss": 1.3769, + "loss_base2": 1.9864, + "loss_pixel": 0.161, + "loss_text": 1.2159, + "ppl": 3.9626, + "step": 11391 + }, + { + "epoch": 0.06, + "global_step": 11392, + "learning_rate": 0.00045328881469115193, + "loss": 1.3887, + "loss_base2": 2.0035, + "loss_pixel": 0.1617, + "loss_text": 1.227, + "ppl": 4.0096, + "step": 11392 + }, + { + "epoch": 0.06, + "global_step": 11393, + "learning_rate": 0.00045328464106844744, + "loss": 1.3881, + "loss_base2": 2.0026, + "loss_pixel": 0.1616, + "loss_text": 1.2265, + "ppl": 4.0072, + "step": 11393 + }, + { + "epoch": 0.06, + "global_step": 11394, + "learning_rate": 0.0004532804674457429, + "loss": 1.399, + "loss_base2": 2.0183, + "loss_pixel": 0.1634, + "loss_text": 1.2357, + "ppl": 4.0511, + "step": 11394 + }, + { + "epoch": 0.06, + "global_step": 11395, + "learning_rate": 0.0004532762938230384, + "loss": 1.3995, + "loss_base2": 2.0191, + "loss_pixel": 0.1614, + "loss_text": 1.2381, + "ppl": 4.0532, + "step": 11395 + }, + { + "epoch": 0.06, + "global_step": 11396, + "learning_rate": 0.0004532721202003339, + "loss": 1.3802, + "loss_base2": 1.9912, + "loss_pixel": 0.162, + "loss_text": 1.2182, + "ppl": 3.9757, + "step": 11396 + }, + { + "epoch": 0.06, + "global_step": 11397, + "learning_rate": 0.00045326794657762936, + "loss": 1.4023, + "loss_base2": 2.0231, + "loss_pixel": 0.166, + "loss_text": 1.2364, + "ppl": 4.0645, + "step": 11397 + }, + { + "epoch": 0.06, + "global_step": 11398, + "learning_rate": 0.00045326377295492487, + "loss": 1.3972, + "loss_base2": 2.0157, + "loss_pixel": 0.1616, + "loss_text": 1.2356, + "ppl": 4.0439, + "step": 11398 + }, + { + "epoch": 0.06, + "global_step": 11399, + "learning_rate": 0.00045325959933222037, + "loss": 1.3819, + "loss_base2": 1.9937, + "loss_pixel": 0.1632, + "loss_text": 1.2187, + "ppl": 3.9825, + "step": 11399 + }, + { + "epoch": 0.06, + "global_step": 11400, + "learning_rate": 0.0004532554257095159, + "loss": 1.3995, + "loss_base2": 2.0191, + "loss_pixel": 0.1608, + "loss_text": 1.2387, + "ppl": 4.0532, + "step": 11400 + }, + { + "epoch": 0.06, + "global_step": 11401, + "learning_rate": 0.00045325125208681133, + "loss": 1.3884, + "loss_base2": 2.003, + "loss_pixel": 0.1619, + "loss_text": 1.2265, + "ppl": 4.0084, + "step": 11401 + }, + { + "epoch": 0.06, + "global_step": 11402, + "learning_rate": 0.00045324707846410684, + "loss": 1.3891, + "loss_base2": 2.004, + "loss_pixel": 0.1619, + "loss_text": 1.2272, + "ppl": 4.0112, + "step": 11402 + }, + { + "epoch": 0.06, + "global_step": 11403, + "learning_rate": 0.00045324290484140235, + "loss": 1.3895, + "loss_base2": 2.0046, + "loss_pixel": 0.1624, + "loss_text": 1.227, + "ppl": 4.0128, + "step": 11403 + }, + { + "epoch": 0.06, + "global_step": 11404, + "learning_rate": 0.00045323873121869786, + "loss": 1.3847, + "loss_base2": 1.9977, + "loss_pixel": 0.163, + "loss_text": 1.2217, + "ppl": 3.9936, + "step": 11404 + }, + { + "epoch": 0.06, + "global_step": 11405, + "learning_rate": 0.00045323455759599336, + "loss": 1.3687, + "loss_base2": 1.9746, + "loss_pixel": 0.1612, + "loss_text": 1.2075, + "ppl": 3.9302, + "step": 11405 + }, + { + "epoch": 0.06, + "global_step": 11406, + "learning_rate": 0.0004532303839732888, + "loss": 1.41, + "loss_base2": 2.0342, + "loss_pixel": 0.1615, + "loss_text": 1.2485, + "ppl": 4.096, + "step": 11406 + }, + { + "epoch": 0.06, + "global_step": 11407, + "learning_rate": 0.0004532262103505843, + "loss": 1.3912, + "loss_base2": 2.0071, + "loss_pixel": 0.1652, + "loss_text": 1.226, + "ppl": 4.0197, + "step": 11407 + }, + { + "epoch": 0.06, + "global_step": 11408, + "learning_rate": 0.00045322203672787983, + "loss": 1.3934, + "loss_base2": 2.0103, + "loss_pixel": 0.1618, + "loss_text": 1.2316, + "ppl": 4.0285, + "step": 11408 + }, + { + "epoch": 0.06, + "global_step": 11409, + "learning_rate": 0.00045321786310517534, + "loss": 1.6131, + "loss_base2": 2.3272, + "loss_pixel": 0.1616, + "loss_text": 1.4515, + "ppl": 5.0183, + "step": 11409 + }, + { + "epoch": 0.06, + "global_step": 11410, + "learning_rate": 0.0004532136894824708, + "loss": 1.6482, + "loss_base2": 2.3778, + "loss_pixel": 0.1622, + "loss_text": 1.486, + "ppl": 5.1976, + "step": 11410 + }, + { + "epoch": 0.06, + "global_step": 11411, + "learning_rate": 0.0004532095158597663, + "loss": 1.6402, + "loss_base2": 2.3663, + "loss_pixel": 0.1618, + "loss_text": 1.4784, + "ppl": 5.1562, + "step": 11411 + }, + { + "epoch": 0.06, + "global_step": 11412, + "learning_rate": 0.0004532053422370618, + "loss": 1.6148, + "loss_base2": 2.3297, + "loss_pixel": 0.1623, + "loss_text": 1.4524, + "ppl": 5.0269, + "step": 11412 + }, + { + "epoch": 0.06, + "global_step": 11413, + "learning_rate": 0.00045320116861435726, + "loss": 1.6263, + "loss_base2": 2.3463, + "loss_pixel": 0.1605, + "loss_text": 1.4657, + "ppl": 5.085, + "step": 11413 + }, + { + "epoch": 0.06, + "global_step": 11414, + "learning_rate": 0.00045319699499165277, + "loss": 1.6352, + "loss_base2": 2.3591, + "loss_pixel": 0.162, + "loss_text": 1.4732, + "ppl": 5.1305, + "step": 11414 + }, + { + "epoch": 0.06, + "global_step": 11415, + "learning_rate": 0.0004531928213689482, + "loss": 1.6118, + "loss_base2": 2.3253, + "loss_pixel": 0.1612, + "loss_text": 1.4507, + "ppl": 5.0118, + "step": 11415 + }, + { + "epoch": 0.06, + "global_step": 11416, + "learning_rate": 0.0004531886477462437, + "loss": 1.6511, + "loss_base2": 2.382, + "loss_pixel": 0.1607, + "loss_text": 1.4905, + "ppl": 5.2127, + "step": 11416 + }, + { + "epoch": 0.06, + "global_step": 11417, + "learning_rate": 0.00045318447412353923, + "loss": 1.6204, + "loss_base2": 2.3377, + "loss_pixel": 0.1604, + "loss_text": 1.46, + "ppl": 5.0551, + "step": 11417 + }, + { + "epoch": 0.06, + "global_step": 11418, + "learning_rate": 0.00045318030050083474, + "loss": 1.6349, + "loss_base2": 2.3587, + "loss_pixel": 0.1628, + "loss_text": 1.4721, + "ppl": 5.1289, + "step": 11418 + }, + { + "epoch": 0.06, + "global_step": 11419, + "learning_rate": 0.0004531761268781302, + "loss": 1.6097, + "loss_base2": 2.3223, + "loss_pixel": 0.1616, + "loss_text": 1.4482, + "ppl": 5.0013, + "step": 11419 + }, + { + "epoch": 0.06, + "global_step": 11420, + "learning_rate": 0.0004531719532554257, + "loss": 1.6296, + "loss_base2": 2.351, + "loss_pixel": 0.1621, + "loss_text": 1.4675, + "ppl": 5.1018, + "step": 11420 + }, + { + "epoch": 0.06, + "global_step": 11421, + "learning_rate": 0.0004531677796327212, + "loss": 1.617, + "loss_base2": 2.3328, + "loss_pixel": 0.1616, + "loss_text": 1.4554, + "ppl": 5.038, + "step": 11421 + }, + { + "epoch": 0.06, + "global_step": 11422, + "learning_rate": 0.0004531636060100167, + "loss": 1.6142, + "loss_base2": 2.3288, + "loss_pixel": 0.1601, + "loss_text": 1.4542, + "ppl": 5.0239, + "step": 11422 + }, + { + "epoch": 0.06, + "global_step": 11423, + "learning_rate": 0.0004531594323873122, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.1616, + "loss_text": 1.4535, + "ppl": 5.0284, + "step": 11423 + }, + { + "epoch": 0.06, + "global_step": 11424, + "learning_rate": 0.0004531552587646077, + "loss": 1.6236, + "loss_base2": 2.3424, + "loss_pixel": 0.1619, + "loss_text": 1.4617, + "ppl": 5.0713, + "step": 11424 + }, + { + "epoch": 0.06, + "global_step": 11425, + "learning_rate": 0.0004531510851419032, + "loss": 1.6066, + "loss_base2": 2.3178, + "loss_pixel": 0.1612, + "loss_text": 1.4454, + "ppl": 4.9858, + "step": 11425 + }, + { + "epoch": 0.06, + "global_step": 11426, + "learning_rate": 0.0004531469115191987, + "loss": 1.6177, + "loss_base2": 2.3338, + "loss_pixel": 0.1608, + "loss_text": 1.4569, + "ppl": 5.0415, + "step": 11426 + }, + { + "epoch": 0.06, + "global_step": 11427, + "learning_rate": 0.0004531427378964942, + "loss": 1.613, + "loss_base2": 2.3271, + "loss_pixel": 0.1621, + "loss_text": 1.4509, + "ppl": 5.0178, + "step": 11427 + }, + { + "epoch": 0.06, + "global_step": 11428, + "learning_rate": 0.00045313856427378965, + "loss": 1.6136, + "loss_base2": 2.3279, + "loss_pixel": 0.161, + "loss_text": 1.4526, + "ppl": 5.0209, + "step": 11428 + }, + { + "epoch": 0.06, + "global_step": 11429, + "learning_rate": 0.00045313439065108516, + "loss": 1.6243, + "loss_base2": 2.3434, + "loss_pixel": 0.1625, + "loss_text": 1.4618, + "ppl": 5.0749, + "step": 11429 + }, + { + "epoch": 0.06, + "global_step": 11430, + "learning_rate": 0.00045313021702838067, + "loss": 1.6234, + "loss_base2": 2.3421, + "loss_pixel": 0.1598, + "loss_text": 1.4637, + "ppl": 5.0703, + "step": 11430 + }, + { + "epoch": 0.06, + "global_step": 11431, + "learning_rate": 0.0004531260434056762, + "loss": 1.6178, + "loss_base2": 2.334, + "loss_pixel": 0.1613, + "loss_text": 1.4564, + "ppl": 5.042, + "step": 11431 + }, + { + "epoch": 0.06, + "global_step": 11432, + "learning_rate": 0.0004531218697829716, + "loss": 1.6133, + "loss_base2": 2.3275, + "loss_pixel": 0.1598, + "loss_text": 1.4535, + "ppl": 5.0193, + "step": 11432 + }, + { + "epoch": 0.06, + "global_step": 11433, + "learning_rate": 0.0004531176961602671, + "loss": 1.5691, + "loss_base2": 2.2637, + "loss_pixel": 0.1617, + "loss_text": 1.4073, + "ppl": 4.8023, + "step": 11433 + }, + { + "epoch": 0.06, + "global_step": 11434, + "learning_rate": 0.0004531135225375626, + "loss": 1.5674, + "loss_base2": 2.2613, + "loss_pixel": 0.1604, + "loss_text": 1.407, + "ppl": 4.7942, + "step": 11434 + }, + { + "epoch": 0.06, + "global_step": 11435, + "learning_rate": 0.0004531093489148581, + "loss": 1.6204, + "loss_base2": 2.3377, + "loss_pixel": 0.1615, + "loss_text": 1.4589, + "ppl": 5.0551, + "step": 11435 + }, + { + "epoch": 0.06, + "global_step": 11436, + "learning_rate": 0.0004531051752921536, + "loss": 1.5984, + "loss_base2": 2.306, + "loss_pixel": 0.1596, + "loss_text": 1.4388, + "ppl": 4.9451, + "step": 11436 + }, + { + "epoch": 0.06, + "global_step": 11437, + "learning_rate": 0.00045310100166944905, + "loss": 1.6035, + "loss_base2": 2.3134, + "loss_pixel": 0.1617, + "loss_text": 1.4418, + "ppl": 4.9704, + "step": 11437 + }, + { + "epoch": 0.06, + "global_step": 11438, + "learning_rate": 0.00045309682804674456, + "loss": 1.6031, + "loss_base2": 2.3128, + "loss_pixel": 0.1604, + "loss_text": 1.4428, + "ppl": 4.9684, + "step": 11438 + }, + { + "epoch": 0.06, + "global_step": 11439, + "learning_rate": 0.00045309265442404007, + "loss": 1.5996, + "loss_base2": 2.3077, + "loss_pixel": 0.1622, + "loss_text": 1.4374, + "ppl": 4.9511, + "step": 11439 + }, + { + "epoch": 0.06, + "global_step": 11440, + "learning_rate": 0.0004530884808013356, + "loss": 1.618, + "loss_base2": 2.3343, + "loss_pixel": 0.1627, + "loss_text": 1.4553, + "ppl": 5.043, + "step": 11440 + }, + { + "epoch": 0.06, + "global_step": 11441, + "learning_rate": 0.0004530843071786311, + "loss": 1.6114, + "loss_base2": 2.3248, + "loss_pixel": 0.1602, + "loss_text": 1.4512, + "ppl": 5.0098, + "step": 11441 + }, + { + "epoch": 0.06, + "global_step": 11442, + "learning_rate": 0.00045308013355592654, + "loss": 1.6075, + "loss_base2": 2.3191, + "loss_pixel": 0.1611, + "loss_text": 1.4464, + "ppl": 4.9903, + "step": 11442 + }, + { + "epoch": 0.06, + "global_step": 11443, + "learning_rate": 0.00045307595993322204, + "loss": 1.5958, + "loss_base2": 2.3023, + "loss_pixel": 0.1608, + "loss_text": 1.435, + "ppl": 4.9323, + "step": 11443 + }, + { + "epoch": 0.06, + "global_step": 11444, + "learning_rate": 0.00045307178631051755, + "loss": 1.6211, + "loss_base2": 2.3388, + "loss_pixel": 0.1608, + "loss_text": 1.4603, + "ppl": 5.0587, + "step": 11444 + }, + { + "epoch": 0.06, + "global_step": 11445, + "learning_rate": 0.00045306761268781306, + "loss": 1.6322, + "loss_base2": 2.3548, + "loss_pixel": 0.1627, + "loss_text": 1.4695, + "ppl": 5.1151, + "step": 11445 + }, + { + "epoch": 0.06, + "global_step": 11446, + "learning_rate": 0.00045306343906510857, + "loss": 1.618, + "loss_base2": 2.3343, + "loss_pixel": 0.1617, + "loss_text": 1.4563, + "ppl": 5.043, + "step": 11446 + }, + { + "epoch": 0.06, + "global_step": 11447, + "learning_rate": 0.000453059265442404, + "loss": 1.6297, + "loss_base2": 2.3512, + "loss_pixel": 0.1601, + "loss_text": 1.4697, + "ppl": 5.1023, + "step": 11447 + }, + { + "epoch": 0.06, + "global_step": 11448, + "learning_rate": 0.0004530550918196995, + "loss": 1.601, + "loss_base2": 2.3098, + "loss_pixel": 0.1598, + "loss_text": 1.4413, + "ppl": 4.958, + "step": 11448 + }, + { + "epoch": 0.06, + "global_step": 11449, + "learning_rate": 0.00045305091819699503, + "loss": 1.6157, + "loss_base2": 2.331, + "loss_pixel": 0.1606, + "loss_text": 1.4551, + "ppl": 5.0314, + "step": 11449 + }, + { + "epoch": 0.06, + "global_step": 11450, + "learning_rate": 0.00045304674457429054, + "loss": 1.6123, + "loss_base2": 2.3261, + "loss_pixel": 0.1604, + "loss_text": 1.4519, + "ppl": 5.0143, + "step": 11450 + }, + { + "epoch": 0.06, + "global_step": 11451, + "learning_rate": 0.00045304257095158594, + "loss": 1.6172, + "loss_base2": 2.3331, + "loss_pixel": 0.1646, + "loss_text": 1.4526, + "ppl": 5.039, + "step": 11451 + }, + { + "epoch": 0.06, + "global_step": 11452, + "learning_rate": 0.00045303839732888145, + "loss": 1.6058, + "loss_base2": 2.3167, + "loss_pixel": 0.1603, + "loss_text": 1.4454, + "ppl": 4.9818, + "step": 11452 + }, + { + "epoch": 0.06, + "global_step": 11453, + "learning_rate": 0.00045303422370617695, + "loss": 1.6092, + "loss_base2": 2.3216, + "loss_pixel": 0.1613, + "loss_text": 1.4479, + "ppl": 4.9988, + "step": 11453 + }, + { + "epoch": 0.06, + "global_step": 11454, + "learning_rate": 0.00045303005008347246, + "loss": 1.6229, + "loss_base2": 2.3413, + "loss_pixel": 0.16, + "loss_text": 1.4629, + "ppl": 5.0678, + "step": 11454 + }, + { + "epoch": 0.06, + "global_step": 11455, + "learning_rate": 0.00045302587646076797, + "loss": 1.6145, + "loss_base2": 2.3292, + "loss_pixel": 0.1613, + "loss_text": 1.4532, + "ppl": 5.0254, + "step": 11455 + }, + { + "epoch": 0.06, + "global_step": 11456, + "learning_rate": 0.0004530217028380634, + "loss": 1.6033, + "loss_base2": 2.3131, + "loss_pixel": 0.1621, + "loss_text": 1.4412, + "ppl": 4.9694, + "step": 11456 + }, + { + "epoch": 0.06, + "global_step": 11457, + "learning_rate": 0.00045301752921535893, + "loss": 1.6217, + "loss_base2": 2.3396, + "loss_pixel": 0.1614, + "loss_text": 1.4603, + "ppl": 5.0617, + "step": 11457 + }, + { + "epoch": 0.06, + "global_step": 11458, + "learning_rate": 0.00045301335559265444, + "loss": 1.618, + "loss_base2": 2.3343, + "loss_pixel": 0.1606, + "loss_text": 1.4573, + "ppl": 5.043, + "step": 11458 + }, + { + "epoch": 0.06, + "global_step": 11459, + "learning_rate": 0.00045300918196994994, + "loss": 1.4751, + "loss_base2": 2.1281, + "loss_pixel": 0.1625, + "loss_text": 1.3125, + "ppl": 4.3715, + "step": 11459 + }, + { + "epoch": 0.06, + "global_step": 11460, + "learning_rate": 0.0004530050083472454, + "loss": 1.3901, + "loss_base2": 2.0055, + "loss_pixel": 0.1597, + "loss_text": 1.2304, + "ppl": 4.0153, + "step": 11460 + }, + { + "epoch": 0.06, + "global_step": 11461, + "learning_rate": 0.0004530008347245409, + "loss": 1.3918, + "loss_base2": 2.0079, + "loss_pixel": 0.1601, + "loss_text": 1.2317, + "ppl": 4.0221, + "step": 11461 + }, + { + "epoch": 0.06, + "global_step": 11462, + "learning_rate": 0.0004529966611018364, + "loss": 1.3912, + "loss_base2": 2.0071, + "loss_pixel": 0.1618, + "loss_text": 1.2293, + "ppl": 4.0197, + "step": 11462 + }, + { + "epoch": 0.06, + "global_step": 11463, + "learning_rate": 0.0004529924874791319, + "loss": 1.3727, + "loss_base2": 1.9804, + "loss_pixel": 0.1596, + "loss_text": 1.2131, + "ppl": 3.946, + "step": 11463 + }, + { + "epoch": 0.06, + "global_step": 11464, + "learning_rate": 0.0004529883138564274, + "loss": 1.3931, + "loss_base2": 2.0098, + "loss_pixel": 0.16, + "loss_text": 1.2331, + "ppl": 4.0273, + "step": 11464 + }, + { + "epoch": 0.06, + "global_step": 11465, + "learning_rate": 0.0004529841402337229, + "loss": 1.3865, + "loss_base2": 2.0003, + "loss_pixel": 0.1611, + "loss_text": 1.2254, + "ppl": 4.0008, + "step": 11465 + }, + { + "epoch": 0.06, + "global_step": 11466, + "learning_rate": 0.0004529799666110184, + "loss": 1.379, + "loss_base2": 1.9895, + "loss_pixel": 0.1597, + "loss_text": 1.2193, + "ppl": 3.9709, + "step": 11466 + }, + { + "epoch": 0.06, + "global_step": 11467, + "learning_rate": 0.0004529757929883139, + "loss": 1.3749, + "loss_base2": 1.9836, + "loss_pixel": 0.1609, + "loss_text": 1.214, + "ppl": 3.9547, + "step": 11467 + }, + { + "epoch": 0.06, + "global_step": 11468, + "learning_rate": 0.0004529716193656094, + "loss": 1.5112, + "loss_base2": 2.1802, + "loss_pixel": 0.1618, + "loss_text": 1.3494, + "ppl": 4.5322, + "step": 11468 + }, + { + "epoch": 0.06, + "global_step": 11469, + "learning_rate": 0.0004529674457429048, + "loss": 1.6109, + "loss_base2": 2.324, + "loss_pixel": 0.159, + "loss_text": 1.4519, + "ppl": 5.0073, + "step": 11469 + }, + { + "epoch": 0.06, + "global_step": 11470, + "learning_rate": 0.0004529632721202003, + "loss": 1.6124, + "loss_base2": 2.3262, + "loss_pixel": 0.1596, + "loss_text": 1.4528, + "ppl": 5.0148, + "step": 11470 + }, + { + "epoch": 0.06, + "global_step": 11471, + "learning_rate": 0.0004529590984974958, + "loss": 1.6208, + "loss_base2": 2.3383, + "loss_pixel": 0.1617, + "loss_text": 1.4591, + "ppl": 5.0571, + "step": 11471 + }, + { + "epoch": 0.06, + "global_step": 11472, + "learning_rate": 0.0004529549248747913, + "loss": 1.6227, + "loss_base2": 2.3411, + "loss_pixel": 0.1602, + "loss_text": 1.4625, + "ppl": 5.0668, + "step": 11472 + }, + { + "epoch": 0.06, + "global_step": 11473, + "learning_rate": 0.00045295075125208683, + "loss": 1.6286, + "loss_base2": 2.3496, + "loss_pixel": 0.1593, + "loss_text": 1.4694, + "ppl": 5.0967, + "step": 11473 + }, + { + "epoch": 0.06, + "global_step": 11474, + "learning_rate": 0.0004529465776293823, + "loss": 1.6229, + "loss_base2": 2.3413, + "loss_pixel": 0.1612, + "loss_text": 1.4617, + "ppl": 5.0678, + "step": 11474 + }, + { + "epoch": 0.06, + "global_step": 11475, + "learning_rate": 0.0004529424040066778, + "loss": 1.6106, + "loss_base2": 2.3236, + "loss_pixel": 0.1607, + "loss_text": 1.4499, + "ppl": 5.0058, + "step": 11475 + }, + { + "epoch": 0.06, + "global_step": 11476, + "learning_rate": 0.0004529382303839733, + "loss": 1.5731, + "loss_base2": 2.2695, + "loss_pixel": 0.1598, + "loss_text": 1.4134, + "ppl": 4.8216, + "step": 11476 + }, + { + "epoch": 0.06, + "global_step": 11477, + "learning_rate": 0.0004529340567612688, + "loss": 1.6059, + "loss_base2": 2.3168, + "loss_pixel": 0.1609, + "loss_text": 1.445, + "ppl": 4.9823, + "step": 11477 + }, + { + "epoch": 0.06, + "global_step": 11478, + "learning_rate": 0.00045292988313856426, + "loss": 1.6005, + "loss_base2": 2.309, + "loss_pixel": 0.1605, + "loss_text": 1.44, + "ppl": 4.9555, + "step": 11478 + }, + { + "epoch": 0.06, + "global_step": 11479, + "learning_rate": 0.00045292570951585977, + "loss": 1.6308, + "loss_base2": 2.3527, + "loss_pixel": 0.1599, + "loss_text": 1.4709, + "ppl": 5.108, + "step": 11479 + }, + { + "epoch": 0.06, + "global_step": 11480, + "learning_rate": 0.0004529215358931553, + "loss": 1.6127, + "loss_base2": 2.3266, + "loss_pixel": 0.1612, + "loss_text": 1.4515, + "ppl": 5.0163, + "step": 11480 + }, + { + "epoch": 0.06, + "global_step": 11481, + "learning_rate": 0.0004529173622704508, + "loss": 1.5964, + "loss_base2": 2.3031, + "loss_pixel": 0.1603, + "loss_text": 1.4361, + "ppl": 4.9352, + "step": 11481 + }, + { + "epoch": 0.06, + "global_step": 11482, + "learning_rate": 0.0004529131886477463, + "loss": 1.6102, + "loss_base2": 2.323, + "loss_pixel": 0.1608, + "loss_text": 1.4495, + "ppl": 5.0038, + "step": 11482 + }, + { + "epoch": 0.06, + "global_step": 11483, + "learning_rate": 0.00045290901502504174, + "loss": 1.6113, + "loss_base2": 2.3246, + "loss_pixel": 0.1567, + "loss_text": 1.4546, + "ppl": 5.0093, + "step": 11483 + }, + { + "epoch": 0.06, + "global_step": 11484, + "learning_rate": 0.00045290484140233725, + "loss": 1.6116, + "loss_base2": 2.325, + "loss_pixel": 0.1528, + "loss_text": 1.4588, + "ppl": 5.0108, + "step": 11484 + }, + { + "epoch": 0.06, + "global_step": 11485, + "learning_rate": 0.00045290066777963276, + "loss": 1.6131, + "loss_base2": 2.3272, + "loss_pixel": 0.1518, + "loss_text": 1.4613, + "ppl": 5.0183, + "step": 11485 + }, + { + "epoch": 0.06, + "global_step": 11486, + "learning_rate": 0.00045289649415692826, + "loss": 1.6038, + "loss_base2": 2.3138, + "loss_pixel": 0.1533, + "loss_text": 1.4505, + "ppl": 4.9719, + "step": 11486 + }, + { + "epoch": 0.06, + "global_step": 11487, + "learning_rate": 0.0004528923205342237, + "loss": 1.5961, + "loss_base2": 2.3027, + "loss_pixel": 0.1543, + "loss_text": 1.4418, + "ppl": 4.9338, + "step": 11487 + }, + { + "epoch": 0.06, + "global_step": 11488, + "learning_rate": 0.00045288814691151917, + "loss": 1.613, + "loss_base2": 2.3271, + "loss_pixel": 0.1548, + "loss_text": 1.4581, + "ppl": 5.0178, + "step": 11488 + }, + { + "epoch": 0.06, + "global_step": 11489, + "learning_rate": 0.0004528839732888147, + "loss": 1.5987, + "loss_base2": 2.3064, + "loss_pixel": 0.1536, + "loss_text": 1.445, + "ppl": 4.9466, + "step": 11489 + }, + { + "epoch": 0.06, + "global_step": 11490, + "learning_rate": 0.0004528797996661102, + "loss": 1.6062, + "loss_base2": 2.3173, + "loss_pixel": 0.1547, + "loss_text": 1.4514, + "ppl": 4.9838, + "step": 11490 + }, + { + "epoch": 0.06, + "global_step": 11491, + "learning_rate": 0.0004528756260434057, + "loss": 1.6021, + "loss_base2": 2.3113, + "loss_pixel": 0.1513, + "loss_text": 1.4508, + "ppl": 4.9634, + "step": 11491 + }, + { + "epoch": 0.06, + "global_step": 11492, + "learning_rate": 0.00045287145242070114, + "loss": 1.544, + "loss_base2": 2.2275, + "loss_pixel": 0.1551, + "loss_text": 1.389, + "ppl": 4.6833, + "step": 11492 + }, + { + "epoch": 0.06, + "global_step": 11493, + "learning_rate": 0.00045286727879799665, + "loss": 1.3929, + "loss_base2": 2.0095, + "loss_pixel": 0.1527, + "loss_text": 1.2402, + "ppl": 4.0265, + "step": 11493 + }, + { + "epoch": 0.06, + "global_step": 11494, + "learning_rate": 0.00045286310517529216, + "loss": 1.3737, + "loss_base2": 1.9818, + "loss_pixel": 0.1518, + "loss_text": 1.2219, + "ppl": 3.9499, + "step": 11494 + }, + { + "epoch": 0.06, + "global_step": 11495, + "learning_rate": 0.00045285893155258767, + "loss": 1.3915, + "loss_base2": 2.0075, + "loss_pixel": 0.1498, + "loss_text": 1.2417, + "ppl": 4.0209, + "step": 11495 + }, + { + "epoch": 0.06, + "global_step": 11496, + "learning_rate": 0.0004528547579298831, + "loss": 1.3633, + "loss_base2": 1.9668, + "loss_pixel": 0.149, + "loss_text": 1.2143, + "ppl": 3.9091, + "step": 11496 + }, + { + "epoch": 0.06, + "global_step": 11497, + "learning_rate": 0.0004528505843071786, + "loss": 1.3981, + "loss_base2": 2.017, + "loss_pixel": 0.1513, + "loss_text": 1.2468, + "ppl": 4.0475, + "step": 11497 + }, + { + "epoch": 0.06, + "global_step": 11498, + "learning_rate": 0.00045284641068447413, + "loss": 1.3732, + "loss_base2": 1.9811, + "loss_pixel": 0.1548, + "loss_text": 1.2184, + "ppl": 3.948, + "step": 11498 + }, + { + "epoch": 0.06, + "global_step": 11499, + "learning_rate": 0.00045284223706176964, + "loss": 1.3609, + "loss_base2": 1.9634, + "loss_pixel": 0.1516, + "loss_text": 1.2094, + "ppl": 3.8997, + "step": 11499 + }, + { + "epoch": 0.06, + "global_step": 11500, + "learning_rate": 0.00045283806343906515, + "loss": 1.3839, + "loss_base2": 1.9965, + "loss_pixel": 0.149, + "loss_text": 1.2349, + "ppl": 3.9904, + "step": 11500 + }, + { + "epoch": 0.06, + "global_step": 11501, + "learning_rate": 0.0004528338898163606, + "loss": 1.4725, + "loss_base2": 2.1244, + "loss_pixel": 0.1518, + "loss_text": 1.3207, + "ppl": 4.3601, + "step": 11501 + }, + { + "epoch": 0.06, + "global_step": 11502, + "learning_rate": 0.0004528297161936561, + "loss": 1.6292, + "loss_base2": 2.3504, + "loss_pixel": 0.1482, + "loss_text": 1.481, + "ppl": 5.0998, + "step": 11502 + }, + { + "epoch": 0.06, + "global_step": 11503, + "learning_rate": 0.0004528255425709516, + "loss": 1.6048, + "loss_base2": 2.3152, + "loss_pixel": 0.1493, + "loss_text": 1.4556, + "ppl": 4.9769, + "step": 11503 + }, + { + "epoch": 0.06, + "global_step": 11504, + "learning_rate": 0.0004528213689482471, + "loss": 1.6247, + "loss_base2": 2.3439, + "loss_pixel": 0.1516, + "loss_text": 1.4732, + "ppl": 5.0769, + "step": 11504 + }, + { + "epoch": 0.06, + "global_step": 11505, + "learning_rate": 0.00045281719532554263, + "loss": 1.6132, + "loss_base2": 2.3274, + "loss_pixel": 0.1507, + "loss_text": 1.4625, + "ppl": 5.0188, + "step": 11505 + }, + { + "epoch": 0.06, + "global_step": 11506, + "learning_rate": 0.0004528130217028381, + "loss": 1.5913, + "loss_base2": 2.2958, + "loss_pixel": 0.1501, + "loss_text": 1.4412, + "ppl": 4.9101, + "step": 11506 + }, + { + "epoch": 0.06, + "global_step": 11507, + "learning_rate": 0.00045280884808013354, + "loss": 1.6062, + "loss_base2": 2.3173, + "loss_pixel": 0.1488, + "loss_text": 1.4574, + "ppl": 4.9838, + "step": 11507 + }, + { + "epoch": 0.06, + "global_step": 11508, + "learning_rate": 0.00045280467445742904, + "loss": 1.6141, + "loss_base2": 2.3287, + "loss_pixel": 0.15, + "loss_text": 1.4641, + "ppl": 5.0234, + "step": 11508 + }, + { + "epoch": 0.06, + "global_step": 11509, + "learning_rate": 0.00045280050083472455, + "loss": 1.6056, + "loss_base2": 2.3164, + "loss_pixel": 0.15, + "loss_text": 1.4556, + "ppl": 4.9808, + "step": 11509 + }, + { + "epoch": 0.06, + "global_step": 11510, + "learning_rate": 0.00045279632721202, + "loss": 1.6085, + "loss_base2": 2.3206, + "loss_pixel": 0.1494, + "loss_text": 1.4591, + "ppl": 4.9953, + "step": 11510 + }, + { + "epoch": 0.06, + "global_step": 11511, + "learning_rate": 0.0004527921535893155, + "loss": 1.596, + "loss_base2": 2.3025, + "loss_pixel": 0.1508, + "loss_text": 1.4452, + "ppl": 4.9333, + "step": 11511 + }, + { + "epoch": 0.06, + "global_step": 11512, + "learning_rate": 0.000452787979966611, + "loss": 1.6026, + "loss_base2": 2.3121, + "loss_pixel": 0.1505, + "loss_text": 1.4522, + "ppl": 4.9659, + "step": 11512 + }, + { + "epoch": 0.06, + "global_step": 11513, + "learning_rate": 0.0004527838063439065, + "loss": 1.6074, + "loss_base2": 2.319, + "loss_pixel": 0.1515, + "loss_text": 1.4559, + "ppl": 4.9898, + "step": 11513 + }, + { + "epoch": 0.06, + "global_step": 11514, + "learning_rate": 0.00045277963272120203, + "loss": 1.6036, + "loss_base2": 2.3135, + "loss_pixel": 0.1513, + "loss_text": 1.4523, + "ppl": 4.9709, + "step": 11514 + }, + { + "epoch": 0.06, + "global_step": 11515, + "learning_rate": 0.0004527754590984975, + "loss": 1.594, + "loss_base2": 2.2997, + "loss_pixel": 0.1492, + "loss_text": 1.4448, + "ppl": 4.9234, + "step": 11515 + }, + { + "epoch": 0.06, + "global_step": 11516, + "learning_rate": 0.000452771285475793, + "loss": 1.6096, + "loss_base2": 2.3222, + "loss_pixel": 0.1544, + "loss_text": 1.4552, + "ppl": 5.0008, + "step": 11516 + }, + { + "epoch": 0.06, + "global_step": 11517, + "learning_rate": 0.0004527671118530885, + "loss": 1.6173, + "loss_base2": 2.3333, + "loss_pixel": 0.1677, + "loss_text": 1.4496, + "ppl": 5.0395, + "step": 11517 + }, + { + "epoch": 0.06, + "global_step": 11518, + "learning_rate": 0.000452762938230384, + "loss": 1.6278, + "loss_base2": 2.3484, + "loss_pixel": 0.1679, + "loss_text": 1.4599, + "ppl": 5.0927, + "step": 11518 + }, + { + "epoch": 0.06, + "global_step": 11519, + "learning_rate": 0.00045275876460767946, + "loss": 1.6265, + "loss_base2": 2.3465, + "loss_pixel": 0.1659, + "loss_text": 1.4607, + "ppl": 5.086, + "step": 11519 + }, + { + "epoch": 0.06, + "global_step": 11520, + "learning_rate": 0.00045275459098497497, + "loss": 1.6296, + "loss_base2": 2.351, + "loss_pixel": 0.1638, + "loss_text": 1.4657, + "ppl": 5.1018, + "step": 11520 + }, + { + "epoch": 0.06, + "global_step": 11521, + "learning_rate": 0.0004527504173622705, + "loss": 1.6072, + "loss_base2": 2.3187, + "loss_pixel": 0.1631, + "loss_text": 1.4441, + "ppl": 4.9888, + "step": 11521 + }, + { + "epoch": 0.06, + "global_step": 11522, + "learning_rate": 0.000452746243739566, + "loss": 1.6166, + "loss_base2": 2.3323, + "loss_pixel": 0.1622, + "loss_text": 1.4544, + "ppl": 5.0359, + "step": 11522 + }, + { + "epoch": 0.06, + "global_step": 11523, + "learning_rate": 0.0004527420701168615, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1623, + "loss_text": 1.4546, + "ppl": 5.0374, + "step": 11523 + }, + { + "epoch": 0.06, + "global_step": 11524, + "learning_rate": 0.00045273789649415694, + "loss": 1.6248, + "loss_base2": 2.3441, + "loss_pixel": 0.1619, + "loss_text": 1.4628, + "ppl": 5.0774, + "step": 11524 + }, + { + "epoch": 0.06, + "global_step": 11525, + "learning_rate": 0.00045273372287145245, + "loss": 1.5803, + "loss_base2": 2.2799, + "loss_pixel": 0.1612, + "loss_text": 1.4191, + "ppl": 4.8564, + "step": 11525 + }, + { + "epoch": 0.06, + "global_step": 11526, + "learning_rate": 0.0004527295492487479, + "loss": 1.509, + "loss_base2": 2.177, + "loss_pixel": 0.1604, + "loss_text": 1.3486, + "ppl": 4.5222, + "step": 11526 + }, + { + "epoch": 0.06, + "global_step": 11527, + "learning_rate": 0.0004527253756260434, + "loss": 1.4072, + "loss_base2": 2.0302, + "loss_pixel": 0.1642, + "loss_text": 1.243, + "ppl": 4.0845, + "step": 11527 + }, + { + "epoch": 0.06, + "global_step": 11528, + "learning_rate": 0.00045272120200333887, + "loss": 1.3856, + "loss_base2": 1.999, + "loss_pixel": 0.1614, + "loss_text": 1.2241, + "ppl": 3.9972, + "step": 11528 + }, + { + "epoch": 0.06, + "global_step": 11529, + "learning_rate": 0.00045271702838063437, + "loss": 1.411, + "loss_base2": 2.0356, + "loss_pixel": 0.163, + "loss_text": 1.248, + "ppl": 4.1001, + "step": 11529 + }, + { + "epoch": 0.06, + "global_step": 11530, + "learning_rate": 0.0004527128547579299, + "loss": 1.3931, + "loss_base2": 2.0098, + "loss_pixel": 0.1612, + "loss_text": 1.2319, + "ppl": 4.0273, + "step": 11530 + }, + { + "epoch": 0.06, + "global_step": 11531, + "learning_rate": 0.0004527086811352254, + "loss": 1.3646, + "loss_base2": 1.9687, + "loss_pixel": 0.1619, + "loss_text": 1.2027, + "ppl": 3.9142, + "step": 11531 + }, + { + "epoch": 0.06, + "global_step": 11532, + "learning_rate": 0.0004527045075125209, + "loss": 1.3914, + "loss_base2": 2.0074, + "loss_pixel": 0.1611, + "loss_text": 1.2303, + "ppl": 4.0205, + "step": 11532 + }, + { + "epoch": 0.06, + "global_step": 11533, + "learning_rate": 0.00045270033388981635, + "loss": 1.3655, + "loss_base2": 1.97, + "loss_pixel": 0.1614, + "loss_text": 1.2042, + "ppl": 3.9177, + "step": 11533 + }, + { + "epoch": 0.06, + "global_step": 11534, + "learning_rate": 0.00045269616026711185, + "loss": 1.4259, + "loss_base2": 2.0571, + "loss_pixel": 0.1619, + "loss_text": 1.264, + "ppl": 4.1616, + "step": 11534 + }, + { + "epoch": 0.06, + "global_step": 11535, + "learning_rate": 0.00045269198664440736, + "loss": 1.5416, + "loss_base2": 2.2241, + "loss_pixel": 0.1618, + "loss_text": 1.3798, + "ppl": 4.6721, + "step": 11535 + }, + { + "epoch": 0.06, + "global_step": 11536, + "learning_rate": 0.00045268781302170287, + "loss": 1.3817, + "loss_base2": 1.9934, + "loss_pixel": 0.1616, + "loss_text": 1.2201, + "ppl": 3.9817, + "step": 11536 + }, + { + "epoch": 0.06, + "global_step": 11537, + "learning_rate": 0.0004526836393989983, + "loss": 1.3956, + "loss_base2": 2.0134, + "loss_pixel": 0.1601, + "loss_text": 1.2354, + "ppl": 4.0374, + "step": 11537 + }, + { + "epoch": 0.06, + "global_step": 11538, + "learning_rate": 0.00045267946577629383, + "loss": 1.4108, + "loss_base2": 2.0354, + "loss_pixel": 0.1602, + "loss_text": 1.2506, + "ppl": 4.0992, + "step": 11538 + }, + { + "epoch": 0.06, + "global_step": 11539, + "learning_rate": 0.00045267529215358934, + "loss": 1.387, + "loss_base2": 2.001, + "loss_pixel": 0.1612, + "loss_text": 1.2258, + "ppl": 4.0028, + "step": 11539 + }, + { + "epoch": 0.06, + "global_step": 11540, + "learning_rate": 0.00045267111853088484, + "loss": 1.3863, + "loss_base2": 2.0, + "loss_pixel": 0.1603, + "loss_text": 1.226, + "ppl": 4.0, + "step": 11540 + }, + { + "epoch": 0.06, + "global_step": 11541, + "learning_rate": 0.00045266694490818035, + "loss": 1.3661, + "loss_base2": 1.9709, + "loss_pixel": 0.1615, + "loss_text": 1.2045, + "ppl": 3.92, + "step": 11541 + }, + { + "epoch": 0.06, + "global_step": 11542, + "learning_rate": 0.0004526627712854758, + "loss": 1.3856, + "loss_base2": 1.999, + "loss_pixel": 0.1611, + "loss_text": 1.2245, + "ppl": 3.9972, + "step": 11542 + }, + { + "epoch": 0.06, + "global_step": 11543, + "learning_rate": 0.0004526585976627713, + "loss": 1.3855, + "loss_base2": 1.9989, + "loss_pixel": 0.1602, + "loss_text": 1.2252, + "ppl": 3.9968, + "step": 11543 + }, + { + "epoch": 0.06, + "global_step": 11544, + "learning_rate": 0.00045265442404006677, + "loss": 1.3738, + "loss_base2": 1.982, + "loss_pixel": 0.162, + "loss_text": 1.2118, + "ppl": 3.9503, + "step": 11544 + }, + { + "epoch": 0.06, + "global_step": 11545, + "learning_rate": 0.00045265025041736227, + "loss": 1.4025, + "loss_base2": 2.0234, + "loss_pixel": 0.1596, + "loss_text": 1.2429, + "ppl": 4.0654, + "step": 11545 + }, + { + "epoch": 0.06, + "global_step": 11546, + "learning_rate": 0.0004526460767946577, + "loss": 1.3878, + "loss_base2": 2.0022, + "loss_pixel": 0.1601, + "loss_text": 1.2277, + "ppl": 4.006, + "step": 11546 + }, + { + "epoch": 0.06, + "global_step": 11547, + "learning_rate": 0.00045264190317195323, + "loss": 1.3843, + "loss_base2": 1.9971, + "loss_pixel": 0.1602, + "loss_text": 1.2241, + "ppl": 3.992, + "step": 11547 + }, + { + "epoch": 0.06, + "global_step": 11548, + "learning_rate": 0.00045263772954924874, + "loss": 1.3925, + "loss_base2": 2.009, + "loss_pixel": 0.1619, + "loss_text": 1.2305, + "ppl": 4.0249, + "step": 11548 + }, + { + "epoch": 0.06, + "global_step": 11549, + "learning_rate": 0.00045263355592654425, + "loss": 1.364, + "loss_base2": 1.9678, + "loss_pixel": 0.1597, + "loss_text": 1.2042, + "ppl": 3.9118, + "step": 11549 + }, + { + "epoch": 0.06, + "global_step": 11550, + "learning_rate": 0.00045262938230383976, + "loss": 1.3961, + "loss_base2": 2.0141, + "loss_pixel": 0.1601, + "loss_text": 1.2359, + "ppl": 4.0394, + "step": 11550 + }, + { + "epoch": 0.06, + "global_step": 11551, + "learning_rate": 0.0004526252086811352, + "loss": 1.573, + "loss_base2": 2.2694, + "loss_pixel": 0.1591, + "loss_text": 1.414, + "ppl": 4.8211, + "step": 11551 + }, + { + "epoch": 0.06, + "global_step": 11552, + "learning_rate": 0.0004526210350584307, + "loss": 1.6331, + "loss_base2": 2.3561, + "loss_pixel": 0.1598, + "loss_text": 1.4733, + "ppl": 5.1197, + "step": 11552 + }, + { + "epoch": 0.06, + "global_step": 11553, + "learning_rate": 0.0004526168614357262, + "loss": 1.618, + "loss_base2": 2.3343, + "loss_pixel": 0.16, + "loss_text": 1.458, + "ppl": 5.043, + "step": 11553 + }, + { + "epoch": 0.06, + "global_step": 11554, + "learning_rate": 0.00045261268781302173, + "loss": 1.6248, + "loss_base2": 2.3441, + "loss_pixel": 0.161, + "loss_text": 1.4637, + "ppl": 5.0774, + "step": 11554 + }, + { + "epoch": 0.06, + "global_step": 11555, + "learning_rate": 0.0004526085141903172, + "loss": 1.6002, + "loss_base2": 2.3086, + "loss_pixel": 0.1594, + "loss_text": 1.4408, + "ppl": 4.954, + "step": 11555 + }, + { + "epoch": 0.06, + "global_step": 11556, + "learning_rate": 0.0004526043405676127, + "loss": 1.6124, + "loss_base2": 2.3262, + "loss_pixel": 0.1604, + "loss_text": 1.452, + "ppl": 5.0148, + "step": 11556 + }, + { + "epoch": 0.06, + "global_step": 11557, + "learning_rate": 0.0004526001669449082, + "loss": 1.6286, + "loss_base2": 2.3496, + "loss_pixel": 0.1612, + "loss_text": 1.4674, + "ppl": 5.0967, + "step": 11557 + }, + { + "epoch": 0.06, + "global_step": 11558, + "learning_rate": 0.0004525959933222037, + "loss": 1.6235, + "loss_base2": 2.3422, + "loss_pixel": 0.1598, + "loss_text": 1.4638, + "ppl": 5.0708, + "step": 11558 + }, + { + "epoch": 0.06, + "global_step": 11559, + "learning_rate": 0.0004525918196994992, + "loss": 1.6244, + "loss_base2": 2.3435, + "loss_pixel": 0.1588, + "loss_text": 1.4656, + "ppl": 5.0754, + "step": 11559 + }, + { + "epoch": 0.06, + "global_step": 11560, + "learning_rate": 0.00045258764607679467, + "loss": 1.6149, + "loss_base2": 2.3298, + "loss_pixel": 0.1602, + "loss_text": 1.4548, + "ppl": 5.0274, + "step": 11560 + }, + { + "epoch": 0.06, + "global_step": 11561, + "learning_rate": 0.0004525834724540902, + "loss": 1.6093, + "loss_base2": 2.3217, + "loss_pixel": 0.1598, + "loss_text": 1.4495, + "ppl": 4.9993, + "step": 11561 + }, + { + "epoch": 0.06, + "global_step": 11562, + "learning_rate": 0.0004525792988313857, + "loss": 1.612, + "loss_base2": 2.3256, + "loss_pixel": 0.1594, + "loss_text": 1.4526, + "ppl": 5.0128, + "step": 11562 + }, + { + "epoch": 0.06, + "global_step": 11563, + "learning_rate": 0.00045257512520868113, + "loss": 1.6118, + "loss_base2": 2.3253, + "loss_pixel": 0.1609, + "loss_text": 1.4509, + "ppl": 5.0118, + "step": 11563 + }, + { + "epoch": 0.06, + "global_step": 11564, + "learning_rate": 0.00045257095158597664, + "loss": 1.6186, + "loss_base2": 2.3351, + "loss_pixel": 0.1596, + "loss_text": 1.459, + "ppl": 5.046, + "step": 11564 + }, + { + "epoch": 0.06, + "global_step": 11565, + "learning_rate": 0.0004525667779632721, + "loss": 1.6047, + "loss_base2": 2.3151, + "loss_pixel": 0.1606, + "loss_text": 1.4441, + "ppl": 4.9764, + "step": 11565 + }, + { + "epoch": 0.06, + "global_step": 11566, + "learning_rate": 0.0004525626043405676, + "loss": 1.6135, + "loss_base2": 2.3278, + "loss_pixel": 0.1611, + "loss_text": 1.4524, + "ppl": 5.0204, + "step": 11566 + }, + { + "epoch": 0.06, + "global_step": 11567, + "learning_rate": 0.0004525584307178631, + "loss": 1.6136, + "loss_base2": 2.3279, + "loss_pixel": 0.1588, + "loss_text": 1.4549, + "ppl": 5.0209, + "step": 11567 + }, + { + "epoch": 0.06, + "global_step": 11568, + "learning_rate": 0.0004525542570951586, + "loss": 1.6073, + "loss_base2": 2.3188, + "loss_pixel": 0.16, + "loss_text": 1.4473, + "ppl": 4.9893, + "step": 11568 + }, + { + "epoch": 0.06, + "global_step": 11569, + "learning_rate": 0.00045255008347245407, + "loss": 1.6283, + "loss_base2": 2.3491, + "loss_pixel": 0.1606, + "loss_text": 1.4677, + "ppl": 5.0952, + "step": 11569 + }, + { + "epoch": 0.06, + "global_step": 11570, + "learning_rate": 0.0004525459098497496, + "loss": 1.6033, + "loss_base2": 2.3131, + "loss_pixel": 0.1606, + "loss_text": 1.4426, + "ppl": 4.9694, + "step": 11570 + }, + { + "epoch": 0.06, + "global_step": 11571, + "learning_rate": 0.0004525417362270451, + "loss": 1.5997, + "loss_base2": 2.3079, + "loss_pixel": 0.1605, + "loss_text": 1.4392, + "ppl": 4.9515, + "step": 11571 + }, + { + "epoch": 0.06, + "global_step": 11572, + "learning_rate": 0.0004525375626043406, + "loss": 1.6187, + "loss_base2": 2.3353, + "loss_pixel": 0.1589, + "loss_text": 1.4599, + "ppl": 5.0465, + "step": 11572 + }, + { + "epoch": 0.06, + "global_step": 11573, + "learning_rate": 0.0004525333889816361, + "loss": 1.6129, + "loss_base2": 2.3269, + "loss_pixel": 0.1603, + "loss_text": 1.4526, + "ppl": 5.0173, + "step": 11573 + }, + { + "epoch": 0.06, + "global_step": 11574, + "learning_rate": 0.00045252921535893155, + "loss": 1.6206, + "loss_base2": 2.338, + "loss_pixel": 0.16, + "loss_text": 1.4606, + "ppl": 5.0561, + "step": 11574 + }, + { + "epoch": 0.06, + "global_step": 11575, + "learning_rate": 0.00045252504173622706, + "loss": 1.6257, + "loss_base2": 2.3454, + "loss_pixel": 0.1589, + "loss_text": 1.4668, + "ppl": 5.082, + "step": 11575 + }, + { + "epoch": 0.06, + "global_step": 11576, + "learning_rate": 0.00045252086811352257, + "loss": 1.5989, + "loss_base2": 2.3067, + "loss_pixel": 0.1587, + "loss_text": 1.4402, + "ppl": 4.9476, + "step": 11576 + }, + { + "epoch": 0.06, + "global_step": 11577, + "learning_rate": 0.0004525166944908181, + "loss": 1.6074, + "loss_base2": 2.319, + "loss_pixel": 0.1608, + "loss_text": 1.4467, + "ppl": 4.9898, + "step": 11577 + }, + { + "epoch": 0.06, + "global_step": 11578, + "learning_rate": 0.0004525125208681135, + "loss": 1.6099, + "loss_base2": 2.3226, + "loss_pixel": 0.1594, + "loss_text": 1.4504, + "ppl": 5.0023, + "step": 11578 + }, + { + "epoch": 0.06, + "global_step": 11579, + "learning_rate": 0.00045250834724540903, + "loss": 1.6056, + "loss_base2": 2.3164, + "loss_pixel": 0.1602, + "loss_text": 1.4453, + "ppl": 4.9808, + "step": 11579 + }, + { + "epoch": 0.06, + "global_step": 11580, + "learning_rate": 0.00045250417362270454, + "loss": 1.5846, + "loss_base2": 2.2861, + "loss_pixel": 0.1615, + "loss_text": 1.4231, + "ppl": 4.8773, + "step": 11580 + }, + { + "epoch": 0.06, + "global_step": 11581, + "learning_rate": 0.00045250000000000005, + "loss": 1.5946, + "loss_base2": 2.3005, + "loss_pixel": 0.1601, + "loss_text": 1.4345, + "ppl": 4.9264, + "step": 11581 + }, + { + "epoch": 0.06, + "global_step": 11582, + "learning_rate": 0.0004524958263772955, + "loss": 1.6032, + "loss_base2": 2.3129, + "loss_pixel": 0.1594, + "loss_text": 1.4437, + "ppl": 4.9689, + "step": 11582 + }, + { + "epoch": 0.06, + "global_step": 11583, + "learning_rate": 0.00045249165275459095, + "loss": 1.6056, + "loss_base2": 2.3164, + "loss_pixel": 0.1589, + "loss_text": 1.4467, + "ppl": 4.9808, + "step": 11583 + }, + { + "epoch": 0.06, + "global_step": 11584, + "learning_rate": 0.00045248747913188646, + "loss": 1.6101, + "loss_base2": 2.3229, + "loss_pixel": 0.1602, + "loss_text": 1.4499, + "ppl": 5.0033, + "step": 11584 + }, + { + "epoch": 0.06, + "global_step": 11585, + "learning_rate": 0.00045248330550918197, + "loss": 1.6035, + "loss_base2": 2.3134, + "loss_pixel": 0.1616, + "loss_text": 1.442, + "ppl": 4.9704, + "step": 11585 + }, + { + "epoch": 0.06, + "global_step": 11586, + "learning_rate": 0.0004524791318864775, + "loss": 1.6156, + "loss_base2": 2.3308, + "loss_pixel": 0.1524, + "loss_text": 1.4632, + "ppl": 5.0309, + "step": 11586 + }, + { + "epoch": 0.06, + "global_step": 11587, + "learning_rate": 0.00045247495826377293, + "loss": 1.5941, + "loss_base2": 2.2998, + "loss_pixel": 0.1528, + "loss_text": 1.4413, + "ppl": 4.9239, + "step": 11587 + }, + { + "epoch": 0.06, + "global_step": 11588, + "learning_rate": 0.00045247078464106844, + "loss": 1.6083, + "loss_base2": 2.3203, + "loss_pixel": 0.1503, + "loss_text": 1.458, + "ppl": 4.9943, + "step": 11588 + }, + { + "epoch": 0.06, + "global_step": 11589, + "learning_rate": 0.00045246661101836394, + "loss": 1.5988, + "loss_base2": 2.3066, + "loss_pixel": 0.1537, + "loss_text": 1.4451, + "ppl": 4.9471, + "step": 11589 + }, + { + "epoch": 0.06, + "global_step": 11590, + "learning_rate": 0.00045246243739565945, + "loss": 1.6177, + "loss_base2": 2.3338, + "loss_pixel": 0.1521, + "loss_text": 1.4657, + "ppl": 5.0415, + "step": 11590 + }, + { + "epoch": 0.06, + "global_step": 11591, + "learning_rate": 0.00045245826377295496, + "loss": 1.6032, + "loss_base2": 2.3129, + "loss_pixel": 0.1534, + "loss_text": 1.4498, + "ppl": 4.9689, + "step": 11591 + }, + { + "epoch": 0.06, + "global_step": 11592, + "learning_rate": 0.0004524540901502504, + "loss": 1.5888, + "loss_base2": 2.2922, + "loss_pixel": 0.1506, + "loss_text": 1.4382, + "ppl": 4.8979, + "step": 11592 + }, + { + "epoch": 0.06, + "global_step": 11593, + "learning_rate": 0.0004524499165275459, + "loss": 1.603, + "loss_base2": 2.3126, + "loss_pixel": 0.1496, + "loss_text": 1.4534, + "ppl": 4.9679, + "step": 11593 + }, + { + "epoch": 0.06, + "global_step": 11594, + "learning_rate": 0.0004524457429048414, + "loss": 1.5972, + "loss_base2": 2.3043, + "loss_pixel": 0.1513, + "loss_text": 1.446, + "ppl": 4.9392, + "step": 11594 + }, + { + "epoch": 0.06, + "global_step": 11595, + "learning_rate": 0.00045244156928213693, + "loss": 1.6078, + "loss_base2": 2.3196, + "loss_pixel": 0.1513, + "loss_text": 1.4565, + "ppl": 4.9918, + "step": 11595 + }, + { + "epoch": 0.06, + "global_step": 11596, + "learning_rate": 0.0004524373956594324, + "loss": 1.5961, + "loss_base2": 2.3027, + "loss_pixel": 0.1506, + "loss_text": 1.4454, + "ppl": 4.9338, + "step": 11596 + }, + { + "epoch": 0.06, + "global_step": 11597, + "learning_rate": 0.0004524332220367279, + "loss": 1.5934, + "loss_base2": 2.2988, + "loss_pixel": 0.1507, + "loss_text": 1.4427, + "ppl": 4.9205, + "step": 11597 + }, + { + "epoch": 0.06, + "global_step": 11598, + "learning_rate": 0.0004524290484140234, + "loss": 1.6069, + "loss_base2": 2.3183, + "loss_pixel": 0.1505, + "loss_text": 1.4564, + "ppl": 4.9873, + "step": 11598 + }, + { + "epoch": 0.06, + "global_step": 11599, + "learning_rate": 0.0004524248747913189, + "loss": 1.5982, + "loss_base2": 2.3057, + "loss_pixel": 0.1489, + "loss_text": 1.4493, + "ppl": 4.9441, + "step": 11599 + }, + { + "epoch": 0.06, + "global_step": 11600, + "learning_rate": 0.0004524207011686144, + "loss": 1.6041, + "loss_base2": 2.3142, + "loss_pixel": 0.1491, + "loss_text": 1.455, + "ppl": 4.9734, + "step": 11600 + }, + { + "epoch": 0.06, + "global_step": 11601, + "learning_rate": 0.0004524165275459098, + "loss": 1.5982, + "loss_base2": 2.3057, + "loss_pixel": 0.1512, + "loss_text": 1.447, + "ppl": 4.9441, + "step": 11601 + }, + { + "epoch": 0.06, + "global_step": 11602, + "learning_rate": 0.0004524123539232053, + "loss": 1.5987, + "loss_base2": 2.3064, + "loss_pixel": 0.1487, + "loss_text": 1.45, + "ppl": 4.9466, + "step": 11602 + }, + { + "epoch": 0.06, + "global_step": 11603, + "learning_rate": 0.00045240818030050083, + "loss": 1.5938, + "loss_base2": 2.2994, + "loss_pixel": 0.1515, + "loss_text": 1.4423, + "ppl": 4.9224, + "step": 11603 + }, + { + "epoch": 0.06, + "global_step": 11604, + "learning_rate": 0.00045240400667779634, + "loss": 1.6072, + "loss_base2": 2.3187, + "loss_pixel": 0.1496, + "loss_text": 1.4576, + "ppl": 4.9888, + "step": 11604 + }, + { + "epoch": 0.06, + "global_step": 11605, + "learning_rate": 0.0004523998330550918, + "loss": 1.609, + "loss_base2": 2.3213, + "loss_pixel": 0.1497, + "loss_text": 1.4593, + "ppl": 4.9978, + "step": 11605 + }, + { + "epoch": 0.06, + "global_step": 11606, + "learning_rate": 0.0004523956594323873, + "loss": 1.6023, + "loss_base2": 2.3116, + "loss_pixel": 0.1492, + "loss_text": 1.4531, + "ppl": 4.9644, + "step": 11606 + }, + { + "epoch": 0.06, + "global_step": 11607, + "learning_rate": 0.0004523914858096828, + "loss": 1.5959, + "loss_base2": 2.3024, + "loss_pixel": 0.1489, + "loss_text": 1.447, + "ppl": 4.9328, + "step": 11607 + }, + { + "epoch": 0.06, + "global_step": 11608, + "learning_rate": 0.0004523873121869783, + "loss": 1.5937, + "loss_base2": 2.2992, + "loss_pixel": 0.1482, + "loss_text": 1.4455, + "ppl": 4.9219, + "step": 11608 + }, + { + "epoch": 0.06, + "global_step": 11609, + "learning_rate": 0.0004523831385642738, + "loss": 1.6086, + "loss_base2": 2.3207, + "loss_pixel": 0.1483, + "loss_text": 1.4602, + "ppl": 4.9958, + "step": 11609 + }, + { + "epoch": 0.06, + "global_step": 11610, + "learning_rate": 0.00045237896494156927, + "loss": 1.5877, + "loss_base2": 2.2906, + "loss_pixel": 0.1487, + "loss_text": 1.4391, + "ppl": 4.8925, + "step": 11610 + }, + { + "epoch": 0.06, + "global_step": 11611, + "learning_rate": 0.0004523747913188648, + "loss": 1.6111, + "loss_base2": 2.3243, + "loss_pixel": 0.1494, + "loss_text": 1.4617, + "ppl": 5.0083, + "step": 11611 + }, + { + "epoch": 0.06, + "global_step": 11612, + "learning_rate": 0.0004523706176961603, + "loss": 1.593, + "loss_base2": 2.2982, + "loss_pixel": 0.1496, + "loss_text": 1.4434, + "ppl": 4.9185, + "step": 11612 + }, + { + "epoch": 0.06, + "global_step": 11613, + "learning_rate": 0.0004523664440734558, + "loss": 1.5933, + "loss_base2": 2.2986, + "loss_pixel": 0.1464, + "loss_text": 1.4469, + "ppl": 4.92, + "step": 11613 + }, + { + "epoch": 0.06, + "global_step": 11614, + "learning_rate": 0.00045236227045075125, + "loss": 1.602, + "loss_base2": 2.3112, + "loss_pixel": 0.1494, + "loss_text": 1.4526, + "ppl": 4.9629, + "step": 11614 + }, + { + "epoch": 0.06, + "global_step": 11615, + "learning_rate": 0.00045235809682804676, + "loss": 1.5933, + "loss_base2": 2.2986, + "loss_pixel": 0.1473, + "loss_text": 1.446, + "ppl": 4.92, + "step": 11615 + }, + { + "epoch": 0.06, + "global_step": 11616, + "learning_rate": 0.00045235392320534226, + "loss": 1.5843, + "loss_base2": 2.2857, + "loss_pixel": 0.1489, + "loss_text": 1.4354, + "ppl": 4.8759, + "step": 11616 + }, + { + "epoch": 0.06, + "global_step": 11617, + "learning_rate": 0.00045234974958263777, + "loss": 1.5856, + "loss_base2": 2.2875, + "loss_pixel": 0.1509, + "loss_text": 1.4347, + "ppl": 4.8822, + "step": 11617 + }, + { + "epoch": 0.06, + "global_step": 11618, + "learning_rate": 0.0004523455759599333, + "loss": 1.5823, + "loss_base2": 2.2828, + "loss_pixel": 0.146, + "loss_text": 1.4363, + "ppl": 4.8661, + "step": 11618 + }, + { + "epoch": 0.06, + "global_step": 11619, + "learning_rate": 0.0004523414023372287, + "loss": 1.5928, + "loss_base2": 2.2979, + "loss_pixel": 0.1491, + "loss_text": 1.4437, + "ppl": 4.9175, + "step": 11619 + }, + { + "epoch": 0.06, + "global_step": 11620, + "learning_rate": 0.0004523372287145242, + "loss": 1.5927, + "loss_base2": 2.2978, + "loss_pixel": 0.1512, + "loss_text": 1.4415, + "ppl": 4.917, + "step": 11620 + }, + { + "epoch": 0.06, + "global_step": 11621, + "learning_rate": 0.0004523330550918197, + "loss": 1.6041, + "loss_base2": 2.3142, + "loss_pixel": 0.1621, + "loss_text": 1.442, + "ppl": 4.9734, + "step": 11621 + }, + { + "epoch": 0.06, + "global_step": 11622, + "learning_rate": 0.0004523288814691152, + "loss": 1.6088, + "loss_base2": 2.321, + "loss_pixel": 0.1617, + "loss_text": 1.4471, + "ppl": 4.9968, + "step": 11622 + }, + { + "epoch": 0.06, + "global_step": 11623, + "learning_rate": 0.0004523247078464107, + "loss": 1.624, + "loss_base2": 2.3429, + "loss_pixel": 0.1623, + "loss_text": 1.4617, + "ppl": 5.0733, + "step": 11623 + }, + { + "epoch": 0.06, + "global_step": 11624, + "learning_rate": 0.00045232053422370616, + "loss": 1.6044, + "loss_base2": 2.3147, + "loss_pixel": 0.1616, + "loss_text": 1.4428, + "ppl": 4.9749, + "step": 11624 + }, + { + "epoch": 0.06, + "global_step": 11625, + "learning_rate": 0.00045231636060100167, + "loss": 1.62, + "loss_base2": 2.3372, + "loss_pixel": 0.1611, + "loss_text": 1.459, + "ppl": 5.0531, + "step": 11625 + }, + { + "epoch": 0.06, + "global_step": 11626, + "learning_rate": 0.0004523121869782972, + "loss": 1.6005, + "loss_base2": 2.309, + "loss_pixel": 0.1601, + "loss_text": 1.4404, + "ppl": 4.9555, + "step": 11626 + }, + { + "epoch": 0.06, + "global_step": 11627, + "learning_rate": 0.0004523080133555927, + "loss": 1.6163, + "loss_base2": 2.3318, + "loss_pixel": 0.1614, + "loss_text": 1.4549, + "ppl": 5.0344, + "step": 11627 + }, + { + "epoch": 0.06, + "global_step": 11628, + "learning_rate": 0.00045230383973288813, + "loss": 1.6083, + "loss_base2": 2.3203, + "loss_pixel": 0.1607, + "loss_text": 1.4476, + "ppl": 4.9943, + "step": 11628 + }, + { + "epoch": 0.06, + "global_step": 11629, + "learning_rate": 0.00045229966611018364, + "loss": 1.63, + "loss_base2": 2.3516, + "loss_pixel": 0.1622, + "loss_text": 1.4678, + "ppl": 5.1039, + "step": 11629 + }, + { + "epoch": 0.06, + "global_step": 11630, + "learning_rate": 0.00045229549248747915, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1629, + "loss_text": 1.454, + "ppl": 5.0374, + "step": 11630 + }, + { + "epoch": 0.06, + "global_step": 11631, + "learning_rate": 0.00045229131886477466, + "loss": 1.6283, + "loss_base2": 2.3491, + "loss_pixel": 0.1608, + "loss_text": 1.4675, + "ppl": 5.0952, + "step": 11631 + }, + { + "epoch": 0.06, + "global_step": 11632, + "learning_rate": 0.00045228714524207016, + "loss": 1.5996, + "loss_base2": 2.3077, + "loss_pixel": 0.1607, + "loss_text": 1.4389, + "ppl": 4.9511, + "step": 11632 + }, + { + "epoch": 0.06, + "global_step": 11633, + "learning_rate": 0.0004522829716193656, + "loss": 1.6181, + "loss_base2": 2.3344, + "loss_pixel": 0.1612, + "loss_text": 1.4569, + "ppl": 5.0435, + "step": 11633 + }, + { + "epoch": 0.06, + "global_step": 11634, + "learning_rate": 0.0004522787979966611, + "loss": 1.6033, + "loss_base2": 2.3131, + "loss_pixel": 0.1614, + "loss_text": 1.4419, + "ppl": 4.9694, + "step": 11634 + }, + { + "epoch": 0.06, + "global_step": 11635, + "learning_rate": 0.00045227462437395663, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1591, + "loss_text": 1.4578, + "ppl": 5.0374, + "step": 11635 + }, + { + "epoch": 0.06, + "global_step": 11636, + "learning_rate": 0.00045227045075125214, + "loss": 1.6194, + "loss_base2": 2.3363, + "loss_pixel": 0.1629, + "loss_text": 1.4566, + "ppl": 5.0501, + "step": 11636 + }, + { + "epoch": 0.06, + "global_step": 11637, + "learning_rate": 0.0004522662771285476, + "loss": 1.6173, + "loss_base2": 2.3333, + "loss_pixel": 0.1603, + "loss_text": 1.4571, + "ppl": 5.0395, + "step": 11637 + }, + { + "epoch": 0.06, + "global_step": 11638, + "learning_rate": 0.00045226210350584304, + "loss": 1.6159, + "loss_base2": 2.3313, + "loss_pixel": 0.1592, + "loss_text": 1.4567, + "ppl": 5.0324, + "step": 11638 + }, + { + "epoch": 0.06, + "global_step": 11639, + "learning_rate": 0.00045225792988313855, + "loss": 1.6039, + "loss_base2": 2.3139, + "loss_pixel": 0.1587, + "loss_text": 1.4452, + "ppl": 4.9724, + "step": 11639 + }, + { + "epoch": 0.06, + "global_step": 11640, + "learning_rate": 0.00045225375626043406, + "loss": 1.5949, + "loss_base2": 2.301, + "loss_pixel": 0.1593, + "loss_text": 1.4355, + "ppl": 4.9278, + "step": 11640 + }, + { + "epoch": 0.06, + "global_step": 11641, + "learning_rate": 0.00045224958263772957, + "loss": 1.5886, + "loss_base2": 2.2919, + "loss_pixel": 0.16, + "loss_text": 1.4286, + "ppl": 4.8969, + "step": 11641 + }, + { + "epoch": 0.06, + "global_step": 11642, + "learning_rate": 0.000452245409015025, + "loss": 1.6085, + "loss_base2": 2.3206, + "loss_pixel": 0.1589, + "loss_text": 1.4496, + "ppl": 4.9953, + "step": 11642 + }, + { + "epoch": 0.06, + "global_step": 11643, + "learning_rate": 0.0004522412353923205, + "loss": 1.5951, + "loss_base2": 2.3012, + "loss_pixel": 0.1612, + "loss_text": 1.4339, + "ppl": 4.9288, + "step": 11643 + }, + { + "epoch": 0.06, + "global_step": 11644, + "learning_rate": 0.00045223706176961603, + "loss": 1.5987, + "loss_base2": 2.3064, + "loss_pixel": 0.1602, + "loss_text": 1.4385, + "ppl": 4.9466, + "step": 11644 + }, + { + "epoch": 0.06, + "global_step": 11645, + "learning_rate": 0.00045223288814691154, + "loss": 1.6059, + "loss_base2": 2.3168, + "loss_pixel": 0.159, + "loss_text": 1.4469, + "ppl": 4.9823, + "step": 11645 + }, + { + "epoch": 0.06, + "global_step": 11646, + "learning_rate": 0.000452228714524207, + "loss": 1.5937, + "loss_base2": 2.2992, + "loss_pixel": 0.1593, + "loss_text": 1.4343, + "ppl": 4.9219, + "step": 11646 + }, + { + "epoch": 0.06, + "global_step": 11647, + "learning_rate": 0.0004522245409015025, + "loss": 1.6024, + "loss_base2": 2.3118, + "loss_pixel": 0.1596, + "loss_text": 1.4427, + "ppl": 4.9649, + "step": 11647 + }, + { + "epoch": 0.06, + "global_step": 11648, + "learning_rate": 0.000452220367278798, + "loss": 1.6137, + "loss_base2": 2.3281, + "loss_pixel": 0.1578, + "loss_text": 1.4559, + "ppl": 5.0214, + "step": 11648 + }, + { + "epoch": 0.06, + "global_step": 11649, + "learning_rate": 0.0004522161936560935, + "loss": 1.6153, + "loss_base2": 2.3304, + "loss_pixel": 0.1593, + "loss_text": 1.456, + "ppl": 5.0294, + "step": 11649 + }, + { + "epoch": 0.06, + "global_step": 11650, + "learning_rate": 0.000452212020033389, + "loss": 1.6061, + "loss_base2": 2.3171, + "loss_pixel": 0.16, + "loss_text": 1.4461, + "ppl": 4.9833, + "step": 11650 + }, + { + "epoch": 0.06, + "global_step": 11651, + "learning_rate": 0.0004522078464106845, + "loss": 1.6242, + "loss_base2": 2.3432, + "loss_pixel": 0.1604, + "loss_text": 1.4638, + "ppl": 5.0744, + "step": 11651 + }, + { + "epoch": 0.06, + "global_step": 11652, + "learning_rate": 0.00045220367278798, + "loss": 1.5926, + "loss_base2": 2.2976, + "loss_pixel": 0.1608, + "loss_text": 1.4317, + "ppl": 4.9165, + "step": 11652 + }, + { + "epoch": 0.06, + "global_step": 11653, + "learning_rate": 0.0004521994991652755, + "loss": 1.5925, + "loss_base2": 2.2975, + "loss_pixel": 0.1608, + "loss_text": 1.4318, + "ppl": 4.916, + "step": 11653 + }, + { + "epoch": 0.06, + "global_step": 11654, + "learning_rate": 0.000452195325542571, + "loss": 1.593, + "loss_base2": 2.2982, + "loss_pixel": 0.1614, + "loss_text": 1.4316, + "ppl": 4.9185, + "step": 11654 + }, + { + "epoch": 0.06, + "global_step": 11655, + "learning_rate": 0.00045219115191986645, + "loss": 1.601, + "loss_base2": 2.3098, + "loss_pixel": 0.1641, + "loss_text": 1.4369, + "ppl": 4.958, + "step": 11655 + }, + { + "epoch": 0.06, + "global_step": 11656, + "learning_rate": 0.00045218697829716196, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.1683, + "loss_text": 1.4468, + "ppl": 5.0284, + "step": 11656 + }, + { + "epoch": 0.06, + "global_step": 11657, + "learning_rate": 0.0004521828046744574, + "loss": 1.6284, + "loss_base2": 2.3493, + "loss_pixel": 0.186, + "loss_text": 1.4425, + "ppl": 5.0957, + "step": 11657 + }, + { + "epoch": 0.06, + "global_step": 11658, + "learning_rate": 0.0004521786310517529, + "loss": 1.6332, + "loss_base2": 2.3562, + "loss_pixel": 0.192, + "loss_text": 1.4412, + "ppl": 5.1202, + "step": 11658 + }, + { + "epoch": 0.06, + "global_step": 11659, + "learning_rate": 0.0004521744574290484, + "loss": 1.6324, + "loss_base2": 2.3551, + "loss_pixel": 0.1867, + "loss_text": 1.4457, + "ppl": 5.1161, + "step": 11659 + }, + { + "epoch": 0.06, + "global_step": 11660, + "learning_rate": 0.0004521702838063439, + "loss": 1.6412, + "loss_base2": 2.3678, + "loss_pixel": 0.1852, + "loss_text": 1.456, + "ppl": 5.1614, + "step": 11660 + }, + { + "epoch": 0.06, + "global_step": 11661, + "learning_rate": 0.0004521661101836394, + "loss": 1.6217, + "loss_base2": 2.3396, + "loss_pixel": 0.1806, + "loss_text": 1.4411, + "ppl": 5.0617, + "step": 11661 + }, + { + "epoch": 0.06, + "global_step": 11662, + "learning_rate": 0.0004521619365609349, + "loss": 1.6268, + "loss_base2": 2.347, + "loss_pixel": 0.1793, + "loss_text": 1.4475, + "ppl": 5.0876, + "step": 11662 + }, + { + "epoch": 0.06, + "global_step": 11663, + "learning_rate": 0.0004521577629382304, + "loss": 1.6305, + "loss_base2": 2.3523, + "loss_pixel": 0.1781, + "loss_text": 1.4524, + "ppl": 5.1064, + "step": 11663 + }, + { + "epoch": 0.06, + "global_step": 11664, + "learning_rate": 0.00045215358931552585, + "loss": 1.6325, + "loss_base2": 2.3552, + "loss_pixel": 0.1764, + "loss_text": 1.4561, + "ppl": 5.1167, + "step": 11664 + }, + { + "epoch": 0.06, + "global_step": 11665, + "learning_rate": 0.00045214941569282136, + "loss": 1.6032, + "loss_base2": 2.3129, + "loss_pixel": 0.1745, + "loss_text": 1.4287, + "ppl": 4.9689, + "step": 11665 + }, + { + "epoch": 0.06, + "global_step": 11666, + "learning_rate": 0.00045214524207011687, + "loss": 1.5214, + "loss_base2": 2.1949, + "loss_pixel": 0.1743, + "loss_text": 1.3471, + "ppl": 4.5786, + "step": 11666 + }, + { + "epoch": 0.06, + "global_step": 11667, + "learning_rate": 0.0004521410684474124, + "loss": 1.4115, + "loss_base2": 2.0364, + "loss_pixel": 0.1715, + "loss_text": 1.24, + "ppl": 4.1021, + "step": 11667 + }, + { + "epoch": 0.06, + "global_step": 11668, + "learning_rate": 0.0004521368948247079, + "loss": 1.4207, + "loss_base2": 2.0496, + "loss_pixel": 0.1712, + "loss_text": 1.2494, + "ppl": 4.14, + "step": 11668 + }, + { + "epoch": 0.06, + "global_step": 11669, + "learning_rate": 0.00045213272120200334, + "loss": 1.401, + "loss_base2": 2.0212, + "loss_pixel": 0.1718, + "loss_text": 1.2292, + "ppl": 4.0593, + "step": 11669 + }, + { + "epoch": 0.06, + "global_step": 11670, + "learning_rate": 0.00045212854757929884, + "loss": 1.4084, + "loss_base2": 2.0319, + "loss_pixel": 0.1697, + "loss_text": 1.2387, + "ppl": 4.0894, + "step": 11670 + }, + { + "epoch": 0.06, + "global_step": 11671, + "learning_rate": 0.00045212437395659435, + "loss": 1.3966, + "loss_base2": 2.0149, + "loss_pixel": 0.1685, + "loss_text": 1.2281, + "ppl": 4.0414, + "step": 11671 + }, + { + "epoch": 0.06, + "global_step": 11672, + "learning_rate": 0.00045212020033388986, + "loss": 1.3916, + "loss_base2": 2.0077, + "loss_pixel": 0.1689, + "loss_text": 1.2228, + "ppl": 4.0213, + "step": 11672 + }, + { + "epoch": 0.06, + "global_step": 11673, + "learning_rate": 0.0004521160267111853, + "loss": 1.4061, + "loss_base2": 2.0286, + "loss_pixel": 0.1674, + "loss_text": 1.2386, + "ppl": 4.08, + "step": 11673 + }, + { + "epoch": 0.06, + "global_step": 11674, + "learning_rate": 0.0004521118530884808, + "loss": 1.3831, + "loss_base2": 1.9954, + "loss_pixel": 0.1681, + "loss_text": 1.215, + "ppl": 3.9872, + "step": 11674 + }, + { + "epoch": 0.06, + "global_step": 11675, + "learning_rate": 0.0004521076794657763, + "loss": 1.3943, + "loss_base2": 2.0115, + "loss_pixel": 0.1662, + "loss_text": 1.2281, + "ppl": 4.0322, + "step": 11675 + }, + { + "epoch": 0.06, + "global_step": 11676, + "learning_rate": 0.0004521035058430718, + "loss": 1.3982, + "loss_base2": 2.0172, + "loss_pixel": 0.1677, + "loss_text": 1.2304, + "ppl": 4.0479, + "step": 11676 + }, + { + "epoch": 0.06, + "global_step": 11677, + "learning_rate": 0.0004520993322203673, + "loss": 1.4026, + "loss_base2": 2.0235, + "loss_pixel": 0.1662, + "loss_text": 1.2364, + "ppl": 4.0658, + "step": 11677 + }, + { + "epoch": 0.06, + "global_step": 11678, + "learning_rate": 0.00045209515859766274, + "loss": 1.3909, + "loss_base2": 2.0066, + "loss_pixel": 0.1663, + "loss_text": 1.2246, + "ppl": 4.0185, + "step": 11678 + }, + { + "epoch": 0.06, + "global_step": 11679, + "learning_rate": 0.00045209098497495825, + "loss": 1.3929, + "loss_base2": 2.0095, + "loss_pixel": 0.1648, + "loss_text": 1.2282, + "ppl": 4.0265, + "step": 11679 + }, + { + "epoch": 0.06, + "global_step": 11680, + "learning_rate": 0.00045208681135225376, + "loss": 1.4074, + "loss_base2": 2.0304, + "loss_pixel": 0.1652, + "loss_text": 1.2422, + "ppl": 4.0853, + "step": 11680 + }, + { + "epoch": 0.06, + "global_step": 11681, + "learning_rate": 0.00045208263772954926, + "loss": 1.3723, + "loss_base2": 1.9798, + "loss_pixel": 0.1656, + "loss_text": 1.2067, + "ppl": 3.9444, + "step": 11681 + }, + { + "epoch": 0.06, + "global_step": 11682, + "learning_rate": 0.00045207846410684477, + "loss": 1.4054, + "loss_base2": 2.0276, + "loss_pixel": 0.1705, + "loss_text": 1.2349, + "ppl": 4.0772, + "step": 11682 + }, + { + "epoch": 0.06, + "global_step": 11683, + "learning_rate": 0.0004520742904841402, + "loss": 1.3953, + "loss_base2": 2.013, + "loss_pixel": 0.1695, + "loss_text": 1.2258, + "ppl": 4.0362, + "step": 11683 + }, + { + "epoch": 0.06, + "global_step": 11684, + "learning_rate": 0.00045207011686143573, + "loss": 1.516, + "loss_base2": 2.1871, + "loss_pixel": 0.1653, + "loss_text": 1.3507, + "ppl": 4.554, + "step": 11684 + }, + { + "epoch": 0.06, + "global_step": 11685, + "learning_rate": 0.00045206594323873124, + "loss": 1.6361, + "loss_base2": 2.3604, + "loss_pixel": 0.163, + "loss_text": 1.473, + "ppl": 5.1351, + "step": 11685 + }, + { + "epoch": 0.06, + "global_step": 11686, + "learning_rate": 0.00045206176961602674, + "loss": 1.626, + "loss_base2": 2.3458, + "loss_pixel": 0.1628, + "loss_text": 1.4632, + "ppl": 5.0835, + "step": 11686 + }, + { + "epoch": 0.06, + "global_step": 11687, + "learning_rate": 0.0004520575959933222, + "loss": 1.6138, + "loss_base2": 2.3282, + "loss_pixel": 0.1631, + "loss_text": 1.4507, + "ppl": 5.0219, + "step": 11687 + }, + { + "epoch": 0.06, + "global_step": 11688, + "learning_rate": 0.0004520534223706177, + "loss": 1.6079, + "loss_base2": 2.3197, + "loss_pixel": 0.1636, + "loss_text": 1.4443, + "ppl": 4.9923, + "step": 11688 + }, + { + "epoch": 0.06, + "global_step": 11689, + "learning_rate": 0.0004520492487479132, + "loss": 1.6111, + "loss_base2": 2.3243, + "loss_pixel": 0.1617, + "loss_text": 1.4495, + "ppl": 5.0083, + "step": 11689 + }, + { + "epoch": 0.06, + "global_step": 11690, + "learning_rate": 0.0004520450751252087, + "loss": 1.6264, + "loss_base2": 2.3464, + "loss_pixel": 0.1618, + "loss_text": 1.4646, + "ppl": 5.0855, + "step": 11690 + }, + { + "epoch": 0.06, + "global_step": 11691, + "learning_rate": 0.00045204090150250423, + "loss": 1.6305, + "loss_base2": 2.3523, + "loss_pixel": 0.1633, + "loss_text": 1.4672, + "ppl": 5.1064, + "step": 11691 + }, + { + "epoch": 0.06, + "global_step": 11692, + "learning_rate": 0.0004520367278797997, + "loss": 1.6029, + "loss_base2": 2.3125, + "loss_pixel": 0.1615, + "loss_text": 1.4414, + "ppl": 4.9674, + "step": 11692 + }, + { + "epoch": 0.06, + "global_step": 11693, + "learning_rate": 0.0004520325542570952, + "loss": 1.6194, + "loss_base2": 2.3363, + "loss_pixel": 0.1598, + "loss_text": 1.4596, + "ppl": 5.0501, + "step": 11693 + }, + { + "epoch": 0.06, + "global_step": 11694, + "learning_rate": 0.0004520283806343907, + "loss": 1.6322, + "loss_base2": 2.3548, + "loss_pixel": 0.1623, + "loss_text": 1.4699, + "ppl": 5.1151, + "step": 11694 + }, + { + "epoch": 0.06, + "global_step": 11695, + "learning_rate": 0.00045202420701168615, + "loss": 1.6144, + "loss_base2": 2.3291, + "loss_pixel": 0.1623, + "loss_text": 1.4521, + "ppl": 5.0249, + "step": 11695 + }, + { + "epoch": 0.06, + "global_step": 11696, + "learning_rate": 0.0004520200333889816, + "loss": 1.5968, + "loss_base2": 2.3037, + "loss_pixel": 0.1607, + "loss_text": 1.4361, + "ppl": 4.9372, + "step": 11696 + }, + { + "epoch": 0.06, + "global_step": 11697, + "learning_rate": 0.0004520158597662771, + "loss": 1.6263, + "loss_base2": 2.3463, + "loss_pixel": 0.1619, + "loss_text": 1.4645, + "ppl": 5.085, + "step": 11697 + }, + { + "epoch": 0.06, + "global_step": 11698, + "learning_rate": 0.0004520116861435726, + "loss": 1.6095, + "loss_base2": 2.322, + "loss_pixel": 0.1616, + "loss_text": 1.4479, + "ppl": 5.0003, + "step": 11698 + }, + { + "epoch": 0.06, + "global_step": 11699, + "learning_rate": 0.0004520075125208681, + "loss": 1.6164, + "loss_base2": 2.332, + "loss_pixel": 0.1613, + "loss_text": 1.4552, + "ppl": 5.0349, + "step": 11699 + }, + { + "epoch": 0.06, + "global_step": 11700, + "learning_rate": 0.00045200333889816363, + "loss": 1.5929, + "loss_base2": 2.2981, + "loss_pixel": 0.1601, + "loss_text": 1.4328, + "ppl": 4.918, + "step": 11700 + }, + { + "epoch": 0.06, + "global_step": 11701, + "learning_rate": 0.0004519991652754591, + "loss": 1.625, + "loss_base2": 2.3444, + "loss_pixel": 0.162, + "loss_text": 1.463, + "ppl": 5.0784, + "step": 11701 + }, + { + "epoch": 0.06, + "global_step": 11702, + "learning_rate": 0.0004519949916527546, + "loss": 1.6042, + "loss_base2": 2.3144, + "loss_pixel": 0.1611, + "loss_text": 1.4431, + "ppl": 4.9739, + "step": 11702 + }, + { + "epoch": 0.06, + "global_step": 11703, + "learning_rate": 0.0004519908180300501, + "loss": 1.6146, + "loss_base2": 2.3294, + "loss_pixel": 0.1634, + "loss_text": 1.4512, + "ppl": 5.0259, + "step": 11703 + }, + { + "epoch": 0.06, + "global_step": 11704, + "learning_rate": 0.0004519866444073456, + "loss": 1.6181, + "loss_base2": 2.3344, + "loss_pixel": 0.1606, + "loss_text": 1.4575, + "ppl": 5.0435, + "step": 11704 + }, + { + "epoch": 0.06, + "global_step": 11705, + "learning_rate": 0.00045198247078464106, + "loss": 1.626, + "loss_base2": 2.3458, + "loss_pixel": 0.1621, + "loss_text": 1.4639, + "ppl": 5.0835, + "step": 11705 + }, + { + "epoch": 0.06, + "global_step": 11706, + "learning_rate": 0.00045197829716193657, + "loss": 1.6243, + "loss_base2": 2.3434, + "loss_pixel": 0.1618, + "loss_text": 1.4624, + "ppl": 5.0749, + "step": 11706 + }, + { + "epoch": 0.06, + "global_step": 11707, + "learning_rate": 0.0004519741235392321, + "loss": 1.6162, + "loss_base2": 2.3317, + "loss_pixel": 0.1625, + "loss_text": 1.4537, + "ppl": 5.0339, + "step": 11707 + }, + { + "epoch": 0.06, + "global_step": 11708, + "learning_rate": 0.0004519699499165276, + "loss": 1.4455, + "loss_base2": 2.0854, + "loss_pixel": 0.1604, + "loss_text": 1.2851, + "ppl": 4.244, + "step": 11708 + }, + { + "epoch": 0.06, + "global_step": 11709, + "learning_rate": 0.0004519657762938231, + "loss": 1.3977, + "loss_base2": 2.0165, + "loss_pixel": 0.1611, + "loss_text": 1.2366, + "ppl": 4.0459, + "step": 11709 + }, + { + "epoch": 0.06, + "global_step": 11710, + "learning_rate": 0.00045196160267111854, + "loss": 1.3992, + "loss_base2": 2.0186, + "loss_pixel": 0.1605, + "loss_text": 1.2387, + "ppl": 4.052, + "step": 11710 + }, + { + "epoch": 0.06, + "global_step": 11711, + "learning_rate": 0.00045195742904841405, + "loss": 1.3854, + "loss_base2": 1.9987, + "loss_pixel": 0.1615, + "loss_text": 1.2239, + "ppl": 3.9964, + "step": 11711 + }, + { + "epoch": 0.06, + "global_step": 11712, + "learning_rate": 0.00045195325542570956, + "loss": 1.4026, + "loss_base2": 2.0235, + "loss_pixel": 0.1587, + "loss_text": 1.244, + "ppl": 4.0658, + "step": 11712 + }, + { + "epoch": 0.06, + "global_step": 11713, + "learning_rate": 0.000451949081803005, + "loss": 1.3921, + "loss_base2": 2.0084, + "loss_pixel": 0.1631, + "loss_text": 1.229, + "ppl": 4.0233, + "step": 11713 + }, + { + "epoch": 0.06, + "global_step": 11714, + "learning_rate": 0.00045194490818030046, + "loss": 1.3881, + "loss_base2": 2.0026, + "loss_pixel": 0.1606, + "loss_text": 1.2275, + "ppl": 4.0072, + "step": 11714 + }, + { + "epoch": 0.06, + "global_step": 11715, + "learning_rate": 0.00045194073455759597, + "loss": 1.3949, + "loss_base2": 2.0124, + "loss_pixel": 0.162, + "loss_text": 1.2329, + "ppl": 4.0346, + "step": 11715 + }, + { + "epoch": 0.06, + "global_step": 11716, + "learning_rate": 0.0004519365609348915, + "loss": 1.3864, + "loss_base2": 2.0002, + "loss_pixel": 0.16, + "loss_text": 1.2264, + "ppl": 4.0004, + "step": 11716 + }, + { + "epoch": 0.06, + "global_step": 11717, + "learning_rate": 0.000451932387312187, + "loss": 1.3892, + "loss_base2": 2.0042, + "loss_pixel": 0.1595, + "loss_text": 1.2296, + "ppl": 4.0116, + "step": 11717 + }, + { + "epoch": 0.06, + "global_step": 11718, + "learning_rate": 0.0004519282136894825, + "loss": 1.3879, + "loss_base2": 2.0023, + "loss_pixel": 0.1594, + "loss_text": 1.2285, + "ppl": 4.0064, + "step": 11718 + }, + { + "epoch": 0.06, + "global_step": 11719, + "learning_rate": 0.00045192404006677794, + "loss": 1.3934, + "loss_base2": 2.0103, + "loss_pixel": 0.1611, + "loss_text": 1.2323, + "ppl": 4.0285, + "step": 11719 + }, + { + "epoch": 0.06, + "global_step": 11720, + "learning_rate": 0.00045191986644407345, + "loss": 1.397, + "loss_base2": 2.0154, + "loss_pixel": 0.1612, + "loss_text": 1.2358, + "ppl": 4.0431, + "step": 11720 + }, + { + "epoch": 0.06, + "global_step": 11721, + "learning_rate": 0.00045191569282136896, + "loss": 1.3726, + "loss_base2": 1.9802, + "loss_pixel": 0.1603, + "loss_text": 1.2123, + "ppl": 3.9456, + "step": 11721 + }, + { + "epoch": 0.06, + "global_step": 11722, + "learning_rate": 0.00045191151919866447, + "loss": 1.385, + "loss_base2": 1.9981, + "loss_pixel": 0.1598, + "loss_text": 1.2252, + "ppl": 3.9948, + "step": 11722 + }, + { + "epoch": 0.06, + "global_step": 11723, + "learning_rate": 0.0004519073455759599, + "loss": 1.3963, + "loss_base2": 2.0144, + "loss_pixel": 0.1603, + "loss_text": 1.236, + "ppl": 4.0402, + "step": 11723 + }, + { + "epoch": 0.06, + "global_step": 11724, + "learning_rate": 0.0004519031719532554, + "loss": 1.3895, + "loss_base2": 2.0046, + "loss_pixel": 0.1605, + "loss_text": 1.229, + "ppl": 4.0128, + "step": 11724 + }, + { + "epoch": 0.06, + "global_step": 11725, + "learning_rate": 0.00045189899833055093, + "loss": 1.5484, + "loss_base2": 2.2339, + "loss_pixel": 0.1609, + "loss_text": 1.3875, + "ppl": 4.7039, + "step": 11725 + }, + { + "epoch": 0.06, + "global_step": 11726, + "learning_rate": 0.00045189482470784644, + "loss": 1.6357, + "loss_base2": 2.3598, + "loss_pixel": 0.1604, + "loss_text": 1.4753, + "ppl": 5.133, + "step": 11726 + }, + { + "epoch": 0.06, + "global_step": 11727, + "learning_rate": 0.00045189065108514195, + "loss": 1.6128, + "loss_base2": 2.3268, + "loss_pixel": 0.1607, + "loss_text": 1.4521, + "ppl": 5.0168, + "step": 11727 + }, + { + "epoch": 0.06, + "global_step": 11728, + "learning_rate": 0.0004518864774624374, + "loss": 1.6266, + "loss_base2": 2.3467, + "loss_pixel": 0.161, + "loss_text": 1.4656, + "ppl": 5.0866, + "step": 11728 + }, + { + "epoch": 0.06, + "global_step": 11729, + "learning_rate": 0.0004518823038397329, + "loss": 1.6344, + "loss_base2": 2.3579, + "loss_pixel": 0.1607, + "loss_text": 1.4737, + "ppl": 5.1264, + "step": 11729 + }, + { + "epoch": 0.06, + "global_step": 11730, + "learning_rate": 0.0004518781302170284, + "loss": 1.6287, + "loss_base2": 2.3497, + "loss_pixel": 0.1607, + "loss_text": 1.468, + "ppl": 5.0972, + "step": 11730 + }, + { + "epoch": 0.06, + "global_step": 11731, + "learning_rate": 0.0004518739565943239, + "loss": 1.633, + "loss_base2": 2.3559, + "loss_pixel": 0.1618, + "loss_text": 1.4711, + "ppl": 5.1192, + "step": 11731 + }, + { + "epoch": 0.06, + "global_step": 11732, + "learning_rate": 0.0004518697829716193, + "loss": 1.6189, + "loss_base2": 2.3356, + "loss_pixel": 0.1589, + "loss_text": 1.4601, + "ppl": 5.0475, + "step": 11732 + }, + { + "epoch": 0.06, + "global_step": 11733, + "learning_rate": 0.00045186560934891483, + "loss": 1.6061, + "loss_base2": 2.3171, + "loss_pixel": 0.1601, + "loss_text": 1.4461, + "ppl": 4.9833, + "step": 11733 + }, + { + "epoch": 0.06, + "global_step": 11734, + "learning_rate": 0.00045186143572621034, + "loss": 1.5985, + "loss_base2": 2.3061, + "loss_pixel": 0.1599, + "loss_text": 1.4386, + "ppl": 4.9456, + "step": 11734 + }, + { + "epoch": 0.06, + "global_step": 11735, + "learning_rate": 0.00045185726210350584, + "loss": 1.6059, + "loss_base2": 2.3168, + "loss_pixel": 0.1604, + "loss_text": 1.4455, + "ppl": 4.9823, + "step": 11735 + }, + { + "epoch": 0.06, + "global_step": 11736, + "learning_rate": 0.00045185308848080135, + "loss": 1.6003, + "loss_base2": 2.3087, + "loss_pixel": 0.1605, + "loss_text": 1.4397, + "ppl": 4.9545, + "step": 11736 + }, + { + "epoch": 0.06, + "global_step": 11737, + "learning_rate": 0.0004518489148580968, + "loss": 1.6133, + "loss_base2": 2.3275, + "loss_pixel": 0.1594, + "loss_text": 1.4539, + "ppl": 5.0193, + "step": 11737 + }, + { + "epoch": 0.06, + "global_step": 11738, + "learning_rate": 0.0004518447412353923, + "loss": 1.6162, + "loss_base2": 2.3317, + "loss_pixel": 0.1598, + "loss_text": 1.4564, + "ppl": 5.0339, + "step": 11738 + }, + { + "epoch": 0.06, + "global_step": 11739, + "learning_rate": 0.0004518405676126878, + "loss": 1.597, + "loss_base2": 2.304, + "loss_pixel": 0.1596, + "loss_text": 1.4375, + "ppl": 4.9382, + "step": 11739 + }, + { + "epoch": 0.06, + "global_step": 11740, + "learning_rate": 0.0004518363939899833, + "loss": 1.5831, + "loss_base2": 2.2839, + "loss_pixel": 0.1592, + "loss_text": 1.4239, + "ppl": 4.87, + "step": 11740 + }, + { + "epoch": 0.06, + "global_step": 11741, + "learning_rate": 0.00045183222036727883, + "loss": 1.615, + "loss_base2": 2.33, + "loss_pixel": 0.1607, + "loss_text": 1.4542, + "ppl": 5.0279, + "step": 11741 + }, + { + "epoch": 0.06, + "global_step": 11742, + "learning_rate": 0.0004518280467445743, + "loss": 1.5859, + "loss_base2": 2.288, + "loss_pixel": 0.1604, + "loss_text": 1.4255, + "ppl": 4.8837, + "step": 11742 + }, + { + "epoch": 0.06, + "global_step": 11743, + "learning_rate": 0.0004518238731218698, + "loss": 1.6031, + "loss_base2": 2.3128, + "loss_pixel": 0.1548, + "loss_text": 1.4483, + "ppl": 4.9684, + "step": 11743 + }, + { + "epoch": 0.06, + "global_step": 11744, + "learning_rate": 0.0004518196994991653, + "loss": 1.5926, + "loss_base2": 2.2976, + "loss_pixel": 0.1517, + "loss_text": 1.4409, + "ppl": 4.9165, + "step": 11744 + }, + { + "epoch": 0.06, + "global_step": 11745, + "learning_rate": 0.0004518155258764608, + "loss": 1.5936, + "loss_base2": 2.2991, + "loss_pixel": 0.1497, + "loss_text": 1.4439, + "ppl": 4.9214, + "step": 11745 + }, + { + "epoch": 0.06, + "global_step": 11746, + "learning_rate": 0.00045181135225375626, + "loss": 1.6053, + "loss_base2": 2.316, + "loss_pixel": 0.15, + "loss_text": 1.4553, + "ppl": 4.9794, + "step": 11746 + }, + { + "epoch": 0.06, + "global_step": 11747, + "learning_rate": 0.00045180717863105177, + "loss": 1.4905, + "loss_base2": 2.1503, + "loss_pixel": 0.152, + "loss_text": 1.3385, + "ppl": 4.4393, + "step": 11747 + }, + { + "epoch": 0.06, + "global_step": 11748, + "learning_rate": 0.0004518030050083473, + "loss": 1.4096, + "loss_base2": 2.0336, + "loss_pixel": 0.1519, + "loss_text": 1.2576, + "ppl": 4.0943, + "step": 11748 + }, + { + "epoch": 0.06, + "global_step": 11749, + "learning_rate": 0.0004517988313856428, + "loss": 1.401, + "loss_base2": 2.0212, + "loss_pixel": 0.1528, + "loss_text": 1.2482, + "ppl": 4.0593, + "step": 11749 + }, + { + "epoch": 0.06, + "global_step": 11750, + "learning_rate": 0.0004517946577629383, + "loss": 1.3775, + "loss_base2": 1.9873, + "loss_pixel": 0.1516, + "loss_text": 1.2259, + "ppl": 3.965, + "step": 11750 + }, + { + "epoch": 0.06, + "global_step": 11751, + "learning_rate": 0.0004517904841402337, + "loss": 1.3879, + "loss_base2": 2.0023, + "loss_pixel": 0.1515, + "loss_text": 1.2364, + "ppl": 4.0064, + "step": 11751 + }, + { + "epoch": 0.06, + "global_step": 11752, + "learning_rate": 0.0004517863105175292, + "loss": 1.3744, + "loss_base2": 1.9828, + "loss_pixel": 0.1514, + "loss_text": 1.223, + "ppl": 3.9527, + "step": 11752 + }, + { + "epoch": 0.06, + "global_step": 11753, + "learning_rate": 0.0004517821368948247, + "loss": 1.3854, + "loss_base2": 1.9987, + "loss_pixel": 0.1491, + "loss_text": 1.2363, + "ppl": 3.9964, + "step": 11753 + }, + { + "epoch": 0.06, + "global_step": 11754, + "learning_rate": 0.0004517779632721202, + "loss": 1.3627, + "loss_base2": 1.966, + "loss_pixel": 0.1499, + "loss_text": 1.2128, + "ppl": 3.9067, + "step": 11754 + }, + { + "epoch": 0.06, + "global_step": 11755, + "learning_rate": 0.00045177378964941567, + "loss": 1.3693, + "loss_base2": 1.9755, + "loss_pixel": 0.1487, + "loss_text": 1.2206, + "ppl": 3.9326, + "step": 11755 + }, + { + "epoch": 0.06, + "global_step": 11756, + "learning_rate": 0.0004517696160267112, + "loss": 1.3783, + "loss_base2": 1.9885, + "loss_pixel": 0.1507, + "loss_text": 1.2276, + "ppl": 3.9682, + "step": 11756 + }, + { + "epoch": 0.06, + "global_step": 11757, + "learning_rate": 0.0004517654424040067, + "loss": 1.373, + "loss_base2": 1.9808, + "loss_pixel": 0.1481, + "loss_text": 1.225, + "ppl": 3.9472, + "step": 11757 + }, + { + "epoch": 0.06, + "global_step": 11758, + "learning_rate": 0.0004517612687813022, + "loss": 1.365, + "loss_base2": 1.9693, + "loss_pixel": 0.1497, + "loss_text": 1.2152, + "ppl": 3.9157, + "step": 11758 + }, + { + "epoch": 0.06, + "global_step": 11759, + "learning_rate": 0.0004517570951585977, + "loss": 1.3493, + "loss_base2": 1.9466, + "loss_pixel": 0.1497, + "loss_text": 1.1996, + "ppl": 3.8547, + "step": 11759 + }, + { + "epoch": 0.06, + "global_step": 11760, + "learning_rate": 0.00045175292153589315, + "loss": 1.3711, + "loss_base2": 1.9781, + "loss_pixel": 0.1525, + "loss_text": 1.2186, + "ppl": 3.9397, + "step": 11760 + }, + { + "epoch": 0.06, + "global_step": 11761, + "learning_rate": 0.00045174874791318866, + "loss": 1.3853, + "loss_base2": 1.9986, + "loss_pixel": 0.1532, + "loss_text": 1.2322, + "ppl": 3.996, + "step": 11761 + }, + { + "epoch": 0.06, + "global_step": 11762, + "learning_rate": 0.00045174457429048416, + "loss": 1.4448, + "loss_base2": 2.0844, + "loss_pixel": 0.1623, + "loss_text": 1.2824, + "ppl": 4.241, + "step": 11762 + }, + { + "epoch": 0.06, + "global_step": 11763, + "learning_rate": 0.00045174040066777967, + "loss": 1.6272, + "loss_base2": 2.3476, + "loss_pixel": 0.1607, + "loss_text": 1.4665, + "ppl": 5.0896, + "step": 11763 + }, + { + "epoch": 0.06, + "global_step": 11764, + "learning_rate": 0.0004517362270450751, + "loss": 1.6265, + "loss_base2": 2.3465, + "loss_pixel": 0.1613, + "loss_text": 1.4652, + "ppl": 5.086, + "step": 11764 + }, + { + "epoch": 0.06, + "global_step": 11765, + "learning_rate": 0.00045173205342237063, + "loss": 1.6344, + "loss_base2": 2.3579, + "loss_pixel": 0.1609, + "loss_text": 1.4735, + "ppl": 5.1264, + "step": 11765 + }, + { + "epoch": 0.06, + "global_step": 11766, + "learning_rate": 0.00045172787979966614, + "loss": 1.6181, + "loss_base2": 2.3344, + "loss_pixel": 0.161, + "loss_text": 1.4571, + "ppl": 5.0435, + "step": 11766 + }, + { + "epoch": 0.06, + "global_step": 11767, + "learning_rate": 0.00045172370617696165, + "loss": 1.6172, + "loss_base2": 2.3331, + "loss_pixel": 0.1604, + "loss_text": 1.4568, + "ppl": 5.039, + "step": 11767 + }, + { + "epoch": 0.06, + "global_step": 11768, + "learning_rate": 0.00045171953255425715, + "loss": 1.6194, + "loss_base2": 2.3363, + "loss_pixel": 0.1615, + "loss_text": 1.4579, + "ppl": 5.0501, + "step": 11768 + }, + { + "epoch": 0.06, + "global_step": 11769, + "learning_rate": 0.00045171535893155255, + "loss": 1.6237, + "loss_base2": 2.3425, + "loss_pixel": 0.1611, + "loss_text": 1.4626, + "ppl": 5.0718, + "step": 11769 + }, + { + "epoch": 0.06, + "global_step": 11770, + "learning_rate": 0.00045171118530884806, + "loss": 1.6168, + "loss_base2": 2.3325, + "loss_pixel": 0.1599, + "loss_text": 1.4569, + "ppl": 5.0369, + "step": 11770 + }, + { + "epoch": 0.06, + "global_step": 11771, + "learning_rate": 0.00045170701168614357, + "loss": 1.6149, + "loss_base2": 2.3298, + "loss_pixel": 0.1611, + "loss_text": 1.4538, + "ppl": 5.0274, + "step": 11771 + }, + { + "epoch": 0.06, + "global_step": 11772, + "learning_rate": 0.0004517028380634391, + "loss": 1.6129, + "loss_base2": 2.3269, + "loss_pixel": 0.1597, + "loss_text": 1.4532, + "ppl": 5.0173, + "step": 11772 + }, + { + "epoch": 0.06, + "global_step": 11773, + "learning_rate": 0.0004516986644407345, + "loss": 1.608, + "loss_base2": 2.3199, + "loss_pixel": 0.1602, + "loss_text": 1.4478, + "ppl": 4.9928, + "step": 11773 + }, + { + "epoch": 0.06, + "global_step": 11774, + "learning_rate": 0.00045169449081803003, + "loss": 1.6092, + "loss_base2": 2.3216, + "loss_pixel": 0.1604, + "loss_text": 1.4488, + "ppl": 4.9988, + "step": 11774 + }, + { + "epoch": 0.06, + "global_step": 11775, + "learning_rate": 0.00045169031719532554, + "loss": 1.602, + "loss_base2": 2.3112, + "loss_pixel": 0.1588, + "loss_text": 1.4433, + "ppl": 4.9629, + "step": 11775 + }, + { + "epoch": 0.06, + "global_step": 11776, + "learning_rate": 0.00045168614357262105, + "loss": 1.6156, + "loss_base2": 2.3308, + "loss_pixel": 0.1596, + "loss_text": 1.456, + "ppl": 5.0309, + "step": 11776 + }, + { + "epoch": 0.06, + "global_step": 11777, + "learning_rate": 0.00045168196994991656, + "loss": 1.5932, + "loss_base2": 2.2985, + "loss_pixel": 0.1596, + "loss_text": 1.4336, + "ppl": 4.9195, + "step": 11777 + }, + { + "epoch": 0.06, + "global_step": 11778, + "learning_rate": 0.000451677796327212, + "loss": 1.6131, + "loss_base2": 2.3272, + "loss_pixel": 0.1601, + "loss_text": 1.453, + "ppl": 5.0183, + "step": 11778 + }, + { + "epoch": 0.06, + "global_step": 11779, + "learning_rate": 0.0004516736227045075, + "loss": 1.6024, + "loss_base2": 2.3118, + "loss_pixel": 0.1598, + "loss_text": 1.4426, + "ppl": 4.9649, + "step": 11779 + }, + { + "epoch": 0.06, + "global_step": 11780, + "learning_rate": 0.000451669449081803, + "loss": 1.5925, + "loss_base2": 2.2975, + "loss_pixel": 0.158, + "loss_text": 1.4345, + "ppl": 4.916, + "step": 11780 + }, + { + "epoch": 0.06, + "global_step": 11781, + "learning_rate": 0.00045166527545909853, + "loss": 1.6058, + "loss_base2": 2.3167, + "loss_pixel": 0.1599, + "loss_text": 1.446, + "ppl": 4.9818, + "step": 11781 + }, + { + "epoch": 0.06, + "global_step": 11782, + "learning_rate": 0.000451661101836394, + "loss": 1.5997, + "loss_base2": 2.3079, + "loss_pixel": 0.1602, + "loss_text": 1.4395, + "ppl": 4.9515, + "step": 11782 + }, + { + "epoch": 0.06, + "global_step": 11783, + "learning_rate": 0.0004516569282136895, + "loss": 1.6163, + "loss_base2": 2.3318, + "loss_pixel": 0.1615, + "loss_text": 1.4547, + "ppl": 5.0344, + "step": 11783 + }, + { + "epoch": 0.06, + "global_step": 11784, + "learning_rate": 0.000451652754590985, + "loss": 1.5821, + "loss_base2": 2.2825, + "loss_pixel": 0.1585, + "loss_text": 1.4236, + "ppl": 4.8652, + "step": 11784 + }, + { + "epoch": 0.06, + "global_step": 11785, + "learning_rate": 0.0004516485809682805, + "loss": 1.62, + "loss_base2": 2.3372, + "loss_pixel": 0.1596, + "loss_text": 1.4604, + "ppl": 5.0531, + "step": 11785 + }, + { + "epoch": 0.06, + "global_step": 11786, + "learning_rate": 0.000451644407345576, + "loss": 1.5903, + "loss_base2": 2.2943, + "loss_pixel": 0.1581, + "loss_text": 1.4321, + "ppl": 4.9052, + "step": 11786 + }, + { + "epoch": 0.06, + "global_step": 11787, + "learning_rate": 0.00045164023372287147, + "loss": 1.5869, + "loss_base2": 2.2894, + "loss_pixel": 0.159, + "loss_text": 1.4279, + "ppl": 4.8886, + "step": 11787 + }, + { + "epoch": 0.06, + "global_step": 11788, + "learning_rate": 0.0004516360601001669, + "loss": 1.621, + "loss_base2": 2.3386, + "loss_pixel": 0.16, + "loss_text": 1.461, + "ppl": 5.0581, + "step": 11788 + }, + { + "epoch": 0.06, + "global_step": 11789, + "learning_rate": 0.0004516318864774624, + "loss": 1.6198, + "loss_base2": 2.3369, + "loss_pixel": 0.1608, + "loss_text": 1.459, + "ppl": 5.0521, + "step": 11789 + }, + { + "epoch": 0.06, + "global_step": 11790, + "learning_rate": 0.00045162771285475793, + "loss": 1.6071, + "loss_base2": 2.3186, + "loss_pixel": 0.16, + "loss_text": 1.4471, + "ppl": 4.9883, + "step": 11790 + }, + { + "epoch": 0.06, + "global_step": 11791, + "learning_rate": 0.0004516235392320534, + "loss": 1.6131, + "loss_base2": 2.3272, + "loss_pixel": 0.1598, + "loss_text": 1.4533, + "ppl": 5.0183, + "step": 11791 + }, + { + "epoch": 0.06, + "global_step": 11792, + "learning_rate": 0.0004516193656093489, + "loss": 1.609, + "loss_base2": 2.3213, + "loss_pixel": 0.1573, + "loss_text": 1.4518, + "ppl": 4.9978, + "step": 11792 + }, + { + "epoch": 0.06, + "global_step": 11793, + "learning_rate": 0.0004516151919866444, + "loss": 1.5927, + "loss_base2": 2.2978, + "loss_pixel": 0.1597, + "loss_text": 1.433, + "ppl": 4.917, + "step": 11793 + }, + { + "epoch": 0.06, + "global_step": 11794, + "learning_rate": 0.0004516110183639399, + "loss": 1.6122, + "loss_base2": 2.3259, + "loss_pixel": 0.1594, + "loss_text": 1.4529, + "ppl": 5.0138, + "step": 11794 + }, + { + "epoch": 0.06, + "global_step": 11795, + "learning_rate": 0.0004516068447412354, + "loss": 1.612, + "loss_base2": 2.3256, + "loss_pixel": 0.1608, + "loss_text": 1.4512, + "ppl": 5.0128, + "step": 11795 + }, + { + "epoch": 0.06, + "global_step": 11796, + "learning_rate": 0.00045160267111853087, + "loss": 1.6115, + "loss_base2": 2.3249, + "loss_pixel": 0.1603, + "loss_text": 1.4513, + "ppl": 5.0103, + "step": 11796 + }, + { + "epoch": 0.06, + "global_step": 11797, + "learning_rate": 0.0004515984974958264, + "loss": 1.615, + "loss_base2": 2.33, + "loss_pixel": 0.1597, + "loss_text": 1.4553, + "ppl": 5.0279, + "step": 11797 + }, + { + "epoch": 0.06, + "global_step": 11798, + "learning_rate": 0.0004515943238731219, + "loss": 1.5965, + "loss_base2": 2.3033, + "loss_pixel": 0.1584, + "loss_text": 1.4381, + "ppl": 4.9357, + "step": 11798 + }, + { + "epoch": 0.06, + "global_step": 11799, + "learning_rate": 0.0004515901502504174, + "loss": 1.625, + "loss_base2": 2.3444, + "loss_pixel": 0.1595, + "loss_text": 1.4655, + "ppl": 5.0784, + "step": 11799 + }, + { + "epoch": 0.06, + "global_step": 11800, + "learning_rate": 0.0004515859766277129, + "loss": 1.6015, + "loss_base2": 2.3105, + "loss_pixel": 0.1589, + "loss_text": 1.4426, + "ppl": 4.9605, + "step": 11800 + }, + { + "epoch": 0.06, + "global_step": 11801, + "learning_rate": 0.00045158180300500835, + "loss": 1.6118, + "loss_base2": 2.3253, + "loss_pixel": 0.1588, + "loss_text": 1.453, + "ppl": 5.0118, + "step": 11801 + }, + { + "epoch": 0.06, + "global_step": 11802, + "learning_rate": 0.00045157762938230386, + "loss": 1.6191, + "loss_base2": 2.3359, + "loss_pixel": 0.1592, + "loss_text": 1.4599, + "ppl": 5.0485, + "step": 11802 + }, + { + "epoch": 0.06, + "global_step": 11803, + "learning_rate": 0.00045157345575959937, + "loss": 1.6172, + "loss_base2": 2.3331, + "loss_pixel": 0.1587, + "loss_text": 1.4585, + "ppl": 5.039, + "step": 11803 + }, + { + "epoch": 0.06, + "global_step": 11804, + "learning_rate": 0.0004515692821368949, + "loss": 1.6113, + "loss_base2": 2.3246, + "loss_pixel": 0.1593, + "loss_text": 1.452, + "ppl": 5.0093, + "step": 11804 + }, + { + "epoch": 0.06, + "global_step": 11805, + "learning_rate": 0.0004515651085141903, + "loss": 1.6155, + "loss_base2": 2.3307, + "loss_pixel": 0.1595, + "loss_text": 1.456, + "ppl": 5.0304, + "step": 11805 + }, + { + "epoch": 0.06, + "global_step": 11806, + "learning_rate": 0.00045156093489148583, + "loss": 1.5766, + "loss_base2": 2.2746, + "loss_pixel": 0.1589, + "loss_text": 1.4177, + "ppl": 4.8385, + "step": 11806 + }, + { + "epoch": 0.06, + "global_step": 11807, + "learning_rate": 0.0004515567612687813, + "loss": 1.443, + "loss_base2": 2.0818, + "loss_pixel": 0.1596, + "loss_text": 1.2834, + "ppl": 4.2334, + "step": 11807 + }, + { + "epoch": 0.06, + "global_step": 11808, + "learning_rate": 0.0004515525876460768, + "loss": 1.3913, + "loss_base2": 2.0072, + "loss_pixel": 0.1592, + "loss_text": 1.232, + "ppl": 4.0201, + "step": 11808 + }, + { + "epoch": 0.06, + "global_step": 11809, + "learning_rate": 0.0004515484140233723, + "loss": 1.387, + "loss_base2": 2.001, + "loss_pixel": 0.1566, + "loss_text": 1.2304, + "ppl": 4.0028, + "step": 11809 + }, + { + "epoch": 0.06, + "global_step": 11810, + "learning_rate": 0.00045154424040066775, + "loss": 1.3753, + "loss_base2": 1.9841, + "loss_pixel": 0.1587, + "loss_text": 1.2166, + "ppl": 3.9563, + "step": 11810 + }, + { + "epoch": 0.06, + "global_step": 11811, + "learning_rate": 0.00045154006677796326, + "loss": 1.4034, + "loss_base2": 2.0247, + "loss_pixel": 0.1605, + "loss_text": 1.2429, + "ppl": 4.069, + "step": 11811 + }, + { + "epoch": 0.06, + "global_step": 11812, + "learning_rate": 0.00045153589315525877, + "loss": 1.3815, + "loss_base2": 1.9931, + "loss_pixel": 0.1587, + "loss_text": 1.2227, + "ppl": 3.9809, + "step": 11812 + }, + { + "epoch": 0.06, + "global_step": 11813, + "learning_rate": 0.0004515317195325543, + "loss": 1.3806, + "loss_base2": 1.9918, + "loss_pixel": 0.1599, + "loss_text": 1.2207, + "ppl": 3.9773, + "step": 11813 + }, + { + "epoch": 0.06, + "global_step": 11814, + "learning_rate": 0.00045152754590984973, + "loss": 1.3846, + "loss_base2": 1.9976, + "loss_pixel": 0.1587, + "loss_text": 1.2259, + "ppl": 3.9932, + "step": 11814 + }, + { + "epoch": 0.06, + "global_step": 11815, + "learning_rate": 0.00045152337228714524, + "loss": 1.4908, + "loss_base2": 2.1508, + "loss_pixel": 0.1589, + "loss_text": 1.3319, + "ppl": 4.4406, + "step": 11815 + }, + { + "epoch": 0.06, + "global_step": 11816, + "learning_rate": 0.00045151919866444074, + "loss": 1.5219, + "loss_base2": 2.1956, + "loss_pixel": 0.1594, + "loss_text": 1.3625, + "ppl": 4.5809, + "step": 11816 + }, + { + "epoch": 0.06, + "global_step": 11817, + "learning_rate": 0.00045151502504173625, + "loss": 1.601, + "loss_base2": 2.3098, + "loss_pixel": 0.1601, + "loss_text": 1.4409, + "ppl": 4.958, + "step": 11817 + }, + { + "epoch": 0.06, + "global_step": 11818, + "learning_rate": 0.00045151085141903176, + "loss": 1.6152, + "loss_base2": 2.3302, + "loss_pixel": 0.1585, + "loss_text": 1.4567, + "ppl": 5.0289, + "step": 11818 + }, + { + "epoch": 0.06, + "global_step": 11819, + "learning_rate": 0.0004515066777963272, + "loss": 1.6236, + "loss_base2": 2.3424, + "loss_pixel": 0.1608, + "loss_text": 1.4627, + "ppl": 5.0713, + "step": 11819 + }, + { + "epoch": 0.06, + "global_step": 11820, + "learning_rate": 0.0004515025041736227, + "loss": 1.6031, + "loss_base2": 2.3128, + "loss_pixel": 0.1607, + "loss_text": 1.4424, + "ppl": 4.9684, + "step": 11820 + }, + { + "epoch": 0.06, + "global_step": 11821, + "learning_rate": 0.0004514983305509182, + "loss": 1.6306, + "loss_base2": 2.3525, + "loss_pixel": 0.1603, + "loss_text": 1.4702, + "ppl": 5.1069, + "step": 11821 + }, + { + "epoch": 0.06, + "global_step": 11822, + "learning_rate": 0.00045149415692821373, + "loss": 1.6063, + "loss_base2": 2.3174, + "loss_pixel": 0.1532, + "loss_text": 1.4531, + "ppl": 4.9843, + "step": 11822 + }, + { + "epoch": 0.06, + "global_step": 11823, + "learning_rate": 0.0004514899833055092, + "loss": 1.6109, + "loss_base2": 2.324, + "loss_pixel": 0.1509, + "loss_text": 1.46, + "ppl": 5.0073, + "step": 11823 + }, + { + "epoch": 0.06, + "global_step": 11824, + "learning_rate": 0.0004514858096828047, + "loss": 1.6012, + "loss_base2": 2.31, + "loss_pixel": 0.1515, + "loss_text": 1.4497, + "ppl": 4.959, + "step": 11824 + }, + { + "epoch": 0.06, + "global_step": 11825, + "learning_rate": 0.0004514816360601002, + "loss": 1.6161, + "loss_base2": 2.3315, + "loss_pixel": 0.1494, + "loss_text": 1.4666, + "ppl": 5.0334, + "step": 11825 + }, + { + "epoch": 0.06, + "global_step": 11826, + "learning_rate": 0.00045147746243739566, + "loss": 1.5975, + "loss_base2": 2.3047, + "loss_pixel": 0.153, + "loss_text": 1.4445, + "ppl": 4.9407, + "step": 11826 + }, + { + "epoch": 0.06, + "global_step": 11827, + "learning_rate": 0.00045147328881469116, + "loss": 1.5989, + "loss_base2": 2.3067, + "loss_pixel": 0.1496, + "loss_text": 1.4493, + "ppl": 4.9476, + "step": 11827 + }, + { + "epoch": 0.06, + "global_step": 11828, + "learning_rate": 0.0004514691151919866, + "loss": 1.6047, + "loss_base2": 2.3151, + "loss_pixel": 0.1505, + "loss_text": 1.4543, + "ppl": 4.9764, + "step": 11828 + }, + { + "epoch": 0.06, + "global_step": 11829, + "learning_rate": 0.0004514649415692821, + "loss": 1.5987, + "loss_base2": 2.3064, + "loss_pixel": 0.1495, + "loss_text": 1.4492, + "ppl": 4.9466, + "step": 11829 + }, + { + "epoch": 0.06, + "global_step": 11830, + "learning_rate": 0.00045146076794657763, + "loss": 1.5997, + "loss_base2": 2.3079, + "loss_pixel": 0.1483, + "loss_text": 1.4514, + "ppl": 4.9515, + "step": 11830 + }, + { + "epoch": 0.06, + "global_step": 11831, + "learning_rate": 0.00045145659432387314, + "loss": 1.5879, + "loss_base2": 2.2909, + "loss_pixel": 0.1497, + "loss_text": 1.4382, + "ppl": 4.8935, + "step": 11831 + }, + { + "epoch": 0.06, + "global_step": 11832, + "learning_rate": 0.0004514524207011686, + "loss": 1.5996, + "loss_base2": 2.3077, + "loss_pixel": 0.1485, + "loss_text": 1.4511, + "ppl": 4.9511, + "step": 11832 + }, + { + "epoch": 0.06, + "global_step": 11833, + "learning_rate": 0.0004514482470784641, + "loss": 1.594, + "loss_base2": 2.2997, + "loss_pixel": 0.1508, + "loss_text": 1.4431, + "ppl": 4.9234, + "step": 11833 + }, + { + "epoch": 0.06, + "global_step": 11834, + "learning_rate": 0.0004514440734557596, + "loss": 1.6016, + "loss_base2": 2.3106, + "loss_pixel": 0.1492, + "loss_text": 1.4524, + "ppl": 4.961, + "step": 11834 + }, + { + "epoch": 0.06, + "global_step": 11835, + "learning_rate": 0.0004514398998330551, + "loss": 1.6035, + "loss_base2": 2.3134, + "loss_pixel": 0.1502, + "loss_text": 1.4534, + "ppl": 4.9704, + "step": 11835 + }, + { + "epoch": 0.06, + "global_step": 11836, + "learning_rate": 0.0004514357262103506, + "loss": 1.6001, + "loss_base2": 2.3085, + "loss_pixel": 0.1497, + "loss_text": 1.4504, + "ppl": 4.9535, + "step": 11836 + }, + { + "epoch": 0.06, + "global_step": 11837, + "learning_rate": 0.0004514315525876461, + "loss": 1.5869, + "loss_base2": 2.2894, + "loss_pixel": 0.1472, + "loss_text": 1.4396, + "ppl": 4.8886, + "step": 11837 + }, + { + "epoch": 0.06, + "global_step": 11838, + "learning_rate": 0.0004514273789649416, + "loss": 1.5993, + "loss_base2": 2.3073, + "loss_pixel": 0.1504, + "loss_text": 1.4489, + "ppl": 4.9496, + "step": 11838 + }, + { + "epoch": 0.06, + "global_step": 11839, + "learning_rate": 0.0004514232053422371, + "loss": 1.596, + "loss_base2": 2.3025, + "loss_pixel": 0.1475, + "loss_text": 1.4485, + "ppl": 4.9333, + "step": 11839 + }, + { + "epoch": 0.06, + "global_step": 11840, + "learning_rate": 0.0004514190317195326, + "loss": 1.6007, + "loss_base2": 2.3093, + "loss_pixel": 0.1497, + "loss_text": 1.451, + "ppl": 4.9565, + "step": 11840 + }, + { + "epoch": 0.06, + "global_step": 11841, + "learning_rate": 0.00045141485809682805, + "loss": 1.6121, + "loss_base2": 2.3258, + "loss_pixel": 0.1607, + "loss_text": 1.4513, + "ppl": 5.0133, + "step": 11841 + }, + { + "epoch": 0.06, + "global_step": 11842, + "learning_rate": 0.00045141068447412356, + "loss": 1.602, + "loss_base2": 2.3112, + "loss_pixel": 0.1603, + "loss_text": 1.4417, + "ppl": 4.9629, + "step": 11842 + }, + { + "epoch": 0.06, + "global_step": 11843, + "learning_rate": 0.00045140651085141906, + "loss": 1.6184, + "loss_base2": 2.3349, + "loss_pixel": 0.1612, + "loss_text": 1.4572, + "ppl": 5.045, + "step": 11843 + }, + { + "epoch": 0.06, + "global_step": 11844, + "learning_rate": 0.00045140233722871457, + "loss": 1.617, + "loss_base2": 2.3328, + "loss_pixel": 0.161, + "loss_text": 1.456, + "ppl": 5.038, + "step": 11844 + }, + { + "epoch": 0.06, + "global_step": 11845, + "learning_rate": 0.00045139816360601, + "loss": 1.6128, + "loss_base2": 2.3268, + "loss_pixel": 0.1596, + "loss_text": 1.4532, + "ppl": 5.0168, + "step": 11845 + }, + { + "epoch": 0.06, + "global_step": 11846, + "learning_rate": 0.0004513939899833055, + "loss": 1.5847, + "loss_base2": 2.2862, + "loss_pixel": 0.1594, + "loss_text": 1.4252, + "ppl": 4.8778, + "step": 11846 + }, + { + "epoch": 0.06, + "global_step": 11847, + "learning_rate": 0.000451389816360601, + "loss": 1.6116, + "loss_base2": 2.325, + "loss_pixel": 0.1602, + "loss_text": 1.4514, + "ppl": 5.0108, + "step": 11847 + }, + { + "epoch": 0.06, + "global_step": 11848, + "learning_rate": 0.0004513856427378965, + "loss": 1.5969, + "loss_base2": 2.3038, + "loss_pixel": 0.1607, + "loss_text": 1.4362, + "ppl": 4.9377, + "step": 11848 + }, + { + "epoch": 0.06, + "global_step": 11849, + "learning_rate": 0.000451381469115192, + "loss": 1.6067, + "loss_base2": 2.318, + "loss_pixel": 0.1601, + "loss_text": 1.4465, + "ppl": 4.9863, + "step": 11849 + }, + { + "epoch": 0.06, + "global_step": 11850, + "learning_rate": 0.00045137729549248745, + "loss": 1.5984, + "loss_base2": 2.306, + "loss_pixel": 0.1596, + "loss_text": 1.4388, + "ppl": 4.9451, + "step": 11850 + }, + { + "epoch": 0.06, + "global_step": 11851, + "learning_rate": 0.00045137312186978296, + "loss": 1.6134, + "loss_base2": 2.3276, + "loss_pixel": 0.1599, + "loss_text": 1.4534, + "ppl": 5.0198, + "step": 11851 + }, + { + "epoch": 0.06, + "global_step": 11852, + "learning_rate": 0.00045136894824707847, + "loss": 1.5964, + "loss_base2": 2.3031, + "loss_pixel": 0.1601, + "loss_text": 1.4363, + "ppl": 4.9352, + "step": 11852 + }, + { + "epoch": 0.06, + "global_step": 11853, + "learning_rate": 0.000451364774624374, + "loss": 1.6, + "loss_base2": 2.3083, + "loss_pixel": 0.1596, + "loss_text": 1.4404, + "ppl": 4.953, + "step": 11853 + }, + { + "epoch": 0.06, + "global_step": 11854, + "learning_rate": 0.0004513606010016695, + "loss": 1.5992, + "loss_base2": 2.3072, + "loss_pixel": 0.1603, + "loss_text": 1.4389, + "ppl": 4.9491, + "step": 11854 + }, + { + "epoch": 0.06, + "global_step": 11855, + "learning_rate": 0.00045135642737896493, + "loss": 1.6168, + "loss_base2": 2.3325, + "loss_pixel": 0.1588, + "loss_text": 1.458, + "ppl": 5.0369, + "step": 11855 + }, + { + "epoch": 0.06, + "global_step": 11856, + "learning_rate": 0.00045135225375626044, + "loss": 1.6041, + "loss_base2": 2.3142, + "loss_pixel": 0.1581, + "loss_text": 1.446, + "ppl": 4.9734, + "step": 11856 + }, + { + "epoch": 0.06, + "global_step": 11857, + "learning_rate": 0.00045134808013355595, + "loss": 1.6088, + "loss_base2": 2.321, + "loss_pixel": 0.1588, + "loss_text": 1.45, + "ppl": 4.9968, + "step": 11857 + }, + { + "epoch": 0.06, + "global_step": 11858, + "learning_rate": 0.00045134390651085146, + "loss": 1.5885, + "loss_base2": 2.2917, + "loss_pixel": 0.1587, + "loss_text": 1.4298, + "ppl": 4.8964, + "step": 11858 + }, + { + "epoch": 0.06, + "global_step": 11859, + "learning_rate": 0.00045133973288814696, + "loss": 1.6104, + "loss_base2": 2.3233, + "loss_pixel": 0.1591, + "loss_text": 1.4512, + "ppl": 5.0048, + "step": 11859 + }, + { + "epoch": 0.06, + "global_step": 11860, + "learning_rate": 0.0004513355592654424, + "loss": 1.6096, + "loss_base2": 2.3222, + "loss_pixel": 0.1592, + "loss_text": 1.4505, + "ppl": 5.0008, + "step": 11860 + }, + { + "epoch": 0.06, + "global_step": 11861, + "learning_rate": 0.0004513313856427379, + "loss": 1.5732, + "loss_base2": 2.2696, + "loss_pixel": 0.16, + "loss_text": 1.4133, + "ppl": 4.8221, + "step": 11861 + }, + { + "epoch": 0.06, + "global_step": 11862, + "learning_rate": 0.00045132721202003343, + "loss": 1.4604, + "loss_base2": 2.1069, + "loss_pixel": 0.1591, + "loss_text": 1.3013, + "ppl": 4.3077, + "step": 11862 + }, + { + "epoch": 0.06, + "global_step": 11863, + "learning_rate": 0.00045132303839732894, + "loss": 1.3764, + "loss_base2": 1.9857, + "loss_pixel": 0.1579, + "loss_text": 1.2184, + "ppl": 3.9606, + "step": 11863 + }, + { + "epoch": 0.06, + "global_step": 11864, + "learning_rate": 0.00045131886477462434, + "loss": 1.3719, + "loss_base2": 1.9792, + "loss_pixel": 0.1596, + "loss_text": 1.2124, + "ppl": 3.9428, + "step": 11864 + }, + { + "epoch": 0.06, + "global_step": 11865, + "learning_rate": 0.00045131469115191984, + "loss": 1.3913, + "loss_base2": 2.0072, + "loss_pixel": 0.1589, + "loss_text": 1.2324, + "ppl": 4.0201, + "step": 11865 + }, + { + "epoch": 0.06, + "global_step": 11866, + "learning_rate": 0.00045131051752921535, + "loss": 1.3887, + "loss_base2": 2.0035, + "loss_pixel": 0.1592, + "loss_text": 1.2296, + "ppl": 4.0096, + "step": 11866 + }, + { + "epoch": 0.06, + "global_step": 11867, + "learning_rate": 0.00045130634390651086, + "loss": 1.3519, + "loss_base2": 1.9504, + "loss_pixel": 0.1597, + "loss_text": 1.1921, + "ppl": 3.8648, + "step": 11867 + }, + { + "epoch": 0.06, + "global_step": 11868, + "learning_rate": 0.00045130217028380637, + "loss": 1.3992, + "loss_base2": 2.0186, + "loss_pixel": 0.1599, + "loss_text": 1.2393, + "ppl": 4.052, + "step": 11868 + }, + { + "epoch": 0.06, + "global_step": 11869, + "learning_rate": 0.0004512979966611018, + "loss": 1.3783, + "loss_base2": 1.9885, + "loss_pixel": 0.1597, + "loss_text": 1.2187, + "ppl": 3.9682, + "step": 11869 + }, + { + "epoch": 0.06, + "global_step": 11870, + "learning_rate": 0.0004512938230383973, + "loss": 1.37, + "loss_base2": 1.9765, + "loss_pixel": 0.1607, + "loss_text": 1.2093, + "ppl": 3.9354, + "step": 11870 + }, + { + "epoch": 0.06, + "global_step": 11871, + "learning_rate": 0.00045128964941569283, + "loss": 1.3853, + "loss_base2": 1.9986, + "loss_pixel": 0.1598, + "loss_text": 1.2255, + "ppl": 3.996, + "step": 11871 + }, + { + "epoch": 0.06, + "global_step": 11872, + "learning_rate": 0.00045128547579298834, + "loss": 1.3982, + "loss_base2": 2.0172, + "loss_pixel": 0.1593, + "loss_text": 1.2388, + "ppl": 4.0479, + "step": 11872 + }, + { + "epoch": 0.06, + "global_step": 11873, + "learning_rate": 0.0004512813021702838, + "loss": 1.3696, + "loss_base2": 1.9759, + "loss_pixel": 0.1606, + "loss_text": 1.209, + "ppl": 3.9338, + "step": 11873 + }, + { + "epoch": 0.06, + "global_step": 11874, + "learning_rate": 0.0004512771285475793, + "loss": 1.3691, + "loss_base2": 1.9752, + "loss_pixel": 0.1604, + "loss_text": 1.2086, + "ppl": 3.9318, + "step": 11874 + }, + { + "epoch": 0.06, + "global_step": 11875, + "learning_rate": 0.0004512729549248748, + "loss": 1.3802, + "loss_base2": 1.9912, + "loss_pixel": 0.16, + "loss_text": 1.2202, + "ppl": 3.9757, + "step": 11875 + }, + { + "epoch": 0.06, + "global_step": 11876, + "learning_rate": 0.0004512687813021703, + "loss": 1.4134, + "loss_base2": 2.0391, + "loss_pixel": 0.1614, + "loss_text": 1.252, + "ppl": 4.1099, + "step": 11876 + }, + { + "epoch": 0.06, + "global_step": 11877, + "learning_rate": 0.0004512646076794658, + "loss": 1.3849, + "loss_base2": 1.998, + "loss_pixel": 0.1594, + "loss_text": 1.2255, + "ppl": 3.9944, + "step": 11877 + }, + { + "epoch": 0.06, + "global_step": 11878, + "learning_rate": 0.0004512604340567613, + "loss": 1.4921, + "loss_base2": 2.1526, + "loss_pixel": 0.1581, + "loss_text": 1.3339, + "ppl": 4.4464, + "step": 11878 + }, + { + "epoch": 0.06, + "global_step": 11879, + "learning_rate": 0.0004512562604340568, + "loss": 1.633, + "loss_base2": 2.3559, + "loss_pixel": 0.1601, + "loss_text": 1.4729, + "ppl": 5.1192, + "step": 11879 + }, + { + "epoch": 0.06, + "global_step": 11880, + "learning_rate": 0.0004512520868113523, + "loss": 1.6432, + "loss_base2": 2.3706, + "loss_pixel": 0.1618, + "loss_text": 1.4813, + "ppl": 5.1717, + "step": 11880 + }, + { + "epoch": 0.06, + "global_step": 11881, + "learning_rate": 0.0004512479131886478, + "loss": 1.6195, + "loss_base2": 2.3364, + "loss_pixel": 0.163, + "loss_text": 1.4565, + "ppl": 5.0506, + "step": 11881 + }, + { + "epoch": 0.06, + "global_step": 11882, + "learning_rate": 0.0004512437395659432, + "loss": 1.6126, + "loss_base2": 2.3265, + "loss_pixel": 0.1616, + "loss_text": 1.451, + "ppl": 5.0158, + "step": 11882 + }, + { + "epoch": 0.06, + "global_step": 11883, + "learning_rate": 0.0004512395659432387, + "loss": 1.6152, + "loss_base2": 2.3302, + "loss_pixel": 0.1623, + "loss_text": 1.4529, + "ppl": 5.0289, + "step": 11883 + }, + { + "epoch": 0.06, + "global_step": 11884, + "learning_rate": 0.0004512353923205342, + "loss": 1.611, + "loss_base2": 2.3242, + "loss_pixel": 0.1615, + "loss_text": 1.4495, + "ppl": 5.0078, + "step": 11884 + }, + { + "epoch": 0.06, + "global_step": 11885, + "learning_rate": 0.0004512312186978297, + "loss": 1.605, + "loss_base2": 2.3155, + "loss_pixel": 0.1634, + "loss_text": 1.4416, + "ppl": 4.9779, + "step": 11885 + }, + { + "epoch": 0.06, + "global_step": 11886, + "learning_rate": 0.0004512270450751252, + "loss": 1.6296, + "loss_base2": 2.351, + "loss_pixel": 0.1633, + "loss_text": 1.4662, + "ppl": 5.1018, + "step": 11886 + }, + { + "epoch": 0.06, + "global_step": 11887, + "learning_rate": 0.0004512228714524207, + "loss": 1.6186, + "loss_base2": 2.3351, + "loss_pixel": 0.1617, + "loss_text": 1.4569, + "ppl": 5.046, + "step": 11887 + }, + { + "epoch": 0.06, + "global_step": 11888, + "learning_rate": 0.0004512186978297162, + "loss": 1.6083, + "loss_base2": 2.3203, + "loss_pixel": 0.1627, + "loss_text": 1.4456, + "ppl": 4.9943, + "step": 11888 + }, + { + "epoch": 0.06, + "global_step": 11889, + "learning_rate": 0.0004512145242070117, + "loss": 1.6023, + "loss_base2": 2.3116, + "loss_pixel": 0.1612, + "loss_text": 1.4411, + "ppl": 4.9644, + "step": 11889 + }, + { + "epoch": 0.06, + "global_step": 11890, + "learning_rate": 0.0004512103505843072, + "loss": 1.6223, + "loss_base2": 2.3405, + "loss_pixel": 0.1613, + "loss_text": 1.461, + "ppl": 5.0647, + "step": 11890 + }, + { + "epoch": 0.06, + "global_step": 11891, + "learning_rate": 0.00045120617696160266, + "loss": 1.6114, + "loss_base2": 2.3248, + "loss_pixel": 0.1603, + "loss_text": 1.4512, + "ppl": 5.0098, + "step": 11891 + }, + { + "epoch": 0.06, + "global_step": 11892, + "learning_rate": 0.00045120200333889816, + "loss": 1.6139, + "loss_base2": 2.3284, + "loss_pixel": 0.1608, + "loss_text": 1.4531, + "ppl": 5.0224, + "step": 11892 + }, + { + "epoch": 0.06, + "global_step": 11893, + "learning_rate": 0.00045119782971619367, + "loss": 1.5974, + "loss_base2": 2.3046, + "loss_pixel": 0.1605, + "loss_text": 1.4369, + "ppl": 4.9402, + "step": 11893 + }, + { + "epoch": 0.06, + "global_step": 11894, + "learning_rate": 0.0004511936560934892, + "loss": 1.6045, + "loss_base2": 2.3148, + "loss_pixel": 0.1599, + "loss_text": 1.4445, + "ppl": 4.9754, + "step": 11894 + }, + { + "epoch": 0.06, + "global_step": 11895, + "learning_rate": 0.0004511894824707847, + "loss": 1.6012, + "loss_base2": 2.31, + "loss_pixel": 0.1597, + "loss_text": 1.4415, + "ppl": 4.959, + "step": 11895 + }, + { + "epoch": 0.06, + "global_step": 11896, + "learning_rate": 0.00045118530884808014, + "loss": 1.6091, + "loss_base2": 2.3214, + "loss_pixel": 0.1601, + "loss_text": 1.449, + "ppl": 4.9983, + "step": 11896 + }, + { + "epoch": 0.06, + "global_step": 11897, + "learning_rate": 0.00045118113522537564, + "loss": 1.6131, + "loss_base2": 2.3272, + "loss_pixel": 0.1596, + "loss_text": 1.4535, + "ppl": 5.0183, + "step": 11897 + }, + { + "epoch": 0.06, + "global_step": 11898, + "learning_rate": 0.00045117696160267115, + "loss": 1.6108, + "loss_base2": 2.3239, + "loss_pixel": 0.1605, + "loss_text": 1.4503, + "ppl": 5.0068, + "step": 11898 + }, + { + "epoch": 0.06, + "global_step": 11899, + "learning_rate": 0.00045117278797996666, + "loss": 1.6252, + "loss_base2": 2.3447, + "loss_pixel": 0.16, + "loss_text": 1.4652, + "ppl": 5.0794, + "step": 11899 + }, + { + "epoch": 0.06, + "global_step": 11900, + "learning_rate": 0.0004511686143572621, + "loss": 1.5953, + "loss_base2": 2.3015, + "loss_pixel": 0.1593, + "loss_text": 1.436, + "ppl": 4.9298, + "step": 11900 + }, + { + "epoch": 0.06, + "global_step": 11901, + "learning_rate": 0.00045116444073455757, + "loss": 1.546, + "loss_base2": 2.2304, + "loss_pixel": 0.1612, + "loss_text": 1.3849, + "ppl": 4.6927, + "step": 11901 + }, + { + "epoch": 0.06, + "global_step": 11902, + "learning_rate": 0.0004511602671118531, + "loss": 1.426, + "loss_base2": 2.0573, + "loss_pixel": 0.1595, + "loss_text": 1.2665, + "ppl": 4.162, + "step": 11902 + }, + { + "epoch": 0.06, + "global_step": 11903, + "learning_rate": 0.0004511560934891486, + "loss": 1.3844, + "loss_base2": 1.9973, + "loss_pixel": 0.1601, + "loss_text": 1.2243, + "ppl": 3.9924, + "step": 11903 + }, + { + "epoch": 0.06, + "global_step": 11904, + "learning_rate": 0.0004511519198664441, + "loss": 1.3822, + "loss_base2": 1.9941, + "loss_pixel": 0.1597, + "loss_text": 1.2225, + "ppl": 3.9837, + "step": 11904 + }, + { + "epoch": 0.06, + "global_step": 11905, + "learning_rate": 0.00045114774624373954, + "loss": 1.3749, + "loss_base2": 1.9836, + "loss_pixel": 0.1596, + "loss_text": 1.2153, + "ppl": 3.9547, + "step": 11905 + }, + { + "epoch": 0.06, + "global_step": 11906, + "learning_rate": 0.00045114357262103505, + "loss": 1.3822, + "loss_base2": 1.9941, + "loss_pixel": 0.1584, + "loss_text": 1.2238, + "ppl": 3.9837, + "step": 11906 + }, + { + "epoch": 0.06, + "global_step": 11907, + "learning_rate": 0.00045113939899833056, + "loss": 1.3731, + "loss_base2": 1.981, + "loss_pixel": 0.1598, + "loss_text": 1.2133, + "ppl": 3.9476, + "step": 11907 + }, + { + "epoch": 0.06, + "global_step": 11908, + "learning_rate": 0.00045113522537562606, + "loss": 1.3676, + "loss_base2": 1.973, + "loss_pixel": 0.158, + "loss_text": 1.2096, + "ppl": 3.9259, + "step": 11908 + }, + { + "epoch": 0.06, + "global_step": 11909, + "learning_rate": 0.00045113105175292157, + "loss": 1.383, + "loss_base2": 1.9952, + "loss_pixel": 0.1501, + "loss_text": 1.2328, + "ppl": 3.9868, + "step": 11909 + }, + { + "epoch": 0.06, + "global_step": 11910, + "learning_rate": 0.000451126878130217, + "loss": 1.3744, + "loss_base2": 1.9828, + "loss_pixel": 0.1494, + "loss_text": 1.225, + "ppl": 3.9527, + "step": 11910 + }, + { + "epoch": 0.06, + "global_step": 11911, + "learning_rate": 0.00045112270450751253, + "loss": 1.631, + "loss_base2": 2.353, + "loss_pixel": 0.1532, + "loss_text": 1.4777, + "ppl": 5.109, + "step": 11911 + }, + { + "epoch": 0.06, + "global_step": 11912, + "learning_rate": 0.00045111853088480804, + "loss": 1.6029, + "loss_base2": 2.3125, + "loss_pixel": 0.1504, + "loss_text": 1.4525, + "ppl": 4.9674, + "step": 11912 + }, + { + "epoch": 0.06, + "global_step": 11913, + "learning_rate": 0.00045111435726210355, + "loss": 1.6093, + "loss_base2": 2.3217, + "loss_pixel": 0.1496, + "loss_text": 1.4597, + "ppl": 4.9993, + "step": 11913 + }, + { + "epoch": 0.06, + "global_step": 11914, + "learning_rate": 0.000451110183639399, + "loss": 1.6024, + "loss_base2": 2.3118, + "loss_pixel": 0.1497, + "loss_text": 1.4527, + "ppl": 4.9649, + "step": 11914 + }, + { + "epoch": 0.06, + "global_step": 11915, + "learning_rate": 0.0004511060100166945, + "loss": 1.5982, + "loss_base2": 2.3057, + "loss_pixel": 0.1499, + "loss_text": 1.4483, + "ppl": 4.9441, + "step": 11915 + }, + { + "epoch": 0.06, + "global_step": 11916, + "learning_rate": 0.00045110183639399, + "loss": 1.5986, + "loss_base2": 2.3063, + "loss_pixel": 0.1495, + "loss_text": 1.4492, + "ppl": 4.9461, + "step": 11916 + }, + { + "epoch": 0.06, + "global_step": 11917, + "learning_rate": 0.0004510976627712855, + "loss": 1.6087, + "loss_base2": 2.3209, + "loss_pixel": 0.1482, + "loss_text": 1.4605, + "ppl": 4.9963, + "step": 11917 + }, + { + "epoch": 0.06, + "global_step": 11918, + "learning_rate": 0.00045109348914858103, + "loss": 1.6136, + "loss_base2": 2.3279, + "loss_pixel": 0.1501, + "loss_text": 1.4635, + "ppl": 5.0209, + "step": 11918 + }, + { + "epoch": 0.06, + "global_step": 11919, + "learning_rate": 0.0004510893155258765, + "loss": 1.6086, + "loss_base2": 2.3207, + "loss_pixel": 0.1495, + "loss_text": 1.459, + "ppl": 4.9958, + "step": 11919 + }, + { + "epoch": 0.06, + "global_step": 11920, + "learning_rate": 0.00045108514190317193, + "loss": 1.6315, + "loss_base2": 2.3538, + "loss_pixel": 0.1496, + "loss_text": 1.482, + "ppl": 5.1115, + "step": 11920 + }, + { + "epoch": 0.06, + "global_step": 11921, + "learning_rate": 0.00045108096828046744, + "loss": 1.6014, + "loss_base2": 2.3103, + "loss_pixel": 0.1492, + "loss_text": 1.4522, + "ppl": 4.96, + "step": 11921 + }, + { + "epoch": 0.06, + "global_step": 11922, + "learning_rate": 0.00045107679465776295, + "loss": 1.618, + "loss_base2": 2.3343, + "loss_pixel": 0.1485, + "loss_text": 1.4695, + "ppl": 5.043, + "step": 11922 + }, + { + "epoch": 0.06, + "global_step": 11923, + "learning_rate": 0.0004510726210350584, + "loss": 1.6117, + "loss_base2": 2.3252, + "loss_pixel": 0.1499, + "loss_text": 1.4618, + "ppl": 5.0113, + "step": 11923 + }, + { + "epoch": 0.06, + "global_step": 11924, + "learning_rate": 0.0004510684474123539, + "loss": 1.5962, + "loss_base2": 2.3028, + "loss_pixel": 0.1467, + "loss_text": 1.4495, + "ppl": 4.9342, + "step": 11924 + }, + { + "epoch": 0.06, + "global_step": 11925, + "learning_rate": 0.0004510642737896494, + "loss": 1.6024, + "loss_base2": 2.3118, + "loss_pixel": 0.1483, + "loss_text": 1.454, + "ppl": 4.9649, + "step": 11925 + }, + { + "epoch": 0.06, + "global_step": 11926, + "learning_rate": 0.0004510601001669449, + "loss": 1.6231, + "loss_base2": 2.3416, + "loss_pixel": 0.1582, + "loss_text": 1.4649, + "ppl": 5.0688, + "step": 11926 + }, + { + "epoch": 0.06, + "global_step": 11927, + "learning_rate": 0.00045105592654424043, + "loss": 1.609, + "loss_base2": 2.3213, + "loss_pixel": 0.1653, + "loss_text": 1.4437, + "ppl": 4.9978, + "step": 11927 + }, + { + "epoch": 0.06, + "global_step": 11928, + "learning_rate": 0.0004510517529215359, + "loss": 1.6336, + "loss_base2": 2.3568, + "loss_pixel": 0.1635, + "loss_text": 1.47, + "ppl": 5.1223, + "step": 11928 + }, + { + "epoch": 0.06, + "global_step": 11929, + "learning_rate": 0.0004510475792988314, + "loss": 1.6187, + "loss_base2": 2.3353, + "loss_pixel": 0.1518, + "loss_text": 1.4669, + "ppl": 5.0465, + "step": 11929 + }, + { + "epoch": 0.06, + "global_step": 11930, + "learning_rate": 0.0004510434056761269, + "loss": 1.5833, + "loss_base2": 2.2842, + "loss_pixel": 0.1517, + "loss_text": 1.4315, + "ppl": 4.871, + "step": 11930 + }, + { + "epoch": 0.06, + "global_step": 11931, + "learning_rate": 0.0004510392320534224, + "loss": 1.6093, + "loss_base2": 2.3217, + "loss_pixel": 0.1476, + "loss_text": 1.4617, + "ppl": 4.9993, + "step": 11931 + }, + { + "epoch": 0.06, + "global_step": 11932, + "learning_rate": 0.00045103505843071786, + "loss": 1.5978, + "loss_base2": 2.3051, + "loss_pixel": 0.1491, + "loss_text": 1.4487, + "ppl": 4.9421, + "step": 11932 + }, + { + "epoch": 0.06, + "global_step": 11933, + "learning_rate": 0.00045103088480801337, + "loss": 1.5962, + "loss_base2": 2.3028, + "loss_pixel": 0.147, + "loss_text": 1.4492, + "ppl": 4.9342, + "step": 11933 + }, + { + "epoch": 0.06, + "global_step": 11934, + "learning_rate": 0.0004510267111853089, + "loss": 1.5961, + "loss_base2": 2.3027, + "loss_pixel": 0.1489, + "loss_text": 1.4471, + "ppl": 4.9338, + "step": 11934 + }, + { + "epoch": 0.06, + "global_step": 11935, + "learning_rate": 0.0004510225375626044, + "loss": 1.599, + "loss_base2": 2.3069, + "loss_pixel": 0.1492, + "loss_text": 1.4498, + "ppl": 4.9481, + "step": 11935 + }, + { + "epoch": 0.06, + "global_step": 11936, + "learning_rate": 0.0004510183639398999, + "loss": 1.598, + "loss_base2": 2.3054, + "loss_pixel": 0.1508, + "loss_text": 1.4472, + "ppl": 4.9431, + "step": 11936 + }, + { + "epoch": 0.06, + "global_step": 11937, + "learning_rate": 0.00045101419031719534, + "loss": 1.6123, + "loss_base2": 2.3261, + "loss_pixel": 0.1477, + "loss_text": 1.4647, + "ppl": 5.0143, + "step": 11937 + }, + { + "epoch": 0.06, + "global_step": 11938, + "learning_rate": 0.0004510100166944908, + "loss": 1.5897, + "loss_base2": 2.2935, + "loss_pixel": 0.1497, + "loss_text": 1.44, + "ppl": 4.9023, + "step": 11938 + }, + { + "epoch": 0.06, + "global_step": 11939, + "learning_rate": 0.0004510058430717863, + "loss": 1.5922, + "loss_base2": 2.2971, + "loss_pixel": 0.1484, + "loss_text": 1.4438, + "ppl": 4.9145, + "step": 11939 + }, + { + "epoch": 0.06, + "global_step": 11940, + "learning_rate": 0.0004510016694490818, + "loss": 1.5965, + "loss_base2": 2.3033, + "loss_pixel": 0.1487, + "loss_text": 1.4478, + "ppl": 4.9357, + "step": 11940 + }, + { + "epoch": 0.06, + "global_step": 11941, + "learning_rate": 0.00045099749582637726, + "loss": 1.5864, + "loss_base2": 2.2887, + "loss_pixel": 0.1494, + "loss_text": 1.437, + "ppl": 4.8861, + "step": 11941 + }, + { + "epoch": 0.06, + "global_step": 11942, + "learning_rate": 0.00045099332220367277, + "loss": 1.5992, + "loss_base2": 2.3072, + "loss_pixel": 0.1486, + "loss_text": 1.4505, + "ppl": 4.9491, + "step": 11942 + }, + { + "epoch": 0.06, + "global_step": 11943, + "learning_rate": 0.0004509891485809683, + "loss": 1.5746, + "loss_base2": 2.2717, + "loss_pixel": 0.1474, + "loss_text": 1.4272, + "ppl": 4.8288, + "step": 11943 + }, + { + "epoch": 0.06, + "global_step": 11944, + "learning_rate": 0.0004509849749582638, + "loss": 1.5821, + "loss_base2": 2.2825, + "loss_pixel": 0.1466, + "loss_text": 1.4356, + "ppl": 4.8652, + "step": 11944 + }, + { + "epoch": 0.06, + "global_step": 11945, + "learning_rate": 0.0004509808013355593, + "loss": 1.5953, + "loss_base2": 2.3015, + "loss_pixel": 0.1483, + "loss_text": 1.447, + "ppl": 4.9298, + "step": 11945 + }, + { + "epoch": 0.06, + "global_step": 11946, + "learning_rate": 0.00045097662771285474, + "loss": 1.6043, + "loss_base2": 2.3145, + "loss_pixel": 0.1451, + "loss_text": 1.4592, + "ppl": 4.9744, + "step": 11946 + }, + { + "epoch": 0.06, + "global_step": 11947, + "learning_rate": 0.00045097245409015025, + "loss": 1.6053, + "loss_base2": 2.316, + "loss_pixel": 0.1473, + "loss_text": 1.458, + "ppl": 4.9794, + "step": 11947 + }, + { + "epoch": 0.06, + "global_step": 11948, + "learning_rate": 0.00045096828046744576, + "loss": 1.6057, + "loss_base2": 2.3165, + "loss_pixel": 0.1477, + "loss_text": 1.458, + "ppl": 4.9813, + "step": 11948 + }, + { + "epoch": 0.06, + "global_step": 11949, + "learning_rate": 0.00045096410684474127, + "loss": 1.5991, + "loss_base2": 2.307, + "loss_pixel": 0.1468, + "loss_text": 1.4523, + "ppl": 4.9486, + "step": 11949 + }, + { + "epoch": 0.06, + "global_step": 11950, + "learning_rate": 0.0004509599332220367, + "loss": 1.5755, + "loss_base2": 2.273, + "loss_pixel": 0.1481, + "loss_text": 1.4273, + "ppl": 4.8332, + "step": 11950 + }, + { + "epoch": 0.06, + "global_step": 11951, + "learning_rate": 0.0004509557595993322, + "loss": 1.5759, + "loss_base2": 2.2735, + "loss_pixel": 0.1467, + "loss_text": 1.4291, + "ppl": 4.8351, + "step": 11951 + }, + { + "epoch": 0.06, + "global_step": 11952, + "learning_rate": 0.00045095158597662773, + "loss": 1.5872, + "loss_base2": 2.2898, + "loss_pixel": 0.1468, + "loss_text": 1.4405, + "ppl": 4.89, + "step": 11952 + }, + { + "epoch": 0.06, + "global_step": 11953, + "learning_rate": 0.00045094741235392324, + "loss": 1.6038, + "loss_base2": 2.3138, + "loss_pixel": 0.1511, + "loss_text": 1.4527, + "ppl": 4.9719, + "step": 11953 + }, + { + "epoch": 0.06, + "global_step": 11954, + "learning_rate": 0.00045094323873121875, + "loss": 1.6054, + "loss_base2": 2.3161, + "loss_pixel": 0.1497, + "loss_text": 1.4557, + "ppl": 4.9799, + "step": 11954 + }, + { + "epoch": 0.06, + "global_step": 11955, + "learning_rate": 0.0004509390651085142, + "loss": 1.5994, + "loss_base2": 2.3074, + "loss_pixel": 0.1472, + "loss_text": 1.4522, + "ppl": 4.9501, + "step": 11955 + }, + { + "epoch": 0.06, + "global_step": 11956, + "learning_rate": 0.0004509348914858097, + "loss": 1.5898, + "loss_base2": 2.2936, + "loss_pixel": 0.1459, + "loss_text": 1.4438, + "ppl": 4.9028, + "step": 11956 + }, + { + "epoch": 0.06, + "global_step": 11957, + "learning_rate": 0.00045093071786310516, + "loss": 1.6036, + "loss_base2": 2.3135, + "loss_pixel": 0.1485, + "loss_text": 1.4551, + "ppl": 4.9709, + "step": 11957 + }, + { + "epoch": 0.06, + "global_step": 11958, + "learning_rate": 0.00045092654424040067, + "loss": 1.5615, + "loss_base2": 2.2528, + "loss_pixel": 0.1454, + "loss_text": 1.4161, + "ppl": 4.766, + "step": 11958 + }, + { + "epoch": 0.06, + "global_step": 11959, + "learning_rate": 0.0004509223706176961, + "loss": 1.3839, + "loss_base2": 1.9965, + "loss_pixel": 0.1479, + "loss_text": 1.2359, + "ppl": 3.9904, + "step": 11959 + }, + { + "epoch": 0.06, + "global_step": 11960, + "learning_rate": 0.00045091819699499163, + "loss": 1.3919, + "loss_base2": 2.0081, + "loss_pixel": 0.1467, + "loss_text": 1.2452, + "ppl": 4.0225, + "step": 11960 + }, + { + "epoch": 0.06, + "global_step": 11961, + "learning_rate": 0.00045091402337228714, + "loss": 1.368, + "loss_base2": 1.9736, + "loss_pixel": 0.1484, + "loss_text": 1.2196, + "ppl": 3.9275, + "step": 11961 + }, + { + "epoch": 0.06, + "global_step": 11962, + "learning_rate": 0.00045090984974958264, + "loss": 1.3727, + "loss_base2": 1.9804, + "loss_pixel": 0.1475, + "loss_text": 1.2252, + "ppl": 3.946, + "step": 11962 + }, + { + "epoch": 0.06, + "global_step": 11963, + "learning_rate": 0.00045090567612687815, + "loss": 1.3708, + "loss_base2": 1.9776, + "loss_pixel": 0.1449, + "loss_text": 1.2259, + "ppl": 3.9385, + "step": 11963 + }, + { + "epoch": 0.06, + "global_step": 11964, + "learning_rate": 0.0004509015025041736, + "loss": 1.3627, + "loss_base2": 1.966, + "loss_pixel": 0.1439, + "loss_text": 1.2188, + "ppl": 3.9067, + "step": 11964 + }, + { + "epoch": 0.06, + "global_step": 11965, + "learning_rate": 0.0004508973288814691, + "loss": 1.3657, + "loss_base2": 1.9703, + "loss_pixel": 0.1532, + "loss_text": 1.2125, + "ppl": 3.9185, + "step": 11965 + }, + { + "epoch": 0.06, + "global_step": 11966, + "learning_rate": 0.0004508931552587646, + "loss": 1.4137, + "loss_base2": 2.0395, + "loss_pixel": 0.1606, + "loss_text": 1.253, + "ppl": 4.1111, + "step": 11966 + }, + { + "epoch": 0.06, + "global_step": 11967, + "learning_rate": 0.00045088898163606013, + "loss": 1.5648, + "loss_base2": 2.2575, + "loss_pixel": 0.1608, + "loss_text": 1.404, + "ppl": 4.7817, + "step": 11967 + }, + { + "epoch": 0.06, + "global_step": 11968, + "learning_rate": 0.00045088480801335563, + "loss": 1.6066, + "loss_base2": 2.3178, + "loss_pixel": 0.1612, + "loss_text": 1.4454, + "ppl": 4.9858, + "step": 11968 + }, + { + "epoch": 0.06, + "global_step": 11969, + "learning_rate": 0.0004508806343906511, + "loss": 1.6261, + "loss_base2": 2.346, + "loss_pixel": 0.1602, + "loss_text": 1.4659, + "ppl": 5.084, + "step": 11969 + }, + { + "epoch": 0.06, + "global_step": 11970, + "learning_rate": 0.0004508764607679466, + "loss": 1.6187, + "loss_base2": 2.3353, + "loss_pixel": 0.161, + "loss_text": 1.4577, + "ppl": 5.0465, + "step": 11970 + }, + { + "epoch": 0.06, + "global_step": 11971, + "learning_rate": 0.0004508722871452421, + "loss": 1.5939, + "loss_base2": 2.2995, + "loss_pixel": 0.1605, + "loss_text": 1.4333, + "ppl": 4.9229, + "step": 11971 + }, + { + "epoch": 0.06, + "global_step": 11972, + "learning_rate": 0.0004508681135225376, + "loss": 1.6193, + "loss_base2": 2.3362, + "loss_pixel": 0.1589, + "loss_text": 1.4604, + "ppl": 5.0496, + "step": 11972 + }, + { + "epoch": 0.06, + "global_step": 11973, + "learning_rate": 0.00045086393989983306, + "loss": 1.6163, + "loss_base2": 2.3318, + "loss_pixel": 0.1594, + "loss_text": 1.4569, + "ppl": 5.0344, + "step": 11973 + }, + { + "epoch": 0.06, + "global_step": 11974, + "learning_rate": 0.00045085976627712857, + "loss": 1.6075, + "loss_base2": 2.3191, + "loss_pixel": 0.1606, + "loss_text": 1.4469, + "ppl": 4.9903, + "step": 11974 + }, + { + "epoch": 0.06, + "global_step": 11975, + "learning_rate": 0.0004508555926544241, + "loss": 1.6098, + "loss_base2": 2.3225, + "loss_pixel": 0.1594, + "loss_text": 1.4504, + "ppl": 5.0018, + "step": 11975 + }, + { + "epoch": 0.06, + "global_step": 11976, + "learning_rate": 0.00045085141903171953, + "loss": 1.6078, + "loss_base2": 2.3196, + "loss_pixel": 0.1598, + "loss_text": 1.448, + "ppl": 4.9918, + "step": 11976 + }, + { + "epoch": 0.06, + "global_step": 11977, + "learning_rate": 0.00045084724540901504, + "loss": 1.603, + "loss_base2": 2.3126, + "loss_pixel": 0.1589, + "loss_text": 1.4441, + "ppl": 4.9679, + "step": 11977 + }, + { + "epoch": 0.06, + "global_step": 11978, + "learning_rate": 0.0004508430717863105, + "loss": 1.6274, + "loss_base2": 2.3478, + "loss_pixel": 0.1607, + "loss_text": 1.4668, + "ppl": 5.0906, + "step": 11978 + }, + { + "epoch": 0.06, + "global_step": 11979, + "learning_rate": 0.000450838898163606, + "loss": 1.6041, + "loss_base2": 2.3142, + "loss_pixel": 0.1596, + "loss_text": 1.4445, + "ppl": 4.9734, + "step": 11979 + }, + { + "epoch": 0.06, + "global_step": 11980, + "learning_rate": 0.0004508347245409015, + "loss": 1.6065, + "loss_base2": 2.3177, + "loss_pixel": 0.1585, + "loss_text": 1.4479, + "ppl": 4.9853, + "step": 11980 + }, + { + "epoch": 0.06, + "global_step": 11981, + "learning_rate": 0.000450830550918197, + "loss": 1.6039, + "loss_base2": 2.3139, + "loss_pixel": 0.1584, + "loss_text": 1.4455, + "ppl": 4.9724, + "step": 11981 + }, + { + "epoch": 0.06, + "global_step": 11982, + "learning_rate": 0.00045082637729549247, + "loss": 1.6008, + "loss_base2": 2.3095, + "loss_pixel": 0.1595, + "loss_text": 1.4412, + "ppl": 4.957, + "step": 11982 + }, + { + "epoch": 0.06, + "global_step": 11983, + "learning_rate": 0.000450822203672788, + "loss": 1.6194, + "loss_base2": 2.3363, + "loss_pixel": 0.1594, + "loss_text": 1.4601, + "ppl": 5.0501, + "step": 11983 + }, + { + "epoch": 0.06, + "global_step": 11984, + "learning_rate": 0.0004508180300500835, + "loss": 1.5974, + "loss_base2": 2.3046, + "loss_pixel": 0.1579, + "loss_text": 1.4396, + "ppl": 4.9402, + "step": 11984 + }, + { + "epoch": 0.06, + "global_step": 11985, + "learning_rate": 0.000450813856427379, + "loss": 1.6114, + "loss_base2": 2.3248, + "loss_pixel": 0.1592, + "loss_text": 1.4523, + "ppl": 5.0098, + "step": 11985 + }, + { + "epoch": 0.06, + "global_step": 11986, + "learning_rate": 0.0004508096828046745, + "loss": 1.6046, + "loss_base2": 2.3149, + "loss_pixel": 0.1584, + "loss_text": 1.4462, + "ppl": 4.9759, + "step": 11986 + }, + { + "epoch": 0.06, + "global_step": 11987, + "learning_rate": 0.00045080550918196995, + "loss": 1.5959, + "loss_base2": 2.3024, + "loss_pixel": 0.1593, + "loss_text": 1.4366, + "ppl": 4.9328, + "step": 11987 + }, + { + "epoch": 0.06, + "global_step": 11988, + "learning_rate": 0.00045080133555926546, + "loss": 1.601, + "loss_base2": 2.3098, + "loss_pixel": 0.1613, + "loss_text": 1.4397, + "ppl": 4.958, + "step": 11988 + }, + { + "epoch": 0.06, + "global_step": 11989, + "learning_rate": 0.00045079716193656096, + "loss": 1.6119, + "loss_base2": 2.3255, + "loss_pixel": 0.1594, + "loss_text": 1.4525, + "ppl": 5.0123, + "step": 11989 + }, + { + "epoch": 0.06, + "global_step": 11990, + "learning_rate": 0.00045079298831385647, + "loss": 1.6106, + "loss_base2": 2.3236, + "loss_pixel": 0.158, + "loss_text": 1.4526, + "ppl": 5.0058, + "step": 11990 + }, + { + "epoch": 0.06, + "global_step": 11991, + "learning_rate": 0.0004507888146911519, + "loss": 1.6003, + "loss_base2": 2.3087, + "loss_pixel": 0.158, + "loss_text": 1.4423, + "ppl": 4.9545, + "step": 11991 + }, + { + "epoch": 0.06, + "global_step": 11992, + "learning_rate": 0.00045078464106844743, + "loss": 1.6008, + "loss_base2": 2.3095, + "loss_pixel": 0.1583, + "loss_text": 1.4425, + "ppl": 4.957, + "step": 11992 + }, + { + "epoch": 0.06, + "global_step": 11993, + "learning_rate": 0.00045078046744574294, + "loss": 1.6057, + "loss_base2": 2.3165, + "loss_pixel": 0.1596, + "loss_text": 1.4461, + "ppl": 4.9813, + "step": 11993 + }, + { + "epoch": 0.06, + "global_step": 11994, + "learning_rate": 0.00045077629382303845, + "loss": 1.6177, + "loss_base2": 2.3338, + "loss_pixel": 0.1589, + "loss_text": 1.4589, + "ppl": 5.0415, + "step": 11994 + }, + { + "epoch": 0.06, + "global_step": 11995, + "learning_rate": 0.0004507721202003339, + "loss": 1.609, + "loss_base2": 2.3213, + "loss_pixel": 0.1583, + "loss_text": 1.4506, + "ppl": 4.9978, + "step": 11995 + }, + { + "epoch": 0.06, + "global_step": 11996, + "learning_rate": 0.00045076794657762935, + "loss": 1.6112, + "loss_base2": 2.3245, + "loss_pixel": 0.1594, + "loss_text": 1.4518, + "ppl": 5.0088, + "step": 11996 + }, + { + "epoch": 0.06, + "global_step": 11997, + "learning_rate": 0.00045076377295492486, + "loss": 1.6016, + "loss_base2": 2.3106, + "loss_pixel": 0.1582, + "loss_text": 1.4434, + "ppl": 4.961, + "step": 11997 + }, + { + "epoch": 0.06, + "global_step": 11998, + "learning_rate": 0.00045075959933222037, + "loss": 1.5946, + "loss_base2": 2.3005, + "loss_pixel": 0.1584, + "loss_text": 1.4362, + "ppl": 4.9264, + "step": 11998 + }, + { + "epoch": 0.06, + "global_step": 11999, + "learning_rate": 0.0004507554257095159, + "loss": 1.6095, + "loss_base2": 2.322, + "loss_pixel": 0.1596, + "loss_text": 1.4499, + "ppl": 5.0003, + "step": 11999 + }, + { + "epoch": 0.06, + "global_step": 12000, + "learning_rate": 0.0004507512520868113, + "loss": 1.6029, + "loss_base2": 2.3125, + "loss_pixel": 0.1579, + "loss_text": 1.4451, + "ppl": 4.9674, + "step": 12000 + }, + { + "epoch": 0.06, + "global_step": 12001, + "learning_rate": 0.00045074707846410683, + "loss": 1.6158, + "loss_base2": 2.3311, + "loss_pixel": 0.158, + "loss_text": 1.4578, + "ppl": 5.0319, + "step": 12001 + }, + { + "epoch": 0.06, + "global_step": 12002, + "learning_rate": 0.00045074290484140234, + "loss": 1.6038, + "loss_base2": 2.3138, + "loss_pixel": 0.1584, + "loss_text": 1.4454, + "ppl": 4.9719, + "step": 12002 + }, + { + "epoch": 0.06, + "global_step": 12003, + "learning_rate": 0.00045073873121869785, + "loss": 1.6, + "loss_base2": 2.3083, + "loss_pixel": 0.1594, + "loss_text": 1.4407, + "ppl": 4.953, + "step": 12003 + }, + { + "epoch": 0.06, + "global_step": 12004, + "learning_rate": 0.00045073455759599336, + "loss": 1.6084, + "loss_base2": 2.3204, + "loss_pixel": 0.1582, + "loss_text": 1.4502, + "ppl": 4.9948, + "step": 12004 + }, + { + "epoch": 0.06, + "global_step": 12005, + "learning_rate": 0.0004507303839732888, + "loss": 1.5944, + "loss_base2": 2.3002, + "loss_pixel": 0.1572, + "loss_text": 1.4372, + "ppl": 4.9254, + "step": 12005 + }, + { + "epoch": 0.06, + "global_step": 12006, + "learning_rate": 0.0004507262103505843, + "loss": 1.5802, + "loss_base2": 2.2797, + "loss_pixel": 0.1574, + "loss_text": 1.4228, + "ppl": 4.8559, + "step": 12006 + }, + { + "epoch": 0.06, + "global_step": 12007, + "learning_rate": 0.0004507220367278798, + "loss": 1.6036, + "loss_base2": 2.3135, + "loss_pixel": 0.1597, + "loss_text": 1.444, + "ppl": 4.9709, + "step": 12007 + }, + { + "epoch": 0.06, + "global_step": 12008, + "learning_rate": 0.00045071786310517533, + "loss": 1.6085, + "loss_base2": 2.3206, + "loss_pixel": 0.1594, + "loss_text": 1.4491, + "ppl": 4.9953, + "step": 12008 + }, + { + "epoch": 0.06, + "global_step": 12009, + "learning_rate": 0.0004507136894824708, + "loss": 1.5945, + "loss_base2": 2.3004, + "loss_pixel": 0.159, + "loss_text": 1.4356, + "ppl": 4.9259, + "step": 12009 + }, + { + "epoch": 0.06, + "global_step": 12010, + "learning_rate": 0.0004507095158597663, + "loss": 1.606, + "loss_base2": 2.317, + "loss_pixel": 0.1583, + "loss_text": 1.4477, + "ppl": 4.9828, + "step": 12010 + }, + { + "epoch": 0.06, + "global_step": 12011, + "learning_rate": 0.0004507053422370618, + "loss": 1.4536, + "loss_base2": 2.0971, + "loss_pixel": 0.1589, + "loss_text": 1.2947, + "ppl": 4.2785, + "step": 12011 + }, + { + "epoch": 0.06, + "global_step": 12012, + "learning_rate": 0.0004507011686143573, + "loss": 1.3762, + "loss_base2": 1.9854, + "loss_pixel": 0.1568, + "loss_text": 1.2193, + "ppl": 3.9598, + "step": 12012 + }, + { + "epoch": 0.06, + "global_step": 12013, + "learning_rate": 0.0004506969949916528, + "loss": 1.4089, + "loss_base2": 2.0326, + "loss_pixel": 0.1589, + "loss_text": 1.25, + "ppl": 4.0915, + "step": 12013 + }, + { + "epoch": 0.06, + "global_step": 12014, + "learning_rate": 0.0004506928213689482, + "loss": 1.3778, + "loss_base2": 1.9877, + "loss_pixel": 0.1587, + "loss_text": 1.2191, + "ppl": 3.9662, + "step": 12014 + }, + { + "epoch": 0.06, + "global_step": 12015, + "learning_rate": 0.0004506886477462437, + "loss": 1.3748, + "loss_base2": 1.9834, + "loss_pixel": 0.158, + "loss_text": 1.2168, + "ppl": 3.9543, + "step": 12015 + }, + { + "epoch": 0.06, + "global_step": 12016, + "learning_rate": 0.0004506844741235392, + "loss": 1.3857, + "loss_base2": 1.9991, + "loss_pixel": 0.1579, + "loss_text": 1.2278, + "ppl": 3.9976, + "step": 12016 + }, + { + "epoch": 0.06, + "global_step": 12017, + "learning_rate": 0.00045068030050083473, + "loss": 1.3653, + "loss_base2": 1.9697, + "loss_pixel": 0.1592, + "loss_text": 1.2062, + "ppl": 3.9169, + "step": 12017 + }, + { + "epoch": 0.06, + "global_step": 12018, + "learning_rate": 0.0004506761268781302, + "loss": 1.3815, + "loss_base2": 1.9931, + "loss_pixel": 0.1594, + "loss_text": 1.2221, + "ppl": 3.9809, + "step": 12018 + }, + { + "epoch": 0.06, + "global_step": 12019, + "learning_rate": 0.0004506719532554257, + "loss": 1.424, + "loss_base2": 2.0544, + "loss_pixel": 0.1613, + "loss_text": 1.2627, + "ppl": 4.1537, + "step": 12019 + }, + { + "epoch": 0.06, + "global_step": 12020, + "learning_rate": 0.0004506677796327212, + "loss": 1.6218, + "loss_base2": 2.3398, + "loss_pixel": 0.1591, + "loss_text": 1.4628, + "ppl": 5.0622, + "step": 12020 + }, + { + "epoch": 0.06, + "global_step": 12021, + "learning_rate": 0.0004506636060100167, + "loss": 1.6218, + "loss_base2": 2.3398, + "loss_pixel": 0.1588, + "loss_text": 1.463, + "ppl": 5.0622, + "step": 12021 + }, + { + "epoch": 0.06, + "global_step": 12022, + "learning_rate": 0.0004506594323873122, + "loss": 1.6347, + "loss_base2": 2.3584, + "loss_pixel": 0.1592, + "loss_text": 1.4755, + "ppl": 5.1279, + "step": 12022 + }, + { + "epoch": 0.06, + "global_step": 12023, + "learning_rate": 0.00045065525876460767, + "loss": 1.6161, + "loss_base2": 2.3315, + "loss_pixel": 0.1581, + "loss_text": 1.4579, + "ppl": 5.0334, + "step": 12023 + }, + { + "epoch": 0.06, + "global_step": 12024, + "learning_rate": 0.0004506510851419032, + "loss": 1.6225, + "loss_base2": 2.3408, + "loss_pixel": 0.1594, + "loss_text": 1.4631, + "ppl": 5.0657, + "step": 12024 + }, + { + "epoch": 0.06, + "global_step": 12025, + "learning_rate": 0.0004506469115191987, + "loss": 1.5957, + "loss_base2": 2.3021, + "loss_pixel": 0.1581, + "loss_text": 1.4376, + "ppl": 4.9318, + "step": 12025 + }, + { + "epoch": 0.06, + "global_step": 12026, + "learning_rate": 0.0004506427378964942, + "loss": 1.604, + "loss_base2": 2.3141, + "loss_pixel": 0.1591, + "loss_text": 1.4449, + "ppl": 4.9729, + "step": 12026 + }, + { + "epoch": 0.06, + "global_step": 12027, + "learning_rate": 0.0004506385642737897, + "loss": 1.6115, + "loss_base2": 2.3249, + "loss_pixel": 0.1587, + "loss_text": 1.4528, + "ppl": 5.0103, + "step": 12027 + }, + { + "epoch": 0.06, + "global_step": 12028, + "learning_rate": 0.00045063439065108515, + "loss": 1.6253, + "loss_base2": 2.3448, + "loss_pixel": 0.1601, + "loss_text": 1.4652, + "ppl": 5.0799, + "step": 12028 + }, + { + "epoch": 0.06, + "global_step": 12029, + "learning_rate": 0.00045063021702838066, + "loss": 1.6041, + "loss_base2": 2.3142, + "loss_pixel": 0.1591, + "loss_text": 1.445, + "ppl": 4.9734, + "step": 12029 + }, + { + "epoch": 0.06, + "global_step": 12030, + "learning_rate": 0.00045062604340567617, + "loss": 1.613, + "loss_base2": 2.3271, + "loss_pixel": 0.1587, + "loss_text": 1.4543, + "ppl": 5.0178, + "step": 12030 + }, + { + "epoch": 0.06, + "global_step": 12031, + "learning_rate": 0.0004506218697829717, + "loss": 1.6125, + "loss_base2": 2.3263, + "loss_pixel": 0.1587, + "loss_text": 1.4538, + "ppl": 5.0153, + "step": 12031 + }, + { + "epoch": 0.06, + "global_step": 12032, + "learning_rate": 0.0004506176961602671, + "loss": 1.6012, + "loss_base2": 2.31, + "loss_pixel": 0.1607, + "loss_text": 1.4406, + "ppl": 4.959, + "step": 12032 + }, + { + "epoch": 0.06, + "global_step": 12033, + "learning_rate": 0.0004506135225375626, + "loss": 1.6188, + "loss_base2": 2.3354, + "loss_pixel": 0.1592, + "loss_text": 1.4596, + "ppl": 5.047, + "step": 12033 + }, + { + "epoch": 0.06, + "global_step": 12034, + "learning_rate": 0.0004506093489148581, + "loss": 1.6063, + "loss_base2": 2.3174, + "loss_pixel": 0.1535, + "loss_text": 1.4529, + "ppl": 4.9843, + "step": 12034 + }, + { + "epoch": 0.06, + "global_step": 12035, + "learning_rate": 0.0004506051752921536, + "loss": 1.5904, + "loss_base2": 2.2945, + "loss_pixel": 0.1508, + "loss_text": 1.4397, + "ppl": 4.9057, + "step": 12035 + }, + { + "epoch": 0.06, + "global_step": 12036, + "learning_rate": 0.0004506010016694491, + "loss": 1.5967, + "loss_base2": 2.3036, + "loss_pixel": 0.1494, + "loss_text": 1.4472, + "ppl": 4.9367, + "step": 12036 + }, + { + "epoch": 0.06, + "global_step": 12037, + "learning_rate": 0.00045059682804674456, + "loss": 1.5964, + "loss_base2": 2.3031, + "loss_pixel": 0.151, + "loss_text": 1.4453, + "ppl": 4.9352, + "step": 12037 + }, + { + "epoch": 0.06, + "global_step": 12038, + "learning_rate": 0.00045059265442404006, + "loss": 1.5803, + "loss_base2": 2.2799, + "loss_pixel": 0.1476, + "loss_text": 1.4327, + "ppl": 4.8564, + "step": 12038 + }, + { + "epoch": 0.06, + "global_step": 12039, + "learning_rate": 0.00045058848080133557, + "loss": 1.5946, + "loss_base2": 2.3005, + "loss_pixel": 0.1491, + "loss_text": 1.4454, + "ppl": 4.9264, + "step": 12039 + }, + { + "epoch": 0.06, + "global_step": 12040, + "learning_rate": 0.0004505843071786311, + "loss": 1.5768, + "loss_base2": 2.2748, + "loss_pixel": 0.1467, + "loss_text": 1.4301, + "ppl": 4.8394, + "step": 12040 + }, + { + "epoch": 0.06, + "global_step": 12041, + "learning_rate": 0.00045058013355592653, + "loss": 1.6118, + "loss_base2": 2.3253, + "loss_pixel": 0.147, + "loss_text": 1.4648, + "ppl": 5.0118, + "step": 12041 + }, + { + "epoch": 0.06, + "global_step": 12042, + "learning_rate": 0.00045057595993322204, + "loss": 1.584, + "loss_base2": 2.2852, + "loss_pixel": 0.1502, + "loss_text": 1.4339, + "ppl": 4.8744, + "step": 12042 + }, + { + "epoch": 0.06, + "global_step": 12043, + "learning_rate": 0.00045057178631051755, + "loss": 1.585, + "loss_base2": 2.2867, + "loss_pixel": 0.1495, + "loss_text": 1.4355, + "ppl": 4.8793, + "step": 12043 + }, + { + "epoch": 0.06, + "global_step": 12044, + "learning_rate": 0.00045056761268781305, + "loss": 1.6005, + "loss_base2": 2.309, + "loss_pixel": 0.1483, + "loss_text": 1.4523, + "ppl": 4.9555, + "step": 12044 + }, + { + "epoch": 0.06, + "global_step": 12045, + "learning_rate": 0.00045056343906510856, + "loss": 1.5896, + "loss_base2": 2.2933, + "loss_pixel": 0.1474, + "loss_text": 1.4422, + "ppl": 4.9018, + "step": 12045 + }, + { + "epoch": 0.06, + "global_step": 12046, + "learning_rate": 0.000450559265442404, + "loss": 1.6039, + "loss_base2": 2.3139, + "loss_pixel": 0.1446, + "loss_text": 1.4593, + "ppl": 4.9724, + "step": 12046 + }, + { + "epoch": 0.06, + "global_step": 12047, + "learning_rate": 0.0004505550918196995, + "loss": 1.5884, + "loss_base2": 2.2916, + "loss_pixel": 0.1456, + "loss_text": 1.4429, + "ppl": 4.8959, + "step": 12047 + }, + { + "epoch": 0.06, + "global_step": 12048, + "learning_rate": 0.00045055091819699503, + "loss": 1.5765, + "loss_base2": 2.2744, + "loss_pixel": 0.1464, + "loss_text": 1.4301, + "ppl": 4.838, + "step": 12048 + }, + { + "epoch": 0.06, + "global_step": 12049, + "learning_rate": 0.00045054674457429053, + "loss": 1.5896, + "loss_base2": 2.2933, + "loss_pixel": 0.148, + "loss_text": 1.4415, + "ppl": 4.9018, + "step": 12049 + }, + { + "epoch": 0.06, + "global_step": 12050, + "learning_rate": 0.000450542570951586, + "loss": 1.5581, + "loss_base2": 2.2479, + "loss_pixel": 0.1473, + "loss_text": 1.4107, + "ppl": 4.7498, + "step": 12050 + }, + { + "epoch": 0.06, + "global_step": 12051, + "learning_rate": 0.00045053839732888144, + "loss": 1.5882, + "loss_base2": 2.2913, + "loss_pixel": 0.1453, + "loss_text": 1.4429, + "ppl": 4.8949, + "step": 12051 + }, + { + "epoch": 0.06, + "global_step": 12052, + "learning_rate": 0.00045053422370617695, + "loss": 1.5975, + "loss_base2": 2.3047, + "loss_pixel": 0.1494, + "loss_text": 1.4481, + "ppl": 4.9407, + "step": 12052 + }, + { + "epoch": 0.06, + "global_step": 12053, + "learning_rate": 0.00045053005008347246, + "loss": 1.6073, + "loss_base2": 2.3188, + "loss_pixel": 0.1467, + "loss_text": 1.4606, + "ppl": 4.9893, + "step": 12053 + }, + { + "epoch": 0.06, + "global_step": 12054, + "learning_rate": 0.00045052587646076796, + "loss": 1.5955, + "loss_base2": 2.3018, + "loss_pixel": 0.1473, + "loss_text": 1.4482, + "ppl": 4.9308, + "step": 12054 + }, + { + "epoch": 0.06, + "global_step": 12055, + "learning_rate": 0.0004505217028380634, + "loss": 1.5843, + "loss_base2": 2.2857, + "loss_pixel": 0.146, + "loss_text": 1.4383, + "ppl": 4.8759, + "step": 12055 + }, + { + "epoch": 0.06, + "global_step": 12056, + "learning_rate": 0.0004505175292153589, + "loss": 1.5887, + "loss_base2": 2.292, + "loss_pixel": 0.1459, + "loss_text": 1.4428, + "ppl": 4.8974, + "step": 12056 + }, + { + "epoch": 0.06, + "global_step": 12057, + "learning_rate": 0.00045051335559265443, + "loss": 1.5919, + "loss_base2": 2.2966, + "loss_pixel": 0.1474, + "loss_text": 1.4446, + "ppl": 4.9131, + "step": 12057 + }, + { + "epoch": 0.06, + "global_step": 12058, + "learning_rate": 0.00045050918196994994, + "loss": 1.5998, + "loss_base2": 2.308, + "loss_pixel": 0.1463, + "loss_text": 1.4535, + "ppl": 4.952, + "step": 12058 + }, + { + "epoch": 0.06, + "global_step": 12059, + "learning_rate": 0.0004505050083472454, + "loss": 1.584, + "loss_base2": 2.2852, + "loss_pixel": 0.1486, + "loss_text": 1.4354, + "ppl": 4.8744, + "step": 12059 + }, + { + "epoch": 0.06, + "global_step": 12060, + "learning_rate": 0.0004505008347245409, + "loss": 1.5904, + "loss_base2": 2.2945, + "loss_pixel": 0.147, + "loss_text": 1.4434, + "ppl": 4.9057, + "step": 12060 + }, + { + "epoch": 0.06, + "global_step": 12061, + "learning_rate": 0.0004504966611018364, + "loss": 1.5872, + "loss_base2": 2.2898, + "loss_pixel": 0.1457, + "loss_text": 1.4415, + "ppl": 4.89, + "step": 12061 + }, + { + "epoch": 0.06, + "global_step": 12062, + "learning_rate": 0.0004504924874791319, + "loss": 1.5912, + "loss_base2": 2.2956, + "loss_pixel": 0.1466, + "loss_text": 1.4446, + "ppl": 4.9096, + "step": 12062 + }, + { + "epoch": 0.06, + "global_step": 12063, + "learning_rate": 0.0004504883138564274, + "loss": 1.572, + "loss_base2": 2.2679, + "loss_pixel": 0.1448, + "loss_text": 1.4273, + "ppl": 4.8163, + "step": 12063 + }, + { + "epoch": 0.06, + "global_step": 12064, + "learning_rate": 0.0004504841402337229, + "loss": 1.5811, + "loss_base2": 2.281, + "loss_pixel": 0.1443, + "loss_text": 1.4368, + "ppl": 4.8603, + "step": 12064 + }, + { + "epoch": 0.06, + "global_step": 12065, + "learning_rate": 0.0004504799666110184, + "loss": 1.6094, + "loss_base2": 2.3219, + "loss_pixel": 0.1465, + "loss_text": 1.4629, + "ppl": 4.9998, + "step": 12065 + }, + { + "epoch": 0.06, + "global_step": 12066, + "learning_rate": 0.0004504757929883139, + "loss": 1.5926, + "loss_base2": 2.2976, + "loss_pixel": 0.1469, + "loss_text": 1.4457, + "ppl": 4.9165, + "step": 12066 + }, + { + "epoch": 0.06, + "global_step": 12067, + "learning_rate": 0.0004504716193656094, + "loss": 1.5732, + "loss_base2": 2.2696, + "loss_pixel": 0.1482, + "loss_text": 1.4249, + "ppl": 4.8221, + "step": 12067 + }, + { + "epoch": 0.06, + "global_step": 12068, + "learning_rate": 0.00045046744574290485, + "loss": 1.5925, + "loss_base2": 2.2975, + "loss_pixel": 0.1465, + "loss_text": 1.446, + "ppl": 4.916, + "step": 12068 + }, + { + "epoch": 0.06, + "global_step": 12069, + "learning_rate": 0.00045046327212020036, + "loss": 1.576, + "loss_base2": 2.2737, + "loss_pixel": 0.1444, + "loss_text": 1.4316, + "ppl": 4.8356, + "step": 12069 + }, + { + "epoch": 0.06, + "global_step": 12070, + "learning_rate": 0.0004504590984974958, + "loss": 1.5859, + "loss_base2": 2.288, + "loss_pixel": 0.1476, + "loss_text": 1.4383, + "ppl": 4.8837, + "step": 12070 + }, + { + "epoch": 0.06, + "global_step": 12071, + "learning_rate": 0.0004504549248747913, + "loss": 1.5979, + "loss_base2": 2.3053, + "loss_pixel": 0.1606, + "loss_text": 1.4373, + "ppl": 4.9426, + "step": 12071 + }, + { + "epoch": 0.06, + "global_step": 12072, + "learning_rate": 0.0004504507512520868, + "loss": 1.6055, + "loss_base2": 2.3162, + "loss_pixel": 0.1593, + "loss_text": 1.4463, + "ppl": 4.9803, + "step": 12072 + }, + { + "epoch": 0.06, + "global_step": 12073, + "learning_rate": 0.0004504465776293823, + "loss": 1.6168, + "loss_base2": 2.3325, + "loss_pixel": 0.1596, + "loss_text": 1.4573, + "ppl": 5.0369, + "step": 12073 + }, + { + "epoch": 0.06, + "global_step": 12074, + "learning_rate": 0.0004504424040066778, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1598, + "loss_text": 1.4571, + "ppl": 5.0374, + "step": 12074 + }, + { + "epoch": 0.06, + "global_step": 12075, + "learning_rate": 0.0004504382303839733, + "loss": 1.6096, + "loss_base2": 2.3222, + "loss_pixel": 0.1588, + "loss_text": 1.4508, + "ppl": 5.0008, + "step": 12075 + }, + { + "epoch": 0.06, + "global_step": 12076, + "learning_rate": 0.0004504340567612688, + "loss": 1.5964, + "loss_base2": 2.3031, + "loss_pixel": 0.1581, + "loss_text": 1.4382, + "ppl": 4.9352, + "step": 12076 + }, + { + "epoch": 0.06, + "global_step": 12077, + "learning_rate": 0.00045042988313856425, + "loss": 1.6149, + "loss_base2": 2.3298, + "loss_pixel": 0.1598, + "loss_text": 1.4551, + "ppl": 5.0274, + "step": 12077 + }, + { + "epoch": 0.06, + "global_step": 12078, + "learning_rate": 0.00045042570951585976, + "loss": 1.6024, + "loss_base2": 2.3118, + "loss_pixel": 0.1587, + "loss_text": 1.4437, + "ppl": 4.9649, + "step": 12078 + }, + { + "epoch": 0.06, + "global_step": 12079, + "learning_rate": 0.00045042153589315527, + "loss": 1.5896, + "loss_base2": 2.2933, + "loss_pixel": 0.1589, + "loss_text": 1.4307, + "ppl": 4.9018, + "step": 12079 + }, + { + "epoch": 0.06, + "global_step": 12080, + "learning_rate": 0.0004504173622704508, + "loss": 1.5862, + "loss_base2": 2.2884, + "loss_pixel": 0.1585, + "loss_text": 1.4277, + "ppl": 4.8852, + "step": 12080 + }, + { + "epoch": 0.06, + "global_step": 12081, + "learning_rate": 0.0004504131886477463, + "loss": 1.6071, + "loss_base2": 2.3186, + "loss_pixel": 0.1583, + "loss_text": 1.4488, + "ppl": 4.9883, + "step": 12081 + }, + { + "epoch": 0.06, + "global_step": 12082, + "learning_rate": 0.00045040901502504173, + "loss": 1.6074, + "loss_base2": 2.319, + "loss_pixel": 0.1594, + "loss_text": 1.448, + "ppl": 4.9898, + "step": 12082 + }, + { + "epoch": 0.06, + "global_step": 12083, + "learning_rate": 0.00045040484140233724, + "loss": 1.6071, + "loss_base2": 2.3186, + "loss_pixel": 0.1576, + "loss_text": 1.4494, + "ppl": 4.9883, + "step": 12083 + }, + { + "epoch": 0.06, + "global_step": 12084, + "learning_rate": 0.00045040066777963275, + "loss": 1.5974, + "loss_base2": 2.3046, + "loss_pixel": 0.1578, + "loss_text": 1.4397, + "ppl": 4.9402, + "step": 12084 + }, + { + "epoch": 0.06, + "global_step": 12085, + "learning_rate": 0.00045039649415692826, + "loss": 1.58, + "loss_base2": 2.2795, + "loss_pixel": 0.1589, + "loss_text": 1.4211, + "ppl": 4.855, + "step": 12085 + }, + { + "epoch": 0.06, + "global_step": 12086, + "learning_rate": 0.00045039232053422376, + "loss": 1.6082, + "loss_base2": 2.3201, + "loss_pixel": 0.1588, + "loss_text": 1.4495, + "ppl": 4.9938, + "step": 12086 + }, + { + "epoch": 0.06, + "global_step": 12087, + "learning_rate": 0.0004503881469115192, + "loss": 1.6115, + "loss_base2": 2.3249, + "loss_pixel": 0.1602, + "loss_text": 1.4513, + "ppl": 5.0103, + "step": 12087 + }, + { + "epoch": 0.06, + "global_step": 12088, + "learning_rate": 0.0004503839732888147, + "loss": 1.6052, + "loss_base2": 2.3158, + "loss_pixel": 0.16, + "loss_text": 1.4451, + "ppl": 4.9789, + "step": 12088 + }, + { + "epoch": 0.06, + "global_step": 12089, + "learning_rate": 0.0004503797996661102, + "loss": 1.6089, + "loss_base2": 2.3212, + "loss_pixel": 0.1587, + "loss_text": 1.4502, + "ppl": 4.9973, + "step": 12089 + }, + { + "epoch": 0.06, + "global_step": 12090, + "learning_rate": 0.0004503756260434057, + "loss": 1.6006, + "loss_base2": 2.3092, + "loss_pixel": 0.1587, + "loss_text": 1.4419, + "ppl": 4.956, + "step": 12090 + }, + { + "epoch": 0.06, + "global_step": 12091, + "learning_rate": 0.00045037145242070114, + "loss": 1.4156, + "loss_base2": 2.0423, + "loss_pixel": 0.1592, + "loss_text": 1.2564, + "ppl": 4.119, + "step": 12091 + }, + { + "epoch": 0.06, + "global_step": 12092, + "learning_rate": 0.00045036727879799664, + "loss": 1.3834, + "loss_base2": 1.9958, + "loss_pixel": 0.16, + "loss_text": 1.2234, + "ppl": 3.9884, + "step": 12092 + }, + { + "epoch": 0.06, + "global_step": 12093, + "learning_rate": 0.00045036310517529215, + "loss": 1.3786, + "loss_base2": 1.9889, + "loss_pixel": 0.1577, + "loss_text": 1.2209, + "ppl": 3.9693, + "step": 12093 + }, + { + "epoch": 0.06, + "global_step": 12094, + "learning_rate": 0.00045035893155258766, + "loss": 1.4058, + "loss_base2": 2.0281, + "loss_pixel": 0.1585, + "loss_text": 1.2474, + "ppl": 4.0788, + "step": 12094 + }, + { + "epoch": 0.06, + "global_step": 12095, + "learning_rate": 0.00045035475792988317, + "loss": 1.3878, + "loss_base2": 2.0022, + "loss_pixel": 0.1571, + "loss_text": 1.2307, + "ppl": 4.006, + "step": 12095 + }, + { + "epoch": 0.06, + "global_step": 12096, + "learning_rate": 0.0004503505843071786, + "loss": 1.3805, + "loss_base2": 1.9916, + "loss_pixel": 0.1586, + "loss_text": 1.2219, + "ppl": 3.9769, + "step": 12096 + }, + { + "epoch": 0.06, + "global_step": 12097, + "learning_rate": 0.0004503464106844741, + "loss": 1.3899, + "loss_base2": 2.0052, + "loss_pixel": 0.1596, + "loss_text": 1.2303, + "ppl": 4.0144, + "step": 12097 + }, + { + "epoch": 0.06, + "global_step": 12098, + "learning_rate": 0.00045034223706176963, + "loss": 1.3767, + "loss_base2": 1.9862, + "loss_pixel": 0.1583, + "loss_text": 1.2185, + "ppl": 3.9618, + "step": 12098 + }, + { + "epoch": 0.06, + "global_step": 12099, + "learning_rate": 0.00045033806343906514, + "loss": 1.3817, + "loss_base2": 1.9934, + "loss_pixel": 0.1591, + "loss_text": 1.2226, + "ppl": 3.9817, + "step": 12099 + }, + { + "epoch": 0.06, + "global_step": 12100, + "learning_rate": 0.0004503338898163606, + "loss": 1.3823, + "loss_base2": 1.9942, + "loss_pixel": 0.1594, + "loss_text": 1.2229, + "ppl": 3.9841, + "step": 12100 + }, + { + "epoch": 0.06, + "global_step": 12101, + "learning_rate": 0.0004503297161936561, + "loss": 1.3839, + "loss_base2": 1.9965, + "loss_pixel": 0.1605, + "loss_text": 1.2234, + "ppl": 3.9904, + "step": 12101 + }, + { + "epoch": 0.06, + "global_step": 12102, + "learning_rate": 0.0004503255425709516, + "loss": 1.3883, + "loss_base2": 2.0029, + "loss_pixel": 0.1602, + "loss_text": 1.2281, + "ppl": 4.008, + "step": 12102 + }, + { + "epoch": 0.06, + "global_step": 12103, + "learning_rate": 0.0004503213689482471, + "loss": 1.3756, + "loss_base2": 1.9846, + "loss_pixel": 0.1584, + "loss_text": 1.2172, + "ppl": 3.9575, + "step": 12103 + }, + { + "epoch": 0.06, + "global_step": 12104, + "learning_rate": 0.0004503171953255426, + "loss": 1.3863, + "loss_base2": 2.0, + "loss_pixel": 0.1589, + "loss_text": 1.2274, + "ppl": 4.0, + "step": 12104 + }, + { + "epoch": 0.06, + "global_step": 12105, + "learning_rate": 0.0004503130217028381, + "loss": 1.3844, + "loss_base2": 1.9973, + "loss_pixel": 0.1591, + "loss_text": 1.2253, + "ppl": 3.9924, + "step": 12105 + }, + { + "epoch": 0.06, + "global_step": 12106, + "learning_rate": 0.0004503088480801336, + "loss": 1.3688, + "loss_base2": 1.9748, + "loss_pixel": 0.16, + "loss_text": 1.2088, + "ppl": 3.9306, + "step": 12106 + }, + { + "epoch": 0.06, + "global_step": 12107, + "learning_rate": 0.00045030467445742904, + "loss": 1.4931, + "loss_base2": 2.1541, + "loss_pixel": 0.1587, + "loss_text": 1.3344, + "ppl": 4.4509, + "step": 12107 + }, + { + "epoch": 0.06, + "global_step": 12108, + "learning_rate": 0.00045030050083472454, + "loss": 1.6246, + "loss_base2": 2.3438, + "loss_pixel": 0.1585, + "loss_text": 1.4661, + "ppl": 5.0764, + "step": 12108 + }, + { + "epoch": 0.06, + "global_step": 12109, + "learning_rate": 0.00045029632721202, + "loss": 1.6122, + "loss_base2": 2.3259, + "loss_pixel": 0.1586, + "loss_text": 1.4535, + "ppl": 5.0138, + "step": 12109 + }, + { + "epoch": 0.06, + "global_step": 12110, + "learning_rate": 0.0004502921535893155, + "loss": 1.6096, + "loss_base2": 2.3222, + "loss_pixel": 0.158, + "loss_text": 1.4517, + "ppl": 5.0008, + "step": 12110 + }, + { + "epoch": 0.06, + "global_step": 12111, + "learning_rate": 0.000450287979966611, + "loss": 1.6216, + "loss_base2": 2.3395, + "loss_pixel": 0.1605, + "loss_text": 1.4611, + "ppl": 5.0612, + "step": 12111 + }, + { + "epoch": 0.06, + "global_step": 12112, + "learning_rate": 0.0004502838063439065, + "loss": 1.6019, + "loss_base2": 2.3111, + "loss_pixel": 0.1589, + "loss_text": 1.443, + "ppl": 4.9625, + "step": 12112 + }, + { + "epoch": 0.06, + "global_step": 12113, + "learning_rate": 0.00045027963272120203, + "loss": 1.6257, + "loss_base2": 2.3454, + "loss_pixel": 0.1586, + "loss_text": 1.4671, + "ppl": 5.082, + "step": 12113 + }, + { + "epoch": 0.06, + "global_step": 12114, + "learning_rate": 0.0004502754590984975, + "loss": 1.5889, + "loss_base2": 2.2923, + "loss_pixel": 0.1598, + "loss_text": 1.4291, + "ppl": 4.8984, + "step": 12114 + }, + { + "epoch": 0.06, + "global_step": 12115, + "learning_rate": 0.000450271285475793, + "loss": 1.5818, + "loss_base2": 2.2821, + "loss_pixel": 0.1585, + "loss_text": 1.4233, + "ppl": 4.8637, + "step": 12115 + }, + { + "epoch": 0.06, + "global_step": 12116, + "learning_rate": 0.0004502671118530885, + "loss": 1.6153, + "loss_base2": 2.3304, + "loss_pixel": 0.1587, + "loss_text": 1.4567, + "ppl": 5.0294, + "step": 12116 + }, + { + "epoch": 0.06, + "global_step": 12117, + "learning_rate": 0.000450262938230384, + "loss": 1.606, + "loss_base2": 2.317, + "loss_pixel": 0.1584, + "loss_text": 1.4476, + "ppl": 4.9828, + "step": 12117 + }, + { + "epoch": 0.06, + "global_step": 12118, + "learning_rate": 0.00045025876460767946, + "loss": 1.5963, + "loss_base2": 2.303, + "loss_pixel": 0.1584, + "loss_text": 1.4379, + "ppl": 4.9347, + "step": 12118 + }, + { + "epoch": 0.06, + "global_step": 12119, + "learning_rate": 0.00045025459098497496, + "loss": 1.6102, + "loss_base2": 2.323, + "loss_pixel": 0.1593, + "loss_text": 1.4509, + "ppl": 5.0038, + "step": 12119 + }, + { + "epoch": 0.06, + "global_step": 12120, + "learning_rate": 0.00045025041736227047, + "loss": 1.588, + "loss_base2": 2.291, + "loss_pixel": 0.1579, + "loss_text": 1.4301, + "ppl": 4.894, + "step": 12120 + }, + { + "epoch": 0.06, + "global_step": 12121, + "learning_rate": 0.000450246243739566, + "loss": 1.6024, + "loss_base2": 2.3118, + "loss_pixel": 0.1583, + "loss_text": 1.4441, + "ppl": 4.9649, + "step": 12121 + }, + { + "epoch": 0.06, + "global_step": 12122, + "learning_rate": 0.0004502420701168615, + "loss": 1.5968, + "loss_base2": 2.3037, + "loss_pixel": 0.1576, + "loss_text": 1.4391, + "ppl": 4.9372, + "step": 12122 + }, + { + "epoch": 0.06, + "global_step": 12123, + "learning_rate": 0.00045023789649415694, + "loss": 1.5995, + "loss_base2": 2.3076, + "loss_pixel": 0.1597, + "loss_text": 1.4398, + "ppl": 4.9506, + "step": 12123 + }, + { + "epoch": 0.06, + "global_step": 12124, + "learning_rate": 0.00045023372287145245, + "loss": 1.5957, + "loss_base2": 2.3021, + "loss_pixel": 0.1607, + "loss_text": 1.435, + "ppl": 4.9318, + "step": 12124 + }, + { + "epoch": 0.06, + "global_step": 12125, + "learning_rate": 0.00045022954924874795, + "loss": 1.5932, + "loss_base2": 2.2985, + "loss_pixel": 0.1579, + "loss_text": 1.4353, + "ppl": 4.9195, + "step": 12125 + }, + { + "epoch": 0.06, + "global_step": 12126, + "learning_rate": 0.0004502253756260434, + "loss": 1.5981, + "loss_base2": 2.3056, + "loss_pixel": 0.1575, + "loss_text": 1.4407, + "ppl": 4.9436, + "step": 12126 + }, + { + "epoch": 0.06, + "global_step": 12127, + "learning_rate": 0.00045022120200333886, + "loss": 1.6093, + "loss_base2": 2.3217, + "loss_pixel": 0.1586, + "loss_text": 1.4507, + "ppl": 4.9993, + "step": 12127 + }, + { + "epoch": 0.06, + "global_step": 12128, + "learning_rate": 0.00045021702838063437, + "loss": 1.5687, + "loss_base2": 2.2632, + "loss_pixel": 0.159, + "loss_text": 1.4097, + "ppl": 4.8004, + "step": 12128 + }, + { + "epoch": 0.06, + "global_step": 12129, + "learning_rate": 0.0004502128547579299, + "loss": 1.3971, + "loss_base2": 2.0156, + "loss_pixel": 0.1589, + "loss_text": 1.2382, + "ppl": 4.0435, + "step": 12129 + }, + { + "epoch": 0.06, + "global_step": 12130, + "learning_rate": 0.0004502086811352254, + "loss": 1.4019, + "loss_base2": 2.0225, + "loss_pixel": 0.1577, + "loss_text": 1.2442, + "ppl": 4.0629, + "step": 12130 + }, + { + "epoch": 0.06, + "global_step": 12131, + "learning_rate": 0.0004502045075125209, + "loss": 1.3734, + "loss_base2": 1.9814, + "loss_pixel": 0.1572, + "loss_text": 1.2162, + "ppl": 3.9488, + "step": 12131 + }, + { + "epoch": 0.06, + "global_step": 12132, + "learning_rate": 0.00045020033388981634, + "loss": 1.3901, + "loss_base2": 2.0055, + "loss_pixel": 0.1577, + "loss_text": 1.2325, + "ppl": 4.0153, + "step": 12132 + }, + { + "epoch": 0.06, + "global_step": 12133, + "learning_rate": 0.00045019616026711185, + "loss": 1.3626, + "loss_base2": 1.9658, + "loss_pixel": 0.1581, + "loss_text": 1.2045, + "ppl": 3.9063, + "step": 12133 + }, + { + "epoch": 0.06, + "global_step": 12134, + "learning_rate": 0.00045019198664440736, + "loss": 1.3835, + "loss_base2": 1.996, + "loss_pixel": 0.158, + "loss_text": 1.2255, + "ppl": 3.9888, + "step": 12134 + }, + { + "epoch": 0.06, + "global_step": 12135, + "learning_rate": 0.00045018781302170286, + "loss": 1.3774, + "loss_base2": 1.9872, + "loss_pixel": 0.157, + "loss_text": 1.2204, + "ppl": 3.9646, + "step": 12135 + }, + { + "epoch": 0.06, + "global_step": 12136, + "learning_rate": 0.0004501836393989983, + "loss": 1.3764, + "loss_base2": 1.9857, + "loss_pixel": 0.1589, + "loss_text": 1.2175, + "ppl": 3.9606, + "step": 12136 + }, + { + "epoch": 0.06, + "global_step": 12137, + "learning_rate": 0.0004501794657762938, + "loss": 1.3829, + "loss_base2": 1.9951, + "loss_pixel": 0.1577, + "loss_text": 1.2252, + "ppl": 3.9864, + "step": 12137 + }, + { + "epoch": 0.06, + "global_step": 12138, + "learning_rate": 0.00045017529215358933, + "loss": 1.4047, + "loss_base2": 2.0266, + "loss_pixel": 0.156, + "loss_text": 1.2487, + "ppl": 4.0743, + "step": 12138 + }, + { + "epoch": 0.06, + "global_step": 12139, + "learning_rate": 0.00045017111853088484, + "loss": 1.3653, + "loss_base2": 1.9697, + "loss_pixel": 0.1471, + "loss_text": 1.2182, + "ppl": 3.9169, + "step": 12139 + }, + { + "epoch": 0.06, + "global_step": 12140, + "learning_rate": 0.00045016694490818035, + "loss": 1.3875, + "loss_base2": 2.0017, + "loss_pixel": 0.1499, + "loss_text": 1.2376, + "ppl": 4.0048, + "step": 12140 + }, + { + "epoch": 0.06, + "global_step": 12141, + "learning_rate": 0.0004501627712854758, + "loss": 1.3562, + "loss_base2": 1.9566, + "loss_pixel": 0.1467, + "loss_text": 1.2096, + "ppl": 3.8814, + "step": 12141 + }, + { + "epoch": 0.06, + "global_step": 12142, + "learning_rate": 0.0004501585976627713, + "loss": 1.37, + "loss_base2": 1.9765, + "loss_pixel": 0.1482, + "loss_text": 1.2218, + "ppl": 3.9354, + "step": 12142 + }, + { + "epoch": 0.06, + "global_step": 12143, + "learning_rate": 0.0004501544240400668, + "loss": 1.3658, + "loss_base2": 1.9704, + "loss_pixel": 0.1489, + "loss_text": 1.2169, + "ppl": 3.9189, + "step": 12143 + }, + { + "epoch": 0.06, + "global_step": 12144, + "learning_rate": 0.0004501502504173623, + "loss": 1.3767, + "loss_base2": 1.9862, + "loss_pixel": 0.1481, + "loss_text": 1.2286, + "ppl": 3.9618, + "step": 12144 + }, + { + "epoch": 0.06, + "global_step": 12145, + "learning_rate": 0.0004501460767946578, + "loss": 1.3622, + "loss_base2": 1.9652, + "loss_pixel": 0.1467, + "loss_text": 1.2155, + "ppl": 3.9048, + "step": 12145 + }, + { + "epoch": 0.06, + "global_step": 12146, + "learning_rate": 0.0004501419031719532, + "loss": 1.373, + "loss_base2": 1.9808, + "loss_pixel": 0.147, + "loss_text": 1.226, + "ppl": 3.9472, + "step": 12146 + }, + { + "epoch": 0.06, + "global_step": 12147, + "learning_rate": 0.00045013772954924873, + "loss": 1.3911, + "loss_base2": 2.0069, + "loss_pixel": 0.1492, + "loss_text": 1.2419, + "ppl": 4.0193, + "step": 12147 + }, + { + "epoch": 0.06, + "global_step": 12148, + "learning_rate": 0.00045013355592654424, + "loss": 1.365, + "loss_base2": 1.9693, + "loss_pixel": 0.1449, + "loss_text": 1.2201, + "ppl": 3.9157, + "step": 12148 + }, + { + "epoch": 0.06, + "global_step": 12149, + "learning_rate": 0.00045012938230383975, + "loss": 1.36, + "loss_base2": 1.9621, + "loss_pixel": 0.1488, + "loss_text": 1.2112, + "ppl": 3.8962, + "step": 12149 + }, + { + "epoch": 0.06, + "global_step": 12150, + "learning_rate": 0.0004501252086811352, + "loss": 1.3814, + "loss_base2": 1.9929, + "loss_pixel": 0.1456, + "loss_text": 1.2358, + "ppl": 3.9805, + "step": 12150 + }, + { + "epoch": 0.06, + "global_step": 12151, + "learning_rate": 0.0004501210350584307, + "loss": 1.3671, + "loss_base2": 1.9723, + "loss_pixel": 0.1455, + "loss_text": 1.2216, + "ppl": 3.924, + "step": 12151 + }, + { + "epoch": 0.06, + "global_step": 12152, + "learning_rate": 0.0004501168614357262, + "loss": 1.3521, + "loss_base2": 1.9507, + "loss_pixel": 0.1468, + "loss_text": 1.2053, + "ppl": 3.8655, + "step": 12152 + }, + { + "epoch": 0.06, + "global_step": 12153, + "learning_rate": 0.0004501126878130217, + "loss": 1.3701, + "loss_base2": 1.9766, + "loss_pixel": 0.1449, + "loss_text": 1.2252, + "ppl": 3.9357, + "step": 12153 + }, + { + "epoch": 0.06, + "global_step": 12154, + "learning_rate": 0.00045010851419031723, + "loss": 1.4279, + "loss_base2": 2.06, + "loss_pixel": 0.1534, + "loss_text": 1.2745, + "ppl": 4.1699, + "step": 12154 + }, + { + "epoch": 0.06, + "global_step": 12155, + "learning_rate": 0.0004501043405676127, + "loss": 1.6313, + "loss_base2": 2.3535, + "loss_pixel": 0.1595, + "loss_text": 1.4718, + "ppl": 5.1105, + "step": 12155 + }, + { + "epoch": 0.06, + "global_step": 12156, + "learning_rate": 0.0004501001669449082, + "loss": 1.6127, + "loss_base2": 2.3266, + "loss_pixel": 0.1597, + "loss_text": 1.453, + "ppl": 5.0163, + "step": 12156 + }, + { + "epoch": 0.06, + "global_step": 12157, + "learning_rate": 0.0004500959933222037, + "loss": 1.6457, + "loss_base2": 2.3742, + "loss_pixel": 0.1574, + "loss_text": 1.4883, + "ppl": 5.1846, + "step": 12157 + }, + { + "epoch": 0.06, + "global_step": 12158, + "learning_rate": 0.0004500918196994992, + "loss": 1.6286, + "loss_base2": 2.3496, + "loss_pixel": 0.1593, + "loss_text": 1.4694, + "ppl": 5.0967, + "step": 12158 + }, + { + "epoch": 0.06, + "global_step": 12159, + "learning_rate": 0.00045008764607679466, + "loss": 1.6057, + "loss_base2": 2.3165, + "loss_pixel": 0.1584, + "loss_text": 1.4473, + "ppl": 4.9813, + "step": 12159 + }, + { + "epoch": 0.06, + "global_step": 12160, + "learning_rate": 0.00045008347245409017, + "loss": 1.6255, + "loss_base2": 2.3451, + "loss_pixel": 0.159, + "loss_text": 1.4665, + "ppl": 5.081, + "step": 12160 + }, + { + "epoch": 0.06, + "global_step": 12161, + "learning_rate": 0.0004500792988313857, + "loss": 1.6235, + "loss_base2": 2.3422, + "loss_pixel": 0.1599, + "loss_text": 1.4635, + "ppl": 5.0708, + "step": 12161 + }, + { + "epoch": 0.06, + "global_step": 12162, + "learning_rate": 0.0004500751252086812, + "loss": 1.6058, + "loss_base2": 2.3167, + "loss_pixel": 0.1591, + "loss_text": 1.4468, + "ppl": 4.9818, + "step": 12162 + }, + { + "epoch": 0.06, + "global_step": 12163, + "learning_rate": 0.0004500709515859767, + "loss": 1.6155, + "loss_base2": 2.3307, + "loss_pixel": 0.157, + "loss_text": 1.4585, + "ppl": 5.0304, + "step": 12163 + }, + { + "epoch": 0.06, + "global_step": 12164, + "learning_rate": 0.0004500667779632721, + "loss": 1.595, + "loss_base2": 2.3011, + "loss_pixel": 0.1589, + "loss_text": 1.4361, + "ppl": 4.9283, + "step": 12164 + }, + { + "epoch": 0.06, + "global_step": 12165, + "learning_rate": 0.0004500626043405676, + "loss": 1.6154, + "loss_base2": 2.3305, + "loss_pixel": 0.1579, + "loss_text": 1.4576, + "ppl": 5.0299, + "step": 12165 + }, + { + "epoch": 0.06, + "global_step": 12166, + "learning_rate": 0.0004500584307178631, + "loss": 1.6369, + "loss_base2": 2.3615, + "loss_pixel": 0.1592, + "loss_text": 1.4778, + "ppl": 5.1392, + "step": 12166 + }, + { + "epoch": 0.06, + "global_step": 12167, + "learning_rate": 0.0004500542570951586, + "loss": 1.6057, + "loss_base2": 2.3165, + "loss_pixel": 0.1574, + "loss_text": 1.4483, + "ppl": 4.9813, + "step": 12167 + }, + { + "epoch": 0.06, + "global_step": 12168, + "learning_rate": 0.00045005008347245406, + "loss": 1.591, + "loss_base2": 2.2953, + "loss_pixel": 0.1591, + "loss_text": 1.4319, + "ppl": 4.9087, + "step": 12168 + }, + { + "epoch": 0.06, + "global_step": 12169, + "learning_rate": 0.00045004590984974957, + "loss": 1.5965, + "loss_base2": 2.3033, + "loss_pixel": 0.1583, + "loss_text": 1.4382, + "ppl": 4.9357, + "step": 12169 + }, + { + "epoch": 0.06, + "global_step": 12170, + "learning_rate": 0.0004500417362270451, + "loss": 1.6157, + "loss_base2": 2.331, + "loss_pixel": 0.1583, + "loss_text": 1.4574, + "ppl": 5.0314, + "step": 12170 + }, + { + "epoch": 0.06, + "global_step": 12171, + "learning_rate": 0.0004500375626043406, + "loss": 1.6173, + "loss_base2": 2.3333, + "loss_pixel": 0.1603, + "loss_text": 1.457, + "ppl": 5.0395, + "step": 12171 + }, + { + "epoch": 0.06, + "global_step": 12172, + "learning_rate": 0.0004500333889816361, + "loss": 1.6117, + "loss_base2": 2.3252, + "loss_pixel": 0.158, + "loss_text": 1.4537, + "ppl": 5.0113, + "step": 12172 + }, + { + "epoch": 0.06, + "global_step": 12173, + "learning_rate": 0.00045002921535893154, + "loss": 1.6046, + "loss_base2": 2.3149, + "loss_pixel": 0.1588, + "loss_text": 1.4458, + "ppl": 4.9759, + "step": 12173 + }, + { + "epoch": 0.06, + "global_step": 12174, + "learning_rate": 0.00045002504173622705, + "loss": 1.5996, + "loss_base2": 2.3077, + "loss_pixel": 0.1576, + "loss_text": 1.442, + "ppl": 4.9511, + "step": 12174 + }, + { + "epoch": 0.06, + "global_step": 12175, + "learning_rate": 0.00045002086811352256, + "loss": 1.6095, + "loss_base2": 2.322, + "loss_pixel": 0.1595, + "loss_text": 1.45, + "ppl": 5.0003, + "step": 12175 + }, + { + "epoch": 0.06, + "global_step": 12176, + "learning_rate": 0.00045001669449081807, + "loss": 1.5844, + "loss_base2": 2.2858, + "loss_pixel": 0.1579, + "loss_text": 1.4265, + "ppl": 4.8764, + "step": 12176 + }, + { + "epoch": 0.06, + "global_step": 12177, + "learning_rate": 0.0004500125208681135, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.1585, + "loss_text": 1.4566, + "ppl": 5.0284, + "step": 12177 + }, + { + "epoch": 0.06, + "global_step": 12178, + "learning_rate": 0.00045000834724540903, + "loss": 1.5992, + "loss_base2": 2.3072, + "loss_pixel": 0.1584, + "loss_text": 1.4408, + "ppl": 4.9491, + "step": 12178 + }, + { + "epoch": 0.06, + "global_step": 12179, + "learning_rate": 0.00045000417362270453, + "loss": 1.5955, + "loss_base2": 2.3018, + "loss_pixel": 0.1588, + "loss_text": 1.4367, + "ppl": 4.9308, + "step": 12179 + }, + { + "epoch": 0.06, + "global_step": 12180, + "learning_rate": 0.00045000000000000004, + "loss": 1.4017, + "loss_base2": 2.0222, + "loss_pixel": 0.1582, + "loss_text": 1.2435, + "ppl": 4.0621, + "step": 12180 + }, + { + "epoch": 0.06, + "global_step": 12181, + "learning_rate": 0.00044999582637729555, + "loss": 1.4024, + "loss_base2": 2.0232, + "loss_pixel": 0.1572, + "loss_text": 1.2452, + "ppl": 4.0649, + "step": 12181 + }, + { + "epoch": 0.06, + "global_step": 12182, + "learning_rate": 0.00044999165275459095, + "loss": 1.3863, + "loss_base2": 2.0, + "loss_pixel": 0.1583, + "loss_text": 1.228, + "ppl": 4.0, + "step": 12182 + }, + { + "epoch": 0.06, + "global_step": 12183, + "learning_rate": 0.00044998747913188646, + "loss": 1.4, + "loss_base2": 2.0198, + "loss_pixel": 0.1589, + "loss_text": 1.2411, + "ppl": 4.0552, + "step": 12183 + }, + { + "epoch": 0.06, + "global_step": 12184, + "learning_rate": 0.00044998330550918196, + "loss": 1.393, + "loss_base2": 2.0097, + "loss_pixel": 0.1587, + "loss_text": 1.2343, + "ppl": 4.0269, + "step": 12184 + }, + { + "epoch": 0.06, + "global_step": 12185, + "learning_rate": 0.00044997913188647747, + "loss": 1.3859, + "loss_base2": 1.9994, + "loss_pixel": 0.1587, + "loss_text": 1.2273, + "ppl": 3.9984, + "step": 12185 + }, + { + "epoch": 0.06, + "global_step": 12186, + "learning_rate": 0.0004499749582637729, + "loss": 1.3737, + "loss_base2": 1.9818, + "loss_pixel": 0.1581, + "loss_text": 1.2155, + "ppl": 3.9499, + "step": 12186 + }, + { + "epoch": 0.06, + "global_step": 12187, + "learning_rate": 0.00044997078464106843, + "loss": 1.3696, + "loss_base2": 1.9759, + "loss_pixel": 0.1596, + "loss_text": 1.21, + "ppl": 3.9338, + "step": 12187 + }, + { + "epoch": 0.06, + "global_step": 12188, + "learning_rate": 0.00044996661101836394, + "loss": 1.3749, + "loss_base2": 1.9836, + "loss_pixel": 0.1572, + "loss_text": 1.2177, + "ppl": 3.9547, + "step": 12188 + }, + { + "epoch": 0.06, + "global_step": 12189, + "learning_rate": 0.00044996243739565945, + "loss": 1.378, + "loss_base2": 1.988, + "loss_pixel": 0.159, + "loss_text": 1.219, + "ppl": 3.967, + "step": 12189 + }, + { + "epoch": 0.06, + "global_step": 12190, + "learning_rate": 0.00044995826377295495, + "loss": 1.3799, + "loss_base2": 1.9908, + "loss_pixel": 0.1571, + "loss_text": 1.2228, + "ppl": 3.9745, + "step": 12190 + }, + { + "epoch": 0.06, + "global_step": 12191, + "learning_rate": 0.0004499540901502504, + "loss": 1.3666, + "loss_base2": 1.9716, + "loss_pixel": 0.1577, + "loss_text": 1.2089, + "ppl": 3.922, + "step": 12191 + }, + { + "epoch": 0.06, + "global_step": 12192, + "learning_rate": 0.0004499499165275459, + "loss": 1.3829, + "loss_base2": 1.9951, + "loss_pixel": 0.1577, + "loss_text": 1.2252, + "ppl": 3.9864, + "step": 12192 + }, + { + "epoch": 0.06, + "global_step": 12193, + "learning_rate": 0.0004499457429048414, + "loss": 1.3772, + "loss_base2": 1.9869, + "loss_pixel": 0.1578, + "loss_text": 1.2194, + "ppl": 3.9638, + "step": 12193 + }, + { + "epoch": 0.06, + "global_step": 12194, + "learning_rate": 0.00044994156928213693, + "loss": 1.3613, + "loss_base2": 1.9639, + "loss_pixel": 0.1575, + "loss_text": 1.2038, + "ppl": 3.9013, + "step": 12194 + }, + { + "epoch": 0.06, + "global_step": 12195, + "learning_rate": 0.0004499373956594324, + "loss": 1.3788, + "loss_base2": 1.9892, + "loss_pixel": 0.1574, + "loss_text": 1.2214, + "ppl": 3.9701, + "step": 12195 + }, + { + "epoch": 0.06, + "global_step": 12196, + "learning_rate": 0.0004499332220367279, + "loss": 1.3778, + "loss_base2": 1.9877, + "loss_pixel": 0.1577, + "loss_text": 1.2201, + "ppl": 3.9662, + "step": 12196 + }, + { + "epoch": 0.06, + "global_step": 12197, + "learning_rate": 0.0004499290484140234, + "loss": 1.4982, + "loss_base2": 2.1614, + "loss_pixel": 0.1588, + "loss_text": 1.3395, + "ppl": 4.4736, + "step": 12197 + }, + { + "epoch": 0.06, + "global_step": 12198, + "learning_rate": 0.0004499248747913189, + "loss": 1.6338, + "loss_base2": 2.3571, + "loss_pixel": 0.1588, + "loss_text": 1.4751, + "ppl": 5.1233, + "step": 12198 + }, + { + "epoch": 0.06, + "global_step": 12199, + "learning_rate": 0.0004499207011686144, + "loss": 1.6266, + "loss_base2": 2.3467, + "loss_pixel": 0.1569, + "loss_text": 1.4696, + "ppl": 5.0866, + "step": 12199 + }, + { + "epoch": 0.06, + "global_step": 12200, + "learning_rate": 0.00044991652754590986, + "loss": 1.6356, + "loss_base2": 2.3597, + "loss_pixel": 0.1581, + "loss_text": 1.4775, + "ppl": 5.1325, + "step": 12200 + }, + { + "epoch": 0.06, + "global_step": 12201, + "learning_rate": 0.0004499123539232053, + "loss": 1.615, + "loss_base2": 2.33, + "loss_pixel": 0.1581, + "loss_text": 1.4568, + "ppl": 5.0279, + "step": 12201 + }, + { + "epoch": 0.06, + "global_step": 12202, + "learning_rate": 0.0004499081803005008, + "loss": 1.6096, + "loss_base2": 2.3222, + "loss_pixel": 0.1578, + "loss_text": 1.4518, + "ppl": 5.0008, + "step": 12202 + }, + { + "epoch": 0.06, + "global_step": 12203, + "learning_rate": 0.00044990400667779633, + "loss": 1.5984, + "loss_base2": 2.306, + "loss_pixel": 0.1588, + "loss_text": 1.4396, + "ppl": 4.9451, + "step": 12203 + }, + { + "epoch": 0.06, + "global_step": 12204, + "learning_rate": 0.00044989983305509184, + "loss": 1.613, + "loss_base2": 2.3271, + "loss_pixel": 0.1584, + "loss_text": 1.4546, + "ppl": 5.0178, + "step": 12204 + }, + { + "epoch": 0.06, + "global_step": 12205, + "learning_rate": 0.0004498956594323873, + "loss": 1.6313, + "loss_base2": 2.3535, + "loss_pixel": 0.1582, + "loss_text": 1.473, + "ppl": 5.1105, + "step": 12205 + }, + { + "epoch": 0.06, + "global_step": 12206, + "learning_rate": 0.0004498914858096828, + "loss": 1.6283, + "loss_base2": 2.3491, + "loss_pixel": 0.1593, + "loss_text": 1.469, + "ppl": 5.0952, + "step": 12206 + }, + { + "epoch": 0.06, + "global_step": 12207, + "learning_rate": 0.0004498873121869783, + "loss": 1.6045, + "loss_base2": 2.3148, + "loss_pixel": 0.1571, + "loss_text": 1.4474, + "ppl": 4.9754, + "step": 12207 + }, + { + "epoch": 0.06, + "global_step": 12208, + "learning_rate": 0.0004498831385642738, + "loss": 1.6222, + "loss_base2": 2.3403, + "loss_pixel": 0.1587, + "loss_text": 1.4635, + "ppl": 5.0642, + "step": 12208 + }, + { + "epoch": 0.06, + "global_step": 12209, + "learning_rate": 0.00044987896494156927, + "loss": 1.6101, + "loss_base2": 2.3229, + "loss_pixel": 0.1572, + "loss_text": 1.4529, + "ppl": 5.0033, + "step": 12209 + }, + { + "epoch": 0.06, + "global_step": 12210, + "learning_rate": 0.0004498747913188648, + "loss": 1.6073, + "loss_base2": 2.3188, + "loss_pixel": 0.1571, + "loss_text": 1.4502, + "ppl": 4.9893, + "step": 12210 + }, + { + "epoch": 0.06, + "global_step": 12211, + "learning_rate": 0.0004498706176961603, + "loss": 1.614, + "loss_base2": 2.3285, + "loss_pixel": 0.1597, + "loss_text": 1.4544, + "ppl": 5.0229, + "step": 12211 + }, + { + "epoch": 0.06, + "global_step": 12212, + "learning_rate": 0.0004498664440734558, + "loss": 1.6095, + "loss_base2": 2.322, + "loss_pixel": 0.1588, + "loss_text": 1.4507, + "ppl": 5.0003, + "step": 12212 + }, + { + "epoch": 0.06, + "global_step": 12213, + "learning_rate": 0.0004498622704507513, + "loss": 1.6086, + "loss_base2": 2.3207, + "loss_pixel": 0.1588, + "loss_text": 1.4499, + "ppl": 4.9958, + "step": 12213 + }, + { + "epoch": 0.06, + "global_step": 12214, + "learning_rate": 0.00044985809682804675, + "loss": 1.5906, + "loss_base2": 2.2948, + "loss_pixel": 0.1563, + "loss_text": 1.4343, + "ppl": 4.9067, + "step": 12214 + }, + { + "epoch": 0.06, + "global_step": 12215, + "learning_rate": 0.00044985392320534226, + "loss": 1.6027, + "loss_base2": 2.3122, + "loss_pixel": 0.1487, + "loss_text": 1.4541, + "ppl": 4.9664, + "step": 12215 + }, + { + "epoch": 0.06, + "global_step": 12216, + "learning_rate": 0.00044984974958263776, + "loss": 1.5926, + "loss_base2": 2.2976, + "loss_pixel": 0.1472, + "loss_text": 1.4454, + "ppl": 4.9165, + "step": 12216 + }, + { + "epoch": 0.06, + "global_step": 12217, + "learning_rate": 0.00044984557595993327, + "loss": 1.6035, + "loss_base2": 2.3134, + "loss_pixel": 0.1489, + "loss_text": 1.4546, + "ppl": 4.9704, + "step": 12217 + }, + { + "epoch": 0.06, + "global_step": 12218, + "learning_rate": 0.0004498414023372287, + "loss": 1.5964, + "loss_base2": 2.3031, + "loss_pixel": 0.1476, + "loss_text": 1.4488, + "ppl": 4.9352, + "step": 12218 + }, + { + "epoch": 0.06, + "global_step": 12219, + "learning_rate": 0.00044983722871452423, + "loss": 1.6075, + "loss_base2": 2.3191, + "loss_pixel": 0.1474, + "loss_text": 1.4601, + "ppl": 4.9903, + "step": 12219 + }, + { + "epoch": 0.06, + "global_step": 12220, + "learning_rate": 0.0004498330550918197, + "loss": 1.574, + "loss_base2": 2.2708, + "loss_pixel": 0.1481, + "loss_text": 1.4259, + "ppl": 4.8259, + "step": 12220 + }, + { + "epoch": 0.06, + "global_step": 12221, + "learning_rate": 0.0004498288814691152, + "loss": 1.6028, + "loss_base2": 2.3124, + "loss_pixel": 0.1468, + "loss_text": 1.456, + "ppl": 4.9669, + "step": 12221 + }, + { + "epoch": 0.06, + "global_step": 12222, + "learning_rate": 0.0004498247078464107, + "loss": 1.4101, + "loss_base2": 2.0343, + "loss_pixel": 0.1468, + "loss_text": 1.2633, + "ppl": 4.0964, + "step": 12222 + }, + { + "epoch": 0.06, + "global_step": 12223, + "learning_rate": 0.00044982053422370615, + "loss": 1.3841, + "loss_base2": 1.9968, + "loss_pixel": 0.1455, + "loss_text": 1.2386, + "ppl": 3.9912, + "step": 12223 + }, + { + "epoch": 0.06, + "global_step": 12224, + "learning_rate": 0.00044981636060100166, + "loss": 1.3727, + "loss_base2": 1.9804, + "loss_pixel": 0.1467, + "loss_text": 1.226, + "ppl": 3.946, + "step": 12224 + }, + { + "epoch": 0.06, + "global_step": 12225, + "learning_rate": 0.00044981218697829717, + "loss": 1.3611, + "loss_base2": 1.9637, + "loss_pixel": 0.1456, + "loss_text": 1.2155, + "ppl": 3.9005, + "step": 12225 + }, + { + "epoch": 0.06, + "global_step": 12226, + "learning_rate": 0.0004498080133555927, + "loss": 1.3688, + "loss_base2": 1.9748, + "loss_pixel": 0.146, + "loss_text": 1.2228, + "ppl": 3.9306, + "step": 12226 + }, + { + "epoch": 0.06, + "global_step": 12227, + "learning_rate": 0.0004498038397328881, + "loss": 1.3728, + "loss_base2": 1.9805, + "loss_pixel": 0.1468, + "loss_text": 1.226, + "ppl": 3.9464, + "step": 12227 + }, + { + "epoch": 0.06, + "global_step": 12228, + "learning_rate": 0.00044979966611018363, + "loss": 1.3864, + "loss_base2": 2.0002, + "loss_pixel": 0.145, + "loss_text": 1.2414, + "ppl": 4.0004, + "step": 12228 + }, + { + "epoch": 0.06, + "global_step": 12229, + "learning_rate": 0.00044979549248747914, + "loss": 1.3674, + "loss_base2": 1.9727, + "loss_pixel": 0.1489, + "loss_text": 1.2185, + "ppl": 3.9251, + "step": 12229 + }, + { + "epoch": 0.06, + "global_step": 12230, + "learning_rate": 0.00044979131886477465, + "loss": 1.5351, + "loss_base2": 2.2147, + "loss_pixel": 0.1454, + "loss_text": 1.3897, + "ppl": 4.6418, + "step": 12230 + }, + { + "epoch": 0.06, + "global_step": 12231, + "learning_rate": 0.00044978714524207016, + "loss": 1.6043, + "loss_base2": 2.3145, + "loss_pixel": 0.147, + "loss_text": 1.4574, + "ppl": 4.9744, + "step": 12231 + }, + { + "epoch": 0.06, + "global_step": 12232, + "learning_rate": 0.0004497829716193656, + "loss": 1.6185, + "loss_base2": 2.335, + "loss_pixel": 0.1587, + "loss_text": 1.4598, + "ppl": 5.0455, + "step": 12232 + }, + { + "epoch": 0.06, + "global_step": 12233, + "learning_rate": 0.0004497787979966611, + "loss": 1.6101, + "loss_base2": 2.3229, + "loss_pixel": 0.1595, + "loss_text": 1.4506, + "ppl": 5.0033, + "step": 12233 + }, + { + "epoch": 0.06, + "global_step": 12234, + "learning_rate": 0.0004497746243739566, + "loss": 1.6054, + "loss_base2": 2.3161, + "loss_pixel": 0.1595, + "loss_text": 1.4459, + "ppl": 4.9799, + "step": 12234 + }, + { + "epoch": 0.06, + "global_step": 12235, + "learning_rate": 0.00044977045075125213, + "loss": 1.6185, + "loss_base2": 2.335, + "loss_pixel": 0.1579, + "loss_text": 1.4606, + "ppl": 5.0455, + "step": 12235 + }, + { + "epoch": 0.06, + "global_step": 12236, + "learning_rate": 0.0004497662771285476, + "loss": 1.6116, + "loss_base2": 2.325, + "loss_pixel": 0.1573, + "loss_text": 1.4542, + "ppl": 5.0108, + "step": 12236 + }, + { + "epoch": 0.06, + "global_step": 12237, + "learning_rate": 0.0004497621035058431, + "loss": 1.6, + "loss_base2": 2.3083, + "loss_pixel": 0.158, + "loss_text": 1.442, + "ppl": 4.953, + "step": 12237 + }, + { + "epoch": 0.06, + "global_step": 12238, + "learning_rate": 0.0004497579298831386, + "loss": 1.6095, + "loss_base2": 2.322, + "loss_pixel": 0.16, + "loss_text": 1.4494, + "ppl": 5.0003, + "step": 12238 + }, + { + "epoch": 0.06, + "global_step": 12239, + "learning_rate": 0.00044975375626043405, + "loss": 1.6257, + "loss_base2": 2.3454, + "loss_pixel": 0.1598, + "loss_text": 1.4659, + "ppl": 5.082, + "step": 12239 + }, + { + "epoch": 0.06, + "global_step": 12240, + "learning_rate": 0.00044974958263772956, + "loss": 1.6026, + "loss_base2": 2.3121, + "loss_pixel": 0.1589, + "loss_text": 1.4437, + "ppl": 4.9659, + "step": 12240 + }, + { + "epoch": 0.06, + "global_step": 12241, + "learning_rate": 0.000449745409015025, + "loss": 1.6078, + "loss_base2": 2.3196, + "loss_pixel": 0.1573, + "loss_text": 1.4505, + "ppl": 4.9918, + "step": 12241 + }, + { + "epoch": 0.06, + "global_step": 12242, + "learning_rate": 0.0004497412353923205, + "loss": 1.6046, + "loss_base2": 2.3149, + "loss_pixel": 0.1585, + "loss_text": 1.4461, + "ppl": 4.9759, + "step": 12242 + }, + { + "epoch": 0.06, + "global_step": 12243, + "learning_rate": 0.00044973706176961603, + "loss": 1.6266, + "loss_base2": 2.3467, + "loss_pixel": 0.1582, + "loss_text": 1.4684, + "ppl": 5.0866, + "step": 12243 + }, + { + "epoch": 0.06, + "global_step": 12244, + "learning_rate": 0.00044973288814691153, + "loss": 1.6112, + "loss_base2": 2.3245, + "loss_pixel": 0.1589, + "loss_text": 1.4523, + "ppl": 5.0088, + "step": 12244 + }, + { + "epoch": 0.06, + "global_step": 12245, + "learning_rate": 0.000449728714524207, + "loss": 1.6204, + "loss_base2": 2.3377, + "loss_pixel": 0.1568, + "loss_text": 1.4637, + "ppl": 5.0551, + "step": 12245 + }, + { + "epoch": 0.06, + "global_step": 12246, + "learning_rate": 0.0004497245409015025, + "loss": 1.6076, + "loss_base2": 2.3193, + "loss_pixel": 0.1573, + "loss_text": 1.4504, + "ppl": 4.9908, + "step": 12246 + }, + { + "epoch": 0.06, + "global_step": 12247, + "learning_rate": 0.000449720367278798, + "loss": 1.5961, + "loss_base2": 2.3027, + "loss_pixel": 0.1584, + "loss_text": 1.4376, + "ppl": 4.9338, + "step": 12247 + }, + { + "epoch": 0.06, + "global_step": 12248, + "learning_rate": 0.0004497161936560935, + "loss": 1.6111, + "loss_base2": 2.3243, + "loss_pixel": 0.1577, + "loss_text": 1.4535, + "ppl": 5.0083, + "step": 12248 + }, + { + "epoch": 0.06, + "global_step": 12249, + "learning_rate": 0.000449712020033389, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.1576, + "loss_text": 1.4576, + "ppl": 5.0284, + "step": 12249 + }, + { + "epoch": 0.06, + "global_step": 12250, + "learning_rate": 0.00044970784641068447, + "loss": 1.6013, + "loss_base2": 2.3102, + "loss_pixel": 0.1576, + "loss_text": 1.4437, + "ppl": 4.9595, + "step": 12250 + }, + { + "epoch": 0.06, + "global_step": 12251, + "learning_rate": 0.00044970367278798, + "loss": 1.4746, + "loss_base2": 2.1274, + "loss_pixel": 0.1566, + "loss_text": 1.3179, + "ppl": 4.3693, + "step": 12251 + }, + { + "epoch": 0.06, + "global_step": 12252, + "learning_rate": 0.0004496994991652755, + "loss": 1.3698, + "loss_base2": 1.9762, + "loss_pixel": 0.1592, + "loss_text": 1.2105, + "ppl": 3.9346, + "step": 12252 + }, + { + "epoch": 0.06, + "global_step": 12253, + "learning_rate": 0.000449695325542571, + "loss": 1.3741, + "loss_base2": 1.9824, + "loss_pixel": 0.1582, + "loss_text": 1.2159, + "ppl": 3.9515, + "step": 12253 + }, + { + "epoch": 0.06, + "global_step": 12254, + "learning_rate": 0.00044969115191986645, + "loss": 1.3877, + "loss_base2": 2.002, + "loss_pixel": 0.1588, + "loss_text": 1.2289, + "ppl": 4.0056, + "step": 12254 + }, + { + "epoch": 0.06, + "global_step": 12255, + "learning_rate": 0.00044968697829716195, + "loss": 1.3836, + "loss_base2": 1.9961, + "loss_pixel": 0.1591, + "loss_text": 1.2245, + "ppl": 3.9892, + "step": 12255 + }, + { + "epoch": 0.06, + "global_step": 12256, + "learning_rate": 0.00044968280467445746, + "loss": 1.3924, + "loss_base2": 2.0088, + "loss_pixel": 0.1589, + "loss_text": 1.2335, + "ppl": 4.0245, + "step": 12256 + }, + { + "epoch": 0.06, + "global_step": 12257, + "learning_rate": 0.00044967863105175297, + "loss": 1.3926, + "loss_base2": 2.0091, + "loss_pixel": 0.1593, + "loss_text": 1.2333, + "ppl": 4.0253, + "step": 12257 + }, + { + "epoch": 0.06, + "global_step": 12258, + "learning_rate": 0.0004496744574290484, + "loss": 1.3755, + "loss_base2": 1.9844, + "loss_pixel": 0.1571, + "loss_text": 1.2185, + "ppl": 3.9571, + "step": 12258 + }, + { + "epoch": 0.06, + "global_step": 12259, + "learning_rate": 0.0004496702838063439, + "loss": 1.3787, + "loss_base2": 1.989, + "loss_pixel": 0.1572, + "loss_text": 1.2215, + "ppl": 3.9697, + "step": 12259 + }, + { + "epoch": 0.06, + "global_step": 12260, + "learning_rate": 0.0004496661101836394, + "loss": 1.373, + "loss_base2": 1.9808, + "loss_pixel": 0.1606, + "loss_text": 1.2124, + "ppl": 3.9472, + "step": 12260 + }, + { + "epoch": 0.06, + "global_step": 12261, + "learning_rate": 0.0004496619365609349, + "loss": 1.3705, + "loss_base2": 1.9772, + "loss_pixel": 0.1577, + "loss_text": 1.2128, + "ppl": 3.9373, + "step": 12261 + }, + { + "epoch": 0.06, + "global_step": 12262, + "learning_rate": 0.0004496577629382304, + "loss": 1.3809, + "loss_base2": 1.9922, + "loss_pixel": 0.1594, + "loss_text": 1.2215, + "ppl": 3.9785, + "step": 12262 + }, + { + "epoch": 0.06, + "global_step": 12263, + "learning_rate": 0.0004496535893155259, + "loss": 1.3935, + "loss_base2": 2.0104, + "loss_pixel": 0.1576, + "loss_text": 1.236, + "ppl": 4.0289, + "step": 12263 + }, + { + "epoch": 0.06, + "global_step": 12264, + "learning_rate": 0.00044964941569282136, + "loss": 1.377, + "loss_base2": 1.9866, + "loss_pixel": 0.1595, + "loss_text": 1.2176, + "ppl": 3.963, + "step": 12264 + }, + { + "epoch": 0.06, + "global_step": 12265, + "learning_rate": 0.00044964524207011686, + "loss": 1.3957, + "loss_base2": 2.0136, + "loss_pixel": 0.1584, + "loss_text": 1.2373, + "ppl": 4.0378, + "step": 12265 + }, + { + "epoch": 0.06, + "global_step": 12266, + "learning_rate": 0.00044964106844741237, + "loss": 1.3772, + "loss_base2": 1.9869, + "loss_pixel": 0.1579, + "loss_text": 1.2193, + "ppl": 3.9638, + "step": 12266 + }, + { + "epoch": 0.06, + "global_step": 12267, + "learning_rate": 0.0004496368948247079, + "loss": 1.3766, + "loss_base2": 1.986, + "loss_pixel": 0.1582, + "loss_text": 1.2184, + "ppl": 3.9614, + "step": 12267 + }, + { + "epoch": 0.06, + "global_step": 12268, + "learning_rate": 0.00044963272120200333, + "loss": 1.3599, + "loss_base2": 1.9619, + "loss_pixel": 0.1577, + "loss_text": 1.2022, + "ppl": 3.8958, + "step": 12268 + }, + { + "epoch": 0.06, + "global_step": 12269, + "learning_rate": 0.00044962854757929884, + "loss": 1.3756, + "loss_base2": 1.9846, + "loss_pixel": 0.1581, + "loss_text": 1.2174, + "ppl": 3.9575, + "step": 12269 + }, + { + "epoch": 0.06, + "global_step": 12270, + "learning_rate": 0.00044962437395659435, + "loss": 1.3708, + "loss_base2": 1.9776, + "loss_pixel": 0.1586, + "loss_text": 1.2122, + "ppl": 3.9385, + "step": 12270 + }, + { + "epoch": 0.06, + "global_step": 12271, + "learning_rate": 0.00044962020033388985, + "loss": 1.4148, + "loss_base2": 2.0411, + "loss_pixel": 0.1572, + "loss_text": 1.2576, + "ppl": 4.1157, + "step": 12271 + }, + { + "epoch": 0.06, + "global_step": 12272, + "learning_rate": 0.00044961602671118536, + "loss": 1.3734, + "loss_base2": 1.9814, + "loss_pixel": 0.1588, + "loss_text": 1.2146, + "ppl": 3.9488, + "step": 12272 + }, + { + "epoch": 0.06, + "global_step": 12273, + "learning_rate": 0.0004496118530884808, + "loss": 1.367, + "loss_base2": 1.9722, + "loss_pixel": 0.1577, + "loss_text": 1.2093, + "ppl": 3.9236, + "step": 12273 + }, + { + "epoch": 0.06, + "global_step": 12274, + "learning_rate": 0.0004496076794657763, + "loss": 1.3752, + "loss_base2": 1.984, + "loss_pixel": 0.1586, + "loss_text": 1.2165, + "ppl": 3.9559, + "step": 12274 + }, + { + "epoch": 0.06, + "global_step": 12275, + "learning_rate": 0.00044960350584307183, + "loss": 1.5428, + "loss_base2": 2.2258, + "loss_pixel": 0.1591, + "loss_text": 1.3837, + "ppl": 4.6777, + "step": 12275 + }, + { + "epoch": 0.06, + "global_step": 12276, + "learning_rate": 0.0004495993322203673, + "loss": 1.6309, + "loss_base2": 2.3529, + "loss_pixel": 0.1621, + "loss_text": 1.4688, + "ppl": 5.1085, + "step": 12276 + }, + { + "epoch": 0.06, + "global_step": 12277, + "learning_rate": 0.00044959515859766273, + "loss": 1.6272, + "loss_base2": 2.3476, + "loss_pixel": 0.1612, + "loss_text": 1.466, + "ppl": 5.0896, + "step": 12277 + }, + { + "epoch": 0.06, + "global_step": 12278, + "learning_rate": 0.00044959098497495824, + "loss": 1.6141, + "loss_base2": 2.3287, + "loss_pixel": 0.1611, + "loss_text": 1.4531, + "ppl": 5.0234, + "step": 12278 + }, + { + "epoch": 0.06, + "global_step": 12279, + "learning_rate": 0.00044958681135225375, + "loss": 1.607, + "loss_base2": 2.3184, + "loss_pixel": 0.1613, + "loss_text": 1.4457, + "ppl": 4.9878, + "step": 12279 + }, + { + "epoch": 0.06, + "global_step": 12280, + "learning_rate": 0.00044958263772954926, + "loss": 1.6061, + "loss_base2": 2.3171, + "loss_pixel": 0.1613, + "loss_text": 1.4449, + "ppl": 4.9833, + "step": 12280 + }, + { + "epoch": 0.06, + "global_step": 12281, + "learning_rate": 0.00044957846410684476, + "loss": 1.5975, + "loss_base2": 2.3047, + "loss_pixel": 0.1606, + "loss_text": 1.4369, + "ppl": 4.9407, + "step": 12281 + }, + { + "epoch": 0.06, + "global_step": 12282, + "learning_rate": 0.0004495742904841402, + "loss": 1.6175, + "loss_base2": 2.3336, + "loss_pixel": 0.1598, + "loss_text": 1.4577, + "ppl": 5.0405, + "step": 12282 + }, + { + "epoch": 0.06, + "global_step": 12283, + "learning_rate": 0.0004495701168614357, + "loss": 1.6107, + "loss_base2": 2.3237, + "loss_pixel": 0.1593, + "loss_text": 1.4514, + "ppl": 5.0063, + "step": 12283 + }, + { + "epoch": 0.06, + "global_step": 12284, + "learning_rate": 0.00044956594323873123, + "loss": 1.6004, + "loss_base2": 2.3089, + "loss_pixel": 0.1598, + "loss_text": 1.4406, + "ppl": 4.955, + "step": 12284 + }, + { + "epoch": 0.06, + "global_step": 12285, + "learning_rate": 0.00044956176961602674, + "loss": 1.5976, + "loss_base2": 2.3048, + "loss_pixel": 0.1611, + "loss_text": 1.4365, + "ppl": 4.9412, + "step": 12285 + }, + { + "epoch": 0.06, + "global_step": 12286, + "learning_rate": 0.0004495575959933222, + "loss": 1.5971, + "loss_base2": 2.3041, + "loss_pixel": 0.1596, + "loss_text": 1.4375, + "ppl": 4.9387, + "step": 12286 + }, + { + "epoch": 0.06, + "global_step": 12287, + "learning_rate": 0.0004495534223706177, + "loss": 1.6125, + "loss_base2": 2.3263, + "loss_pixel": 0.162, + "loss_text": 1.4505, + "ppl": 5.0153, + "step": 12287 + }, + { + "epoch": 0.06, + "global_step": 12288, + "learning_rate": 0.0004495492487479132, + "loss": 1.6034, + "loss_base2": 2.3132, + "loss_pixel": 0.1603, + "loss_text": 1.4431, + "ppl": 4.9699, + "step": 12288 + }, + { + "epoch": 0.06, + "global_step": 12289, + "learning_rate": 0.0004495450751252087, + "loss": 1.6156, + "loss_base2": 2.3308, + "loss_pixel": 0.1587, + "loss_text": 1.4569, + "ppl": 5.0309, + "step": 12289 + }, + { + "epoch": 0.06, + "global_step": 12290, + "learning_rate": 0.0004495409015025042, + "loss": 1.6152, + "loss_base2": 2.3302, + "loss_pixel": 0.161, + "loss_text": 1.4543, + "ppl": 5.0289, + "step": 12290 + }, + { + "epoch": 0.06, + "global_step": 12291, + "learning_rate": 0.0004495367278797997, + "loss": 1.6405, + "loss_base2": 2.3667, + "loss_pixel": 0.1588, + "loss_text": 1.4817, + "ppl": 5.1577, + "step": 12291 + }, + { + "epoch": 0.06, + "global_step": 12292, + "learning_rate": 0.0004495325542570952, + "loss": 1.6071, + "loss_base2": 2.3186, + "loss_pixel": 0.1616, + "loss_text": 1.4455, + "ppl": 4.9883, + "step": 12292 + }, + { + "epoch": 0.06, + "global_step": 12293, + "learning_rate": 0.0004495283806343907, + "loss": 1.5985, + "loss_base2": 2.3061, + "loss_pixel": 0.1589, + "loss_text": 1.4396, + "ppl": 4.9456, + "step": 12293 + }, + { + "epoch": 0.06, + "global_step": 12294, + "learning_rate": 0.0004495242070116862, + "loss": 1.6155, + "loss_base2": 2.3307, + "loss_pixel": 0.1598, + "loss_text": 1.4557, + "ppl": 5.0304, + "step": 12294 + }, + { + "epoch": 0.06, + "global_step": 12295, + "learning_rate": 0.0004495200333889816, + "loss": 1.5948, + "loss_base2": 2.3008, + "loss_pixel": 0.1595, + "loss_text": 1.4353, + "ppl": 4.9273, + "step": 12295 + }, + { + "epoch": 0.06, + "global_step": 12296, + "learning_rate": 0.0004495158597662771, + "loss": 1.5959, + "loss_base2": 2.3024, + "loss_pixel": 0.1587, + "loss_text": 1.4372, + "ppl": 4.9328, + "step": 12296 + }, + { + "epoch": 0.06, + "global_step": 12297, + "learning_rate": 0.0004495116861435726, + "loss": 1.5171, + "loss_base2": 2.1887, + "loss_pixel": 0.1588, + "loss_text": 1.3583, + "ppl": 4.559, + "step": 12297 + }, + { + "epoch": 0.06, + "global_step": 12298, + "learning_rate": 0.0004495075125208681, + "loss": 1.3933, + "loss_base2": 2.0101, + "loss_pixel": 0.159, + "loss_text": 1.2343, + "ppl": 4.0281, + "step": 12298 + }, + { + "epoch": 0.06, + "global_step": 12299, + "learning_rate": 0.0004495033388981636, + "loss": 1.3913, + "loss_base2": 2.0072, + "loss_pixel": 0.1602, + "loss_text": 1.2311, + "ppl": 4.0201, + "step": 12299 + }, + { + "epoch": 0.06, + "global_step": 12300, + "learning_rate": 0.0004494991652754591, + "loss": 1.3989, + "loss_base2": 2.0182, + "loss_pixel": 0.1581, + "loss_text": 1.2407, + "ppl": 4.0507, + "step": 12300 + }, + { + "epoch": 0.06, + "global_step": 12301, + "learning_rate": 0.0004494949916527546, + "loss": 1.3655, + "loss_base2": 1.97, + "loss_pixel": 0.1584, + "loss_text": 1.2072, + "ppl": 3.9177, + "step": 12301 + }, + { + "epoch": 0.06, + "global_step": 12302, + "learning_rate": 0.0004494908180300501, + "loss": 1.3828, + "loss_base2": 1.995, + "loss_pixel": 0.1595, + "loss_text": 1.2233, + "ppl": 3.986, + "step": 12302 + }, + { + "epoch": 0.06, + "global_step": 12303, + "learning_rate": 0.0004494866444073456, + "loss": 1.3988, + "loss_base2": 2.018, + "loss_pixel": 0.1592, + "loss_text": 1.2396, + "ppl": 4.0503, + "step": 12303 + }, + { + "epoch": 0.06, + "global_step": 12304, + "learning_rate": 0.00044948247078464105, + "loss": 1.3935, + "loss_base2": 2.0104, + "loss_pixel": 0.1585, + "loss_text": 1.2349, + "ppl": 4.0289, + "step": 12304 + }, + { + "epoch": 0.06, + "global_step": 12305, + "learning_rate": 0.00044947829716193656, + "loss": 1.3852, + "loss_base2": 1.9984, + "loss_pixel": 0.1586, + "loss_text": 1.2266, + "ppl": 3.9956, + "step": 12305 + }, + { + "epoch": 0.06, + "global_step": 12306, + "learning_rate": 0.00044947412353923207, + "loss": 1.3904, + "loss_base2": 2.0059, + "loss_pixel": 0.1583, + "loss_text": 1.2321, + "ppl": 4.0165, + "step": 12306 + }, + { + "epoch": 0.06, + "global_step": 12307, + "learning_rate": 0.0004494699499165276, + "loss": 1.3982, + "loss_base2": 2.0172, + "loss_pixel": 0.1576, + "loss_text": 1.2406, + "ppl": 4.0479, + "step": 12307 + }, + { + "epoch": 0.06, + "global_step": 12308, + "learning_rate": 0.0004494657762938231, + "loss": 1.3696, + "loss_base2": 1.9759, + "loss_pixel": 0.1569, + "loss_text": 1.2127, + "ppl": 3.9338, + "step": 12308 + }, + { + "epoch": 0.06, + "global_step": 12309, + "learning_rate": 0.00044946160267111853, + "loss": 1.37, + "loss_base2": 1.9765, + "loss_pixel": 0.157, + "loss_text": 1.213, + "ppl": 3.9354, + "step": 12309 + }, + { + "epoch": 0.06, + "global_step": 12310, + "learning_rate": 0.00044945742904841404, + "loss": 1.3679, + "loss_base2": 1.9735, + "loss_pixel": 0.1575, + "loss_text": 1.2104, + "ppl": 3.9271, + "step": 12310 + }, + { + "epoch": 0.06, + "global_step": 12311, + "learning_rate": 0.00044945325542570955, + "loss": 1.3711, + "loss_base2": 1.9781, + "loss_pixel": 0.1586, + "loss_text": 1.2125, + "ppl": 3.9397, + "step": 12311 + }, + { + "epoch": 0.06, + "global_step": 12312, + "learning_rate": 0.00044944908180300506, + "loss": 1.3785, + "loss_base2": 1.9888, + "loss_pixel": 0.157, + "loss_text": 1.2215, + "ppl": 3.9689, + "step": 12312 + }, + { + "epoch": 0.06, + "global_step": 12313, + "learning_rate": 0.00044944490818030056, + "loss": 1.3697, + "loss_base2": 1.9761, + "loss_pixel": 0.1559, + "loss_text": 1.2138, + "ppl": 3.9342, + "step": 12313 + }, + { + "epoch": 0.06, + "global_step": 12314, + "learning_rate": 0.00044944073455759596, + "loss": 1.3834, + "loss_base2": 1.9958, + "loss_pixel": 0.1573, + "loss_text": 1.2262, + "ppl": 3.9884, + "step": 12314 + }, + { + "epoch": 0.06, + "global_step": 12315, + "learning_rate": 0.00044943656093489147, + "loss": 1.5107, + "loss_base2": 2.1795, + "loss_pixel": 0.158, + "loss_text": 1.3527, + "ppl": 4.5299, + "step": 12315 + }, + { + "epoch": 0.06, + "global_step": 12316, + "learning_rate": 0.000449432387312187, + "loss": 1.4141, + "loss_base2": 2.0401, + "loss_pixel": 0.1585, + "loss_text": 1.2555, + "ppl": 4.1128, + "step": 12316 + }, + { + "epoch": 0.06, + "global_step": 12317, + "learning_rate": 0.0004494282136894825, + "loss": 1.3718, + "loss_base2": 1.9791, + "loss_pixel": 0.1577, + "loss_text": 1.2141, + "ppl": 3.9424, + "step": 12317 + }, + { + "epoch": 0.06, + "global_step": 12318, + "learning_rate": 0.00044942404006677794, + "loss": 1.3763, + "loss_base2": 1.9856, + "loss_pixel": 0.1568, + "loss_text": 1.2196, + "ppl": 3.9602, + "step": 12318 + }, + { + "epoch": 0.06, + "global_step": 12319, + "learning_rate": 0.00044941986644407344, + "loss": 1.3671, + "loss_base2": 1.9723, + "loss_pixel": 0.1556, + "loss_text": 1.2115, + "ppl": 3.924, + "step": 12319 + }, + { + "epoch": 0.06, + "global_step": 12320, + "learning_rate": 0.00044941569282136895, + "loss": 1.3752, + "loss_base2": 1.984, + "loss_pixel": 0.1585, + "loss_text": 1.2167, + "ppl": 3.9559, + "step": 12320 + }, + { + "epoch": 0.06, + "global_step": 12321, + "learning_rate": 0.00044941151919866446, + "loss": 1.3657, + "loss_base2": 1.9703, + "loss_pixel": 0.1584, + "loss_text": 1.2074, + "ppl": 3.9185, + "step": 12321 + }, + { + "epoch": 0.06, + "global_step": 12322, + "learning_rate": 0.00044940734557595997, + "loss": 1.3794, + "loss_base2": 1.9901, + "loss_pixel": 0.1578, + "loss_text": 1.2216, + "ppl": 3.9725, + "step": 12322 + }, + { + "epoch": 0.06, + "global_step": 12323, + "learning_rate": 0.0004494031719532554, + "loss": 1.3944, + "loss_base2": 2.0117, + "loss_pixel": 0.1596, + "loss_text": 1.2348, + "ppl": 4.0326, + "step": 12323 + }, + { + "epoch": 0.06, + "global_step": 12324, + "learning_rate": 0.00044939899833055093, + "loss": 1.3881, + "loss_base2": 2.0026, + "loss_pixel": 0.1578, + "loss_text": 1.2303, + "ppl": 4.0072, + "step": 12324 + }, + { + "epoch": 0.06, + "global_step": 12325, + "learning_rate": 0.00044939482470784643, + "loss": 1.5738, + "loss_base2": 2.2705, + "loss_pixel": 0.1574, + "loss_text": 1.4164, + "ppl": 4.8249, + "step": 12325 + }, + { + "epoch": 0.06, + "global_step": 12326, + "learning_rate": 0.00044939065108514194, + "loss": 1.3719, + "loss_base2": 1.9792, + "loss_pixel": 0.157, + "loss_text": 1.2149, + "ppl": 3.9428, + "step": 12326 + }, + { + "epoch": 0.06, + "global_step": 12327, + "learning_rate": 0.0004493864774624374, + "loss": 1.378, + "loss_base2": 1.988, + "loss_pixel": 0.1572, + "loss_text": 1.2208, + "ppl": 3.967, + "step": 12327 + }, + { + "epoch": 0.06, + "global_step": 12328, + "learning_rate": 0.0004493823038397329, + "loss": 1.3887, + "loss_base2": 2.0035, + "loss_pixel": 0.1581, + "loss_text": 1.2306, + "ppl": 4.0096, + "step": 12328 + }, + { + "epoch": 0.06, + "global_step": 12329, + "learning_rate": 0.0004493781302170284, + "loss": 1.39, + "loss_base2": 2.0053, + "loss_pixel": 0.1568, + "loss_text": 1.2332, + "ppl": 4.0149, + "step": 12329 + }, + { + "epoch": 0.06, + "global_step": 12330, + "learning_rate": 0.0004493739565943239, + "loss": 1.384, + "loss_base2": 1.9967, + "loss_pixel": 0.1578, + "loss_text": 1.2262, + "ppl": 3.9908, + "step": 12330 + }, + { + "epoch": 0.06, + "global_step": 12331, + "learning_rate": 0.0004493697829716194, + "loss": 1.3911, + "loss_base2": 2.0069, + "loss_pixel": 0.1581, + "loss_text": 1.233, + "ppl": 4.0193, + "step": 12331 + }, + { + "epoch": 0.06, + "global_step": 12332, + "learning_rate": 0.0004493656093489148, + "loss": 1.369, + "loss_base2": 1.975, + "loss_pixel": 0.1577, + "loss_text": 1.2112, + "ppl": 3.9314, + "step": 12332 + }, + { + "epoch": 0.06, + "global_step": 12333, + "learning_rate": 0.00044936143572621033, + "loss": 1.378, + "loss_base2": 1.988, + "loss_pixel": 0.1612, + "loss_text": 1.2168, + "ppl": 3.967, + "step": 12333 + }, + { + "epoch": 0.06, + "global_step": 12334, + "learning_rate": 0.00044935726210350584, + "loss": 1.3715, + "loss_base2": 1.9787, + "loss_pixel": 0.1587, + "loss_text": 1.2129, + "ppl": 3.9413, + "step": 12334 + }, + { + "epoch": 0.06, + "global_step": 12335, + "learning_rate": 0.00044935308848080135, + "loss": 1.3764, + "loss_base2": 1.9857, + "loss_pixel": 0.1581, + "loss_text": 1.2182, + "ppl": 3.9606, + "step": 12335 + }, + { + "epoch": 0.06, + "global_step": 12336, + "learning_rate": 0.0004493489148580968, + "loss": 1.3765, + "loss_base2": 1.9859, + "loss_pixel": 0.1584, + "loss_text": 1.2181, + "ppl": 3.961, + "step": 12336 + }, + { + "epoch": 0.06, + "global_step": 12337, + "learning_rate": 0.0004493447412353923, + "loss": 1.3614, + "loss_base2": 1.9641, + "loss_pixel": 0.1596, + "loss_text": 1.2018, + "ppl": 3.9017, + "step": 12337 + }, + { + "epoch": 0.06, + "global_step": 12338, + "learning_rate": 0.0004493405676126878, + "loss": 1.3671, + "loss_base2": 1.9723, + "loss_pixel": 0.1591, + "loss_text": 1.208, + "ppl": 3.924, + "step": 12338 + }, + { + "epoch": 0.06, + "global_step": 12339, + "learning_rate": 0.0004493363939899833, + "loss": 1.3623, + "loss_base2": 1.9654, + "loss_pixel": 0.159, + "loss_text": 1.2033, + "ppl": 3.9052, + "step": 12339 + }, + { + "epoch": 0.06, + "global_step": 12340, + "learning_rate": 0.00044933222036727883, + "loss": 1.3836, + "loss_base2": 1.9961, + "loss_pixel": 0.1579, + "loss_text": 1.2257, + "ppl": 3.9892, + "step": 12340 + }, + { + "epoch": 0.06, + "global_step": 12341, + "learning_rate": 0.0004493280467445743, + "loss": 1.362, + "loss_base2": 1.965, + "loss_pixel": 0.1585, + "loss_text": 1.2035, + "ppl": 3.904, + "step": 12341 + }, + { + "epoch": 0.06, + "global_step": 12342, + "learning_rate": 0.0004493238731218698, + "loss": 1.3802, + "loss_base2": 1.9912, + "loss_pixel": 0.157, + "loss_text": 1.2232, + "ppl": 3.9757, + "step": 12342 + }, + { + "epoch": 0.06, + "global_step": 12343, + "learning_rate": 0.0004493196994991653, + "loss": 1.3666, + "loss_base2": 1.9716, + "loss_pixel": 0.159, + "loss_text": 1.2077, + "ppl": 3.922, + "step": 12343 + }, + { + "epoch": 0.06, + "global_step": 12344, + "learning_rate": 0.0004493155258764608, + "loss": 1.3711, + "loss_base2": 1.9781, + "loss_pixel": 0.1588, + "loss_text": 1.2124, + "ppl": 3.9397, + "step": 12344 + }, + { + "epoch": 0.06, + "global_step": 12345, + "learning_rate": 0.00044931135225375626, + "loss": 1.3832, + "loss_base2": 1.9955, + "loss_pixel": 0.1589, + "loss_text": 1.2243, + "ppl": 3.9876, + "step": 12345 + }, + { + "epoch": 0.06, + "global_step": 12346, + "learning_rate": 0.00044930717863105176, + "loss": 1.3663, + "loss_base2": 1.9712, + "loss_pixel": 0.1563, + "loss_text": 1.21, + "ppl": 3.9208, + "step": 12346 + }, + { + "epoch": 0.06, + "global_step": 12347, + "learning_rate": 0.00044930300500834727, + "loss": 1.3728, + "loss_base2": 1.9805, + "loss_pixel": 0.157, + "loss_text": 1.2158, + "ppl": 3.9464, + "step": 12347 + }, + { + "epoch": 0.06, + "global_step": 12348, + "learning_rate": 0.0004492988313856428, + "loss": 1.3682, + "loss_base2": 1.9739, + "loss_pixel": 0.1591, + "loss_text": 1.2091, + "ppl": 3.9283, + "step": 12348 + }, + { + "epoch": 0.06, + "global_step": 12349, + "learning_rate": 0.0004492946577629383, + "loss": 1.3695, + "loss_base2": 1.9758, + "loss_pixel": 0.1601, + "loss_text": 1.2095, + "ppl": 3.9334, + "step": 12349 + }, + { + "epoch": 0.06, + "global_step": 12350, + "learning_rate": 0.00044929048414023374, + "loss": 1.3774, + "loss_base2": 1.9872, + "loss_pixel": 0.1566, + "loss_text": 1.2208, + "ppl": 3.9646, + "step": 12350 + }, + { + "epoch": 0.06, + "global_step": 12351, + "learning_rate": 0.0004492863105175292, + "loss": 1.5585, + "loss_base2": 2.2484, + "loss_pixel": 0.1583, + "loss_text": 1.4002, + "ppl": 4.7517, + "step": 12351 + }, + { + "epoch": 0.06, + "global_step": 12352, + "learning_rate": 0.0004492821368948247, + "loss": 1.6514, + "loss_base2": 2.3825, + "loss_pixel": 0.1581, + "loss_text": 1.4933, + "ppl": 5.2143, + "step": 12352 + }, + { + "epoch": 0.06, + "global_step": 12353, + "learning_rate": 0.0004492779632721202, + "loss": 1.6275, + "loss_base2": 2.348, + "loss_pixel": 0.1592, + "loss_text": 1.4683, + "ppl": 5.0911, + "step": 12353 + }, + { + "epoch": 0.06, + "global_step": 12354, + "learning_rate": 0.00044927378964941566, + "loss": 1.6408, + "loss_base2": 2.3672, + "loss_pixel": 0.1572, + "loss_text": 1.4836, + "ppl": 5.1593, + "step": 12354 + }, + { + "epoch": 0.06, + "global_step": 12355, + "learning_rate": 0.00044926961602671117, + "loss": 1.6208, + "loss_base2": 2.3383, + "loss_pixel": 0.1565, + "loss_text": 1.4644, + "ppl": 5.0571, + "step": 12355 + }, + { + "epoch": 0.06, + "global_step": 12356, + "learning_rate": 0.0004492654424040067, + "loss": 1.6183, + "loss_base2": 2.3347, + "loss_pixel": 0.1576, + "loss_text": 1.4606, + "ppl": 5.0445, + "step": 12356 + }, + { + "epoch": 0.06, + "global_step": 12357, + "learning_rate": 0.0004492612687813022, + "loss": 1.6345, + "loss_base2": 2.3581, + "loss_pixel": 0.157, + "loss_text": 1.4774, + "ppl": 5.1269, + "step": 12357 + }, + { + "epoch": 0.06, + "global_step": 12358, + "learning_rate": 0.0004492570951585977, + "loss": 1.6221, + "loss_base2": 2.3402, + "loss_pixel": 0.1578, + "loss_text": 1.4643, + "ppl": 5.0637, + "step": 12358 + }, + { + "epoch": 0.06, + "global_step": 12359, + "learning_rate": 0.00044925292153589314, + "loss": 1.6257, + "loss_base2": 2.3454, + "loss_pixel": 0.1567, + "loss_text": 1.469, + "ppl": 5.082, + "step": 12359 + }, + { + "epoch": 0.06, + "global_step": 12360, + "learning_rate": 0.00044924874791318865, + "loss": 1.626, + "loss_base2": 2.3458, + "loss_pixel": 0.1578, + "loss_text": 1.4683, + "ppl": 5.0835, + "step": 12360 + }, + { + "epoch": 0.06, + "global_step": 12361, + "learning_rate": 0.00044924457429048416, + "loss": 1.6236, + "loss_base2": 2.3424, + "loss_pixel": 0.1583, + "loss_text": 1.4653, + "ppl": 5.0713, + "step": 12361 + }, + { + "epoch": 0.06, + "global_step": 12362, + "learning_rate": 0.00044924040066777966, + "loss": 1.6306, + "loss_base2": 2.3525, + "loss_pixel": 0.1586, + "loss_text": 1.472, + "ppl": 5.1069, + "step": 12362 + }, + { + "epoch": 0.06, + "global_step": 12363, + "learning_rate": 0.0004492362270450751, + "loss": 1.6161, + "loss_base2": 2.3315, + "loss_pixel": 0.1573, + "loss_text": 1.4589, + "ppl": 5.0334, + "step": 12363 + }, + { + "epoch": 0.06, + "global_step": 12364, + "learning_rate": 0.0004492320534223706, + "loss": 1.6061, + "loss_base2": 2.3171, + "loss_pixel": 0.1575, + "loss_text": 1.4486, + "ppl": 4.9833, + "step": 12364 + }, + { + "epoch": 0.06, + "global_step": 12365, + "learning_rate": 0.00044922787979966613, + "loss": 1.6242, + "loss_base2": 2.3432, + "loss_pixel": 0.1569, + "loss_text": 1.4673, + "ppl": 5.0744, + "step": 12365 + }, + { + "epoch": 0.06, + "global_step": 12366, + "learning_rate": 0.00044922370617696164, + "loss": 1.6303, + "loss_base2": 2.352, + "loss_pixel": 0.157, + "loss_text": 1.4733, + "ppl": 5.1054, + "step": 12366 + }, + { + "epoch": 0.06, + "global_step": 12367, + "learning_rate": 0.00044921953255425715, + "loss": 1.6077, + "loss_base2": 2.3194, + "loss_pixel": 0.1566, + "loss_text": 1.4511, + "ppl": 4.9913, + "step": 12367 + }, + { + "epoch": 0.06, + "global_step": 12368, + "learning_rate": 0.0004492153589315526, + "loss": 1.6298, + "loss_base2": 2.3513, + "loss_pixel": 0.1572, + "loss_text": 1.4726, + "ppl": 5.1029, + "step": 12368 + }, + { + "epoch": 0.06, + "global_step": 12369, + "learning_rate": 0.0004492111853088481, + "loss": 1.6351, + "loss_base2": 2.359, + "loss_pixel": 0.1585, + "loss_text": 1.4766, + "ppl": 5.13, + "step": 12369 + }, + { + "epoch": 0.06, + "global_step": 12370, + "learning_rate": 0.00044920701168614356, + "loss": 1.6183, + "loss_base2": 2.3347, + "loss_pixel": 0.1569, + "loss_text": 1.4615, + "ppl": 5.0445, + "step": 12370 + }, + { + "epoch": 0.06, + "global_step": 12371, + "learning_rate": 0.00044920283806343907, + "loss": 1.6054, + "loss_base2": 2.3161, + "loss_pixel": 0.1579, + "loss_text": 1.4475, + "ppl": 4.9799, + "step": 12371 + }, + { + "epoch": 0.06, + "global_step": 12372, + "learning_rate": 0.0004491986644407346, + "loss": 1.6095, + "loss_base2": 2.322, + "loss_pixel": 0.1579, + "loss_text": 1.4516, + "ppl": 5.0003, + "step": 12372 + }, + { + "epoch": 0.06, + "global_step": 12373, + "learning_rate": 0.00044919449081803, + "loss": 1.6086, + "loss_base2": 2.3207, + "loss_pixel": 0.1568, + "loss_text": 1.4518, + "ppl": 4.9958, + "step": 12373 + }, + { + "epoch": 0.06, + "global_step": 12374, + "learning_rate": 0.00044919031719532553, + "loss": 1.597, + "loss_base2": 2.304, + "loss_pixel": 0.1571, + "loss_text": 1.4399, + "ppl": 4.9382, + "step": 12374 + }, + { + "epoch": 0.06, + "global_step": 12375, + "learning_rate": 0.00044918614357262104, + "loss": 1.6171, + "loss_base2": 2.333, + "loss_pixel": 0.1563, + "loss_text": 1.4608, + "ppl": 5.0385, + "step": 12375 + }, + { + "epoch": 0.06, + "global_step": 12376, + "learning_rate": 0.00044918196994991655, + "loss": 1.6111, + "loss_base2": 2.3243, + "loss_pixel": 0.1574, + "loss_text": 1.4537, + "ppl": 5.0083, + "step": 12376 + }, + { + "epoch": 0.06, + "global_step": 12377, + "learning_rate": 0.000449177796327212, + "loss": 1.6061, + "loss_base2": 2.3171, + "loss_pixel": 0.1614, + "loss_text": 1.4447, + "ppl": 4.9833, + "step": 12377 + }, + { + "epoch": 0.06, + "global_step": 12378, + "learning_rate": 0.0004491736227045075, + "loss": 1.581, + "loss_base2": 2.2809, + "loss_pixel": 0.1574, + "loss_text": 1.4236, + "ppl": 4.8598, + "step": 12378 + }, + { + "epoch": 0.06, + "global_step": 12379, + "learning_rate": 0.000449169449081803, + "loss": 1.6116, + "loss_base2": 2.325, + "loss_pixel": 0.1584, + "loss_text": 1.4532, + "ppl": 5.0108, + "step": 12379 + }, + { + "epoch": 0.06, + "global_step": 12380, + "learning_rate": 0.0004491652754590985, + "loss": 1.6047, + "loss_base2": 2.3151, + "loss_pixel": 0.1566, + "loss_text": 1.4482, + "ppl": 4.9764, + "step": 12380 + }, + { + "epoch": 0.06, + "global_step": 12381, + "learning_rate": 0.00044916110183639403, + "loss": 1.6089, + "loss_base2": 2.3212, + "loss_pixel": 0.1595, + "loss_text": 1.4494, + "ppl": 4.9973, + "step": 12381 + }, + { + "epoch": 0.06, + "global_step": 12382, + "learning_rate": 0.0004491569282136895, + "loss": 1.6044, + "loss_base2": 2.3147, + "loss_pixel": 0.158, + "loss_text": 1.4464, + "ppl": 4.9749, + "step": 12382 + }, + { + "epoch": 0.06, + "global_step": 12383, + "learning_rate": 0.000449152754590985, + "loss": 1.6037, + "loss_base2": 2.3137, + "loss_pixel": 0.1558, + "loss_text": 1.4479, + "ppl": 4.9714, + "step": 12383 + }, + { + "epoch": 0.06, + "global_step": 12384, + "learning_rate": 0.0004491485809682805, + "loss": 1.6119, + "loss_base2": 2.3255, + "loss_pixel": 0.1552, + "loss_text": 1.4567, + "ppl": 5.0123, + "step": 12384 + }, + { + "epoch": 0.06, + "global_step": 12385, + "learning_rate": 0.000449144407345576, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.1574, + "loss_text": 1.4578, + "ppl": 5.0284, + "step": 12385 + }, + { + "epoch": 0.06, + "global_step": 12386, + "learning_rate": 0.00044914023372287146, + "loss": 1.5994, + "loss_base2": 2.3074, + "loss_pixel": 0.1571, + "loss_text": 1.4423, + "ppl": 4.9501, + "step": 12386 + }, + { + "epoch": 0.06, + "global_step": 12387, + "learning_rate": 0.00044913606010016697, + "loss": 1.6114, + "loss_base2": 2.3248, + "loss_pixel": 0.1571, + "loss_text": 1.4543, + "ppl": 5.0098, + "step": 12387 + }, + { + "epoch": 0.06, + "global_step": 12388, + "learning_rate": 0.0004491318864774625, + "loss": 1.592, + "loss_base2": 2.2968, + "loss_pixel": 0.1573, + "loss_text": 1.4347, + "ppl": 4.9136, + "step": 12388 + }, + { + "epoch": 0.06, + "global_step": 12389, + "learning_rate": 0.00044912771285475793, + "loss": 1.6176, + "loss_base2": 2.3337, + "loss_pixel": 0.1579, + "loss_text": 1.4597, + "ppl": 5.041, + "step": 12389 + }, + { + "epoch": 0.06, + "global_step": 12390, + "learning_rate": 0.00044912353923205343, + "loss": 1.6044, + "loss_base2": 2.3147, + "loss_pixel": 0.1594, + "loss_text": 1.4449, + "ppl": 4.9749, + "step": 12390 + }, + { + "epoch": 0.06, + "global_step": 12391, + "learning_rate": 0.0004491193656093489, + "loss": 1.6155, + "loss_base2": 2.3307, + "loss_pixel": 0.1565, + "loss_text": 1.459, + "ppl": 5.0304, + "step": 12391 + }, + { + "epoch": 0.06, + "global_step": 12392, + "learning_rate": 0.0004491151919866444, + "loss": 1.6088, + "loss_base2": 2.321, + "loss_pixel": 0.1571, + "loss_text": 1.4517, + "ppl": 4.9968, + "step": 12392 + }, + { + "epoch": 0.06, + "global_step": 12393, + "learning_rate": 0.0004491110183639399, + "loss": 1.6072, + "loss_base2": 2.3187, + "loss_pixel": 0.1566, + "loss_text": 1.4506, + "ppl": 4.9888, + "step": 12393 + }, + { + "epoch": 0.06, + "global_step": 12394, + "learning_rate": 0.0004491068447412354, + "loss": 1.5904, + "loss_base2": 2.2945, + "loss_pixel": 0.1564, + "loss_text": 1.4341, + "ppl": 4.9057, + "step": 12394 + }, + { + "epoch": 0.06, + "global_step": 12395, + "learning_rate": 0.00044910267111853086, + "loss": 1.6122, + "loss_base2": 2.3259, + "loss_pixel": 0.158, + "loss_text": 1.4542, + "ppl": 5.0138, + "step": 12395 + }, + { + "epoch": 0.06, + "global_step": 12396, + "learning_rate": 0.00044909849749582637, + "loss": 1.6084, + "loss_base2": 2.3204, + "loss_pixel": 0.1574, + "loss_text": 1.451, + "ppl": 4.9948, + "step": 12396 + }, + { + "epoch": 0.06, + "global_step": 12397, + "learning_rate": 0.0004490943238731219, + "loss": 1.6051, + "loss_base2": 2.3157, + "loss_pixel": 0.1588, + "loss_text": 1.4463, + "ppl": 4.9784, + "step": 12397 + }, + { + "epoch": 0.06, + "global_step": 12398, + "learning_rate": 0.0004490901502504174, + "loss": 1.6088, + "loss_base2": 2.321, + "loss_pixel": 0.1576, + "loss_text": 1.4512, + "ppl": 4.9968, + "step": 12398 + }, + { + "epoch": 0.06, + "global_step": 12399, + "learning_rate": 0.0004490859766277129, + "loss": 1.5934, + "loss_base2": 2.2988, + "loss_pixel": 0.1576, + "loss_text": 1.4358, + "ppl": 4.9205, + "step": 12399 + }, + { + "epoch": 0.06, + "global_step": 12400, + "learning_rate": 0.00044908180300500835, + "loss": 1.5902, + "loss_base2": 2.2942, + "loss_pixel": 0.1564, + "loss_text": 1.4337, + "ppl": 4.9047, + "step": 12400 + }, + { + "epoch": 0.06, + "global_step": 12401, + "learning_rate": 0.00044907762938230385, + "loss": 1.6039, + "loss_base2": 2.3139, + "loss_pixel": 0.1559, + "loss_text": 1.4479, + "ppl": 4.9724, + "step": 12401 + }, + { + "epoch": 0.06, + "global_step": 12402, + "learning_rate": 0.00044907345575959936, + "loss": 1.579, + "loss_base2": 2.278, + "loss_pixel": 0.1573, + "loss_text": 1.4217, + "ppl": 4.8501, + "step": 12402 + }, + { + "epoch": 0.06, + "global_step": 12403, + "learning_rate": 0.00044906928213689487, + "loss": 1.6104, + "loss_base2": 2.3233, + "loss_pixel": 0.1564, + "loss_text": 1.454, + "ppl": 5.0048, + "step": 12403 + }, + { + "epoch": 0.06, + "global_step": 12404, + "learning_rate": 0.0004490651085141903, + "loss": 1.6009, + "loss_base2": 2.3096, + "loss_pixel": 0.1568, + "loss_text": 1.4441, + "ppl": 4.9575, + "step": 12404 + }, + { + "epoch": 0.06, + "global_step": 12405, + "learning_rate": 0.00044906093489148583, + "loss": 1.5986, + "loss_base2": 2.3063, + "loss_pixel": 0.1582, + "loss_text": 1.4404, + "ppl": 4.9461, + "step": 12405 + }, + { + "epoch": 0.06, + "global_step": 12406, + "learning_rate": 0.00044905676126878133, + "loss": 1.5867, + "loss_base2": 2.2891, + "loss_pixel": 0.1581, + "loss_text": 1.4287, + "ppl": 4.8876, + "step": 12406 + }, + { + "epoch": 0.06, + "global_step": 12407, + "learning_rate": 0.00044905258764607684, + "loss": 1.6121, + "loss_base2": 2.3258, + "loss_pixel": 0.1566, + "loss_text": 1.4555, + "ppl": 5.0133, + "step": 12407 + }, + { + "epoch": 0.06, + "global_step": 12408, + "learning_rate": 0.0004490484140233723, + "loss": 1.6055, + "loss_base2": 2.3162, + "loss_pixel": 0.1579, + "loss_text": 1.4476, + "ppl": 4.9803, + "step": 12408 + }, + { + "epoch": 0.06, + "global_step": 12409, + "learning_rate": 0.00044904424040066775, + "loss": 1.6015, + "loss_base2": 2.3105, + "loss_pixel": 0.156, + "loss_text": 1.4455, + "ppl": 4.9605, + "step": 12409 + }, + { + "epoch": 0.06, + "global_step": 12410, + "learning_rate": 0.00044904006677796326, + "loss": 1.5959, + "loss_base2": 2.3024, + "loss_pixel": 0.1563, + "loss_text": 1.4396, + "ppl": 4.9328, + "step": 12410 + }, + { + "epoch": 0.06, + "global_step": 12411, + "learning_rate": 0.00044903589315525876, + "loss": 1.6066, + "loss_base2": 2.3178, + "loss_pixel": 0.1576, + "loss_text": 1.449, + "ppl": 4.9858, + "step": 12411 + }, + { + "epoch": 0.06, + "global_step": 12412, + "learning_rate": 0.00044903171953255427, + "loss": 1.614, + "loss_base2": 2.3285, + "loss_pixel": 0.1568, + "loss_text": 1.4572, + "ppl": 5.0229, + "step": 12412 + }, + { + "epoch": 0.06, + "global_step": 12413, + "learning_rate": 0.0004490275459098497, + "loss": 1.5921, + "loss_base2": 2.2969, + "loss_pixel": 0.158, + "loss_text": 1.4341, + "ppl": 4.9141, + "step": 12413 + }, + { + "epoch": 0.06, + "global_step": 12414, + "learning_rate": 0.00044902337228714523, + "loss": 1.6133, + "loss_base2": 2.3275, + "loss_pixel": 0.1575, + "loss_text": 1.4558, + "ppl": 5.0193, + "step": 12414 + }, + { + "epoch": 0.06, + "global_step": 12415, + "learning_rate": 0.00044901919866444074, + "loss": 1.6054, + "loss_base2": 2.3161, + "loss_pixel": 0.1567, + "loss_text": 1.4487, + "ppl": 4.9799, + "step": 12415 + }, + { + "epoch": 0.06, + "global_step": 12416, + "learning_rate": 0.00044901502504173625, + "loss": 1.5894, + "loss_base2": 2.293, + "loss_pixel": 0.1587, + "loss_text": 1.4307, + "ppl": 4.9008, + "step": 12416 + }, + { + "epoch": 0.06, + "global_step": 12417, + "learning_rate": 0.00044901085141903175, + "loss": 1.5844, + "loss_base2": 2.2858, + "loss_pixel": 0.1581, + "loss_text": 1.4263, + "ppl": 4.8764, + "step": 12417 + }, + { + "epoch": 0.06, + "global_step": 12418, + "learning_rate": 0.0004490066777963272, + "loss": 1.3899, + "loss_base2": 2.0052, + "loss_pixel": 0.1579, + "loss_text": 1.2321, + "ppl": 4.0144, + "step": 12418 + }, + { + "epoch": 0.06, + "global_step": 12419, + "learning_rate": 0.0004490025041736227, + "loss": 1.3861, + "loss_base2": 1.9997, + "loss_pixel": 0.1576, + "loss_text": 1.2284, + "ppl": 3.9992, + "step": 12419 + }, + { + "epoch": 0.06, + "global_step": 12420, + "learning_rate": 0.0004489983305509182, + "loss": 1.3868, + "loss_base2": 2.0007, + "loss_pixel": 0.1577, + "loss_text": 1.2291, + "ppl": 4.002, + "step": 12420 + }, + { + "epoch": 0.06, + "global_step": 12421, + "learning_rate": 0.00044899415692821373, + "loss": 1.3825, + "loss_base2": 1.9945, + "loss_pixel": 0.1574, + "loss_text": 1.2251, + "ppl": 3.9849, + "step": 12421 + }, + { + "epoch": 0.06, + "global_step": 12422, + "learning_rate": 0.0004489899833055092, + "loss": 1.3789, + "loss_base2": 1.9893, + "loss_pixel": 0.1573, + "loss_text": 1.2215, + "ppl": 3.9705, + "step": 12422 + }, + { + "epoch": 0.06, + "global_step": 12423, + "learning_rate": 0.0004489858096828047, + "loss": 1.389, + "loss_base2": 2.0039, + "loss_pixel": 0.157, + "loss_text": 1.232, + "ppl": 4.0108, + "step": 12423 + }, + { + "epoch": 0.06, + "global_step": 12424, + "learning_rate": 0.0004489816360601002, + "loss": 1.3679, + "loss_base2": 1.9735, + "loss_pixel": 0.1589, + "loss_text": 1.209, + "ppl": 3.9271, + "step": 12424 + }, + { + "epoch": 0.06, + "global_step": 12425, + "learning_rate": 0.0004489774624373957, + "loss": 1.3701, + "loss_base2": 1.9766, + "loss_pixel": 0.1576, + "loss_text": 1.2125, + "ppl": 3.9357, + "step": 12425 + }, + { + "epoch": 0.06, + "global_step": 12426, + "learning_rate": 0.0004489732888146912, + "loss": 1.3608, + "loss_base2": 1.9632, + "loss_pixel": 0.1549, + "loss_text": 1.2059, + "ppl": 3.8993, + "step": 12426 + }, + { + "epoch": 0.06, + "global_step": 12427, + "learning_rate": 0.0004489691151919866, + "loss": 1.3555, + "loss_base2": 1.9556, + "loss_pixel": 0.1569, + "loss_text": 1.1987, + "ppl": 3.8787, + "step": 12427 + }, + { + "epoch": 0.06, + "global_step": 12428, + "learning_rate": 0.0004489649415692821, + "loss": 1.3733, + "loss_base2": 1.9813, + "loss_pixel": 0.1582, + "loss_text": 1.2151, + "ppl": 3.9484, + "step": 12428 + }, + { + "epoch": 0.06, + "global_step": 12429, + "learning_rate": 0.0004489607679465776, + "loss": 1.3699, + "loss_base2": 1.9763, + "loss_pixel": 0.157, + "loss_text": 1.2129, + "ppl": 3.935, + "step": 12429 + }, + { + "epoch": 0.06, + "global_step": 12430, + "learning_rate": 0.00044895659432387313, + "loss": 1.3654, + "loss_base2": 1.9699, + "loss_pixel": 0.1562, + "loss_text": 1.2092, + "ppl": 3.9173, + "step": 12430 + }, + { + "epoch": 0.06, + "global_step": 12431, + "learning_rate": 0.00044895242070116864, + "loss": 1.373, + "loss_base2": 1.9808, + "loss_pixel": 0.1544, + "loss_text": 1.2186, + "ppl": 3.9472, + "step": 12431 + }, + { + "epoch": 0.06, + "global_step": 12432, + "learning_rate": 0.0004489482470784641, + "loss": 1.3744, + "loss_base2": 1.9828, + "loss_pixel": 0.1571, + "loss_text": 1.2173, + "ppl": 3.9527, + "step": 12432 + }, + { + "epoch": 0.06, + "global_step": 12433, + "learning_rate": 0.0004489440734557596, + "loss": 1.5606, + "loss_base2": 2.2515, + "loss_pixel": 0.1576, + "loss_text": 1.4029, + "ppl": 4.7617, + "step": 12433 + }, + { + "epoch": 0.06, + "global_step": 12434, + "learning_rate": 0.0004489398998330551, + "loss": 1.6347, + "loss_base2": 2.3584, + "loss_pixel": 0.1566, + "loss_text": 1.4781, + "ppl": 5.1279, + "step": 12434 + }, + { + "epoch": 0.06, + "global_step": 12435, + "learning_rate": 0.0004489357262103506, + "loss": 1.6317, + "loss_base2": 2.354, + "loss_pixel": 0.1583, + "loss_text": 1.4734, + "ppl": 5.1126, + "step": 12435 + }, + { + "epoch": 0.06, + "global_step": 12436, + "learning_rate": 0.00044893155258764607, + "loss": 1.5954, + "loss_base2": 2.3017, + "loss_pixel": 0.1583, + "loss_text": 1.437, + "ppl": 4.9303, + "step": 12436 + }, + { + "epoch": 0.06, + "global_step": 12437, + "learning_rate": 0.0004489273789649416, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.1565, + "loss_text": 1.4585, + "ppl": 5.0284, + "step": 12437 + }, + { + "epoch": 0.06, + "global_step": 12438, + "learning_rate": 0.0004489232053422371, + "loss": 1.6133, + "loss_base2": 2.3275, + "loss_pixel": 0.1567, + "loss_text": 1.4566, + "ppl": 5.0193, + "step": 12438 + }, + { + "epoch": 0.06, + "global_step": 12439, + "learning_rate": 0.0004489190317195326, + "loss": 1.6152, + "loss_base2": 2.3302, + "loss_pixel": 0.1581, + "loss_text": 1.4571, + "ppl": 5.0289, + "step": 12439 + }, + { + "epoch": 0.06, + "global_step": 12440, + "learning_rate": 0.0004489148580968281, + "loss": 1.6178, + "loss_base2": 2.334, + "loss_pixel": 0.1572, + "loss_text": 1.4606, + "ppl": 5.042, + "step": 12440 + }, + { + "epoch": 0.06, + "global_step": 12441, + "learning_rate": 0.00044891068447412355, + "loss": 1.6093, + "loss_base2": 2.3217, + "loss_pixel": 0.1575, + "loss_text": 1.4518, + "ppl": 4.9993, + "step": 12441 + }, + { + "epoch": 0.06, + "global_step": 12442, + "learning_rate": 0.00044890651085141906, + "loss": 1.6059, + "loss_base2": 2.3168, + "loss_pixel": 0.1575, + "loss_text": 1.4484, + "ppl": 4.9823, + "step": 12442 + }, + { + "epoch": 0.06, + "global_step": 12443, + "learning_rate": 0.00044890233722871456, + "loss": 1.5999, + "loss_base2": 2.3082, + "loss_pixel": 0.157, + "loss_text": 1.4429, + "ppl": 4.9525, + "step": 12443 + }, + { + "epoch": 0.06, + "global_step": 12444, + "learning_rate": 0.00044889816360601007, + "loss": 1.5986, + "loss_base2": 2.3063, + "loss_pixel": 0.1548, + "loss_text": 1.4438, + "ppl": 4.9461, + "step": 12444 + }, + { + "epoch": 0.06, + "global_step": 12445, + "learning_rate": 0.00044889398998330547, + "loss": 1.6234, + "loss_base2": 2.3421, + "loss_pixel": 0.157, + "loss_text": 1.4664, + "ppl": 5.0703, + "step": 12445 + }, + { + "epoch": 0.06, + "global_step": 12446, + "learning_rate": 0.000448889816360601, + "loss": 1.5929, + "loss_base2": 2.2981, + "loss_pixel": 0.1575, + "loss_text": 1.4354, + "ppl": 4.918, + "step": 12446 + }, + { + "epoch": 0.06, + "global_step": 12447, + "learning_rate": 0.0004488856427378965, + "loss": 1.6016, + "loss_base2": 2.3106, + "loss_pixel": 0.1584, + "loss_text": 1.4432, + "ppl": 4.961, + "step": 12447 + }, + { + "epoch": 0.06, + "global_step": 12448, + "learning_rate": 0.000448881469115192, + "loss": 1.6064, + "loss_base2": 2.3175, + "loss_pixel": 0.1562, + "loss_text": 1.4502, + "ppl": 4.9848, + "step": 12448 + }, + { + "epoch": 0.06, + "global_step": 12449, + "learning_rate": 0.0004488772954924875, + "loss": 1.6102, + "loss_base2": 2.323, + "loss_pixel": 0.1561, + "loss_text": 1.4541, + "ppl": 5.0038, + "step": 12449 + }, + { + "epoch": 0.06, + "global_step": 12450, + "learning_rate": 0.00044887312186978295, + "loss": 1.597, + "loss_base2": 2.304, + "loss_pixel": 0.1566, + "loss_text": 1.4404, + "ppl": 4.9382, + "step": 12450 + }, + { + "epoch": 0.06, + "global_step": 12451, + "learning_rate": 0.00044886894824707846, + "loss": 1.6087, + "loss_base2": 2.3209, + "loss_pixel": 0.1564, + "loss_text": 1.4523, + "ppl": 4.9963, + "step": 12451 + }, + { + "epoch": 0.06, + "global_step": 12452, + "learning_rate": 0.00044886477462437397, + "loss": 1.6082, + "loss_base2": 2.3201, + "loss_pixel": 0.1573, + "loss_text": 1.451, + "ppl": 4.9938, + "step": 12452 + }, + { + "epoch": 0.06, + "global_step": 12453, + "learning_rate": 0.0004488606010016695, + "loss": 1.5983, + "loss_base2": 2.3059, + "loss_pixel": 0.1557, + "loss_text": 1.4426, + "ppl": 4.9446, + "step": 12453 + }, + { + "epoch": 0.06, + "global_step": 12454, + "learning_rate": 0.00044885642737896493, + "loss": 1.6158, + "loss_base2": 2.3311, + "loss_pixel": 0.1568, + "loss_text": 1.459, + "ppl": 5.0319, + "step": 12454 + }, + { + "epoch": 0.06, + "global_step": 12455, + "learning_rate": 0.00044885225375626043, + "loss": 1.5986, + "loss_base2": 2.3063, + "loss_pixel": 0.1561, + "loss_text": 1.4425, + "ppl": 4.9461, + "step": 12455 + }, + { + "epoch": 0.06, + "global_step": 12456, + "learning_rate": 0.00044884808013355594, + "loss": 1.614, + "loss_base2": 2.3285, + "loss_pixel": 0.1565, + "loss_text": 1.4575, + "ppl": 5.0229, + "step": 12456 + }, + { + "epoch": 0.06, + "global_step": 12457, + "learning_rate": 0.00044884390651085145, + "loss": 1.5304, + "loss_base2": 2.2079, + "loss_pixel": 0.1573, + "loss_text": 1.3731, + "ppl": 4.62, + "step": 12457 + }, + { + "epoch": 0.06, + "global_step": 12458, + "learning_rate": 0.00044883973288814696, + "loss": 1.3809, + "loss_base2": 1.9922, + "loss_pixel": 0.156, + "loss_text": 1.2249, + "ppl": 3.9785, + "step": 12458 + }, + { + "epoch": 0.06, + "global_step": 12459, + "learning_rate": 0.0004488355592654424, + "loss": 1.3857, + "loss_base2": 1.9991, + "loss_pixel": 0.156, + "loss_text": 1.2297, + "ppl": 3.9976, + "step": 12459 + }, + { + "epoch": 0.06, + "global_step": 12460, + "learning_rate": 0.0004488313856427379, + "loss": 1.372, + "loss_base2": 1.9794, + "loss_pixel": 0.1578, + "loss_text": 1.2143, + "ppl": 3.9432, + "step": 12460 + }, + { + "epoch": 0.06, + "global_step": 12461, + "learning_rate": 0.0004488272120200334, + "loss": 1.3561, + "loss_base2": 1.9564, + "loss_pixel": 0.1565, + "loss_text": 1.1996, + "ppl": 3.881, + "step": 12461 + }, + { + "epoch": 0.06, + "global_step": 12462, + "learning_rate": 0.00044882303839732893, + "loss": 1.3905, + "loss_base2": 2.0061, + "loss_pixel": 0.1559, + "loss_text": 1.2345, + "ppl": 4.0169, + "step": 12462 + }, + { + "epoch": 0.06, + "global_step": 12463, + "learning_rate": 0.0004488188647746244, + "loss": 1.3841, + "loss_base2": 1.9968, + "loss_pixel": 0.1571, + "loss_text": 1.227, + "ppl": 3.9912, + "step": 12463 + }, + { + "epoch": 0.06, + "global_step": 12464, + "learning_rate": 0.00044881469115191984, + "loss": 1.3894, + "loss_base2": 2.0045, + "loss_pixel": 0.1572, + "loss_text": 1.2322, + "ppl": 4.0124, + "step": 12464 + }, + { + "epoch": 0.06, + "global_step": 12465, + "learning_rate": 0.00044881051752921535, + "loss": 1.5052, + "loss_base2": 2.1715, + "loss_pixel": 0.1576, + "loss_text": 1.3476, + "ppl": 4.5051, + "step": 12465 + }, + { + "epoch": 0.06, + "global_step": 12466, + "learning_rate": 0.00044880634390651085, + "loss": 1.5295, + "loss_base2": 2.2066, + "loss_pixel": 0.1571, + "loss_text": 1.3724, + "ppl": 4.6159, + "step": 12466 + }, + { + "epoch": 0.06, + "global_step": 12467, + "learning_rate": 0.00044880217028380636, + "loss": 1.5187, + "loss_base2": 2.191, + "loss_pixel": 0.1571, + "loss_text": 1.3616, + "ppl": 4.5663, + "step": 12467 + }, + { + "epoch": 0.06, + "global_step": 12468, + "learning_rate": 0.0004487979966611018, + "loss": 1.5177, + "loss_base2": 2.1896, + "loss_pixel": 0.157, + "loss_text": 1.3608, + "ppl": 4.5617, + "step": 12468 + }, + { + "epoch": 0.06, + "global_step": 12469, + "learning_rate": 0.0004487938230383973, + "loss": 1.5954, + "loss_base2": 2.3017, + "loss_pixel": 0.1582, + "loss_text": 1.4371, + "ppl": 4.9303, + "step": 12469 + }, + { + "epoch": 0.06, + "global_step": 12470, + "learning_rate": 0.00044878964941569283, + "loss": 1.6076, + "loss_base2": 2.3193, + "loss_pixel": 0.1574, + "loss_text": 1.4503, + "ppl": 4.9908, + "step": 12470 + }, + { + "epoch": 0.06, + "global_step": 12471, + "learning_rate": 0.00044878547579298833, + "loss": 1.6203, + "loss_base2": 2.3376, + "loss_pixel": 0.1571, + "loss_text": 1.4632, + "ppl": 5.0546, + "step": 12471 + }, + { + "epoch": 0.06, + "global_step": 12472, + "learning_rate": 0.0004487813021702838, + "loss": 1.6139, + "loss_base2": 2.3284, + "loss_pixel": 0.1568, + "loss_text": 1.4571, + "ppl": 5.0224, + "step": 12472 + }, + { + "epoch": 0.06, + "global_step": 12473, + "learning_rate": 0.0004487771285475793, + "loss": 1.612, + "loss_base2": 2.3256, + "loss_pixel": 0.1564, + "loss_text": 1.4556, + "ppl": 5.0128, + "step": 12473 + }, + { + "epoch": 0.06, + "global_step": 12474, + "learning_rate": 0.0004487729549248748, + "loss": 1.5994, + "loss_base2": 2.3074, + "loss_pixel": 0.1573, + "loss_text": 1.4421, + "ppl": 4.9501, + "step": 12474 + }, + { + "epoch": 0.06, + "global_step": 12475, + "learning_rate": 0.0004487687813021703, + "loss": 1.6079, + "loss_base2": 2.3197, + "loss_pixel": 0.1568, + "loss_text": 1.4511, + "ppl": 4.9923, + "step": 12475 + }, + { + "epoch": 0.06, + "global_step": 12476, + "learning_rate": 0.0004487646076794658, + "loss": 1.6105, + "loss_base2": 2.3235, + "loss_pixel": 0.1562, + "loss_text": 1.4543, + "ppl": 5.0053, + "step": 12476 + }, + { + "epoch": 0.06, + "global_step": 12477, + "learning_rate": 0.00044876043405676127, + "loss": 1.6211, + "loss_base2": 2.3388, + "loss_pixel": 0.1561, + "loss_text": 1.465, + "ppl": 5.0587, + "step": 12477 + }, + { + "epoch": 0.06, + "global_step": 12478, + "learning_rate": 0.0004487562604340568, + "loss": 1.6103, + "loss_base2": 2.3232, + "loss_pixel": 0.1569, + "loss_text": 1.4535, + "ppl": 5.0043, + "step": 12478 + }, + { + "epoch": 0.06, + "global_step": 12479, + "learning_rate": 0.0004487520868113523, + "loss": 1.6145, + "loss_base2": 2.3292, + "loss_pixel": 0.1567, + "loss_text": 1.4578, + "ppl": 5.0254, + "step": 12479 + }, + { + "epoch": 0.06, + "global_step": 12480, + "learning_rate": 0.0004487479131886478, + "loss": 1.6065, + "loss_base2": 2.3177, + "loss_pixel": 0.1565, + "loss_text": 1.45, + "ppl": 4.9853, + "step": 12480 + }, + { + "epoch": 0.06, + "global_step": 12481, + "learning_rate": 0.00044874373956594325, + "loss": 1.605, + "loss_base2": 2.3155, + "loss_pixel": 0.1564, + "loss_text": 1.4487, + "ppl": 4.9779, + "step": 12481 + }, + { + "epoch": 0.06, + "global_step": 12482, + "learning_rate": 0.00044873956594323875, + "loss": 1.5944, + "loss_base2": 2.3002, + "loss_pixel": 0.1569, + "loss_text": 1.4374, + "ppl": 4.9254, + "step": 12482 + }, + { + "epoch": 0.06, + "global_step": 12483, + "learning_rate": 0.0004487353923205342, + "loss": 1.6004, + "loss_base2": 2.3089, + "loss_pixel": 0.1566, + "loss_text": 1.4437, + "ppl": 4.955, + "step": 12483 + }, + { + "epoch": 0.06, + "global_step": 12484, + "learning_rate": 0.0004487312186978297, + "loss": 1.6015, + "loss_base2": 2.3105, + "loss_pixel": 0.1566, + "loss_text": 1.4449, + "ppl": 4.9605, + "step": 12484 + }, + { + "epoch": 0.06, + "global_step": 12485, + "learning_rate": 0.0004487270450751252, + "loss": 1.5975, + "loss_base2": 2.3047, + "loss_pixel": 0.1579, + "loss_text": 1.4397, + "ppl": 4.9407, + "step": 12485 + }, + { + "epoch": 0.06, + "global_step": 12486, + "learning_rate": 0.0004487228714524207, + "loss": 1.5932, + "loss_base2": 2.2985, + "loss_pixel": 0.157, + "loss_text": 1.4362, + "ppl": 4.9195, + "step": 12486 + }, + { + "epoch": 0.06, + "global_step": 12487, + "learning_rate": 0.0004487186978297162, + "loss": 1.6208, + "loss_base2": 2.3383, + "loss_pixel": 0.1571, + "loss_text": 1.4637, + "ppl": 5.0571, + "step": 12487 + }, + { + "epoch": 0.06, + "global_step": 12488, + "learning_rate": 0.0004487145242070117, + "loss": 1.5979, + "loss_base2": 2.3053, + "loss_pixel": 0.1562, + "loss_text": 1.4417, + "ppl": 4.9426, + "step": 12488 + }, + { + "epoch": 0.06, + "global_step": 12489, + "learning_rate": 0.0004487103505843072, + "loss": 1.6027, + "loss_base2": 2.3122, + "loss_pixel": 0.1548, + "loss_text": 1.4479, + "ppl": 4.9664, + "step": 12489 + }, + { + "epoch": 0.06, + "global_step": 12490, + "learning_rate": 0.0004487061769616027, + "loss": 1.569, + "loss_base2": 2.2636, + "loss_pixel": 0.1482, + "loss_text": 1.4209, + "ppl": 4.8018, + "step": 12490 + }, + { + "epoch": 0.06, + "global_step": 12491, + "learning_rate": 0.00044870200333889816, + "loss": 1.596, + "loss_base2": 2.3025, + "loss_pixel": 0.1495, + "loss_text": 1.4465, + "ppl": 4.9333, + "step": 12491 + }, + { + "epoch": 0.06, + "global_step": 12492, + "learning_rate": 0.00044869782971619366, + "loss": 1.5613, + "loss_base2": 2.2525, + "loss_pixel": 0.1487, + "loss_text": 1.4126, + "ppl": 4.765, + "step": 12492 + }, + { + "epoch": 0.06, + "global_step": 12493, + "learning_rate": 0.00044869365609348917, + "loss": 1.4832, + "loss_base2": 2.1398, + "loss_pixel": 0.1506, + "loss_text": 1.3326, + "ppl": 4.407, + "step": 12493 + }, + { + "epoch": 0.06, + "global_step": 12494, + "learning_rate": 0.0004486894824707847, + "loss": 1.3721, + "loss_base2": 1.9795, + "loss_pixel": 0.1514, + "loss_text": 1.2207, + "ppl": 3.9436, + "step": 12494 + }, + { + "epoch": 0.06, + "global_step": 12495, + "learning_rate": 0.00044868530884808013, + "loss": 1.3722, + "loss_base2": 1.9797, + "loss_pixel": 0.1477, + "loss_text": 1.2245, + "ppl": 3.944, + "step": 12495 + }, + { + "epoch": 0.06, + "global_step": 12496, + "learning_rate": 0.00044868113522537564, + "loss": 1.3587, + "loss_base2": 1.9602, + "loss_pixel": 0.1484, + "loss_text": 1.2103, + "ppl": 3.8911, + "step": 12496 + }, + { + "epoch": 0.06, + "global_step": 12497, + "learning_rate": 0.00044867696160267115, + "loss": 1.3726, + "loss_base2": 1.9802, + "loss_pixel": 0.1457, + "loss_text": 1.2269, + "ppl": 3.9456, + "step": 12497 + }, + { + "epoch": 0.06, + "global_step": 12498, + "learning_rate": 0.00044867278797996665, + "loss": 1.3695, + "loss_base2": 1.9758, + "loss_pixel": 0.146, + "loss_text": 1.2235, + "ppl": 3.9334, + "step": 12498 + }, + { + "epoch": 0.06, + "global_step": 12499, + "learning_rate": 0.00044866861435726216, + "loss": 1.3657, + "loss_base2": 1.9703, + "loss_pixel": 0.1469, + "loss_text": 1.2189, + "ppl": 3.9185, + "step": 12499 + }, + { + "epoch": 0.06, + "global_step": 12500, + "learning_rate": 0.0004486644407345576, + "loss": 1.3438, + "loss_base2": 1.9387, + "loss_pixel": 0.1462, + "loss_text": 1.1975, + "ppl": 3.8336, + "step": 12500 + }, + { + "epoch": 0.06, + "global_step": 12501, + "learning_rate": 0.00044866026711185307, + "loss": 1.3932, + "loss_base2": 2.01, + "loss_pixel": 0.1484, + "loss_text": 1.2449, + "ppl": 4.0277, + "step": 12501 + }, + { + "epoch": 0.06, + "global_step": 12502, + "learning_rate": 0.0004486560934891486, + "loss": 1.3694, + "loss_base2": 1.9756, + "loss_pixel": 0.1458, + "loss_text": 1.2237, + "ppl": 3.933, + "step": 12502 + }, + { + "epoch": 0.06, + "global_step": 12503, + "learning_rate": 0.0004486519198664441, + "loss": 1.344, + "loss_base2": 1.939, + "loss_pixel": 0.1469, + "loss_text": 1.1971, + "ppl": 3.8344, + "step": 12503 + }, + { + "epoch": 0.06, + "global_step": 12504, + "learning_rate": 0.00044864774624373953, + "loss": 1.3703, + "loss_base2": 1.9769, + "loss_pixel": 0.1463, + "loss_text": 1.224, + "ppl": 3.9365, + "step": 12504 + }, + { + "epoch": 0.06, + "global_step": 12505, + "learning_rate": 0.00044864357262103504, + "loss": 1.3606, + "loss_base2": 1.9629, + "loss_pixel": 0.1455, + "loss_text": 1.2152, + "ppl": 3.8985, + "step": 12505 + }, + { + "epoch": 0.06, + "global_step": 12506, + "learning_rate": 0.00044863939899833055, + "loss": 1.3684, + "loss_base2": 1.9742, + "loss_pixel": 0.1454, + "loss_text": 1.2229, + "ppl": 3.9291, + "step": 12506 + }, + { + "epoch": 0.06, + "global_step": 12507, + "learning_rate": 0.00044863522537562606, + "loss": 1.3617, + "loss_base2": 1.9645, + "loss_pixel": 0.1514, + "loss_text": 1.2102, + "ppl": 3.9028, + "step": 12507 + }, + { + "epoch": 0.06, + "global_step": 12508, + "learning_rate": 0.00044863105175292156, + "loss": 1.3732, + "loss_base2": 1.9811, + "loss_pixel": 0.1591, + "loss_text": 1.2141, + "ppl": 3.948, + "step": 12508 + }, + { + "epoch": 0.06, + "global_step": 12509, + "learning_rate": 0.000448626878130217, + "loss": 1.3754, + "loss_base2": 1.9843, + "loss_pixel": 0.1588, + "loss_text": 1.2166, + "ppl": 3.9567, + "step": 12509 + }, + { + "epoch": 0.06, + "global_step": 12510, + "learning_rate": 0.0004486227045075125, + "loss": 1.3706, + "loss_base2": 1.9774, + "loss_pixel": 0.1572, + "loss_text": 1.2134, + "ppl": 3.9377, + "step": 12510 + }, + { + "epoch": 0.06, + "global_step": 12511, + "learning_rate": 0.00044861853088480803, + "loss": 1.3733, + "loss_base2": 1.9813, + "loss_pixel": 0.1592, + "loss_text": 1.2141, + "ppl": 3.9484, + "step": 12511 + }, + { + "epoch": 0.06, + "global_step": 12512, + "learning_rate": 0.00044861435726210354, + "loss": 1.3812, + "loss_base2": 1.9927, + "loss_pixel": 0.1574, + "loss_text": 1.2238, + "ppl": 3.9797, + "step": 12512 + }, + { + "epoch": 0.06, + "global_step": 12513, + "learning_rate": 0.000448610183639399, + "loss": 1.3821, + "loss_base2": 1.9939, + "loss_pixel": 0.158, + "loss_text": 1.2241, + "ppl": 3.9833, + "step": 12513 + }, + { + "epoch": 0.06, + "global_step": 12514, + "learning_rate": 0.0004486060100166945, + "loss": 1.365, + "loss_base2": 1.9693, + "loss_pixel": 0.1577, + "loss_text": 1.2072, + "ppl": 3.9157, + "step": 12514 + }, + { + "epoch": 0.06, + "global_step": 12515, + "learning_rate": 0.00044860183639399, + "loss": 1.3605, + "loss_base2": 1.9628, + "loss_pixel": 0.1582, + "loss_text": 1.2023, + "ppl": 3.8981, + "step": 12515 + }, + { + "epoch": 0.06, + "global_step": 12516, + "learning_rate": 0.0004485976627712855, + "loss": 1.3626, + "loss_base2": 1.9658, + "loss_pixel": 0.1571, + "loss_text": 1.2055, + "ppl": 3.9063, + "step": 12516 + }, + { + "epoch": 0.06, + "global_step": 12517, + "learning_rate": 0.000448593489148581, + "loss": 1.3373, + "loss_base2": 1.9293, + "loss_pixel": 0.1575, + "loss_text": 1.1798, + "ppl": 3.8087, + "step": 12517 + }, + { + "epoch": 0.06, + "global_step": 12518, + "learning_rate": 0.0004485893155258765, + "loss": 1.3745, + "loss_base2": 1.983, + "loss_pixel": 0.1574, + "loss_text": 1.2172, + "ppl": 3.9531, + "step": 12518 + }, + { + "epoch": 0.06, + "global_step": 12519, + "learning_rate": 0.000448585141903172, + "loss": 1.3549, + "loss_base2": 1.9547, + "loss_pixel": 0.1574, + "loss_text": 1.1975, + "ppl": 3.8764, + "step": 12519 + }, + { + "epoch": 0.06, + "global_step": 12520, + "learning_rate": 0.00044858096828046743, + "loss": 1.5196, + "loss_base2": 2.1923, + "loss_pixel": 0.157, + "loss_text": 1.3626, + "ppl": 4.5704, + "step": 12520 + }, + { + "epoch": 0.06, + "global_step": 12521, + "learning_rate": 0.00044857679465776294, + "loss": 1.5148, + "loss_base2": 2.1854, + "loss_pixel": 0.1571, + "loss_text": 1.3578, + "ppl": 4.5485, + "step": 12521 + }, + { + "epoch": 0.06, + "global_step": 12522, + "learning_rate": 0.0004485726210350584, + "loss": 1.6228, + "loss_base2": 2.3412, + "loss_pixel": 0.1566, + "loss_text": 1.4662, + "ppl": 5.0673, + "step": 12522 + }, + { + "epoch": 0.06, + "global_step": 12523, + "learning_rate": 0.0004485684474123539, + "loss": 1.6412, + "loss_base2": 2.3678, + "loss_pixel": 0.1575, + "loss_text": 1.4837, + "ppl": 5.1614, + "step": 12523 + }, + { + "epoch": 0.06, + "global_step": 12524, + "learning_rate": 0.0004485642737896494, + "loss": 1.62, + "loss_base2": 2.3372, + "loss_pixel": 0.1587, + "loss_text": 1.4613, + "ppl": 5.0531, + "step": 12524 + }, + { + "epoch": 0.06, + "global_step": 12525, + "learning_rate": 0.0004485601001669449, + "loss": 1.6173, + "loss_base2": 2.3333, + "loss_pixel": 0.1587, + "loss_text": 1.4586, + "ppl": 5.0395, + "step": 12525 + }, + { + "epoch": 0.06, + "global_step": 12526, + "learning_rate": 0.0004485559265442404, + "loss": 1.6283, + "loss_base2": 2.3491, + "loss_pixel": 0.1578, + "loss_text": 1.4705, + "ppl": 5.0952, + "step": 12526 + }, + { + "epoch": 0.06, + "global_step": 12527, + "learning_rate": 0.0004485517529215359, + "loss": 1.6127, + "loss_base2": 2.3266, + "loss_pixel": 0.1585, + "loss_text": 1.4542, + "ppl": 5.0163, + "step": 12527 + }, + { + "epoch": 0.06, + "global_step": 12528, + "learning_rate": 0.0004485475792988314, + "loss": 1.6224, + "loss_base2": 2.3406, + "loss_pixel": 0.1579, + "loss_text": 1.4646, + "ppl": 5.0652, + "step": 12528 + }, + { + "epoch": 0.06, + "global_step": 12529, + "learning_rate": 0.0004485434056761269, + "loss": 1.6011, + "loss_base2": 2.3099, + "loss_pixel": 0.1579, + "loss_text": 1.4433, + "ppl": 4.9585, + "step": 12529 + }, + { + "epoch": 0.06, + "global_step": 12530, + "learning_rate": 0.0004485392320534224, + "loss": 1.6117, + "loss_base2": 2.3252, + "loss_pixel": 0.1573, + "loss_text": 1.4544, + "ppl": 5.0113, + "step": 12530 + }, + { + "epoch": 0.06, + "global_step": 12531, + "learning_rate": 0.00044853505843071785, + "loss": 1.6037, + "loss_base2": 2.3137, + "loss_pixel": 0.1584, + "loss_text": 1.4452, + "ppl": 4.9714, + "step": 12531 + }, + { + "epoch": 0.06, + "global_step": 12532, + "learning_rate": 0.00044853088480801336, + "loss": 1.6137, + "loss_base2": 2.3281, + "loss_pixel": 0.1584, + "loss_text": 1.4553, + "ppl": 5.0214, + "step": 12532 + }, + { + "epoch": 0.06, + "global_step": 12533, + "learning_rate": 0.00044852671118530887, + "loss": 1.6213, + "loss_base2": 2.339, + "loss_pixel": 0.1588, + "loss_text": 1.4624, + "ppl": 5.0597, + "step": 12533 + }, + { + "epoch": 0.06, + "global_step": 12534, + "learning_rate": 0.0004485225375626044, + "loss": 1.6053, + "loss_base2": 2.316, + "loss_pixel": 0.1591, + "loss_text": 1.4462, + "ppl": 4.9794, + "step": 12534 + }, + { + "epoch": 0.06, + "global_step": 12535, + "learning_rate": 0.0004485183639398999, + "loss": 1.6044, + "loss_base2": 2.3147, + "loss_pixel": 0.1585, + "loss_text": 1.4459, + "ppl": 4.9749, + "step": 12535 + }, + { + "epoch": 0.06, + "global_step": 12536, + "learning_rate": 0.00044851419031719533, + "loss": 1.605, + "loss_base2": 2.3155, + "loss_pixel": 0.1589, + "loss_text": 1.4461, + "ppl": 4.9779, + "step": 12536 + }, + { + "epoch": 0.06, + "global_step": 12537, + "learning_rate": 0.00044851001669449084, + "loss": 1.6173, + "loss_base2": 2.3333, + "loss_pixel": 0.1581, + "loss_text": 1.4592, + "ppl": 5.0395, + "step": 12537 + }, + { + "epoch": 0.06, + "global_step": 12538, + "learning_rate": 0.00044850584307178635, + "loss": 1.5873, + "loss_base2": 2.29, + "loss_pixel": 0.1586, + "loss_text": 1.4287, + "ppl": 4.8905, + "step": 12538 + }, + { + "epoch": 0.06, + "global_step": 12539, + "learning_rate": 0.0004485016694490818, + "loss": 1.6016, + "loss_base2": 2.3106, + "loss_pixel": 0.1576, + "loss_text": 1.444, + "ppl": 4.961, + "step": 12539 + }, + { + "epoch": 0.06, + "global_step": 12540, + "learning_rate": 0.00044849749582637726, + "loss": 1.6095, + "loss_base2": 2.322, + "loss_pixel": 0.1596, + "loss_text": 1.45, + "ppl": 5.0003, + "step": 12540 + }, + { + "epoch": 0.06, + "global_step": 12541, + "learning_rate": 0.00044849332220367276, + "loss": 1.6064, + "loss_base2": 2.3175, + "loss_pixel": 0.1569, + "loss_text": 1.4495, + "ppl": 4.9848, + "step": 12541 + }, + { + "epoch": 0.06, + "global_step": 12542, + "learning_rate": 0.00044848914858096827, + "loss": 1.5876, + "loss_base2": 2.2904, + "loss_pixel": 0.1575, + "loss_text": 1.4301, + "ppl": 4.892, + "step": 12542 + }, + { + "epoch": 0.06, + "global_step": 12543, + "learning_rate": 0.0004484849749582638, + "loss": 1.6192, + "loss_base2": 2.336, + "loss_pixel": 0.1577, + "loss_text": 1.4615, + "ppl": 5.049, + "step": 12543 + }, + { + "epoch": 0.06, + "global_step": 12544, + "learning_rate": 0.0004484808013355593, + "loss": 1.6115, + "loss_base2": 2.3249, + "loss_pixel": 0.1582, + "loss_text": 1.4533, + "ppl": 5.0103, + "step": 12544 + }, + { + "epoch": 0.06, + "global_step": 12545, + "learning_rate": 0.00044847662771285474, + "loss": 1.6091, + "loss_base2": 2.3214, + "loss_pixel": 0.1583, + "loss_text": 1.4508, + "ppl": 4.9983, + "step": 12545 + }, + { + "epoch": 0.06, + "global_step": 12546, + "learning_rate": 0.00044847245409015025, + "loss": 1.5937, + "loss_base2": 2.2992, + "loss_pixel": 0.1577, + "loss_text": 1.436, + "ppl": 4.9219, + "step": 12546 + }, + { + "epoch": 0.06, + "global_step": 12547, + "learning_rate": 0.00044846828046744575, + "loss": 1.5323, + "loss_base2": 2.2106, + "loss_pixel": 0.1576, + "loss_text": 1.3747, + "ppl": 4.6288, + "step": 12547 + }, + { + "epoch": 0.06, + "global_step": 12548, + "learning_rate": 0.00044846410684474126, + "loss": 1.5286, + "loss_base2": 2.2053, + "loss_pixel": 0.1571, + "loss_text": 1.3715, + "ppl": 4.6117, + "step": 12548 + }, + { + "epoch": 0.06, + "global_step": 12549, + "learning_rate": 0.00044845993322203677, + "loss": 1.5087, + "loss_base2": 2.1766, + "loss_pixel": 0.1567, + "loss_text": 1.352, + "ppl": 4.5208, + "step": 12549 + }, + { + "epoch": 0.06, + "global_step": 12550, + "learning_rate": 0.0004484557595993322, + "loss": 1.581, + "loss_base2": 2.2809, + "loss_pixel": 0.158, + "loss_text": 1.423, + "ppl": 4.8598, + "step": 12550 + }, + { + "epoch": 0.06, + "global_step": 12551, + "learning_rate": 0.00044845158597662773, + "loss": 1.6299, + "loss_base2": 2.3514, + "loss_pixel": 0.1579, + "loss_text": 1.4721, + "ppl": 5.1034, + "step": 12551 + }, + { + "epoch": 0.06, + "global_step": 12552, + "learning_rate": 0.00044844741235392324, + "loss": 1.5903, + "loss_base2": 2.2943, + "loss_pixel": 0.1578, + "loss_text": 1.4324, + "ppl": 4.9052, + "step": 12552 + }, + { + "epoch": 0.06, + "global_step": 12553, + "learning_rate": 0.00044844323873121874, + "loss": 1.6129, + "loss_base2": 2.3269, + "loss_pixel": 0.1576, + "loss_text": 1.4553, + "ppl": 5.0173, + "step": 12553 + }, + { + "epoch": 0.06, + "global_step": 12554, + "learning_rate": 0.0004484390651085142, + "loss": 1.6081, + "loss_base2": 2.32, + "loss_pixel": 0.1597, + "loss_text": 1.4484, + "ppl": 4.9933, + "step": 12554 + }, + { + "epoch": 0.06, + "global_step": 12555, + "learning_rate": 0.0004484348914858097, + "loss": 1.6169, + "loss_base2": 2.3327, + "loss_pixel": 0.1567, + "loss_text": 1.4602, + "ppl": 5.0374, + "step": 12555 + }, + { + "epoch": 0.06, + "global_step": 12556, + "learning_rate": 0.0004484307178631052, + "loss": 1.6031, + "loss_base2": 2.3128, + "loss_pixel": 0.1573, + "loss_text": 1.4459, + "ppl": 4.9684, + "step": 12556 + }, + { + "epoch": 0.06, + "global_step": 12557, + "learning_rate": 0.0004484265442404007, + "loss": 1.6087, + "loss_base2": 2.3209, + "loss_pixel": 0.1583, + "loss_text": 1.4503, + "ppl": 4.9963, + "step": 12557 + }, + { + "epoch": 0.06, + "global_step": 12558, + "learning_rate": 0.00044842237061769617, + "loss": 1.6087, + "loss_base2": 2.3209, + "loss_pixel": 0.1564, + "loss_text": 1.4524, + "ppl": 4.9963, + "step": 12558 + }, + { + "epoch": 0.06, + "global_step": 12559, + "learning_rate": 0.0004484181969949916, + "loss": 1.5868, + "loss_base2": 2.2893, + "loss_pixel": 0.1567, + "loss_text": 1.4301, + "ppl": 4.8881, + "step": 12559 + }, + { + "epoch": 0.06, + "global_step": 12560, + "learning_rate": 0.00044841402337228713, + "loss": 1.5871, + "loss_base2": 2.2897, + "loss_pixel": 0.1578, + "loss_text": 1.4293, + "ppl": 4.8895, + "step": 12560 + }, + { + "epoch": 0.06, + "global_step": 12561, + "learning_rate": 0.00044840984974958264, + "loss": 1.6138, + "loss_base2": 2.3282, + "loss_pixel": 0.1557, + "loss_text": 1.4581, + "ppl": 5.0219, + "step": 12561 + }, + { + "epoch": 0.06, + "global_step": 12562, + "learning_rate": 0.00044840567612687815, + "loss": 1.6126, + "loss_base2": 2.3265, + "loss_pixel": 0.1559, + "loss_text": 1.4566, + "ppl": 5.0158, + "step": 12562 + }, + { + "epoch": 0.06, + "global_step": 12563, + "learning_rate": 0.0004484015025041736, + "loss": 1.5945, + "loss_base2": 2.3004, + "loss_pixel": 0.1572, + "loss_text": 1.4374, + "ppl": 4.9259, + "step": 12563 + }, + { + "epoch": 0.06, + "global_step": 12564, + "learning_rate": 0.0004483973288814691, + "loss": 1.5953, + "loss_base2": 2.3015, + "loss_pixel": 0.1569, + "loss_text": 1.4385, + "ppl": 4.9298, + "step": 12564 + }, + { + "epoch": 0.06, + "global_step": 12565, + "learning_rate": 0.0004483931552587646, + "loss": 1.6008, + "loss_base2": 2.3095, + "loss_pixel": 0.1576, + "loss_text": 1.4432, + "ppl": 4.957, + "step": 12565 + }, + { + "epoch": 0.06, + "global_step": 12566, + "learning_rate": 0.0004483889816360601, + "loss": 1.6082, + "loss_base2": 2.3201, + "loss_pixel": 0.156, + "loss_text": 1.4522, + "ppl": 4.9938, + "step": 12566 + }, + { + "epoch": 0.06, + "global_step": 12567, + "learning_rate": 0.00044838480801335563, + "loss": 1.6088, + "loss_base2": 2.321, + "loss_pixel": 0.1579, + "loss_text": 1.4509, + "ppl": 4.9968, + "step": 12567 + }, + { + "epoch": 0.06, + "global_step": 12568, + "learning_rate": 0.0004483806343906511, + "loss": 1.6043, + "loss_base2": 2.3145, + "loss_pixel": 0.1558, + "loss_text": 1.4485, + "ppl": 4.9744, + "step": 12568 + }, + { + "epoch": 0.06, + "global_step": 12569, + "learning_rate": 0.0004483764607679466, + "loss": 1.5979, + "loss_base2": 2.3053, + "loss_pixel": 0.1571, + "loss_text": 1.4408, + "ppl": 4.9426, + "step": 12569 + }, + { + "epoch": 0.06, + "global_step": 12570, + "learning_rate": 0.0004483722871452421, + "loss": 1.6068, + "loss_base2": 2.3181, + "loss_pixel": 0.1551, + "loss_text": 1.4517, + "ppl": 4.9868, + "step": 12570 + }, + { + "epoch": 0.06, + "global_step": 12571, + "learning_rate": 0.0004483681135225376, + "loss": 1.5626, + "loss_base2": 2.2544, + "loss_pixel": 0.1579, + "loss_text": 1.4047, + "ppl": 4.7712, + "step": 12571 + }, + { + "epoch": 0.06, + "global_step": 12572, + "learning_rate": 0.00044836393989983306, + "loss": 1.3924, + "loss_base2": 2.0088, + "loss_pixel": 0.1573, + "loss_text": 1.2351, + "ppl": 4.0245, + "step": 12572 + }, + { + "epoch": 0.06, + "global_step": 12573, + "learning_rate": 0.00044835976627712856, + "loss": 1.3772, + "loss_base2": 1.9869, + "loss_pixel": 0.1569, + "loss_text": 1.2202, + "ppl": 3.9638, + "step": 12573 + }, + { + "epoch": 0.06, + "global_step": 12574, + "learning_rate": 0.00044835559265442407, + "loss": 1.3795, + "loss_base2": 1.9902, + "loss_pixel": 0.1566, + "loss_text": 1.2229, + "ppl": 3.9729, + "step": 12574 + }, + { + "epoch": 0.06, + "global_step": 12575, + "learning_rate": 0.0004483514190317196, + "loss": 1.3673, + "loss_base2": 1.9726, + "loss_pixel": 0.1582, + "loss_text": 1.2091, + "ppl": 3.9247, + "step": 12575 + }, + { + "epoch": 0.06, + "global_step": 12576, + "learning_rate": 0.0004483472454090151, + "loss": 1.3689, + "loss_base2": 1.9749, + "loss_pixel": 0.1576, + "loss_text": 1.2113, + "ppl": 3.931, + "step": 12576 + }, + { + "epoch": 0.06, + "global_step": 12577, + "learning_rate": 0.0004483430717863105, + "loss": 1.3466, + "loss_base2": 1.9427, + "loss_pixel": 0.1463, + "loss_text": 1.2002, + "ppl": 3.8443, + "step": 12577 + }, + { + "epoch": 0.06, + "global_step": 12578, + "learning_rate": 0.000448338898163606, + "loss": 1.3678, + "loss_base2": 1.9733, + "loss_pixel": 0.1519, + "loss_text": 1.2159, + "ppl": 3.9267, + "step": 12578 + }, + { + "epoch": 0.06, + "global_step": 12579, + "learning_rate": 0.0004483347245409015, + "loss": 1.3681, + "loss_base2": 1.9738, + "loss_pixel": 0.1492, + "loss_text": 1.2189, + "ppl": 3.9279, + "step": 12579 + }, + { + "epoch": 0.06, + "global_step": 12580, + "learning_rate": 0.000448330550918197, + "loss": 1.3574, + "loss_base2": 1.9583, + "loss_pixel": 0.1489, + "loss_text": 1.2085, + "ppl": 3.8861, + "step": 12580 + }, + { + "epoch": 0.06, + "global_step": 12581, + "learning_rate": 0.00044832637729549246, + "loss": 1.3571, + "loss_base2": 1.9579, + "loss_pixel": 0.1461, + "loss_text": 1.211, + "ppl": 3.8849, + "step": 12581 + }, + { + "epoch": 0.06, + "global_step": 12582, + "learning_rate": 0.00044832220367278797, + "loss": 1.3317, + "loss_base2": 1.9212, + "loss_pixel": 0.1475, + "loss_text": 1.1842, + "ppl": 3.7875, + "step": 12582 + }, + { + "epoch": 0.06, + "global_step": 12583, + "learning_rate": 0.0004483180300500835, + "loss": 1.3542, + "loss_base2": 1.9537, + "loss_pixel": 0.1476, + "loss_text": 1.2066, + "ppl": 3.8737, + "step": 12583 + }, + { + "epoch": 0.06, + "global_step": 12584, + "learning_rate": 0.000448313856427379, + "loss": 1.3565, + "loss_base2": 1.957, + "loss_pixel": 0.1475, + "loss_text": 1.209, + "ppl": 3.8826, + "step": 12584 + }, + { + "epoch": 0.06, + "global_step": 12585, + "learning_rate": 0.0004483096828046745, + "loss": 1.3659, + "loss_base2": 1.9706, + "loss_pixel": 0.1454, + "loss_text": 1.2206, + "ppl": 3.9192, + "step": 12585 + }, + { + "epoch": 0.06, + "global_step": 12586, + "learning_rate": 0.00044830550918196994, + "loss": 1.3633, + "loss_base2": 1.9668, + "loss_pixel": 0.1467, + "loss_text": 1.2165, + "ppl": 3.9091, + "step": 12586 + }, + { + "epoch": 0.06, + "global_step": 12587, + "learning_rate": 0.00044830133555926545, + "loss": 1.3401, + "loss_base2": 1.9334, + "loss_pixel": 0.1463, + "loss_text": 1.1938, + "ppl": 3.8194, + "step": 12587 + }, + { + "epoch": 0.06, + "global_step": 12588, + "learning_rate": 0.00044829716193656096, + "loss": 1.3416, + "loss_base2": 1.9355, + "loss_pixel": 0.1463, + "loss_text": 1.1953, + "ppl": 3.8252, + "step": 12588 + }, + { + "epoch": 0.06, + "global_step": 12589, + "learning_rate": 0.00044829298831385646, + "loss": 1.3547, + "loss_base2": 1.9544, + "loss_pixel": 0.1456, + "loss_text": 1.2091, + "ppl": 3.8756, + "step": 12589 + }, + { + "epoch": 0.06, + "global_step": 12590, + "learning_rate": 0.0004482888146911519, + "loss": 1.3529, + "loss_base2": 1.9518, + "loss_pixel": 0.1486, + "loss_text": 1.2043, + "ppl": 3.8686, + "step": 12590 + }, + { + "epoch": 0.06, + "global_step": 12591, + "learning_rate": 0.0004482846410684474, + "loss": 1.3588, + "loss_base2": 1.9603, + "loss_pixel": 0.1508, + "loss_text": 1.208, + "ppl": 3.8915, + "step": 12591 + }, + { + "epoch": 0.06, + "global_step": 12592, + "learning_rate": 0.00044828046744574293, + "loss": 1.3458, + "loss_base2": 1.9416, + "loss_pixel": 0.1464, + "loss_text": 1.1993, + "ppl": 3.8413, + "step": 12592 + }, + { + "epoch": 0.06, + "global_step": 12593, + "learning_rate": 0.00044827629382303844, + "loss": 1.3751, + "loss_base2": 1.9838, + "loss_pixel": 0.1541, + "loss_text": 1.2211, + "ppl": 3.9555, + "step": 12593 + }, + { + "epoch": 0.06, + "global_step": 12594, + "learning_rate": 0.00044827212020033395, + "loss": 1.3682, + "loss_base2": 1.9739, + "loss_pixel": 0.158, + "loss_text": 1.2102, + "ppl": 3.9283, + "step": 12594 + }, + { + "epoch": 0.06, + "global_step": 12595, + "learning_rate": 0.00044826794657762934, + "loss": 1.3538, + "loss_base2": 1.9531, + "loss_pixel": 0.1593, + "loss_text": 1.1946, + "ppl": 3.8721, + "step": 12595 + }, + { + "epoch": 0.06, + "global_step": 12596, + "learning_rate": 0.00044826377295492485, + "loss": 1.3852, + "loss_base2": 1.9984, + "loss_pixel": 0.1581, + "loss_text": 1.2271, + "ppl": 3.9956, + "step": 12596 + }, + { + "epoch": 0.06, + "global_step": 12597, + "learning_rate": 0.00044825959933222036, + "loss": 1.3679, + "loss_base2": 1.9735, + "loss_pixel": 0.1594, + "loss_text": 1.2086, + "ppl": 3.9271, + "step": 12597 + }, + { + "epoch": 0.06, + "global_step": 12598, + "learning_rate": 0.00044825542570951587, + "loss": 1.3718, + "loss_base2": 1.9791, + "loss_pixel": 0.1553, + "loss_text": 1.2165, + "ppl": 3.9424, + "step": 12598 + }, + { + "epoch": 0.06, + "global_step": 12599, + "learning_rate": 0.0004482512520868113, + "loss": 1.3591, + "loss_base2": 1.9608, + "loss_pixel": 0.1566, + "loss_text": 1.2024, + "ppl": 3.8927, + "step": 12599 + }, + { + "epoch": 0.06, + "global_step": 12600, + "learning_rate": 0.00044824707846410683, + "loss": 1.3675, + "loss_base2": 1.9729, + "loss_pixel": 0.1568, + "loss_text": 1.2107, + "ppl": 3.9255, + "step": 12600 + }, + { + "epoch": 0.06, + "global_step": 12601, + "learning_rate": 0.00044824290484140233, + "loss": 1.3542, + "loss_base2": 1.9537, + "loss_pixel": 0.1577, + "loss_text": 1.1965, + "ppl": 3.8737, + "step": 12601 + }, + { + "epoch": 0.06, + "global_step": 12602, + "learning_rate": 0.00044823873121869784, + "loss": 1.3676, + "loss_base2": 1.973, + "loss_pixel": 0.1579, + "loss_text": 1.2097, + "ppl": 3.9259, + "step": 12602 + }, + { + "epoch": 0.06, + "global_step": 12603, + "learning_rate": 0.00044823455759599335, + "loss": 1.3754, + "loss_base2": 1.9843, + "loss_pixel": 0.1569, + "loss_text": 1.2185, + "ppl": 3.9567, + "step": 12603 + }, + { + "epoch": 0.06, + "global_step": 12604, + "learning_rate": 0.0004482303839732888, + "loss": 1.3684, + "loss_base2": 1.9742, + "loss_pixel": 0.1585, + "loss_text": 1.2099, + "ppl": 3.9291, + "step": 12604 + }, + { + "epoch": 0.06, + "global_step": 12605, + "learning_rate": 0.0004482262103505843, + "loss": 1.3732, + "loss_base2": 1.9811, + "loss_pixel": 0.1566, + "loss_text": 1.2166, + "ppl": 3.948, + "step": 12605 + }, + { + "epoch": 0.06, + "global_step": 12606, + "learning_rate": 0.0004482220367278798, + "loss": 1.3506, + "loss_base2": 1.9485, + "loss_pixel": 0.1562, + "loss_text": 1.1944, + "ppl": 3.8597, + "step": 12606 + }, + { + "epoch": 0.06, + "global_step": 12607, + "learning_rate": 0.0004482178631051753, + "loss": 1.368, + "loss_base2": 1.9736, + "loss_pixel": 0.1565, + "loss_text": 1.2115, + "ppl": 3.9275, + "step": 12607 + }, + { + "epoch": 0.06, + "global_step": 12608, + "learning_rate": 0.00044821368948247083, + "loss": 1.3844, + "loss_base2": 1.9973, + "loss_pixel": 0.1611, + "loss_text": 1.2234, + "ppl": 3.9924, + "step": 12608 + }, + { + "epoch": 0.06, + "global_step": 12609, + "learning_rate": 0.0004482095158597663, + "loss": 1.3739, + "loss_base2": 1.9821, + "loss_pixel": 0.1568, + "loss_text": 1.2172, + "ppl": 3.9507, + "step": 12609 + }, + { + "epoch": 0.06, + "global_step": 12610, + "learning_rate": 0.0004482053422370618, + "loss": 1.3819, + "loss_base2": 1.9937, + "loss_pixel": 0.157, + "loss_text": 1.2249, + "ppl": 3.9825, + "step": 12610 + }, + { + "epoch": 0.06, + "global_step": 12611, + "learning_rate": 0.0004482011686143573, + "loss": 1.3727, + "loss_base2": 1.9804, + "loss_pixel": 0.1574, + "loss_text": 1.2153, + "ppl": 3.946, + "step": 12611 + }, + { + "epoch": 0.06, + "global_step": 12612, + "learning_rate": 0.0004481969949916528, + "loss": 1.383, + "loss_base2": 1.9952, + "loss_pixel": 0.1562, + "loss_text": 1.2268, + "ppl": 3.9868, + "step": 12612 + }, + { + "epoch": 0.06, + "global_step": 12613, + "learning_rate": 0.00044819282136894826, + "loss": 1.384, + "loss_base2": 1.9967, + "loss_pixel": 0.1571, + "loss_text": 1.2269, + "ppl": 3.9908, + "step": 12613 + }, + { + "epoch": 0.06, + "global_step": 12614, + "learning_rate": 0.0004481886477462437, + "loss": 1.3548, + "loss_base2": 1.9546, + "loss_pixel": 0.1566, + "loss_text": 1.1982, + "ppl": 3.876, + "step": 12614 + }, + { + "epoch": 0.06, + "global_step": 12615, + "learning_rate": 0.0004481844741235392, + "loss": 1.3771, + "loss_base2": 1.9867, + "loss_pixel": 0.1572, + "loss_text": 1.2199, + "ppl": 3.9634, + "step": 12615 + }, + { + "epoch": 0.06, + "global_step": 12616, + "learning_rate": 0.00044818030050083473, + "loss": 1.3461, + "loss_base2": 1.942, + "loss_pixel": 0.158, + "loss_text": 1.1881, + "ppl": 3.8424, + "step": 12616 + }, + { + "epoch": 0.06, + "global_step": 12617, + "learning_rate": 0.00044817612687813023, + "loss": 1.3675, + "loss_base2": 1.9729, + "loss_pixel": 0.1565, + "loss_text": 1.211, + "ppl": 3.9255, + "step": 12617 + }, + { + "epoch": 0.06, + "global_step": 12618, + "learning_rate": 0.0004481719532554257, + "loss": 1.365, + "loss_base2": 1.9693, + "loss_pixel": 0.157, + "loss_text": 1.2079, + "ppl": 3.9157, + "step": 12618 + }, + { + "epoch": 0.06, + "global_step": 12619, + "learning_rate": 0.0004481677796327212, + "loss": 1.3394, + "loss_base2": 1.9323, + "loss_pixel": 0.1583, + "loss_text": 1.1811, + "ppl": 3.8168, + "step": 12619 + }, + { + "epoch": 0.06, + "global_step": 12620, + "learning_rate": 0.0004481636060100167, + "loss": 1.6148, + "loss_base2": 2.3297, + "loss_pixel": 0.157, + "loss_text": 1.4578, + "ppl": 5.0269, + "step": 12620 + }, + { + "epoch": 0.06, + "global_step": 12621, + "learning_rate": 0.0004481594323873122, + "loss": 1.6087, + "loss_base2": 2.3209, + "loss_pixel": 0.1567, + "loss_text": 1.452, + "ppl": 4.9963, + "step": 12621 + }, + { + "epoch": 0.06, + "global_step": 12622, + "learning_rate": 0.00044815525876460766, + "loss": 1.6125, + "loss_base2": 2.3263, + "loss_pixel": 0.1565, + "loss_text": 1.456, + "ppl": 5.0153, + "step": 12622 + }, + { + "epoch": 0.06, + "global_step": 12623, + "learning_rate": 0.00044815108514190317, + "loss": 1.6029, + "loss_base2": 2.3125, + "loss_pixel": 0.1555, + "loss_text": 1.4474, + "ppl": 4.9674, + "step": 12623 + }, + { + "epoch": 0.06, + "global_step": 12624, + "learning_rate": 0.0004481469115191987, + "loss": 1.5994, + "loss_base2": 2.3074, + "loss_pixel": 0.1571, + "loss_text": 1.4423, + "ppl": 4.9501, + "step": 12624 + }, + { + "epoch": 0.06, + "global_step": 12625, + "learning_rate": 0.0004481427378964942, + "loss": 1.6053, + "loss_base2": 2.316, + "loss_pixel": 0.1582, + "loss_text": 1.4471, + "ppl": 4.9794, + "step": 12625 + }, + { + "epoch": 0.06, + "global_step": 12626, + "learning_rate": 0.0004481385642737897, + "loss": 1.5872, + "loss_base2": 2.2898, + "loss_pixel": 0.1571, + "loss_text": 1.43, + "ppl": 4.89, + "step": 12626 + }, + { + "epoch": 0.06, + "global_step": 12627, + "learning_rate": 0.00044813439065108515, + "loss": 1.6102, + "loss_base2": 2.323, + "loss_pixel": 0.158, + "loss_text": 1.4523, + "ppl": 5.0038, + "step": 12627 + }, + { + "epoch": 0.06, + "global_step": 12628, + "learning_rate": 0.00044813021702838065, + "loss": 1.615, + "loss_base2": 2.33, + "loss_pixel": 0.1561, + "loss_text": 1.4589, + "ppl": 5.0279, + "step": 12628 + }, + { + "epoch": 0.06, + "global_step": 12629, + "learning_rate": 0.00044812604340567616, + "loss": 1.6042, + "loss_base2": 2.3144, + "loss_pixel": 0.1575, + "loss_text": 1.4467, + "ppl": 4.9739, + "step": 12629 + }, + { + "epoch": 0.06, + "global_step": 12630, + "learning_rate": 0.00044812186978297167, + "loss": 1.586, + "loss_base2": 2.2881, + "loss_pixel": 0.1556, + "loss_text": 1.4304, + "ppl": 4.8842, + "step": 12630 + }, + { + "epoch": 0.06, + "global_step": 12631, + "learning_rate": 0.0004481176961602671, + "loss": 1.6109, + "loss_base2": 2.324, + "loss_pixel": 0.1563, + "loss_text": 1.4547, + "ppl": 5.0073, + "step": 12631 + }, + { + "epoch": 0.06, + "global_step": 12632, + "learning_rate": 0.00044811352253756263, + "loss": 1.6067, + "loss_base2": 2.318, + "loss_pixel": 0.1566, + "loss_text": 1.4501, + "ppl": 4.9863, + "step": 12632 + }, + { + "epoch": 0.06, + "global_step": 12633, + "learning_rate": 0.0004481093489148581, + "loss": 1.5777, + "loss_base2": 2.2761, + "loss_pixel": 0.1561, + "loss_text": 1.4216, + "ppl": 4.8438, + "step": 12633 + }, + { + "epoch": 0.06, + "global_step": 12634, + "learning_rate": 0.0004481051752921536, + "loss": 1.5882, + "loss_base2": 2.2913, + "loss_pixel": 0.1555, + "loss_text": 1.4327, + "ppl": 4.8949, + "step": 12634 + }, + { + "epoch": 0.06, + "global_step": 12635, + "learning_rate": 0.0004481010016694491, + "loss": 1.6111, + "loss_base2": 2.3243, + "loss_pixel": 0.1575, + "loss_text": 1.4536, + "ppl": 5.0083, + "step": 12635 + }, + { + "epoch": 0.06, + "global_step": 12636, + "learning_rate": 0.00044809682804674455, + "loss": 1.5973, + "loss_base2": 2.3044, + "loss_pixel": 0.1574, + "loss_text": 1.4399, + "ppl": 4.9397, + "step": 12636 + }, + { + "epoch": 0.06, + "global_step": 12637, + "learning_rate": 0.00044809265442404006, + "loss": 1.6047, + "loss_base2": 2.3151, + "loss_pixel": 0.1555, + "loss_text": 1.4492, + "ppl": 4.9764, + "step": 12637 + }, + { + "epoch": 0.06, + "global_step": 12638, + "learning_rate": 0.00044808848080133556, + "loss": 1.6019, + "loss_base2": 2.3111, + "loss_pixel": 0.1585, + "loss_text": 1.4434, + "ppl": 4.9625, + "step": 12638 + }, + { + "epoch": 0.06, + "global_step": 12639, + "learning_rate": 0.00044808430717863107, + "loss": 1.6141, + "loss_base2": 2.3287, + "loss_pixel": 0.1577, + "loss_text": 1.4564, + "ppl": 5.0234, + "step": 12639 + }, + { + "epoch": 0.06, + "global_step": 12640, + "learning_rate": 0.0004480801335559265, + "loss": 1.5936, + "loss_base2": 2.2991, + "loss_pixel": 0.1569, + "loss_text": 1.4368, + "ppl": 4.9214, + "step": 12640 + }, + { + "epoch": 0.06, + "global_step": 12641, + "learning_rate": 0.00044807595993322203, + "loss": 1.6116, + "loss_base2": 2.325, + "loss_pixel": 0.1555, + "loss_text": 1.4561, + "ppl": 5.0108, + "step": 12641 + }, + { + "epoch": 0.06, + "global_step": 12642, + "learning_rate": 0.00044807178631051754, + "loss": 1.597, + "loss_base2": 2.304, + "loss_pixel": 0.1583, + "loss_text": 1.4386, + "ppl": 4.9382, + "step": 12642 + }, + { + "epoch": 0.06, + "global_step": 12643, + "learning_rate": 0.00044806761268781305, + "loss": 1.5596, + "loss_base2": 2.25, + "loss_pixel": 0.1596, + "loss_text": 1.4001, + "ppl": 4.7569, + "step": 12643 + }, + { + "epoch": 0.06, + "global_step": 12644, + "learning_rate": 0.00044806343906510855, + "loss": 1.3875, + "loss_base2": 2.0017, + "loss_pixel": 0.1578, + "loss_text": 1.2297, + "ppl": 4.0048, + "step": 12644 + }, + { + "epoch": 0.06, + "global_step": 12645, + "learning_rate": 0.000448059265442404, + "loss": 1.3772, + "loss_base2": 1.9869, + "loss_pixel": 0.1593, + "loss_text": 1.2179, + "ppl": 3.9638, + "step": 12645 + }, + { + "epoch": 0.06, + "global_step": 12646, + "learning_rate": 0.0004480550918196995, + "loss": 1.3645, + "loss_base2": 1.9686, + "loss_pixel": 0.1589, + "loss_text": 1.2056, + "ppl": 3.9138, + "step": 12646 + }, + { + "epoch": 0.06, + "global_step": 12647, + "learning_rate": 0.000448050918196995, + "loss": 1.3779, + "loss_base2": 1.9879, + "loss_pixel": 0.1565, + "loss_text": 1.2214, + "ppl": 3.9666, + "step": 12647 + }, + { + "epoch": 0.06, + "global_step": 12648, + "learning_rate": 0.00044804674457429053, + "loss": 1.3626, + "loss_base2": 1.9658, + "loss_pixel": 0.1589, + "loss_text": 1.2037, + "ppl": 3.9063, + "step": 12648 + }, + { + "epoch": 0.06, + "global_step": 12649, + "learning_rate": 0.000448042570951586, + "loss": 1.3786, + "loss_base2": 1.9889, + "loss_pixel": 0.1595, + "loss_text": 1.2191, + "ppl": 3.9693, + "step": 12649 + }, + { + "epoch": 0.06, + "global_step": 12650, + "learning_rate": 0.0004480383973288815, + "loss": 1.3532, + "loss_base2": 1.9523, + "loss_pixel": 0.1598, + "loss_text": 1.1933, + "ppl": 3.8698, + "step": 12650 + }, + { + "epoch": 0.06, + "global_step": 12651, + "learning_rate": 0.000448034223706177, + "loss": 1.4531, + "loss_base2": 2.0964, + "loss_pixel": 0.1589, + "loss_text": 1.2942, + "ppl": 4.2764, + "step": 12651 + }, + { + "epoch": 0.06, + "global_step": 12652, + "learning_rate": 0.00044803005008347245, + "loss": 1.4152, + "loss_base2": 2.0417, + "loss_pixel": 0.1585, + "loss_text": 1.2567, + "ppl": 4.1173, + "step": 12652 + }, + { + "epoch": 0.06, + "global_step": 12653, + "learning_rate": 0.00044802587646076796, + "loss": 1.375, + "loss_base2": 1.9837, + "loss_pixel": 0.1583, + "loss_text": 1.2167, + "ppl": 3.9551, + "step": 12653 + }, + { + "epoch": 0.06, + "global_step": 12654, + "learning_rate": 0.0004480217028380634, + "loss": 1.3691, + "loss_base2": 1.9752, + "loss_pixel": 0.1582, + "loss_text": 1.2108, + "ppl": 3.9318, + "step": 12654 + }, + { + "epoch": 0.06, + "global_step": 12655, + "learning_rate": 0.0004480175292153589, + "loss": 1.3841, + "loss_base2": 1.9968, + "loss_pixel": 0.1585, + "loss_text": 1.2256, + "ppl": 3.9912, + "step": 12655 + }, + { + "epoch": 0.06, + "global_step": 12656, + "learning_rate": 0.0004480133555926544, + "loss": 1.3454, + "loss_base2": 1.941, + "loss_pixel": 0.1606, + "loss_text": 1.1848, + "ppl": 3.8397, + "step": 12656 + }, + { + "epoch": 0.06, + "global_step": 12657, + "learning_rate": 0.00044800918196994993, + "loss": 1.362, + "loss_base2": 1.965, + "loss_pixel": 0.1643, + "loss_text": 1.1977, + "ppl": 3.904, + "step": 12657 + }, + { + "epoch": 0.06, + "global_step": 12658, + "learning_rate": 0.0004480050083472454, + "loss": 1.3766, + "loss_base2": 1.986, + "loss_pixel": 0.1609, + "loss_text": 1.2157, + "ppl": 3.9614, + "step": 12658 + }, + { + "epoch": 0.06, + "global_step": 12659, + "learning_rate": 0.0004480008347245409, + "loss": 1.3675, + "loss_base2": 1.9729, + "loss_pixel": 0.1612, + "loss_text": 1.2064, + "ppl": 3.9255, + "step": 12659 + }, + { + "epoch": 0.06, + "global_step": 12660, + "learning_rate": 0.0004479966611018364, + "loss": 1.3623, + "loss_base2": 1.9654, + "loss_pixel": 0.1628, + "loss_text": 1.1995, + "ppl": 3.9052, + "step": 12660 + }, + { + "epoch": 0.06, + "global_step": 12661, + "learning_rate": 0.0004479924874791319, + "loss": 1.382, + "loss_base2": 1.9938, + "loss_pixel": 0.1629, + "loss_text": 1.2191, + "ppl": 3.9829, + "step": 12661 + }, + { + "epoch": 0.06, + "global_step": 12662, + "learning_rate": 0.0004479883138564274, + "loss": 1.3734, + "loss_base2": 1.9814, + "loss_pixel": 0.1527, + "loss_text": 1.2207, + "ppl": 3.9488, + "step": 12662 + }, + { + "epoch": 0.06, + "global_step": 12663, + "learning_rate": 0.00044798414023372287, + "loss": 1.3589, + "loss_base2": 1.9605, + "loss_pixel": 0.1521, + "loss_text": 1.2068, + "ppl": 3.8919, + "step": 12663 + }, + { + "epoch": 0.06, + "global_step": 12664, + "learning_rate": 0.0004479799666110184, + "loss": 1.3434, + "loss_base2": 1.9381, + "loss_pixel": 0.1523, + "loss_text": 1.1911, + "ppl": 3.8321, + "step": 12664 + }, + { + "epoch": 0.06, + "global_step": 12665, + "learning_rate": 0.0004479757929883139, + "loss": 1.3623, + "loss_base2": 1.9654, + "loss_pixel": 0.1495, + "loss_text": 1.2128, + "ppl": 3.9052, + "step": 12665 + }, + { + "epoch": 0.06, + "global_step": 12666, + "learning_rate": 0.0004479716193656094, + "loss": 1.3545, + "loss_base2": 1.9541, + "loss_pixel": 0.1532, + "loss_text": 1.2013, + "ppl": 3.8748, + "step": 12666 + }, + { + "epoch": 0.06, + "global_step": 12667, + "learning_rate": 0.0004479674457429049, + "loss": 1.3458, + "loss_base2": 1.9416, + "loss_pixel": 0.1493, + "loss_text": 1.1965, + "ppl": 3.8413, + "step": 12667 + }, + { + "epoch": 0.06, + "global_step": 12668, + "learning_rate": 0.00044796327212020035, + "loss": 1.341, + "loss_base2": 1.9347, + "loss_pixel": 0.1495, + "loss_text": 1.1915, + "ppl": 3.8229, + "step": 12668 + }, + { + "epoch": 0.06, + "global_step": 12669, + "learning_rate": 0.00044795909849749586, + "loss": 1.3721, + "loss_base2": 1.9795, + "loss_pixel": 0.1473, + "loss_text": 1.2248, + "ppl": 3.9436, + "step": 12669 + }, + { + "epoch": 0.06, + "global_step": 12670, + "learning_rate": 0.0004479549248747913, + "loss": 1.6144, + "loss_base2": 2.3291, + "loss_pixel": 0.1469, + "loss_text": 1.4675, + "ppl": 5.0249, + "step": 12670 + }, + { + "epoch": 0.06, + "global_step": 12671, + "learning_rate": 0.0004479507512520868, + "loss": 1.6174, + "loss_base2": 2.3334, + "loss_pixel": 0.1473, + "loss_text": 1.47, + "ppl": 5.04, + "step": 12671 + }, + { + "epoch": 0.06, + "global_step": 12672, + "learning_rate": 0.00044794657762938227, + "loss": 1.5846, + "loss_base2": 2.2861, + "loss_pixel": 0.1464, + "loss_text": 1.4381, + "ppl": 4.8773, + "step": 12672 + }, + { + "epoch": 0.06, + "global_step": 12673, + "learning_rate": 0.0004479424040066778, + "loss": 1.6264, + "loss_base2": 2.3464, + "loss_pixel": 0.1475, + "loss_text": 1.4789, + "ppl": 5.0855, + "step": 12673 + }, + { + "epoch": 0.06, + "global_step": 12674, + "learning_rate": 0.0004479382303839733, + "loss": 1.6026, + "loss_base2": 2.3121, + "loss_pixel": 0.1483, + "loss_text": 1.4543, + "ppl": 4.9659, + "step": 12674 + }, + { + "epoch": 0.06, + "global_step": 12675, + "learning_rate": 0.0004479340567612688, + "loss": 1.5966, + "loss_base2": 2.3034, + "loss_pixel": 0.1511, + "loss_text": 1.4455, + "ppl": 4.9362, + "step": 12675 + }, + { + "epoch": 0.06, + "global_step": 12676, + "learning_rate": 0.0004479298831385643, + "loss": 1.6237, + "loss_base2": 2.3425, + "loss_pixel": 0.1476, + "loss_text": 1.4761, + "ppl": 5.0718, + "step": 12676 + }, + { + "epoch": 0.06, + "global_step": 12677, + "learning_rate": 0.00044792570951585975, + "loss": 1.5995, + "loss_base2": 2.3076, + "loss_pixel": 0.1479, + "loss_text": 1.4516, + "ppl": 4.9506, + "step": 12677 + }, + { + "epoch": 0.06, + "global_step": 12678, + "learning_rate": 0.00044792153589315526, + "loss": 1.5993, + "loss_base2": 2.3073, + "loss_pixel": 0.1477, + "loss_text": 1.4516, + "ppl": 4.9496, + "step": 12678 + }, + { + "epoch": 0.06, + "global_step": 12679, + "learning_rate": 0.00044791736227045077, + "loss": 1.5846, + "loss_base2": 2.2861, + "loss_pixel": 0.1461, + "loss_text": 1.4385, + "ppl": 4.8773, + "step": 12679 + }, + { + "epoch": 0.06, + "global_step": 12680, + "learning_rate": 0.0004479131886477463, + "loss": 1.6069, + "loss_base2": 2.3183, + "loss_pixel": 0.1472, + "loss_text": 1.4597, + "ppl": 4.9873, + "step": 12680 + }, + { + "epoch": 0.06, + "global_step": 12681, + "learning_rate": 0.00044790901502504173, + "loss": 1.5997, + "loss_base2": 2.3079, + "loss_pixel": 0.1459, + "loss_text": 1.4537, + "ppl": 4.9515, + "step": 12681 + }, + { + "epoch": 0.06, + "global_step": 12682, + "learning_rate": 0.00044790484140233723, + "loss": 1.6059, + "loss_base2": 2.3168, + "loss_pixel": 0.1467, + "loss_text": 1.4593, + "ppl": 4.9823, + "step": 12682 + }, + { + "epoch": 0.06, + "global_step": 12683, + "learning_rate": 0.00044790066777963274, + "loss": 1.5815, + "loss_base2": 2.2816, + "loss_pixel": 0.1461, + "loss_text": 1.4355, + "ppl": 4.8622, + "step": 12683 + }, + { + "epoch": 0.06, + "global_step": 12684, + "learning_rate": 0.00044789649415692825, + "loss": 1.6001, + "loss_base2": 2.3085, + "loss_pixel": 0.1465, + "loss_text": 1.4535, + "ppl": 4.9535, + "step": 12684 + }, + { + "epoch": 0.06, + "global_step": 12685, + "learning_rate": 0.00044789232053422376, + "loss": 1.5856, + "loss_base2": 2.2875, + "loss_pixel": 0.1464, + "loss_text": 1.4392, + "ppl": 4.8822, + "step": 12685 + }, + { + "epoch": 0.06, + "global_step": 12686, + "learning_rate": 0.0004478881469115192, + "loss": 1.6044, + "loss_base2": 2.3147, + "loss_pixel": 0.1472, + "loss_text": 1.4572, + "ppl": 4.9749, + "step": 12686 + }, + { + "epoch": 0.06, + "global_step": 12687, + "learning_rate": 0.0004478839732888147, + "loss": 1.5827, + "loss_base2": 2.2834, + "loss_pixel": 0.1428, + "loss_text": 1.4399, + "ppl": 4.8681, + "step": 12687 + }, + { + "epoch": 0.06, + "global_step": 12688, + "learning_rate": 0.0004478797996661102, + "loss": 1.6044, + "loss_base2": 2.3147, + "loss_pixel": 0.1467, + "loss_text": 1.4578, + "ppl": 4.9749, + "step": 12688 + }, + { + "epoch": 0.06, + "global_step": 12689, + "learning_rate": 0.0004478756260434057, + "loss": 1.5752, + "loss_base2": 2.2725, + "loss_pixel": 0.1448, + "loss_text": 1.4305, + "ppl": 4.8317, + "step": 12689 + }, + { + "epoch": 0.06, + "global_step": 12690, + "learning_rate": 0.00044787145242070113, + "loss": 1.5881, + "loss_base2": 2.2911, + "loss_pixel": 0.1465, + "loss_text": 1.4416, + "ppl": 4.8944, + "step": 12690 + }, + { + "epoch": 0.06, + "global_step": 12691, + "learning_rate": 0.00044786727879799664, + "loss": 1.6119, + "loss_base2": 2.3255, + "loss_pixel": 0.1452, + "loss_text": 1.4666, + "ppl": 5.0123, + "step": 12691 + }, + { + "epoch": 0.06, + "global_step": 12692, + "learning_rate": 0.00044786310517529215, + "loss": 1.5889, + "loss_base2": 2.2923, + "loss_pixel": 0.146, + "loss_text": 1.4429, + "ppl": 4.8984, + "step": 12692 + }, + { + "epoch": 0.06, + "global_step": 12693, + "learning_rate": 0.00044785893155258765, + "loss": 1.5858, + "loss_base2": 2.2878, + "loss_pixel": 0.1459, + "loss_text": 1.44, + "ppl": 4.8832, + "step": 12693 + }, + { + "epoch": 0.06, + "global_step": 12694, + "learning_rate": 0.00044785475792988316, + "loss": 1.5938, + "loss_base2": 2.2994, + "loss_pixel": 0.1448, + "loss_text": 1.449, + "ppl": 4.9224, + "step": 12694 + }, + { + "epoch": 0.06, + "global_step": 12695, + "learning_rate": 0.0004478505843071786, + "loss": 1.497, + "loss_base2": 2.1597, + "loss_pixel": 0.1464, + "loss_text": 1.3506, + "ppl": 4.4683, + "step": 12695 + }, + { + "epoch": 0.06, + "global_step": 12696, + "learning_rate": 0.0004478464106844741, + "loss": 1.3736, + "loss_base2": 1.9817, + "loss_pixel": 0.1464, + "loss_text": 1.2272, + "ppl": 3.9495, + "step": 12696 + }, + { + "epoch": 0.06, + "global_step": 12697, + "learning_rate": 0.00044784223706176963, + "loss": 1.3588, + "loss_base2": 1.9603, + "loss_pixel": 0.1464, + "loss_text": 1.2124, + "ppl": 3.8915, + "step": 12697 + }, + { + "epoch": 0.06, + "global_step": 12698, + "learning_rate": 0.00044783806343906514, + "loss": 1.3688, + "loss_base2": 1.9748, + "loss_pixel": 0.1433, + "loss_text": 1.2255, + "ppl": 3.9306, + "step": 12698 + }, + { + "epoch": 0.06, + "global_step": 12699, + "learning_rate": 0.0004478338898163606, + "loss": 1.3639, + "loss_base2": 1.9677, + "loss_pixel": 0.1434, + "loss_text": 1.2205, + "ppl": 3.9114, + "step": 12699 + }, + { + "epoch": 0.06, + "global_step": 12700, + "learning_rate": 0.0004478297161936561, + "loss": 1.3402, + "loss_base2": 1.9335, + "loss_pixel": 0.1453, + "loss_text": 1.1949, + "ppl": 3.8198, + "step": 12700 + }, + { + "epoch": 0.06, + "global_step": 12701, + "learning_rate": 0.0004478255425709516, + "loss": 1.3825, + "loss_base2": 1.9945, + "loss_pixel": 0.147, + "loss_text": 1.2355, + "ppl": 3.9849, + "step": 12701 + }, + { + "epoch": 0.06, + "global_step": 12702, + "learning_rate": 0.0004478213689482471, + "loss": 1.3477, + "loss_base2": 1.9443, + "loss_pixel": 0.145, + "loss_text": 1.2027, + "ppl": 3.8486, + "step": 12702 + }, + { + "epoch": 0.06, + "global_step": 12703, + "learning_rate": 0.0004478171953255426, + "loss": 1.3348, + "loss_base2": 1.9257, + "loss_pixel": 0.145, + "loss_text": 1.1898, + "ppl": 3.7992, + "step": 12703 + }, + { + "epoch": 0.06, + "global_step": 12704, + "learning_rate": 0.00044781302170283807, + "loss": 1.3458, + "loss_base2": 1.9416, + "loss_pixel": 0.1446, + "loss_text": 1.2012, + "ppl": 3.8413, + "step": 12704 + }, + { + "epoch": 0.06, + "global_step": 12705, + "learning_rate": 0.0004478088480801336, + "loss": 1.3635, + "loss_base2": 1.9671, + "loss_pixel": 0.1437, + "loss_text": 1.2198, + "ppl": 3.9099, + "step": 12705 + }, + { + "epoch": 0.06, + "global_step": 12706, + "learning_rate": 0.0004478046744574291, + "loss": 1.3251, + "loss_base2": 1.9117, + "loss_pixel": 0.1444, + "loss_text": 1.1807, + "ppl": 3.7626, + "step": 12706 + }, + { + "epoch": 0.06, + "global_step": 12707, + "learning_rate": 0.0004478005008347246, + "loss": 1.3546, + "loss_base2": 1.9543, + "loss_pixel": 0.1439, + "loss_text": 1.2107, + "ppl": 3.8752, + "step": 12707 + }, + { + "epoch": 0.06, + "global_step": 12708, + "learning_rate": 0.00044779632721202, + "loss": 1.3535, + "loss_base2": 1.9527, + "loss_pixel": 0.1457, + "loss_text": 1.2077, + "ppl": 3.871, + "step": 12708 + }, + { + "epoch": 0.06, + "global_step": 12709, + "learning_rate": 0.0004477921535893155, + "loss": 1.3582, + "loss_base2": 1.9595, + "loss_pixel": 0.1454, + "loss_text": 1.2129, + "ppl": 3.8892, + "step": 12709 + }, + { + "epoch": 0.06, + "global_step": 12710, + "learning_rate": 0.000447787979966611, + "loss": 1.3465, + "loss_base2": 1.9426, + "loss_pixel": 0.1431, + "loss_text": 1.2034, + "ppl": 3.8439, + "step": 12710 + }, + { + "epoch": 0.06, + "global_step": 12711, + "learning_rate": 0.0004477838063439065, + "loss": 1.5241, + "loss_base2": 2.1988, + "loss_pixel": 0.1448, + "loss_text": 1.3793, + "ppl": 4.591, + "step": 12711 + }, + { + "epoch": 0.06, + "global_step": 12712, + "learning_rate": 0.000447779632721202, + "loss": 1.6251, + "loss_base2": 2.3445, + "loss_pixel": 0.1564, + "loss_text": 1.4687, + "ppl": 5.0789, + "step": 12712 + }, + { + "epoch": 0.06, + "global_step": 12713, + "learning_rate": 0.0004477754590984975, + "loss": 1.604, + "loss_base2": 2.3141, + "loss_pixel": 0.1567, + "loss_text": 1.4473, + "ppl": 4.9729, + "step": 12713 + }, + { + "epoch": 0.06, + "global_step": 12714, + "learning_rate": 0.000447771285475793, + "loss": 1.6247, + "loss_base2": 2.3439, + "loss_pixel": 0.1577, + "loss_text": 1.467, + "ppl": 5.0769, + "step": 12714 + }, + { + "epoch": 0.06, + "global_step": 12715, + "learning_rate": 0.0004477671118530885, + "loss": 1.6077, + "loss_base2": 2.3194, + "loss_pixel": 0.1586, + "loss_text": 1.4491, + "ppl": 4.9913, + "step": 12715 + }, + { + "epoch": 0.06, + "global_step": 12716, + "learning_rate": 0.000447762938230384, + "loss": 1.6155, + "loss_base2": 2.3307, + "loss_pixel": 0.1586, + "loss_text": 1.4569, + "ppl": 5.0304, + "step": 12716 + }, + { + "epoch": 0.06, + "global_step": 12717, + "learning_rate": 0.00044775876460767945, + "loss": 1.6143, + "loss_base2": 2.3289, + "loss_pixel": 0.1574, + "loss_text": 1.4568, + "ppl": 5.0244, + "step": 12717 + }, + { + "epoch": 0.06, + "global_step": 12718, + "learning_rate": 0.00044775459098497496, + "loss": 1.6062, + "loss_base2": 2.3173, + "loss_pixel": 0.1575, + "loss_text": 1.4487, + "ppl": 4.9838, + "step": 12718 + }, + { + "epoch": 0.06, + "global_step": 12719, + "learning_rate": 0.00044775041736227046, + "loss": 1.6003, + "loss_base2": 2.3087, + "loss_pixel": 0.1583, + "loss_text": 1.442, + "ppl": 4.9545, + "step": 12719 + }, + { + "epoch": 0.06, + "global_step": 12720, + "learning_rate": 0.00044774624373956597, + "loss": 1.6096, + "loss_base2": 2.3222, + "loss_pixel": 0.158, + "loss_text": 1.4516, + "ppl": 5.0008, + "step": 12720 + }, + { + "epoch": 0.06, + "global_step": 12721, + "learning_rate": 0.0004477420701168615, + "loss": 1.6056, + "loss_base2": 2.3164, + "loss_pixel": 0.1583, + "loss_text": 1.4474, + "ppl": 4.9808, + "step": 12721 + }, + { + "epoch": 0.06, + "global_step": 12722, + "learning_rate": 0.00044773789649415693, + "loss": 1.6098, + "loss_base2": 2.3225, + "loss_pixel": 0.1571, + "loss_text": 1.4527, + "ppl": 5.0018, + "step": 12722 + }, + { + "epoch": 0.06, + "global_step": 12723, + "learning_rate": 0.00044773372287145244, + "loss": 1.6045, + "loss_base2": 2.3148, + "loss_pixel": 0.1583, + "loss_text": 1.4463, + "ppl": 4.9754, + "step": 12723 + }, + { + "epoch": 0.06, + "global_step": 12724, + "learning_rate": 0.00044772954924874795, + "loss": 1.6087, + "loss_base2": 2.3209, + "loss_pixel": 0.1574, + "loss_text": 1.4513, + "ppl": 4.9963, + "step": 12724 + }, + { + "epoch": 0.06, + "global_step": 12725, + "learning_rate": 0.00044772537562604345, + "loss": 1.6058, + "loss_base2": 2.3167, + "loss_pixel": 0.1581, + "loss_text": 1.4478, + "ppl": 4.9818, + "step": 12725 + }, + { + "epoch": 0.06, + "global_step": 12726, + "learning_rate": 0.00044772120200333896, + "loss": 1.6012, + "loss_base2": 2.31, + "loss_pixel": 0.1575, + "loss_text": 1.4437, + "ppl": 4.959, + "step": 12726 + }, + { + "epoch": 0.06, + "global_step": 12727, + "learning_rate": 0.00044771702838063436, + "loss": 1.6198, + "loss_base2": 2.3369, + "loss_pixel": 0.1571, + "loss_text": 1.4627, + "ppl": 5.0521, + "step": 12727 + }, + { + "epoch": 0.06, + "global_step": 12728, + "learning_rate": 0.00044771285475792987, + "loss": 1.6099, + "loss_base2": 2.3226, + "loss_pixel": 0.1564, + "loss_text": 1.4535, + "ppl": 5.0023, + "step": 12728 + }, + { + "epoch": 0.06, + "global_step": 12729, + "learning_rate": 0.0004477086811352254, + "loss": 1.6149, + "loss_base2": 2.3298, + "loss_pixel": 0.1559, + "loss_text": 1.459, + "ppl": 5.0274, + "step": 12729 + }, + { + "epoch": 0.06, + "global_step": 12730, + "learning_rate": 0.0004477045075125209, + "loss": 1.6196, + "loss_base2": 2.3366, + "loss_pixel": 0.1581, + "loss_text": 1.4615, + "ppl": 5.0511, + "step": 12730 + }, + { + "epoch": 0.06, + "global_step": 12731, + "learning_rate": 0.00044770033388981633, + "loss": 1.6154, + "loss_base2": 2.3305, + "loss_pixel": 0.1575, + "loss_text": 1.4579, + "ppl": 5.0299, + "step": 12731 + }, + { + "epoch": 0.06, + "global_step": 12732, + "learning_rate": 0.00044769616026711184, + "loss": 1.585, + "loss_base2": 2.2867, + "loss_pixel": 0.1561, + "loss_text": 1.4289, + "ppl": 4.8793, + "step": 12732 + }, + { + "epoch": 0.06, + "global_step": 12733, + "learning_rate": 0.00044769198664440735, + "loss": 1.6, + "loss_base2": 2.3083, + "loss_pixel": 0.1574, + "loss_text": 1.4426, + "ppl": 4.953, + "step": 12733 + }, + { + "epoch": 0.06, + "global_step": 12734, + "learning_rate": 0.00044768781302170286, + "loss": 1.6144, + "loss_base2": 2.3291, + "loss_pixel": 0.156, + "loss_text": 1.4584, + "ppl": 5.0249, + "step": 12734 + }, + { + "epoch": 0.06, + "global_step": 12735, + "learning_rate": 0.00044768363939899836, + "loss": 1.6043, + "loss_base2": 2.3145, + "loss_pixel": 0.1562, + "loss_text": 1.4482, + "ppl": 4.9744, + "step": 12735 + }, + { + "epoch": 0.06, + "global_step": 12736, + "learning_rate": 0.0004476794657762938, + "loss": 1.3739, + "loss_base2": 1.9821, + "loss_pixel": 0.1575, + "loss_text": 1.2165, + "ppl": 3.9507, + "step": 12736 + }, + { + "epoch": 0.06, + "global_step": 12737, + "learning_rate": 0.0004476752921535893, + "loss": 1.3728, + "loss_base2": 1.9805, + "loss_pixel": 0.1573, + "loss_text": 1.2155, + "ppl": 3.9464, + "step": 12737 + }, + { + "epoch": 0.06, + "global_step": 12738, + "learning_rate": 0.00044767111853088483, + "loss": 1.3798, + "loss_base2": 1.9906, + "loss_pixel": 0.1565, + "loss_text": 1.2232, + "ppl": 3.9741, + "step": 12738 + }, + { + "epoch": 0.06, + "global_step": 12739, + "learning_rate": 0.00044766694490818034, + "loss": 1.375, + "loss_base2": 1.9837, + "loss_pixel": 0.156, + "loss_text": 1.219, + "ppl": 3.9551, + "step": 12739 + }, + { + "epoch": 0.06, + "global_step": 12740, + "learning_rate": 0.0004476627712854758, + "loss": 1.3652, + "loss_base2": 1.9696, + "loss_pixel": 0.1557, + "loss_text": 1.2095, + "ppl": 3.9165, + "step": 12740 + }, + { + "epoch": 0.06, + "global_step": 12741, + "learning_rate": 0.0004476585976627713, + "loss": 1.3696, + "loss_base2": 1.9759, + "loss_pixel": 0.1576, + "loss_text": 1.212, + "ppl": 3.9338, + "step": 12741 + }, + { + "epoch": 0.06, + "global_step": 12742, + "learning_rate": 0.0004476544240400668, + "loss": 1.3679, + "loss_base2": 1.9735, + "loss_pixel": 0.1567, + "loss_text": 1.2112, + "ppl": 3.9271, + "step": 12742 + }, + { + "epoch": 0.06, + "global_step": 12743, + "learning_rate": 0.0004476502504173623, + "loss": 1.3788, + "loss_base2": 1.9892, + "loss_pixel": 0.1566, + "loss_text": 1.2222, + "ppl": 3.9701, + "step": 12743 + }, + { + "epoch": 0.06, + "global_step": 12744, + "learning_rate": 0.0004476460767946578, + "loss": 1.3671, + "loss_base2": 1.9723, + "loss_pixel": 0.1559, + "loss_text": 1.2113, + "ppl": 3.924, + "step": 12744 + }, + { + "epoch": 0.06, + "global_step": 12745, + "learning_rate": 0.0004476419031719532, + "loss": 1.3898, + "loss_base2": 2.0051, + "loss_pixel": 0.1569, + "loss_text": 1.2329, + "ppl": 4.014, + "step": 12745 + }, + { + "epoch": 0.06, + "global_step": 12746, + "learning_rate": 0.00044763772954924873, + "loss": 1.3629, + "loss_base2": 1.9662, + "loss_pixel": 0.1559, + "loss_text": 1.207, + "ppl": 3.9075, + "step": 12746 + }, + { + "epoch": 0.06, + "global_step": 12747, + "learning_rate": 0.00044763355592654423, + "loss": 1.3531, + "loss_base2": 1.9521, + "loss_pixel": 0.1542, + "loss_text": 1.199, + "ppl": 3.8694, + "step": 12747 + }, + { + "epoch": 0.06, + "global_step": 12748, + "learning_rate": 0.00044762938230383974, + "loss": 1.3768, + "loss_base2": 1.9863, + "loss_pixel": 0.1557, + "loss_text": 1.221, + "ppl": 3.9622, + "step": 12748 + }, + { + "epoch": 0.06, + "global_step": 12749, + "learning_rate": 0.0004476252086811352, + "loss": 1.3758, + "loss_base2": 1.9849, + "loss_pixel": 0.1572, + "loss_text": 1.2185, + "ppl": 3.9582, + "step": 12749 + }, + { + "epoch": 0.06, + "global_step": 12750, + "learning_rate": 0.0004476210350584307, + "loss": 1.3566, + "loss_base2": 1.9572, + "loss_pixel": 0.1558, + "loss_text": 1.2008, + "ppl": 3.883, + "step": 12750 + }, + { + "epoch": 0.06, + "global_step": 12751, + "learning_rate": 0.0004476168614357262, + "loss": 1.3458, + "loss_base2": 1.9416, + "loss_pixel": 0.1574, + "loss_text": 1.1883, + "ppl": 3.8413, + "step": 12751 + }, + { + "epoch": 0.06, + "global_step": 12752, + "learning_rate": 0.0004476126878130217, + "loss": 1.6253, + "loss_base2": 2.3448, + "loss_pixel": 0.1546, + "loss_text": 1.4707, + "ppl": 5.0799, + "step": 12752 + }, + { + "epoch": 0.06, + "global_step": 12753, + "learning_rate": 0.0004476085141903172, + "loss": 1.6226, + "loss_base2": 2.3409, + "loss_pixel": 0.1556, + "loss_text": 1.4669, + "ppl": 5.0662, + "step": 12753 + }, + { + "epoch": 0.06, + "global_step": 12754, + "learning_rate": 0.0004476043405676127, + "loss": 1.6084, + "loss_base2": 2.3204, + "loss_pixel": 0.1568, + "loss_text": 1.4517, + "ppl": 4.9948, + "step": 12754 + }, + { + "epoch": 0.06, + "global_step": 12755, + "learning_rate": 0.0004476001669449082, + "loss": 1.6093, + "loss_base2": 2.3217, + "loss_pixel": 0.1562, + "loss_text": 1.4531, + "ppl": 4.9993, + "step": 12755 + }, + { + "epoch": 0.06, + "global_step": 12756, + "learning_rate": 0.0004475959933222037, + "loss": 1.5977, + "loss_base2": 2.305, + "loss_pixel": 0.1571, + "loss_text": 1.4406, + "ppl": 4.9417, + "step": 12756 + }, + { + "epoch": 0.06, + "global_step": 12757, + "learning_rate": 0.0004475918196994992, + "loss": 1.5913, + "loss_base2": 2.2958, + "loss_pixel": 0.1547, + "loss_text": 1.4366, + "ppl": 4.9101, + "step": 12757 + }, + { + "epoch": 0.06, + "global_step": 12758, + "learning_rate": 0.00044758764607679465, + "loss": 1.6095, + "loss_base2": 2.322, + "loss_pixel": 0.1571, + "loss_text": 1.4524, + "ppl": 5.0003, + "step": 12758 + }, + { + "epoch": 0.06, + "global_step": 12759, + "learning_rate": 0.00044758347245409016, + "loss": 1.6085, + "loss_base2": 2.3206, + "loss_pixel": 0.1563, + "loss_text": 1.4522, + "ppl": 4.9953, + "step": 12759 + }, + { + "epoch": 0.06, + "global_step": 12760, + "learning_rate": 0.00044757929883138567, + "loss": 1.5948, + "loss_base2": 2.3008, + "loss_pixel": 0.1563, + "loss_text": 1.4386, + "ppl": 4.9273, + "step": 12760 + }, + { + "epoch": 0.06, + "global_step": 12761, + "learning_rate": 0.0004475751252086812, + "loss": 1.6068, + "loss_base2": 2.3181, + "loss_pixel": 0.1562, + "loss_text": 1.4505, + "ppl": 4.9868, + "step": 12761 + }, + { + "epoch": 0.06, + "global_step": 12762, + "learning_rate": 0.0004475709515859767, + "loss": 1.6096, + "loss_base2": 2.3222, + "loss_pixel": 0.1556, + "loss_text": 1.454, + "ppl": 5.0008, + "step": 12762 + }, + { + "epoch": 0.06, + "global_step": 12763, + "learning_rate": 0.00044756677796327214, + "loss": 1.605, + "loss_base2": 2.3155, + "loss_pixel": 0.156, + "loss_text": 1.449, + "ppl": 4.9779, + "step": 12763 + }, + { + "epoch": 0.06, + "global_step": 12764, + "learning_rate": 0.0004475626043405676, + "loss": 1.6052, + "loss_base2": 2.3158, + "loss_pixel": 0.1574, + "loss_text": 1.4479, + "ppl": 4.9789, + "step": 12764 + }, + { + "epoch": 0.06, + "global_step": 12765, + "learning_rate": 0.0004475584307178631, + "loss": 1.597, + "loss_base2": 2.304, + "loss_pixel": 0.1568, + "loss_text": 1.4402, + "ppl": 4.9382, + "step": 12765 + }, + { + "epoch": 0.06, + "global_step": 12766, + "learning_rate": 0.0004475542570951586, + "loss": 1.6117, + "loss_base2": 2.3252, + "loss_pixel": 0.1557, + "loss_text": 1.456, + "ppl": 5.0113, + "step": 12766 + }, + { + "epoch": 0.06, + "global_step": 12767, + "learning_rate": 0.00044755008347245406, + "loss": 1.6064, + "loss_base2": 2.3175, + "loss_pixel": 0.1558, + "loss_text": 1.4506, + "ppl": 4.9848, + "step": 12767 + }, + { + "epoch": 0.06, + "global_step": 12768, + "learning_rate": 0.00044754590984974956, + "loss": 1.6156, + "loss_base2": 2.3308, + "loss_pixel": 0.1574, + "loss_text": 1.4582, + "ppl": 5.0309, + "step": 12768 + }, + { + "epoch": 0.06, + "global_step": 12769, + "learning_rate": 0.00044754173622704507, + "loss": 1.6073, + "loss_base2": 2.3188, + "loss_pixel": 0.1581, + "loss_text": 1.4492, + "ppl": 4.9893, + "step": 12769 + }, + { + "epoch": 0.06, + "global_step": 12770, + "learning_rate": 0.0004475375626043406, + "loss": 1.5887, + "loss_base2": 2.292, + "loss_pixel": 0.155, + "loss_text": 1.4337, + "ppl": 4.8974, + "step": 12770 + }, + { + "epoch": 0.06, + "global_step": 12771, + "learning_rate": 0.0004475333889816361, + "loss": 1.5942, + "loss_base2": 2.2999, + "loss_pixel": 0.1581, + "loss_text": 1.4362, + "ppl": 4.9244, + "step": 12771 + }, + { + "epoch": 0.06, + "global_step": 12772, + "learning_rate": 0.00044752921535893154, + "loss": 1.6112, + "loss_base2": 2.3245, + "loss_pixel": 0.1562, + "loss_text": 1.455, + "ppl": 5.0088, + "step": 12772 + }, + { + "epoch": 0.06, + "global_step": 12773, + "learning_rate": 0.00044752504173622705, + "loss": 1.611, + "loss_base2": 2.3242, + "loss_pixel": 0.1585, + "loss_text": 1.4525, + "ppl": 5.0078, + "step": 12773 + }, + { + "epoch": 0.06, + "global_step": 12774, + "learning_rate": 0.00044752086811352255, + "loss": 1.5872, + "loss_base2": 2.2898, + "loss_pixel": 0.156, + "loss_text": 1.4312, + "ppl": 4.89, + "step": 12774 + }, + { + "epoch": 0.06, + "global_step": 12775, + "learning_rate": 0.00044751669449081806, + "loss": 1.6067, + "loss_base2": 2.318, + "loss_pixel": 0.1562, + "loss_text": 1.4504, + "ppl": 4.9863, + "step": 12775 + }, + { + "epoch": 0.06, + "global_step": 12776, + "learning_rate": 0.00044751252086811357, + "loss": 1.6158, + "loss_base2": 2.3311, + "loss_pixel": 0.1568, + "loss_text": 1.459, + "ppl": 5.0319, + "step": 12776 + }, + { + "epoch": 0.06, + "global_step": 12777, + "learning_rate": 0.000447508347245409, + "loss": 1.5877, + "loss_base2": 2.2906, + "loss_pixel": 0.157, + "loss_text": 1.4307, + "ppl": 4.8925, + "step": 12777 + }, + { + "epoch": 0.06, + "global_step": 12778, + "learning_rate": 0.00044750417362270453, + "loss": 1.5983, + "loss_base2": 2.3059, + "loss_pixel": 0.1553, + "loss_text": 1.443, + "ppl": 4.9446, + "step": 12778 + }, + { + "epoch": 0.06, + "global_step": 12779, + "learning_rate": 0.00044750000000000004, + "loss": 1.5833, + "loss_base2": 2.2842, + "loss_pixel": 0.1532, + "loss_text": 1.43, + "ppl": 4.871, + "step": 12779 + }, + { + "epoch": 0.06, + "global_step": 12780, + "learning_rate": 0.00044749582637729554, + "loss": 1.5888, + "loss_base2": 2.2922, + "loss_pixel": 0.1462, + "loss_text": 1.4426, + "ppl": 4.8979, + "step": 12780 + }, + { + "epoch": 0.06, + "global_step": 12781, + "learning_rate": 0.000447491652754591, + "loss": 1.5933, + "loss_base2": 2.2986, + "loss_pixel": 0.1465, + "loss_text": 1.4468, + "ppl": 4.92, + "step": 12781 + }, + { + "epoch": 0.06, + "global_step": 12782, + "learning_rate": 0.0004474874791318865, + "loss": 1.5806, + "loss_base2": 2.2803, + "loss_pixel": 0.1453, + "loss_text": 1.4354, + "ppl": 4.8579, + "step": 12782 + }, + { + "epoch": 0.06, + "global_step": 12783, + "learning_rate": 0.00044748330550918196, + "loss": 1.5994, + "loss_base2": 2.3074, + "loss_pixel": 0.1464, + "loss_text": 1.4529, + "ppl": 4.9501, + "step": 12783 + }, + { + "epoch": 0.06, + "global_step": 12784, + "learning_rate": 0.00044747913188647746, + "loss": 1.5985, + "loss_base2": 2.3061, + "loss_pixel": 0.1473, + "loss_text": 1.4512, + "ppl": 4.9456, + "step": 12784 + }, + { + "epoch": 0.06, + "global_step": 12785, + "learning_rate": 0.00044747495826377297, + "loss": 1.5969, + "loss_base2": 2.3038, + "loss_pixel": 0.1459, + "loss_text": 1.451, + "ppl": 4.9377, + "step": 12785 + }, + { + "epoch": 0.06, + "global_step": 12786, + "learning_rate": 0.0004474707846410684, + "loss": 1.5802, + "loss_base2": 2.2797, + "loss_pixel": 0.145, + "loss_text": 1.4353, + "ppl": 4.8559, + "step": 12786 + }, + { + "epoch": 0.06, + "global_step": 12787, + "learning_rate": 0.00044746661101836393, + "loss": 1.5723, + "loss_base2": 2.2683, + "loss_pixel": 0.1467, + "loss_text": 1.4256, + "ppl": 4.8177, + "step": 12787 + }, + { + "epoch": 0.06, + "global_step": 12788, + "learning_rate": 0.00044746243739565944, + "loss": 1.5692, + "loss_base2": 2.2639, + "loss_pixel": 0.1447, + "loss_text": 1.4245, + "ppl": 4.8028, + "step": 12788 + }, + { + "epoch": 0.06, + "global_step": 12789, + "learning_rate": 0.00044745826377295495, + "loss": 1.6, + "loss_base2": 2.3083, + "loss_pixel": 0.1443, + "loss_text": 1.4556, + "ppl": 4.953, + "step": 12789 + }, + { + "epoch": 0.06, + "global_step": 12790, + "learning_rate": 0.0004474540901502504, + "loss": 1.5833, + "loss_base2": 2.2842, + "loss_pixel": 0.1462, + "loss_text": 1.4371, + "ppl": 4.871, + "step": 12790 + }, + { + "epoch": 0.06, + "global_step": 12791, + "learning_rate": 0.0004474499165275459, + "loss": 1.5875, + "loss_base2": 2.2903, + "loss_pixel": 0.1435, + "loss_text": 1.444, + "ppl": 4.8915, + "step": 12791 + }, + { + "epoch": 0.06, + "global_step": 12792, + "learning_rate": 0.0004474457429048414, + "loss": 1.5849, + "loss_base2": 2.2865, + "loss_pixel": 0.1456, + "loss_text": 1.4393, + "ppl": 4.8788, + "step": 12792 + }, + { + "epoch": 0.06, + "global_step": 12793, + "learning_rate": 0.0004474415692821369, + "loss": 1.6091, + "loss_base2": 2.3214, + "loss_pixel": 0.1473, + "loss_text": 1.4619, + "ppl": 4.9983, + "step": 12793 + }, + { + "epoch": 0.06, + "global_step": 12794, + "learning_rate": 0.00044743739565943243, + "loss": 1.5918, + "loss_base2": 2.2965, + "loss_pixel": 0.1463, + "loss_text": 1.4455, + "ppl": 4.9126, + "step": 12794 + }, + { + "epoch": 0.06, + "global_step": 12795, + "learning_rate": 0.0004474332220367279, + "loss": 1.5939, + "loss_base2": 2.2995, + "loss_pixel": 0.1463, + "loss_text": 1.4476, + "ppl": 4.9229, + "step": 12795 + }, + { + "epoch": 0.06, + "global_step": 12796, + "learning_rate": 0.0004474290484140234, + "loss": 1.5974, + "loss_base2": 2.3046, + "loss_pixel": 0.1587, + "loss_text": 1.4387, + "ppl": 4.9402, + "step": 12796 + }, + { + "epoch": 0.06, + "global_step": 12797, + "learning_rate": 0.0004474248747913189, + "loss": 1.5679, + "loss_base2": 2.262, + "loss_pixel": 0.1581, + "loss_text": 1.4099, + "ppl": 4.7966, + "step": 12797 + }, + { + "epoch": 0.06, + "global_step": 12798, + "learning_rate": 0.0004474207011686144, + "loss": 1.6136, + "loss_base2": 2.3279, + "loss_pixel": 0.1578, + "loss_text": 1.4558, + "ppl": 5.0209, + "step": 12798 + }, + { + "epoch": 0.06, + "global_step": 12799, + "learning_rate": 0.00044741652754590986, + "loss": 1.611, + "loss_base2": 2.3242, + "loss_pixel": 0.1568, + "loss_text": 1.4543, + "ppl": 5.0078, + "step": 12799 + }, + { + "epoch": 0.06, + "global_step": 12800, + "learning_rate": 0.00044741235392320536, + "loss": 1.6077, + "loss_base2": 2.3194, + "loss_pixel": 0.1582, + "loss_text": 1.4495, + "ppl": 4.9913, + "step": 12800 + }, + { + "epoch": 0.06, + "global_step": 12801, + "learning_rate": 0.00044740818030050087, + "loss": 1.6057, + "loss_base2": 2.3165, + "loss_pixel": 0.1579, + "loss_text": 1.4478, + "ppl": 4.9813, + "step": 12801 + }, + { + "epoch": 0.06, + "global_step": 12802, + "learning_rate": 0.0004474040066777963, + "loss": 1.5978, + "loss_base2": 2.3051, + "loss_pixel": 0.1566, + "loss_text": 1.4412, + "ppl": 4.9421, + "step": 12802 + }, + { + "epoch": 0.06, + "global_step": 12803, + "learning_rate": 0.00044739983305509183, + "loss": 1.5927, + "loss_base2": 2.2978, + "loss_pixel": 0.1577, + "loss_text": 1.4351, + "ppl": 4.917, + "step": 12803 + }, + { + "epoch": 0.06, + "global_step": 12804, + "learning_rate": 0.0004473956594323873, + "loss": 1.588, + "loss_base2": 2.291, + "loss_pixel": 0.1582, + "loss_text": 1.4299, + "ppl": 4.894, + "step": 12804 + }, + { + "epoch": 0.06, + "global_step": 12805, + "learning_rate": 0.0004473914858096828, + "loss": 1.6091, + "loss_base2": 2.3214, + "loss_pixel": 0.1564, + "loss_text": 1.4527, + "ppl": 4.9983, + "step": 12805 + }, + { + "epoch": 0.06, + "global_step": 12806, + "learning_rate": 0.0004473873121869783, + "loss": 1.5975, + "loss_base2": 2.3047, + "loss_pixel": 0.1588, + "loss_text": 1.4386, + "ppl": 4.9407, + "step": 12806 + }, + { + "epoch": 0.06, + "global_step": 12807, + "learning_rate": 0.0004473831385642738, + "loss": 1.5962, + "loss_base2": 2.3028, + "loss_pixel": 0.1572, + "loss_text": 1.439, + "ppl": 4.9342, + "step": 12807 + }, + { + "epoch": 0.06, + "global_step": 12808, + "learning_rate": 0.00044737896494156926, + "loss": 1.582, + "loss_base2": 2.2823, + "loss_pixel": 0.1564, + "loss_text": 1.4256, + "ppl": 4.8647, + "step": 12808 + }, + { + "epoch": 0.06, + "global_step": 12809, + "learning_rate": 0.00044737479131886477, + "loss": 1.5924, + "loss_base2": 2.2973, + "loss_pixel": 0.1563, + "loss_text": 1.4361, + "ppl": 4.9155, + "step": 12809 + }, + { + "epoch": 0.06, + "global_step": 12810, + "learning_rate": 0.0004473706176961603, + "loss": 1.5923, + "loss_base2": 2.2972, + "loss_pixel": 0.1557, + "loss_text": 1.4365, + "ppl": 4.915, + "step": 12810 + }, + { + "epoch": 0.06, + "global_step": 12811, + "learning_rate": 0.0004473664440734558, + "loss": 1.5901, + "loss_base2": 2.294, + "loss_pixel": 0.156, + "loss_text": 1.4341, + "ppl": 4.9042, + "step": 12811 + }, + { + "epoch": 0.06, + "global_step": 12812, + "learning_rate": 0.0004473622704507513, + "loss": 1.6133, + "loss_base2": 2.3275, + "loss_pixel": 0.1555, + "loss_text": 1.4578, + "ppl": 5.0193, + "step": 12812 + }, + { + "epoch": 0.06, + "global_step": 12813, + "learning_rate": 0.00044735809682804674, + "loss": 1.5957, + "loss_base2": 2.3021, + "loss_pixel": 0.1569, + "loss_text": 1.4388, + "ppl": 4.9318, + "step": 12813 + }, + { + "epoch": 0.06, + "global_step": 12814, + "learning_rate": 0.00044735392320534225, + "loss": 1.5958, + "loss_base2": 2.3023, + "loss_pixel": 0.1557, + "loss_text": 1.4401, + "ppl": 4.9323, + "step": 12814 + }, + { + "epoch": 0.06, + "global_step": 12815, + "learning_rate": 0.00044734974958263776, + "loss": 1.5983, + "loss_base2": 2.3059, + "loss_pixel": 0.1576, + "loss_text": 1.4407, + "ppl": 4.9446, + "step": 12815 + }, + { + "epoch": 0.06, + "global_step": 12816, + "learning_rate": 0.00044734557595993326, + "loss": 1.6048, + "loss_base2": 2.3152, + "loss_pixel": 0.1557, + "loss_text": 1.4491, + "ppl": 4.9769, + "step": 12816 + }, + { + "epoch": 0.06, + "global_step": 12817, + "learning_rate": 0.0004473414023372287, + "loss": 1.5936, + "loss_base2": 2.2991, + "loss_pixel": 0.1575, + "loss_text": 1.4361, + "ppl": 4.9214, + "step": 12817 + }, + { + "epoch": 0.06, + "global_step": 12818, + "learning_rate": 0.0004473372287145242, + "loss": 1.589, + "loss_base2": 2.2924, + "loss_pixel": 0.1562, + "loss_text": 1.4328, + "ppl": 4.8988, + "step": 12818 + }, + { + "epoch": 0.06, + "global_step": 12819, + "learning_rate": 0.00044733305509181973, + "loss": 1.6134, + "loss_base2": 2.3276, + "loss_pixel": 0.1561, + "loss_text": 1.4572, + "ppl": 5.0198, + "step": 12819 + }, + { + "epoch": 0.06, + "global_step": 12820, + "learning_rate": 0.0004473288814691152, + "loss": 1.5918, + "loss_base2": 2.2965, + "loss_pixel": 0.1565, + "loss_text": 1.4353, + "ppl": 4.9126, + "step": 12820 + }, + { + "epoch": 0.06, + "global_step": 12821, + "learning_rate": 0.0004473247078464107, + "loss": 1.5942, + "loss_base2": 2.2999, + "loss_pixel": 0.157, + "loss_text": 1.4372, + "ppl": 4.9244, + "step": 12821 + }, + { + "epoch": 0.06, + "global_step": 12822, + "learning_rate": 0.00044732053422370615, + "loss": 1.5999, + "loss_base2": 2.3082, + "loss_pixel": 0.1557, + "loss_text": 1.4442, + "ppl": 4.9525, + "step": 12822 + }, + { + "epoch": 0.06, + "global_step": 12823, + "learning_rate": 0.00044731636060100165, + "loss": 1.6127, + "loss_base2": 2.3266, + "loss_pixel": 0.1561, + "loss_text": 1.4565, + "ppl": 5.0163, + "step": 12823 + }, + { + "epoch": 0.06, + "global_step": 12824, + "learning_rate": 0.00044731218697829716, + "loss": 1.6113, + "loss_base2": 2.3246, + "loss_pixel": 0.1558, + "loss_text": 1.4555, + "ppl": 5.0093, + "step": 12824 + }, + { + "epoch": 0.06, + "global_step": 12825, + "learning_rate": 0.00044730801335559267, + "loss": 1.5993, + "loss_base2": 2.3073, + "loss_pixel": 0.1563, + "loss_text": 1.443, + "ppl": 4.9496, + "step": 12825 + }, + { + "epoch": 0.06, + "global_step": 12826, + "learning_rate": 0.0004473038397328881, + "loss": 1.5852, + "loss_base2": 2.287, + "loss_pixel": 0.1558, + "loss_text": 1.4294, + "ppl": 4.8803, + "step": 12826 + }, + { + "epoch": 0.06, + "global_step": 12827, + "learning_rate": 0.00044729966611018363, + "loss": 1.6002, + "loss_base2": 2.3086, + "loss_pixel": 0.1555, + "loss_text": 1.4447, + "ppl": 4.954, + "step": 12827 + }, + { + "epoch": 0.06, + "global_step": 12828, + "learning_rate": 0.00044729549248747914, + "loss": 1.5858, + "loss_base2": 2.2878, + "loss_pixel": 0.1562, + "loss_text": 1.4296, + "ppl": 4.8832, + "step": 12828 + }, + { + "epoch": 0.06, + "global_step": 12829, + "learning_rate": 0.00044729131886477464, + "loss": 1.5937, + "loss_base2": 2.2992, + "loss_pixel": 0.1555, + "loss_text": 1.4382, + "ppl": 4.9219, + "step": 12829 + }, + { + "epoch": 0.06, + "global_step": 12830, + "learning_rate": 0.00044728714524207015, + "loss": 1.5846, + "loss_base2": 2.2861, + "loss_pixel": 0.1563, + "loss_text": 1.4283, + "ppl": 4.8773, + "step": 12830 + }, + { + "epoch": 0.06, + "global_step": 12831, + "learning_rate": 0.0004472829716193656, + "loss": 1.6022, + "loss_base2": 2.3115, + "loss_pixel": 0.1576, + "loss_text": 1.4446, + "ppl": 4.9639, + "step": 12831 + }, + { + "epoch": 0.06, + "global_step": 12832, + "learning_rate": 0.0004472787979966611, + "loss": 1.5868, + "loss_base2": 2.2893, + "loss_pixel": 0.1592, + "loss_text": 1.4276, + "ppl": 4.8881, + "step": 12832 + }, + { + "epoch": 0.06, + "global_step": 12833, + "learning_rate": 0.0004472746243739566, + "loss": 1.5909, + "loss_base2": 2.2952, + "loss_pixel": 0.1576, + "loss_text": 1.4334, + "ppl": 4.9082, + "step": 12833 + }, + { + "epoch": 0.06, + "global_step": 12834, + "learning_rate": 0.0004472704507512521, + "loss": 1.5966, + "loss_base2": 2.3034, + "loss_pixel": 0.1576, + "loss_text": 1.439, + "ppl": 4.9362, + "step": 12834 + }, + { + "epoch": 0.06, + "global_step": 12835, + "learning_rate": 0.00044726627712854763, + "loss": 1.5954, + "loss_base2": 2.3017, + "loss_pixel": 0.1573, + "loss_text": 1.4381, + "ppl": 4.9303, + "step": 12835 + }, + { + "epoch": 0.06, + "global_step": 12836, + "learning_rate": 0.0004472621035058431, + "loss": 1.6018, + "loss_base2": 2.3109, + "loss_pixel": 0.1576, + "loss_text": 1.4442, + "ppl": 4.962, + "step": 12836 + }, + { + "epoch": 0.06, + "global_step": 12837, + "learning_rate": 0.0004472579298831386, + "loss": 1.5954, + "loss_base2": 2.3017, + "loss_pixel": 0.1563, + "loss_text": 1.4391, + "ppl": 4.9303, + "step": 12837 + }, + { + "epoch": 0.06, + "global_step": 12838, + "learning_rate": 0.0004472537562604341, + "loss": 1.602, + "loss_base2": 2.3112, + "loss_pixel": 0.157, + "loss_text": 1.4451, + "ppl": 4.9629, + "step": 12838 + }, + { + "epoch": 0.06, + "global_step": 12839, + "learning_rate": 0.00044724958263772955, + "loss": 1.6105, + "loss_base2": 2.3235, + "loss_pixel": 0.1566, + "loss_text": 1.4539, + "ppl": 5.0053, + "step": 12839 + }, + { + "epoch": 0.06, + "global_step": 12840, + "learning_rate": 0.000447245409015025, + "loss": 1.6076, + "loss_base2": 2.3193, + "loss_pixel": 0.1573, + "loss_text": 1.4504, + "ppl": 4.9908, + "step": 12840 + }, + { + "epoch": 0.06, + "global_step": 12841, + "learning_rate": 0.0004472412353923205, + "loss": 1.5759, + "loss_base2": 2.2735, + "loss_pixel": 0.1561, + "loss_text": 1.4198, + "ppl": 4.8351, + "step": 12841 + }, + { + "epoch": 0.06, + "global_step": 12842, + "learning_rate": 0.000447237061769616, + "loss": 1.6062, + "loss_base2": 2.3173, + "loss_pixel": 0.1566, + "loss_text": 1.4496, + "ppl": 4.9838, + "step": 12842 + }, + { + "epoch": 0.06, + "global_step": 12843, + "learning_rate": 0.00044723288814691153, + "loss": 1.5929, + "loss_base2": 2.2981, + "loss_pixel": 0.1563, + "loss_text": 1.4366, + "ppl": 4.918, + "step": 12843 + }, + { + "epoch": 0.06, + "global_step": 12844, + "learning_rate": 0.00044722871452420704, + "loss": 1.6028, + "loss_base2": 2.3124, + "loss_pixel": 0.1558, + "loss_text": 1.4471, + "ppl": 4.9669, + "step": 12844 + }, + { + "epoch": 0.06, + "global_step": 12845, + "learning_rate": 0.0004472245409015025, + "loss": 1.5787, + "loss_base2": 2.2776, + "loss_pixel": 0.1553, + "loss_text": 1.4234, + "ppl": 4.8486, + "step": 12845 + }, + { + "epoch": 0.06, + "global_step": 12846, + "learning_rate": 0.000447220367278798, + "loss": 1.5914, + "loss_base2": 2.2959, + "loss_pixel": 0.1564, + "loss_text": 1.4351, + "ppl": 4.9106, + "step": 12846 + }, + { + "epoch": 0.06, + "global_step": 12847, + "learning_rate": 0.0004472161936560935, + "loss": 1.5871, + "loss_base2": 2.2897, + "loss_pixel": 0.1564, + "loss_text": 1.4307, + "ppl": 4.8895, + "step": 12847 + }, + { + "epoch": 0.06, + "global_step": 12848, + "learning_rate": 0.000447212020033389, + "loss": 1.5923, + "loss_base2": 2.2972, + "loss_pixel": 0.1554, + "loss_text": 1.437, + "ppl": 4.915, + "step": 12848 + }, + { + "epoch": 0.06, + "global_step": 12849, + "learning_rate": 0.00044720784641068446, + "loss": 1.5776, + "loss_base2": 2.276, + "loss_pixel": 0.1565, + "loss_text": 1.4211, + "ppl": 4.8433, + "step": 12849 + }, + { + "epoch": 0.07, + "global_step": 12850, + "learning_rate": 0.00044720367278797997, + "loss": 1.5934, + "loss_base2": 2.2988, + "loss_pixel": 0.155, + "loss_text": 1.4384, + "ppl": 4.9205, + "step": 12850 + }, + { + "epoch": 0.07, + "global_step": 12851, + "learning_rate": 0.0004471994991652755, + "loss": 1.4474, + "loss_base2": 2.0882, + "loss_pixel": 0.1551, + "loss_text": 1.2923, + "ppl": 4.252, + "step": 12851 + }, + { + "epoch": 0.07, + "global_step": 12852, + "learning_rate": 0.000447195325542571, + "loss": 1.362, + "loss_base2": 1.965, + "loss_pixel": 0.1554, + "loss_text": 1.2066, + "ppl": 3.904, + "step": 12852 + }, + { + "epoch": 0.07, + "global_step": 12853, + "learning_rate": 0.0004471911519198665, + "loss": 1.3687, + "loss_base2": 1.9746, + "loss_pixel": 0.1559, + "loss_text": 1.2127, + "ppl": 3.9302, + "step": 12853 + }, + { + "epoch": 0.07, + "global_step": 12854, + "learning_rate": 0.00044718697829716195, + "loss": 1.3555, + "loss_base2": 1.9556, + "loss_pixel": 0.1558, + "loss_text": 1.1997, + "ppl": 3.8787, + "step": 12854 + }, + { + "epoch": 0.07, + "global_step": 12855, + "learning_rate": 0.00044718280467445745, + "loss": 1.3636, + "loss_base2": 1.9673, + "loss_pixel": 0.1558, + "loss_text": 1.2078, + "ppl": 3.9102, + "step": 12855 + }, + { + "epoch": 0.07, + "global_step": 12856, + "learning_rate": 0.00044717863105175296, + "loss": 1.3477, + "loss_base2": 1.9443, + "loss_pixel": 0.1574, + "loss_text": 1.1903, + "ppl": 3.8486, + "step": 12856 + }, + { + "epoch": 0.07, + "global_step": 12857, + "learning_rate": 0.00044717445742904847, + "loss": 1.3794, + "loss_base2": 1.9901, + "loss_pixel": 0.1566, + "loss_text": 1.2228, + "ppl": 3.9725, + "step": 12857 + }, + { + "epoch": 0.07, + "global_step": 12858, + "learning_rate": 0.00044717028380634387, + "loss": 1.3499, + "loss_base2": 1.9475, + "loss_pixel": 0.1551, + "loss_text": 1.1948, + "ppl": 3.857, + "step": 12858 + }, + { + "epoch": 0.07, + "global_step": 12859, + "learning_rate": 0.0004471661101836394, + "loss": 1.3478, + "loss_base2": 1.9445, + "loss_pixel": 0.1551, + "loss_text": 1.1928, + "ppl": 3.8489, + "step": 12859 + }, + { + "epoch": 0.07, + "global_step": 12860, + "learning_rate": 0.0004471619365609349, + "loss": 1.3908, + "loss_base2": 2.0065, + "loss_pixel": 0.156, + "loss_text": 1.2347, + "ppl": 4.0181, + "step": 12860 + }, + { + "epoch": 0.07, + "global_step": 12861, + "learning_rate": 0.0004471577629382304, + "loss": 1.3691, + "loss_base2": 1.9752, + "loss_pixel": 0.1558, + "loss_text": 1.2134, + "ppl": 3.9318, + "step": 12861 + }, + { + "epoch": 0.07, + "global_step": 12862, + "learning_rate": 0.0004471535893155259, + "loss": 1.369, + "loss_base2": 1.975, + "loss_pixel": 0.1557, + "loss_text": 1.2133, + "ppl": 3.9314, + "step": 12862 + }, + { + "epoch": 0.07, + "global_step": 12863, + "learning_rate": 0.00044714941569282135, + "loss": 1.3831, + "loss_base2": 1.9954, + "loss_pixel": 0.1563, + "loss_text": 1.2268, + "ppl": 3.9872, + "step": 12863 + }, + { + "epoch": 0.07, + "global_step": 12864, + "learning_rate": 0.00044714524207011686, + "loss": 1.3692, + "loss_base2": 1.9753, + "loss_pixel": 0.1562, + "loss_text": 1.2131, + "ppl": 3.9322, + "step": 12864 + }, + { + "epoch": 0.07, + "global_step": 12865, + "learning_rate": 0.00044714106844741236, + "loss": 1.362, + "loss_base2": 1.965, + "loss_pixel": 0.1549, + "loss_text": 1.2071, + "ppl": 3.904, + "step": 12865 + }, + { + "epoch": 0.07, + "global_step": 12866, + "learning_rate": 0.00044713689482470787, + "loss": 1.3595, + "loss_base2": 1.9613, + "loss_pixel": 0.1543, + "loss_text": 1.2052, + "ppl": 3.8942, + "step": 12866 + }, + { + "epoch": 0.07, + "global_step": 12867, + "learning_rate": 0.0004471327212020033, + "loss": 1.3601, + "loss_base2": 1.9622, + "loss_pixel": 0.1563, + "loss_text": 1.2038, + "ppl": 3.8966, + "step": 12867 + }, + { + "epoch": 0.07, + "global_step": 12868, + "learning_rate": 0.00044712854757929883, + "loss": 1.3708, + "loss_base2": 1.9776, + "loss_pixel": 0.1566, + "loss_text": 1.2142, + "ppl": 3.9385, + "step": 12868 + }, + { + "epoch": 0.07, + "global_step": 12869, + "learning_rate": 0.00044712437395659434, + "loss": 1.5065, + "loss_base2": 2.1734, + "loss_pixel": 0.157, + "loss_text": 1.3496, + "ppl": 4.5109, + "step": 12869 + }, + { + "epoch": 0.07, + "global_step": 12870, + "learning_rate": 0.00044712020033388985, + "loss": 1.3754, + "loss_base2": 1.9843, + "loss_pixel": 0.1545, + "loss_text": 1.221, + "ppl": 3.9567, + "step": 12870 + }, + { + "epoch": 0.07, + "global_step": 12871, + "learning_rate": 0.00044711602671118535, + "loss": 1.3655, + "loss_base2": 1.97, + "loss_pixel": 0.1549, + "loss_text": 1.2106, + "ppl": 3.9177, + "step": 12871 + }, + { + "epoch": 0.07, + "global_step": 12872, + "learning_rate": 0.0004471118530884808, + "loss": 1.3561, + "loss_base2": 1.9564, + "loss_pixel": 0.1555, + "loss_text": 1.2006, + "ppl": 3.881, + "step": 12872 + }, + { + "epoch": 0.07, + "global_step": 12873, + "learning_rate": 0.0004471076794657763, + "loss": 1.3693, + "loss_base2": 1.9755, + "loss_pixel": 0.1557, + "loss_text": 1.2136, + "ppl": 3.9326, + "step": 12873 + }, + { + "epoch": 0.07, + "global_step": 12874, + "learning_rate": 0.0004471035058430718, + "loss": 1.3752, + "loss_base2": 1.984, + "loss_pixel": 0.1564, + "loss_text": 1.2188, + "ppl": 3.9559, + "step": 12874 + }, + { + "epoch": 0.07, + "global_step": 12875, + "learning_rate": 0.00044709933222036733, + "loss": 1.3696, + "loss_base2": 1.9759, + "loss_pixel": 0.1561, + "loss_text": 1.2135, + "ppl": 3.9338, + "step": 12875 + }, + { + "epoch": 0.07, + "global_step": 12876, + "learning_rate": 0.00044709515859766273, + "loss": 1.3871, + "loss_base2": 2.0012, + "loss_pixel": 0.1562, + "loss_text": 1.2309, + "ppl": 4.0032, + "step": 12876 + }, + { + "epoch": 0.07, + "global_step": 12877, + "learning_rate": 0.00044709098497495823, + "loss": 1.6045, + "loss_base2": 2.3148, + "loss_pixel": 0.1569, + "loss_text": 1.4476, + "ppl": 4.9754, + "step": 12877 + }, + { + "epoch": 0.07, + "global_step": 12878, + "learning_rate": 0.00044708681135225374, + "loss": 1.6162, + "loss_base2": 2.3317, + "loss_pixel": 0.1547, + "loss_text": 1.4615, + "ppl": 5.0339, + "step": 12878 + }, + { + "epoch": 0.07, + "global_step": 12879, + "learning_rate": 0.00044708263772954925, + "loss": 1.6334, + "loss_base2": 2.3565, + "loss_pixel": 0.1552, + "loss_text": 1.4783, + "ppl": 5.1213, + "step": 12879 + }, + { + "epoch": 0.07, + "global_step": 12880, + "learning_rate": 0.00044707846410684476, + "loss": 1.6008, + "loss_base2": 2.3095, + "loss_pixel": 0.155, + "loss_text": 1.4457, + "ppl": 4.957, + "step": 12880 + }, + { + "epoch": 0.07, + "global_step": 12881, + "learning_rate": 0.0004470742904841402, + "loss": 1.6217, + "loss_base2": 2.3396, + "loss_pixel": 0.157, + "loss_text": 1.4647, + "ppl": 5.0617, + "step": 12881 + }, + { + "epoch": 0.07, + "global_step": 12882, + "learning_rate": 0.0004470701168614357, + "loss": 1.6095, + "loss_base2": 2.322, + "loss_pixel": 0.1555, + "loss_text": 1.4541, + "ppl": 5.0003, + "step": 12882 + }, + { + "epoch": 0.07, + "global_step": 12883, + "learning_rate": 0.0004470659432387312, + "loss": 1.6164, + "loss_base2": 2.332, + "loss_pixel": 0.1554, + "loss_text": 1.461, + "ppl": 5.0349, + "step": 12883 + }, + { + "epoch": 0.07, + "global_step": 12884, + "learning_rate": 0.00044706176961602673, + "loss": 1.6047, + "loss_base2": 2.3151, + "loss_pixel": 0.1559, + "loss_text": 1.4488, + "ppl": 4.9764, + "step": 12884 + }, + { + "epoch": 0.07, + "global_step": 12885, + "learning_rate": 0.0004470575959933222, + "loss": 1.61, + "loss_base2": 2.3227, + "loss_pixel": 0.1569, + "loss_text": 1.4531, + "ppl": 5.0028, + "step": 12885 + }, + { + "epoch": 0.07, + "global_step": 12886, + "learning_rate": 0.0004470534223706177, + "loss": 1.6249, + "loss_base2": 2.3442, + "loss_pixel": 0.1567, + "loss_text": 1.4682, + "ppl": 5.0779, + "step": 12886 + }, + { + "epoch": 0.07, + "global_step": 12887, + "learning_rate": 0.0004470492487479132, + "loss": 1.5918, + "loss_base2": 2.2965, + "loss_pixel": 0.1558, + "loss_text": 1.436, + "ppl": 4.9126, + "step": 12887 + }, + { + "epoch": 0.07, + "global_step": 12888, + "learning_rate": 0.0004470450751252087, + "loss": 1.5954, + "loss_base2": 2.3017, + "loss_pixel": 0.1563, + "loss_text": 1.4391, + "ppl": 4.9303, + "step": 12888 + }, + { + "epoch": 0.07, + "global_step": 12889, + "learning_rate": 0.0004470409015025042, + "loss": 1.6039, + "loss_base2": 2.3139, + "loss_pixel": 0.1552, + "loss_text": 1.4487, + "ppl": 4.9724, + "step": 12889 + }, + { + "epoch": 0.07, + "global_step": 12890, + "learning_rate": 0.00044703672787979967, + "loss": 1.588, + "loss_base2": 2.291, + "loss_pixel": 0.1567, + "loss_text": 1.4313, + "ppl": 4.894, + "step": 12890 + }, + { + "epoch": 0.07, + "global_step": 12891, + "learning_rate": 0.0004470325542570952, + "loss": 1.5981, + "loss_base2": 2.3056, + "loss_pixel": 0.1549, + "loss_text": 1.4432, + "ppl": 4.9436, + "step": 12891 + }, + { + "epoch": 0.07, + "global_step": 12892, + "learning_rate": 0.0004470283806343907, + "loss": 1.5945, + "loss_base2": 2.3004, + "loss_pixel": 0.1569, + "loss_text": 1.4376, + "ppl": 4.9259, + "step": 12892 + }, + { + "epoch": 0.07, + "global_step": 12893, + "learning_rate": 0.0004470242070116862, + "loss": 1.6046, + "loss_base2": 2.3149, + "loss_pixel": 0.1551, + "loss_text": 1.4495, + "ppl": 4.9759, + "step": 12893 + }, + { + "epoch": 0.07, + "global_step": 12894, + "learning_rate": 0.0004470200333889817, + "loss": 1.5937, + "loss_base2": 2.2992, + "loss_pixel": 0.1567, + "loss_text": 1.437, + "ppl": 4.9219, + "step": 12894 + }, + { + "epoch": 0.07, + "global_step": 12895, + "learning_rate": 0.0004470158597662771, + "loss": 1.5999, + "loss_base2": 2.3082, + "loss_pixel": 0.1569, + "loss_text": 1.443, + "ppl": 4.9525, + "step": 12895 + }, + { + "epoch": 0.07, + "global_step": 12896, + "learning_rate": 0.0004470116861435726, + "loss": 1.6191, + "loss_base2": 2.3359, + "loss_pixel": 0.1551, + "loss_text": 1.464, + "ppl": 5.0485, + "step": 12896 + }, + { + "epoch": 0.07, + "global_step": 12897, + "learning_rate": 0.0004470075125208681, + "loss": 1.5849, + "loss_base2": 2.2865, + "loss_pixel": 0.1549, + "loss_text": 1.43, + "ppl": 4.8788, + "step": 12897 + }, + { + "epoch": 0.07, + "global_step": 12898, + "learning_rate": 0.0004470033388981636, + "loss": 1.5322, + "loss_base2": 2.2105, + "loss_pixel": 0.157, + "loss_text": 1.3752, + "ppl": 4.6283, + "step": 12898 + }, + { + "epoch": 0.07, + "global_step": 12899, + "learning_rate": 0.00044699916527545907, + "loss": 1.4018, + "loss_base2": 2.0224, + "loss_pixel": 0.1559, + "loss_text": 1.2459, + "ppl": 4.0625, + "step": 12899 + }, + { + "epoch": 0.07, + "global_step": 12900, + "learning_rate": 0.0004469949916527546, + "loss": 1.3685, + "loss_base2": 1.9743, + "loss_pixel": 0.1564, + "loss_text": 1.212, + "ppl": 3.9295, + "step": 12900 + }, + { + "epoch": 0.07, + "global_step": 12901, + "learning_rate": 0.0004469908180300501, + "loss": 1.3705, + "loss_base2": 1.9772, + "loss_pixel": 0.1571, + "loss_text": 1.2135, + "ppl": 3.9373, + "step": 12901 + }, + { + "epoch": 0.07, + "global_step": 12902, + "learning_rate": 0.0004469866444073456, + "loss": 1.3667, + "loss_base2": 1.9717, + "loss_pixel": 0.1561, + "loss_text": 1.2106, + "ppl": 3.9224, + "step": 12902 + }, + { + "epoch": 0.07, + "global_step": 12903, + "learning_rate": 0.0004469824707846411, + "loss": 1.3551, + "loss_base2": 1.955, + "loss_pixel": 0.1564, + "loss_text": 1.1988, + "ppl": 3.8771, + "step": 12903 + }, + { + "epoch": 0.07, + "global_step": 12904, + "learning_rate": 0.00044697829716193655, + "loss": 1.3644, + "loss_base2": 1.9684, + "loss_pixel": 0.1569, + "loss_text": 1.2075, + "ppl": 3.9134, + "step": 12904 + }, + { + "epoch": 0.07, + "global_step": 12905, + "learning_rate": 0.00044697412353923206, + "loss": 1.3524, + "loss_base2": 1.9511, + "loss_pixel": 0.1555, + "loss_text": 1.1969, + "ppl": 3.8667, + "step": 12905 + }, + { + "epoch": 0.07, + "global_step": 12906, + "learning_rate": 0.00044696994991652757, + "loss": 1.5198, + "loss_base2": 2.1926, + "loss_pixel": 0.1559, + "loss_text": 1.364, + "ppl": 4.5713, + "step": 12906 + }, + { + "epoch": 0.07, + "global_step": 12907, + "learning_rate": 0.0004469657762938231, + "loss": 1.6156, + "loss_base2": 2.3308, + "loss_pixel": 0.1543, + "loss_text": 1.4613, + "ppl": 5.0309, + "step": 12907 + }, + { + "epoch": 0.07, + "global_step": 12908, + "learning_rate": 0.00044696160267111853, + "loss": 1.6042, + "loss_base2": 2.3144, + "loss_pixel": 0.1571, + "loss_text": 1.447, + "ppl": 4.9739, + "step": 12908 + }, + { + "epoch": 0.07, + "global_step": 12909, + "learning_rate": 0.00044695742904841404, + "loss": 1.618, + "loss_base2": 2.3343, + "loss_pixel": 0.1569, + "loss_text": 1.461, + "ppl": 5.043, + "step": 12909 + }, + { + "epoch": 0.07, + "global_step": 12910, + "learning_rate": 0.00044695325542570954, + "loss": 1.6256, + "loss_base2": 2.3452, + "loss_pixel": 0.157, + "loss_text": 1.4686, + "ppl": 5.0815, + "step": 12910 + }, + { + "epoch": 0.07, + "global_step": 12911, + "learning_rate": 0.00044694908180300505, + "loss": 1.6095, + "loss_base2": 2.322, + "loss_pixel": 0.1553, + "loss_text": 1.4542, + "ppl": 5.0003, + "step": 12911 + }, + { + "epoch": 0.07, + "global_step": 12912, + "learning_rate": 0.00044694490818030056, + "loss": 1.5931, + "loss_base2": 2.2984, + "loss_pixel": 0.1572, + "loss_text": 1.436, + "ppl": 4.919, + "step": 12912 + }, + { + "epoch": 0.07, + "global_step": 12913, + "learning_rate": 0.000446940734557596, + "loss": 1.6004, + "loss_base2": 2.3089, + "loss_pixel": 0.156, + "loss_text": 1.4444, + "ppl": 4.955, + "step": 12913 + }, + { + "epoch": 0.07, + "global_step": 12914, + "learning_rate": 0.00044693656093489146, + "loss": 1.5894, + "loss_base2": 2.293, + "loss_pixel": 0.156, + "loss_text": 1.4334, + "ppl": 4.9008, + "step": 12914 + }, + { + "epoch": 0.07, + "global_step": 12915, + "learning_rate": 0.00044693238731218697, + "loss": 1.6168, + "loss_base2": 2.3325, + "loss_pixel": 0.1554, + "loss_text": 1.4614, + "ppl": 5.0369, + "step": 12915 + }, + { + "epoch": 0.07, + "global_step": 12916, + "learning_rate": 0.0004469282136894825, + "loss": 1.6024, + "loss_base2": 2.3118, + "loss_pixel": 0.1555, + "loss_text": 1.4468, + "ppl": 4.9649, + "step": 12916 + }, + { + "epoch": 0.07, + "global_step": 12917, + "learning_rate": 0.00044692404006677793, + "loss": 1.5822, + "loss_base2": 2.2826, + "loss_pixel": 0.1562, + "loss_text": 1.426, + "ppl": 4.8656, + "step": 12917 + }, + { + "epoch": 0.07, + "global_step": 12918, + "learning_rate": 0.00044691986644407344, + "loss": 1.5994, + "loss_base2": 2.3074, + "loss_pixel": 0.1559, + "loss_text": 1.4435, + "ppl": 4.9501, + "step": 12918 + }, + { + "epoch": 0.07, + "global_step": 12919, + "learning_rate": 0.00044691569282136895, + "loss": 1.5823, + "loss_base2": 2.2828, + "loss_pixel": 0.157, + "loss_text": 1.4253, + "ppl": 4.8661, + "step": 12919 + }, + { + "epoch": 0.07, + "global_step": 12920, + "learning_rate": 0.00044691151919866445, + "loss": 1.5931, + "loss_base2": 2.2984, + "loss_pixel": 0.1559, + "loss_text": 1.4372, + "ppl": 4.919, + "step": 12920 + }, + { + "epoch": 0.07, + "global_step": 12921, + "learning_rate": 0.00044690734557595996, + "loss": 1.6063, + "loss_base2": 2.3174, + "loss_pixel": 0.1581, + "loss_text": 1.4482, + "ppl": 4.9843, + "step": 12921 + }, + { + "epoch": 0.07, + "global_step": 12922, + "learning_rate": 0.0004469031719532554, + "loss": 1.5867, + "loss_base2": 2.2891, + "loss_pixel": 0.1566, + "loss_text": 1.4301, + "ppl": 4.8876, + "step": 12922 + }, + { + "epoch": 0.07, + "global_step": 12923, + "learning_rate": 0.0004468989983305509, + "loss": 1.5842, + "loss_base2": 2.2855, + "loss_pixel": 0.1555, + "loss_text": 1.4287, + "ppl": 4.8754, + "step": 12923 + }, + { + "epoch": 0.07, + "global_step": 12924, + "learning_rate": 0.00044689482470784643, + "loss": 1.6022, + "loss_base2": 2.3115, + "loss_pixel": 0.1555, + "loss_text": 1.4468, + "ppl": 4.9639, + "step": 12924 + }, + { + "epoch": 0.07, + "global_step": 12925, + "learning_rate": 0.00044689065108514194, + "loss": 1.5985, + "loss_base2": 2.3061, + "loss_pixel": 0.1572, + "loss_text": 1.4413, + "ppl": 4.9456, + "step": 12925 + }, + { + "epoch": 0.07, + "global_step": 12926, + "learning_rate": 0.0004468864774624374, + "loss": 1.6059, + "loss_base2": 2.3168, + "loss_pixel": 0.1556, + "loss_text": 1.4503, + "ppl": 4.9823, + "step": 12926 + }, + { + "epoch": 0.07, + "global_step": 12927, + "learning_rate": 0.0004468823038397329, + "loss": 1.5958, + "loss_base2": 2.3023, + "loss_pixel": 0.1561, + "loss_text": 1.4397, + "ppl": 4.9323, + "step": 12927 + }, + { + "epoch": 0.07, + "global_step": 12928, + "learning_rate": 0.0004468781302170284, + "loss": 1.6063, + "loss_base2": 2.3174, + "loss_pixel": 0.155, + "loss_text": 1.4513, + "ppl": 4.9843, + "step": 12928 + }, + { + "epoch": 0.07, + "global_step": 12929, + "learning_rate": 0.0004468739565943239, + "loss": 1.5866, + "loss_base2": 2.289, + "loss_pixel": 0.1557, + "loss_text": 1.4309, + "ppl": 4.8871, + "step": 12929 + }, + { + "epoch": 0.07, + "global_step": 12930, + "learning_rate": 0.0004468697829716194, + "loss": 1.5897, + "loss_base2": 2.2935, + "loss_pixel": 0.1538, + "loss_text": 1.4359, + "ppl": 4.9023, + "step": 12930 + }, + { + "epoch": 0.07, + "global_step": 12931, + "learning_rate": 0.00044686560934891487, + "loss": 1.5846, + "loss_base2": 2.2861, + "loss_pixel": 0.154, + "loss_text": 1.4305, + "ppl": 4.8773, + "step": 12931 + }, + { + "epoch": 0.07, + "global_step": 12932, + "learning_rate": 0.0004468614357262104, + "loss": 1.5725, + "loss_base2": 2.2686, + "loss_pixel": 0.155, + "loss_text": 1.4175, + "ppl": 4.8187, + "step": 12932 + }, + { + "epoch": 0.07, + "global_step": 12933, + "learning_rate": 0.00044685726210350583, + "loss": 1.5946, + "loss_base2": 2.3005, + "loss_pixel": 0.1555, + "loss_text": 1.4391, + "ppl": 4.9264, + "step": 12933 + }, + { + "epoch": 0.07, + "global_step": 12934, + "learning_rate": 0.00044685308848080134, + "loss": 1.5846, + "loss_base2": 2.2861, + "loss_pixel": 0.1557, + "loss_text": 1.4289, + "ppl": 4.8773, + "step": 12934 + }, + { + "epoch": 0.07, + "global_step": 12935, + "learning_rate": 0.0004468489148580968, + "loss": 1.5887, + "loss_base2": 2.292, + "loss_pixel": 0.1506, + "loss_text": 1.4381, + "ppl": 4.8974, + "step": 12935 + }, + { + "epoch": 0.07, + "global_step": 12936, + "learning_rate": 0.0004468447412353923, + "loss": 1.5594, + "loss_base2": 2.2497, + "loss_pixel": 0.1464, + "loss_text": 1.4131, + "ppl": 4.756, + "step": 12936 + }, + { + "epoch": 0.07, + "global_step": 12937, + "learning_rate": 0.0004468405676126878, + "loss": 1.5574, + "loss_base2": 2.2469, + "loss_pixel": 0.146, + "loss_text": 1.4114, + "ppl": 4.7465, + "step": 12937 + }, + { + "epoch": 0.07, + "global_step": 12938, + "learning_rate": 0.0004468363939899833, + "loss": 1.5953, + "loss_base2": 2.3015, + "loss_pixel": 0.1476, + "loss_text": 1.4478, + "ppl": 4.9298, + "step": 12938 + }, + { + "epoch": 0.07, + "global_step": 12939, + "learning_rate": 0.0004468322203672788, + "loss": 1.5899, + "loss_base2": 2.2937, + "loss_pixel": 0.1466, + "loss_text": 1.4434, + "ppl": 4.9033, + "step": 12939 + }, + { + "epoch": 0.07, + "global_step": 12940, + "learning_rate": 0.0004468280467445743, + "loss": 1.5815, + "loss_base2": 2.2816, + "loss_pixel": 0.1447, + "loss_text": 1.4368, + "ppl": 4.8622, + "step": 12940 + }, + { + "epoch": 0.07, + "global_step": 12941, + "learning_rate": 0.0004468238731218698, + "loss": 1.5964, + "loss_base2": 2.3031, + "loss_pixel": 0.1454, + "loss_text": 1.4511, + "ppl": 4.9352, + "step": 12941 + }, + { + "epoch": 0.07, + "global_step": 12942, + "learning_rate": 0.0004468196994991653, + "loss": 1.5885, + "loss_base2": 2.2917, + "loss_pixel": 0.1465, + "loss_text": 1.442, + "ppl": 4.8964, + "step": 12942 + }, + { + "epoch": 0.07, + "global_step": 12943, + "learning_rate": 0.0004468155258764608, + "loss": 1.5907, + "loss_base2": 2.2949, + "loss_pixel": 0.1462, + "loss_text": 1.4445, + "ppl": 4.9072, + "step": 12943 + }, + { + "epoch": 0.07, + "global_step": 12944, + "learning_rate": 0.00044681135225375625, + "loss": 1.5866, + "loss_base2": 2.289, + "loss_pixel": 0.1457, + "loss_text": 1.441, + "ppl": 4.8871, + "step": 12944 + }, + { + "epoch": 0.07, + "global_step": 12945, + "learning_rate": 0.00044680717863105176, + "loss": 1.5897, + "loss_base2": 2.2935, + "loss_pixel": 0.1441, + "loss_text": 1.4456, + "ppl": 4.9023, + "step": 12945 + }, + { + "epoch": 0.07, + "global_step": 12946, + "learning_rate": 0.00044680300500834726, + "loss": 1.5853, + "loss_base2": 2.2871, + "loss_pixel": 0.1461, + "loss_text": 1.4392, + "ppl": 4.8808, + "step": 12946 + }, + { + "epoch": 0.07, + "global_step": 12947, + "learning_rate": 0.00044679883138564277, + "loss": 1.6083, + "loss_base2": 2.3203, + "loss_pixel": 0.1446, + "loss_text": 1.4636, + "ppl": 4.9943, + "step": 12947 + }, + { + "epoch": 0.07, + "global_step": 12948, + "learning_rate": 0.0004467946577629383, + "loss": 1.5973, + "loss_base2": 2.3044, + "loss_pixel": 0.1454, + "loss_text": 1.4519, + "ppl": 4.9397, + "step": 12948 + }, + { + "epoch": 0.07, + "global_step": 12949, + "learning_rate": 0.00044679048414023373, + "loss": 1.5876, + "loss_base2": 2.2904, + "loss_pixel": 0.1431, + "loss_text": 1.4445, + "ppl": 4.892, + "step": 12949 + }, + { + "epoch": 0.07, + "global_step": 12950, + "learning_rate": 0.00044678631051752924, + "loss": 1.5956, + "loss_base2": 2.302, + "loss_pixel": 0.1449, + "loss_text": 1.4506, + "ppl": 4.9313, + "step": 12950 + }, + { + "epoch": 0.07, + "global_step": 12951, + "learning_rate": 0.00044678213689482475, + "loss": 1.5841, + "loss_base2": 2.2854, + "loss_pixel": 0.147, + "loss_text": 1.4371, + "ppl": 4.8749, + "step": 12951 + }, + { + "epoch": 0.07, + "global_step": 12952, + "learning_rate": 0.0004467779632721202, + "loss": 1.5788, + "loss_base2": 2.2777, + "loss_pixel": 0.1449, + "loss_text": 1.4339, + "ppl": 4.8491, + "step": 12952 + }, + { + "epoch": 0.07, + "global_step": 12953, + "learning_rate": 0.0004467737896494157, + "loss": 1.5657, + "loss_base2": 2.2588, + "loss_pixel": 0.1438, + "loss_text": 1.422, + "ppl": 4.786, + "step": 12953 + }, + { + "epoch": 0.07, + "global_step": 12954, + "learning_rate": 0.00044676961602671116, + "loss": 1.5753, + "loss_base2": 2.2727, + "loss_pixel": 0.1447, + "loss_text": 1.4306, + "ppl": 4.8322, + "step": 12954 + }, + { + "epoch": 0.07, + "global_step": 12955, + "learning_rate": 0.00044676544240400667, + "loss": 1.5993, + "loss_base2": 2.3073, + "loss_pixel": 0.1459, + "loss_text": 1.4534, + "ppl": 4.9496, + "step": 12955 + }, + { + "epoch": 0.07, + "global_step": 12956, + "learning_rate": 0.0004467612687813022, + "loss": 1.5784, + "loss_base2": 2.2771, + "loss_pixel": 0.1447, + "loss_text": 1.4338, + "ppl": 4.8472, + "step": 12956 + }, + { + "epoch": 0.07, + "global_step": 12957, + "learning_rate": 0.0004467570951585977, + "loss": 1.5737, + "loss_base2": 2.2704, + "loss_pixel": 0.1444, + "loss_text": 1.4293, + "ppl": 4.8245, + "step": 12957 + }, + { + "epoch": 0.07, + "global_step": 12958, + "learning_rate": 0.00044675292153589313, + "loss": 1.5861, + "loss_base2": 2.2883, + "loss_pixel": 0.1437, + "loss_text": 1.4424, + "ppl": 4.8847, + "step": 12958 + }, + { + "epoch": 0.07, + "global_step": 12959, + "learning_rate": 0.00044674874791318864, + "loss": 1.5878, + "loss_base2": 2.2907, + "loss_pixel": 0.1428, + "loss_text": 1.445, + "ppl": 4.893, + "step": 12959 + }, + { + "epoch": 0.07, + "global_step": 12960, + "learning_rate": 0.00044674457429048415, + "loss": 1.5763, + "loss_base2": 2.2741, + "loss_pixel": 0.1443, + "loss_text": 1.432, + "ppl": 4.837, + "step": 12960 + }, + { + "epoch": 0.07, + "global_step": 12961, + "learning_rate": 0.00044674040066777966, + "loss": 1.579, + "loss_base2": 2.278, + "loss_pixel": 0.1452, + "loss_text": 1.4338, + "ppl": 4.8501, + "step": 12961 + }, + { + "epoch": 0.07, + "global_step": 12962, + "learning_rate": 0.00044673622704507516, + "loss": 1.5949, + "loss_base2": 2.301, + "loss_pixel": 0.1431, + "loss_text": 1.4518, + "ppl": 4.9278, + "step": 12962 + }, + { + "epoch": 0.07, + "global_step": 12963, + "learning_rate": 0.0004467320534223706, + "loss": 1.5789, + "loss_base2": 2.2779, + "loss_pixel": 0.1441, + "loss_text": 1.4348, + "ppl": 4.8496, + "step": 12963 + }, + { + "epoch": 0.07, + "global_step": 12964, + "learning_rate": 0.0004467278797996661, + "loss": 1.5879, + "loss_base2": 2.2909, + "loss_pixel": 0.141, + "loss_text": 1.4469, + "ppl": 4.8935, + "step": 12964 + }, + { + "epoch": 0.07, + "global_step": 12965, + "learning_rate": 0.00044672370617696163, + "loss": 1.5682, + "loss_base2": 2.2624, + "loss_pixel": 0.1441, + "loss_text": 1.4241, + "ppl": 4.798, + "step": 12965 + }, + { + "epoch": 0.07, + "global_step": 12966, + "learning_rate": 0.00044671953255425714, + "loss": 1.5964, + "loss_base2": 2.3031, + "loss_pixel": 0.143, + "loss_text": 1.4534, + "ppl": 4.9352, + "step": 12966 + }, + { + "epoch": 0.07, + "global_step": 12967, + "learning_rate": 0.0004467153589315526, + "loss": 1.5678, + "loss_base2": 2.2619, + "loss_pixel": 0.1431, + "loss_text": 1.4246, + "ppl": 4.7961, + "step": 12967 + }, + { + "epoch": 0.07, + "global_step": 12968, + "learning_rate": 0.0004467111853088481, + "loss": 1.5731, + "loss_base2": 2.2695, + "loss_pixel": 0.144, + "loss_text": 1.429, + "ppl": 4.8216, + "step": 12968 + }, + { + "epoch": 0.07, + "global_step": 12969, + "learning_rate": 0.0004467070116861436, + "loss": 1.5874, + "loss_base2": 2.2901, + "loss_pixel": 0.1428, + "loss_text": 1.4446, + "ppl": 4.891, + "step": 12969 + }, + { + "epoch": 0.07, + "global_step": 12970, + "learning_rate": 0.0004467028380634391, + "loss": 1.5735, + "loss_base2": 2.2701, + "loss_pixel": 0.143, + "loss_text": 1.4304, + "ppl": 4.8235, + "step": 12970 + }, + { + "epoch": 0.07, + "global_step": 12971, + "learning_rate": 0.00044669866444073457, + "loss": 1.5944, + "loss_base2": 2.3002, + "loss_pixel": 0.1454, + "loss_text": 1.449, + "ppl": 4.9254, + "step": 12971 + }, + { + "epoch": 0.07, + "global_step": 12972, + "learning_rate": 0.00044669449081803, + "loss": 1.5885, + "loss_base2": 2.2917, + "loss_pixel": 0.1437, + "loss_text": 1.4448, + "ppl": 4.8964, + "step": 12972 + }, + { + "epoch": 0.07, + "global_step": 12973, + "learning_rate": 0.00044669031719532553, + "loss": 1.5389, + "loss_base2": 2.2202, + "loss_pixel": 0.1436, + "loss_text": 1.3953, + "ppl": 4.6595, + "step": 12973 + }, + { + "epoch": 0.07, + "global_step": 12974, + "learning_rate": 0.00044668614357262104, + "loss": 1.5347, + "loss_base2": 2.2141, + "loss_pixel": 0.1465, + "loss_text": 1.3882, + "ppl": 4.6399, + "step": 12974 + }, + { + "epoch": 0.07, + "global_step": 12975, + "learning_rate": 0.00044668196994991654, + "loss": 1.585, + "loss_base2": 2.2867, + "loss_pixel": 0.1434, + "loss_text": 1.4416, + "ppl": 4.8793, + "step": 12975 + }, + { + "epoch": 0.07, + "global_step": 12976, + "learning_rate": 0.000446677796327212, + "loss": 1.5972, + "loss_base2": 2.3043, + "loss_pixel": 0.1429, + "loss_text": 1.4543, + "ppl": 4.9392, + "step": 12976 + }, + { + "epoch": 0.07, + "global_step": 12977, + "learning_rate": 0.0004466736227045075, + "loss": 1.5833, + "loss_base2": 2.2842, + "loss_pixel": 0.1451, + "loss_text": 1.4382, + "ppl": 4.871, + "step": 12977 + }, + { + "epoch": 0.07, + "global_step": 12978, + "learning_rate": 0.000446669449081803, + "loss": 1.5719, + "loss_base2": 2.2678, + "loss_pixel": 0.1436, + "loss_text": 1.4284, + "ppl": 4.8158, + "step": 12978 + }, + { + "epoch": 0.07, + "global_step": 12979, + "learning_rate": 0.0004466652754590985, + "loss": 1.5879, + "loss_base2": 2.2909, + "loss_pixel": 0.1453, + "loss_text": 1.4427, + "ppl": 4.8935, + "step": 12979 + }, + { + "epoch": 0.07, + "global_step": 12980, + "learning_rate": 0.000446661101836394, + "loss": 1.5658, + "loss_base2": 2.259, + "loss_pixel": 0.1407, + "loss_text": 1.4251, + "ppl": 4.7865, + "step": 12980 + }, + { + "epoch": 0.07, + "global_step": 12981, + "learning_rate": 0.0004466569282136895, + "loss": 1.5764, + "loss_base2": 2.2743, + "loss_pixel": 0.1441, + "loss_text": 1.4324, + "ppl": 4.8375, + "step": 12981 + }, + { + "epoch": 0.07, + "global_step": 12982, + "learning_rate": 0.000446652754590985, + "loss": 1.5753, + "loss_base2": 2.2727, + "loss_pixel": 0.1416, + "loss_text": 1.4336, + "ppl": 4.8322, + "step": 12982 + }, + { + "epoch": 0.07, + "global_step": 12983, + "learning_rate": 0.0004466485809682805, + "loss": 1.5974, + "loss_base2": 2.3046, + "loss_pixel": 0.1426, + "loss_text": 1.4548, + "ppl": 4.9402, + "step": 12983 + }, + { + "epoch": 0.07, + "global_step": 12984, + "learning_rate": 0.000446644407345576, + "loss": 1.5874, + "loss_base2": 2.2901, + "loss_pixel": 0.1455, + "loss_text": 1.4419, + "ppl": 4.891, + "step": 12984 + }, + { + "epoch": 0.07, + "global_step": 12985, + "learning_rate": 0.00044664023372287145, + "loss": 1.5819, + "loss_base2": 2.2822, + "loss_pixel": 0.1445, + "loss_text": 1.4374, + "ppl": 4.8642, + "step": 12985 + }, + { + "epoch": 0.07, + "global_step": 12986, + "learning_rate": 0.00044663606010016696, + "loss": 1.5742, + "loss_base2": 2.2711, + "loss_pixel": 0.1455, + "loss_text": 1.4287, + "ppl": 4.8269, + "step": 12986 + }, + { + "epoch": 0.07, + "global_step": 12987, + "learning_rate": 0.00044663188647746247, + "loss": 1.5981, + "loss_base2": 2.3056, + "loss_pixel": 0.1408, + "loss_text": 1.4573, + "ppl": 4.9436, + "step": 12987 + }, + { + "epoch": 0.07, + "global_step": 12988, + "learning_rate": 0.000446627712854758, + "loss": 1.5823, + "loss_base2": 2.2828, + "loss_pixel": 0.1431, + "loss_text": 1.4392, + "ppl": 4.8661, + "step": 12988 + }, + { + "epoch": 0.07, + "global_step": 12989, + "learning_rate": 0.00044662353923205343, + "loss": 1.5759, + "loss_base2": 2.2735, + "loss_pixel": 0.143, + "loss_text": 1.4329, + "ppl": 4.8351, + "step": 12989 + }, + { + "epoch": 0.07, + "global_step": 12990, + "learning_rate": 0.0004466193656093489, + "loss": 1.5664, + "loss_base2": 2.2598, + "loss_pixel": 0.1437, + "loss_text": 1.4228, + "ppl": 4.7894, + "step": 12990 + }, + { + "epoch": 0.07, + "global_step": 12991, + "learning_rate": 0.0004466151919866444, + "loss": 1.5696, + "loss_base2": 2.2645, + "loss_pixel": 0.1436, + "loss_text": 1.426, + "ppl": 4.8047, + "step": 12991 + }, + { + "epoch": 0.07, + "global_step": 12992, + "learning_rate": 0.0004466110183639399, + "loss": 1.5859, + "loss_base2": 2.288, + "loss_pixel": 0.1476, + "loss_text": 1.4383, + "ppl": 4.8837, + "step": 12992 + }, + { + "epoch": 0.07, + "global_step": 12993, + "learning_rate": 0.0004466068447412354, + "loss": 1.5769, + "loss_base2": 2.275, + "loss_pixel": 0.1446, + "loss_text": 1.4323, + "ppl": 4.8399, + "step": 12993 + }, + { + "epoch": 0.07, + "global_step": 12994, + "learning_rate": 0.00044660267111853086, + "loss": 1.5872, + "loss_base2": 2.2898, + "loss_pixel": 0.1426, + "loss_text": 1.4445, + "ppl": 4.89, + "step": 12994 + }, + { + "epoch": 0.07, + "global_step": 12995, + "learning_rate": 0.00044659849749582636, + "loss": 1.5864, + "loss_base2": 2.2887, + "loss_pixel": 0.1445, + "loss_text": 1.4419, + "ppl": 4.8861, + "step": 12995 + }, + { + "epoch": 0.07, + "global_step": 12996, + "learning_rate": 0.00044659432387312187, + "loss": 1.5834, + "loss_base2": 2.2844, + "loss_pixel": 0.1445, + "loss_text": 1.4389, + "ppl": 4.8715, + "step": 12996 + }, + { + "epoch": 0.07, + "global_step": 12997, + "learning_rate": 0.0004465901502504174, + "loss": 1.4904, + "loss_base2": 2.1502, + "loss_pixel": 0.1433, + "loss_text": 1.3472, + "ppl": 4.4389, + "step": 12997 + }, + { + "epoch": 0.07, + "global_step": 12998, + "learning_rate": 0.0004465859766277129, + "loss": 1.3619, + "loss_base2": 1.9648, + "loss_pixel": 0.1404, + "loss_text": 1.2215, + "ppl": 3.9036, + "step": 12998 + }, + { + "epoch": 0.07, + "global_step": 12999, + "learning_rate": 0.00044658180300500834, + "loss": 1.3658, + "loss_base2": 1.9704, + "loss_pixel": 0.1439, + "loss_text": 1.2218, + "ppl": 3.9189, + "step": 12999 + }, + { + "epoch": 0.07, + "global_step": 13000, + "learning_rate": 0.00044657762938230385, + "loss": 1.3518, + "loss_base2": 1.9502, + "loss_pixel": 0.1427, + "loss_text": 1.2091, + "ppl": 3.8644, + "step": 13000 + }, + { + "epoch": 0.07, + "global_step": 13001, + "learning_rate": 0.00044657345575959935, + "loss": 1.357, + "loss_base2": 1.9577, + "loss_pixel": 0.1419, + "loss_text": 1.2151, + "ppl": 3.8845, + "step": 13001 + }, + { + "epoch": 0.07, + "global_step": 13002, + "learning_rate": 0.00044656928213689486, + "loss": 1.3504, + "loss_base2": 1.9482, + "loss_pixel": 0.1411, + "loss_text": 1.2092, + "ppl": 3.859, + "step": 13002 + }, + { + "epoch": 0.07, + "global_step": 13003, + "learning_rate": 0.0004465651085141903, + "loss": 1.342, + "loss_base2": 1.9361, + "loss_pixel": 0.1437, + "loss_text": 1.1983, + "ppl": 3.8267, + "step": 13003 + }, + { + "epoch": 0.07, + "global_step": 13004, + "learning_rate": 0.0004465609348914858, + "loss": 1.355, + "loss_base2": 1.9549, + "loss_pixel": 0.1442, + "loss_text": 1.2108, + "ppl": 3.8768, + "step": 13004 + }, + { + "epoch": 0.07, + "global_step": 13005, + "learning_rate": 0.00044655676126878133, + "loss": 1.3491, + "loss_base2": 1.9463, + "loss_pixel": 0.1536, + "loss_text": 1.1955, + "ppl": 3.854, + "step": 13005 + }, + { + "epoch": 0.07, + "global_step": 13006, + "learning_rate": 0.00044655258764607684, + "loss": 1.3619, + "loss_base2": 1.9648, + "loss_pixel": 0.1573, + "loss_text": 1.2047, + "ppl": 3.9036, + "step": 13006 + }, + { + "epoch": 0.07, + "global_step": 13007, + "learning_rate": 0.00044654841402337234, + "loss": 1.369, + "loss_base2": 1.975, + "loss_pixel": 0.1571, + "loss_text": 1.2119, + "ppl": 3.9314, + "step": 13007 + }, + { + "epoch": 0.07, + "global_step": 13008, + "learning_rate": 0.00044654424040066774, + "loss": 1.3864, + "loss_base2": 2.0002, + "loss_pixel": 0.1575, + "loss_text": 1.2289, + "ppl": 4.0004, + "step": 13008 + }, + { + "epoch": 0.07, + "global_step": 13009, + "learning_rate": 0.00044654006677796325, + "loss": 1.3699, + "loss_base2": 1.9763, + "loss_pixel": 0.1584, + "loss_text": 1.2115, + "ppl": 3.935, + "step": 13009 + }, + { + "epoch": 0.07, + "global_step": 13010, + "learning_rate": 0.00044653589315525876, + "loss": 1.3548, + "loss_base2": 1.9546, + "loss_pixel": 0.1576, + "loss_text": 1.1972, + "ppl": 3.876, + "step": 13010 + }, + { + "epoch": 0.07, + "global_step": 13011, + "learning_rate": 0.00044653171953255426, + "loss": 1.3531, + "loss_base2": 1.9521, + "loss_pixel": 0.1573, + "loss_text": 1.1959, + "ppl": 3.8694, + "step": 13011 + }, + { + "epoch": 0.07, + "global_step": 13012, + "learning_rate": 0.00044652754590984977, + "loss": 1.3848, + "loss_base2": 1.9978, + "loss_pixel": 0.1575, + "loss_text": 1.2273, + "ppl": 3.994, + "step": 13012 + }, + { + "epoch": 0.07, + "global_step": 13013, + "learning_rate": 0.0004465233722871452, + "loss": 1.3688, + "loss_base2": 1.9748, + "loss_pixel": 0.1587, + "loss_text": 1.2101, + "ppl": 3.9306, + "step": 13013 + }, + { + "epoch": 0.07, + "global_step": 13014, + "learning_rate": 0.00044651919866444073, + "loss": 1.6119, + "loss_base2": 2.3255, + "loss_pixel": 0.1576, + "loss_text": 1.4543, + "ppl": 5.0123, + "step": 13014 + }, + { + "epoch": 0.07, + "global_step": 13015, + "learning_rate": 0.00044651502504173624, + "loss": 1.6395, + "loss_base2": 2.3653, + "loss_pixel": 0.1566, + "loss_text": 1.4829, + "ppl": 5.1526, + "step": 13015 + }, + { + "epoch": 0.07, + "global_step": 13016, + "learning_rate": 0.00044651085141903175, + "loss": 1.6157, + "loss_base2": 2.331, + "loss_pixel": 0.1574, + "loss_text": 1.4583, + "ppl": 5.0314, + "step": 13016 + }, + { + "epoch": 0.07, + "global_step": 13017, + "learning_rate": 0.0004465066777963272, + "loss": 1.5823, + "loss_base2": 2.2828, + "loss_pixel": 0.1572, + "loss_text": 1.4251, + "ppl": 4.8661, + "step": 13017 + }, + { + "epoch": 0.07, + "global_step": 13018, + "learning_rate": 0.0004465025041736227, + "loss": 1.6107, + "loss_base2": 2.3237, + "loss_pixel": 0.157, + "loss_text": 1.4537, + "ppl": 5.0063, + "step": 13018 + }, + { + "epoch": 0.07, + "global_step": 13019, + "learning_rate": 0.0004464983305509182, + "loss": 1.5977, + "loss_base2": 2.305, + "loss_pixel": 0.1572, + "loss_text": 1.4405, + "ppl": 4.9417, + "step": 13019 + }, + { + "epoch": 0.07, + "global_step": 13020, + "learning_rate": 0.0004464941569282137, + "loss": 1.5871, + "loss_base2": 2.2897, + "loss_pixel": 0.1575, + "loss_text": 1.4296, + "ppl": 4.8895, + "step": 13020 + }, + { + "epoch": 0.07, + "global_step": 13021, + "learning_rate": 0.00044648998330550923, + "loss": 1.5911, + "loss_base2": 2.2955, + "loss_pixel": 0.1588, + "loss_text": 1.4323, + "ppl": 4.9091, + "step": 13021 + }, + { + "epoch": 0.07, + "global_step": 13022, + "learning_rate": 0.0004464858096828047, + "loss": 1.5967, + "loss_base2": 2.3036, + "loss_pixel": 0.1594, + "loss_text": 1.4373, + "ppl": 4.9367, + "step": 13022 + }, + { + "epoch": 0.07, + "global_step": 13023, + "learning_rate": 0.0004464816360601002, + "loss": 1.5989, + "loss_base2": 2.3067, + "loss_pixel": 0.157, + "loss_text": 1.4419, + "ppl": 4.9476, + "step": 13023 + }, + { + "epoch": 0.07, + "global_step": 13024, + "learning_rate": 0.0004464774624373957, + "loss": 1.5953, + "loss_base2": 2.3015, + "loss_pixel": 0.1577, + "loss_text": 1.4376, + "ppl": 4.9298, + "step": 13024 + }, + { + "epoch": 0.07, + "global_step": 13025, + "learning_rate": 0.0004464732888146912, + "loss": 1.5994, + "loss_base2": 2.3074, + "loss_pixel": 0.159, + "loss_text": 1.4404, + "ppl": 4.9501, + "step": 13025 + }, + { + "epoch": 0.07, + "global_step": 13026, + "learning_rate": 0.00044646911519198666, + "loss": 1.6015, + "loss_base2": 2.3105, + "loss_pixel": 0.1584, + "loss_text": 1.4432, + "ppl": 4.9605, + "step": 13026 + }, + { + "epoch": 0.07, + "global_step": 13027, + "learning_rate": 0.0004464649415692821, + "loss": 1.6133, + "loss_base2": 2.3275, + "loss_pixel": 0.1572, + "loss_text": 1.4561, + "ppl": 5.0193, + "step": 13027 + }, + { + "epoch": 0.07, + "global_step": 13028, + "learning_rate": 0.0004464607679465776, + "loss": 1.6129, + "loss_base2": 2.3269, + "loss_pixel": 0.159, + "loss_text": 1.4539, + "ppl": 5.0173, + "step": 13028 + }, + { + "epoch": 0.07, + "global_step": 13029, + "learning_rate": 0.0004464565943238731, + "loss": 1.5922, + "loss_base2": 2.2971, + "loss_pixel": 0.159, + "loss_text": 1.4333, + "ppl": 4.9145, + "step": 13029 + }, + { + "epoch": 0.07, + "global_step": 13030, + "learning_rate": 0.00044645242070116863, + "loss": 1.603, + "loss_base2": 2.3126, + "loss_pixel": 0.158, + "loss_text": 1.4449, + "ppl": 4.9679, + "step": 13030 + }, + { + "epoch": 0.07, + "global_step": 13031, + "learning_rate": 0.0004464482470784641, + "loss": 1.6202, + "loss_base2": 2.3375, + "loss_pixel": 0.159, + "loss_text": 1.4613, + "ppl": 5.0541, + "step": 13031 + }, + { + "epoch": 0.07, + "global_step": 13032, + "learning_rate": 0.0004464440734557596, + "loss": 1.5953, + "loss_base2": 2.3015, + "loss_pixel": 0.1576, + "loss_text": 1.4377, + "ppl": 4.9298, + "step": 13032 + }, + { + "epoch": 0.07, + "global_step": 13033, + "learning_rate": 0.0004464398998330551, + "loss": 1.5806, + "loss_base2": 2.2803, + "loss_pixel": 0.1588, + "loss_text": 1.4218, + "ppl": 4.8579, + "step": 13033 + }, + { + "epoch": 0.07, + "global_step": 13034, + "learning_rate": 0.0004464357262103506, + "loss": 1.6033, + "loss_base2": 2.3131, + "loss_pixel": 0.1577, + "loss_text": 1.4456, + "ppl": 4.9694, + "step": 13034 + }, + { + "epoch": 0.07, + "global_step": 13035, + "learning_rate": 0.00044643155258764606, + "loss": 1.4814, + "loss_base2": 2.1372, + "loss_pixel": 0.1569, + "loss_text": 1.3245, + "ppl": 4.3991, + "step": 13035 + }, + { + "epoch": 0.07, + "global_step": 13036, + "learning_rate": 0.00044642737896494157, + "loss": 1.4046, + "loss_base2": 2.0264, + "loss_pixel": 0.1572, + "loss_text": 1.2474, + "ppl": 4.0739, + "step": 13036 + }, + { + "epoch": 0.07, + "global_step": 13037, + "learning_rate": 0.0004464232053422371, + "loss": 1.3871, + "loss_base2": 2.0012, + "loss_pixel": 0.1577, + "loss_text": 1.2294, + "ppl": 4.0032, + "step": 13037 + }, + { + "epoch": 0.07, + "global_step": 13038, + "learning_rate": 0.0004464190317195326, + "loss": 1.3824, + "loss_base2": 1.9944, + "loss_pixel": 0.1574, + "loss_text": 1.225, + "ppl": 3.9845, + "step": 13038 + }, + { + "epoch": 0.07, + "global_step": 13039, + "learning_rate": 0.0004464148580968281, + "loss": 1.3492, + "loss_base2": 1.9465, + "loss_pixel": 0.1567, + "loss_text": 1.1925, + "ppl": 3.8543, + "step": 13039 + }, + { + "epoch": 0.07, + "global_step": 13040, + "learning_rate": 0.00044641068447412354, + "loss": 1.3721, + "loss_base2": 1.9795, + "loss_pixel": 0.1584, + "loss_text": 1.2137, + "ppl": 3.9436, + "step": 13040 + }, + { + "epoch": 0.07, + "global_step": 13041, + "learning_rate": 0.00044640651085141905, + "loss": 1.3477, + "loss_base2": 1.9443, + "loss_pixel": 0.157, + "loss_text": 1.1907, + "ppl": 3.8486, + "step": 13041 + }, + { + "epoch": 0.07, + "global_step": 13042, + "learning_rate": 0.00044640233722871456, + "loss": 1.3656, + "loss_base2": 1.9701, + "loss_pixel": 0.1581, + "loss_text": 1.2074, + "ppl": 3.9181, + "step": 13042 + }, + { + "epoch": 0.07, + "global_step": 13043, + "learning_rate": 0.00044639816360601006, + "loss": 1.368, + "loss_base2": 1.9736, + "loss_pixel": 0.1566, + "loss_text": 1.2114, + "ppl": 3.9275, + "step": 13043 + }, + { + "epoch": 0.07, + "global_step": 13044, + "learning_rate": 0.0004463939899833055, + "loss": 1.3788, + "loss_base2": 1.9892, + "loss_pixel": 0.1565, + "loss_text": 1.2223, + "ppl": 3.9701, + "step": 13044 + }, + { + "epoch": 0.07, + "global_step": 13045, + "learning_rate": 0.00044638981636060097, + "loss": 1.3829, + "loss_base2": 1.9951, + "loss_pixel": 0.1577, + "loss_text": 1.2251, + "ppl": 3.9864, + "step": 13045 + }, + { + "epoch": 0.07, + "global_step": 13046, + "learning_rate": 0.0004463856427378965, + "loss": 1.3569, + "loss_base2": 1.9576, + "loss_pixel": 0.1571, + "loss_text": 1.1998, + "ppl": 3.8841, + "step": 13046 + }, + { + "epoch": 0.07, + "global_step": 13047, + "learning_rate": 0.000446381469115192, + "loss": 1.3632, + "loss_base2": 1.9667, + "loss_pixel": 0.1567, + "loss_text": 1.2065, + "ppl": 3.9087, + "step": 13047 + }, + { + "epoch": 0.07, + "global_step": 13048, + "learning_rate": 0.0004463772954924875, + "loss": 1.3588, + "loss_base2": 1.9603, + "loss_pixel": 0.1559, + "loss_text": 1.2029, + "ppl": 3.8915, + "step": 13048 + }, + { + "epoch": 0.07, + "global_step": 13049, + "learning_rate": 0.00044637312186978295, + "loss": 1.345, + "loss_base2": 1.9404, + "loss_pixel": 0.1557, + "loss_text": 1.1893, + "ppl": 3.8382, + "step": 13049 + }, + { + "epoch": 0.07, + "global_step": 13050, + "learning_rate": 0.00044636894824707845, + "loss": 1.3559, + "loss_base2": 1.9562, + "loss_pixel": 0.1561, + "loss_text": 1.1998, + "ppl": 3.8803, + "step": 13050 + }, + { + "epoch": 0.07, + "global_step": 13051, + "learning_rate": 0.00044636477462437396, + "loss": 1.3726, + "loss_base2": 1.9802, + "loss_pixel": 0.1573, + "loss_text": 1.2153, + "ppl": 3.9456, + "step": 13051 + }, + { + "epoch": 0.07, + "global_step": 13052, + "learning_rate": 0.00044636060100166947, + "loss": 1.3716, + "loss_base2": 1.9788, + "loss_pixel": 0.1582, + "loss_text": 1.2134, + "ppl": 3.9417, + "step": 13052 + }, + { + "epoch": 0.07, + "global_step": 13053, + "learning_rate": 0.0004463564273789649, + "loss": 1.3791, + "loss_base2": 1.9896, + "loss_pixel": 0.1557, + "loss_text": 1.2234, + "ppl": 3.9713, + "step": 13053 + }, + { + "epoch": 0.07, + "global_step": 13054, + "learning_rate": 0.00044635225375626043, + "loss": 1.3699, + "loss_base2": 1.9763, + "loss_pixel": 0.1572, + "loss_text": 1.2128, + "ppl": 3.935, + "step": 13054 + }, + { + "epoch": 0.07, + "global_step": 13055, + "learning_rate": 0.00044634808013355594, + "loss": 1.3623, + "loss_base2": 1.9654, + "loss_pixel": 0.1564, + "loss_text": 1.206, + "ppl": 3.9052, + "step": 13055 + }, + { + "epoch": 0.07, + "global_step": 13056, + "learning_rate": 0.00044634390651085144, + "loss": 1.3577, + "loss_base2": 1.9587, + "loss_pixel": 0.1569, + "loss_text": 1.2007, + "ppl": 3.8872, + "step": 13056 + }, + { + "epoch": 0.07, + "global_step": 13057, + "learning_rate": 0.00044633973288814695, + "loss": 1.3619, + "loss_base2": 1.9648, + "loss_pixel": 0.1564, + "loss_text": 1.2055, + "ppl": 3.9036, + "step": 13057 + }, + { + "epoch": 0.07, + "global_step": 13058, + "learning_rate": 0.0004463355592654424, + "loss": 1.3579, + "loss_base2": 1.959, + "loss_pixel": 0.1553, + "loss_text": 1.2027, + "ppl": 3.888, + "step": 13058 + }, + { + "epoch": 0.07, + "global_step": 13059, + "learning_rate": 0.0004463313856427379, + "loss": 1.3793, + "loss_base2": 1.9899, + "loss_pixel": 0.156, + "loss_text": 1.2233, + "ppl": 3.9721, + "step": 13059 + }, + { + "epoch": 0.07, + "global_step": 13060, + "learning_rate": 0.0004463272120200334, + "loss": 1.3575, + "loss_base2": 1.9585, + "loss_pixel": 0.1551, + "loss_text": 1.2024, + "ppl": 3.8865, + "step": 13060 + }, + { + "epoch": 0.07, + "global_step": 13061, + "learning_rate": 0.0004463230383973289, + "loss": 1.3456, + "loss_base2": 1.9413, + "loss_pixel": 0.1558, + "loss_text": 1.1898, + "ppl": 3.8405, + "step": 13061 + }, + { + "epoch": 0.07, + "global_step": 13062, + "learning_rate": 0.0004463188647746244, + "loss": 1.3609, + "loss_base2": 1.9634, + "loss_pixel": 0.1565, + "loss_text": 1.2044, + "ppl": 3.8997, + "step": 13062 + }, + { + "epoch": 0.07, + "global_step": 13063, + "learning_rate": 0.0004463146911519199, + "loss": 1.3902, + "loss_base2": 2.0056, + "loss_pixel": 0.1561, + "loss_text": 1.2341, + "ppl": 4.0157, + "step": 13063 + }, + { + "epoch": 0.07, + "global_step": 13064, + "learning_rate": 0.00044631051752921534, + "loss": 1.3628, + "loss_base2": 1.9661, + "loss_pixel": 0.1574, + "loss_text": 1.2054, + "ppl": 3.9071, + "step": 13064 + }, + { + "epoch": 0.07, + "global_step": 13065, + "learning_rate": 0.00044630634390651085, + "loss": 1.3513, + "loss_base2": 1.9495, + "loss_pixel": 0.155, + "loss_text": 1.1963, + "ppl": 3.8624, + "step": 13065 + }, + { + "epoch": 0.07, + "global_step": 13066, + "learning_rate": 0.00044630217028380635, + "loss": 1.3549, + "loss_base2": 1.9547, + "loss_pixel": 0.1553, + "loss_text": 1.1996, + "ppl": 3.8764, + "step": 13066 + }, + { + "epoch": 0.07, + "global_step": 13067, + "learning_rate": 0.0004462979966611018, + "loss": 1.3376, + "loss_base2": 1.9297, + "loss_pixel": 0.1557, + "loss_text": 1.1819, + "ppl": 3.8099, + "step": 13067 + }, + { + "epoch": 0.07, + "global_step": 13068, + "learning_rate": 0.0004462938230383973, + "loss": 1.3653, + "loss_base2": 1.9697, + "loss_pixel": 0.1555, + "loss_text": 1.2098, + "ppl": 3.9169, + "step": 13068 + }, + { + "epoch": 0.07, + "global_step": 13069, + "learning_rate": 0.0004462896494156928, + "loss": 1.3576, + "loss_base2": 1.9586, + "loss_pixel": 0.157, + "loss_text": 1.2006, + "ppl": 3.8869, + "step": 13069 + }, + { + "epoch": 0.07, + "global_step": 13070, + "learning_rate": 0.00044628547579298833, + "loss": 1.3673, + "loss_base2": 1.9726, + "loss_pixel": 0.1566, + "loss_text": 1.2107, + "ppl": 3.9247, + "step": 13070 + }, + { + "epoch": 0.07, + "global_step": 13071, + "learning_rate": 0.00044628130217028384, + "loss": 1.3671, + "loss_base2": 1.9723, + "loss_pixel": 0.1547, + "loss_text": 1.2124, + "ppl": 3.924, + "step": 13071 + }, + { + "epoch": 0.07, + "global_step": 13072, + "learning_rate": 0.0004462771285475793, + "loss": 1.3669, + "loss_base2": 1.972, + "loss_pixel": 0.1565, + "loss_text": 1.2105, + "ppl": 3.9232, + "step": 13072 + }, + { + "epoch": 0.07, + "global_step": 13073, + "learning_rate": 0.0004462729549248748, + "loss": 1.3356, + "loss_base2": 1.9269, + "loss_pixel": 0.1547, + "loss_text": 1.1809, + "ppl": 3.8023, + "step": 13073 + }, + { + "epoch": 0.07, + "global_step": 13074, + "learning_rate": 0.0004462687813021703, + "loss": 1.4622, + "loss_base2": 2.1095, + "loss_pixel": 0.1578, + "loss_text": 1.3044, + "ppl": 4.3154, + "step": 13074 + }, + { + "epoch": 0.07, + "global_step": 13075, + "learning_rate": 0.0004462646076794658, + "loss": 1.6049, + "loss_base2": 2.3154, + "loss_pixel": 0.1502, + "loss_text": 1.4547, + "ppl": 4.9774, + "step": 13075 + }, + { + "epoch": 0.07, + "global_step": 13076, + "learning_rate": 0.00044626043405676126, + "loss": 1.5858, + "loss_base2": 2.2878, + "loss_pixel": 0.1456, + "loss_text": 1.4402, + "ppl": 4.8832, + "step": 13076 + }, + { + "epoch": 0.07, + "global_step": 13077, + "learning_rate": 0.00044625626043405677, + "loss": 1.6187, + "loss_base2": 2.3353, + "loss_pixel": 0.146, + "loss_text": 1.4727, + "ppl": 5.0465, + "step": 13077 + }, + { + "epoch": 0.07, + "global_step": 13078, + "learning_rate": 0.0004462520868113523, + "loss": 1.5916, + "loss_base2": 2.2962, + "loss_pixel": 0.1445, + "loss_text": 1.447, + "ppl": 4.9116, + "step": 13078 + }, + { + "epoch": 0.07, + "global_step": 13079, + "learning_rate": 0.0004462479131886478, + "loss": 1.5915, + "loss_base2": 2.296, + "loss_pixel": 0.1456, + "loss_text": 1.4459, + "ppl": 4.9111, + "step": 13079 + }, + { + "epoch": 0.07, + "global_step": 13080, + "learning_rate": 0.0004462437395659433, + "loss": 1.5982, + "loss_base2": 2.3057, + "loss_pixel": 0.1439, + "loss_text": 1.4543, + "ppl": 4.9441, + "step": 13080 + }, + { + "epoch": 0.07, + "global_step": 13081, + "learning_rate": 0.00044623956594323875, + "loss": 1.5738, + "loss_base2": 2.2705, + "loss_pixel": 0.144, + "loss_text": 1.4298, + "ppl": 4.8249, + "step": 13081 + }, + { + "epoch": 0.07, + "global_step": 13082, + "learning_rate": 0.00044623539232053425, + "loss": 1.5901, + "loss_base2": 2.294, + "loss_pixel": 0.1457, + "loss_text": 1.4444, + "ppl": 4.9042, + "step": 13082 + }, + { + "epoch": 0.07, + "global_step": 13083, + "learning_rate": 0.0004462312186978297, + "loss": 1.606, + "loss_base2": 2.317, + "loss_pixel": 0.1441, + "loss_text": 1.4618, + "ppl": 4.9828, + "step": 13083 + }, + { + "epoch": 0.07, + "global_step": 13084, + "learning_rate": 0.0004462270450751252, + "loss": 1.5886, + "loss_base2": 2.2919, + "loss_pixel": 0.1451, + "loss_text": 1.4435, + "ppl": 4.8969, + "step": 13084 + }, + { + "epoch": 0.07, + "global_step": 13085, + "learning_rate": 0.00044622287145242067, + "loss": 1.5929, + "loss_base2": 2.2981, + "loss_pixel": 0.1447, + "loss_text": 1.4481, + "ppl": 4.918, + "step": 13085 + }, + { + "epoch": 0.07, + "global_step": 13086, + "learning_rate": 0.0004462186978297162, + "loss": 1.5812, + "loss_base2": 2.2812, + "loss_pixel": 0.1471, + "loss_text": 1.4342, + "ppl": 4.8608, + "step": 13086 + }, + { + "epoch": 0.07, + "global_step": 13087, + "learning_rate": 0.0004462145242070117, + "loss": 1.5947, + "loss_base2": 2.3007, + "loss_pixel": 0.1456, + "loss_text": 1.449, + "ppl": 4.9269, + "step": 13087 + }, + { + "epoch": 0.07, + "global_step": 13088, + "learning_rate": 0.0004462103505843072, + "loss": 1.5932, + "loss_base2": 2.2985, + "loss_pixel": 0.143, + "loss_text": 1.4501, + "ppl": 4.9195, + "step": 13088 + }, + { + "epoch": 0.07, + "global_step": 13089, + "learning_rate": 0.0004462061769616027, + "loss": 1.5882, + "loss_base2": 2.2913, + "loss_pixel": 0.1445, + "loss_text": 1.4437, + "ppl": 4.8949, + "step": 13089 + }, + { + "epoch": 0.07, + "global_step": 13090, + "learning_rate": 0.00044620200333889815, + "loss": 1.5809, + "loss_base2": 2.2808, + "loss_pixel": 0.1423, + "loss_text": 1.4387, + "ppl": 4.8593, + "step": 13090 + }, + { + "epoch": 0.07, + "global_step": 13091, + "learning_rate": 0.00044619782971619366, + "loss": 1.6028, + "loss_base2": 2.3124, + "loss_pixel": 0.1551, + "loss_text": 1.4477, + "ppl": 4.9669, + "step": 13091 + }, + { + "epoch": 0.07, + "global_step": 13092, + "learning_rate": 0.00044619365609348916, + "loss": 1.6046, + "loss_base2": 2.3149, + "loss_pixel": 0.1586, + "loss_text": 1.446, + "ppl": 4.9759, + "step": 13092 + }, + { + "epoch": 0.07, + "global_step": 13093, + "learning_rate": 0.00044618948247078467, + "loss": 1.6103, + "loss_base2": 2.3232, + "loss_pixel": 0.1572, + "loss_text": 1.4531, + "ppl": 5.0043, + "step": 13093 + }, + { + "epoch": 0.07, + "global_step": 13094, + "learning_rate": 0.0004461853088480801, + "loss": 1.5879, + "loss_base2": 2.2909, + "loss_pixel": 0.157, + "loss_text": 1.4309, + "ppl": 4.8935, + "step": 13094 + }, + { + "epoch": 0.07, + "global_step": 13095, + "learning_rate": 0.00044618113522537563, + "loss": 1.5942, + "loss_base2": 2.2999, + "loss_pixel": 0.1569, + "loss_text": 1.4373, + "ppl": 4.9244, + "step": 13095 + }, + { + "epoch": 0.07, + "global_step": 13096, + "learning_rate": 0.00044617696160267114, + "loss": 1.6047, + "loss_base2": 2.3151, + "loss_pixel": 0.1547, + "loss_text": 1.4499, + "ppl": 4.9764, + "step": 13096 + }, + { + "epoch": 0.07, + "global_step": 13097, + "learning_rate": 0.00044617278797996665, + "loss": 1.6043, + "loss_base2": 2.3145, + "loss_pixel": 0.1562, + "loss_text": 1.4481, + "ppl": 4.9744, + "step": 13097 + }, + { + "epoch": 0.07, + "global_step": 13098, + "learning_rate": 0.00044616861435726215, + "loss": 1.6003, + "loss_base2": 2.3087, + "loss_pixel": 0.1571, + "loss_text": 1.4432, + "ppl": 4.9545, + "step": 13098 + }, + { + "epoch": 0.07, + "global_step": 13099, + "learning_rate": 0.0004461644407345576, + "loss": 1.6066, + "loss_base2": 2.3178, + "loss_pixel": 0.1559, + "loss_text": 1.4506, + "ppl": 4.9858, + "step": 13099 + }, + { + "epoch": 0.07, + "global_step": 13100, + "learning_rate": 0.0004461602671118531, + "loss": 1.593, + "loss_base2": 2.2982, + "loss_pixel": 0.1556, + "loss_text": 1.4374, + "ppl": 4.9185, + "step": 13100 + }, + { + "epoch": 0.07, + "global_step": 13101, + "learning_rate": 0.0004461560934891486, + "loss": 1.5898, + "loss_base2": 2.2936, + "loss_pixel": 0.1558, + "loss_text": 1.4339, + "ppl": 4.9028, + "step": 13101 + }, + { + "epoch": 0.07, + "global_step": 13102, + "learning_rate": 0.0004461519198664441, + "loss": 1.5753, + "loss_base2": 2.2727, + "loss_pixel": 0.1559, + "loss_text": 1.4194, + "ppl": 4.8322, + "step": 13102 + }, + { + "epoch": 0.07, + "global_step": 13103, + "learning_rate": 0.00044614774624373953, + "loss": 1.6036, + "loss_base2": 2.3135, + "loss_pixel": 0.1574, + "loss_text": 1.4462, + "ppl": 4.9709, + "step": 13103 + }, + { + "epoch": 0.07, + "global_step": 13104, + "learning_rate": 0.00044614357262103504, + "loss": 1.598, + "loss_base2": 2.3054, + "loss_pixel": 0.1553, + "loss_text": 1.4427, + "ppl": 4.9431, + "step": 13104 + }, + { + "epoch": 0.07, + "global_step": 13105, + "learning_rate": 0.00044613939899833054, + "loss": 1.5954, + "loss_base2": 2.3017, + "loss_pixel": 0.1548, + "loss_text": 1.4406, + "ppl": 4.9303, + "step": 13105 + }, + { + "epoch": 0.07, + "global_step": 13106, + "learning_rate": 0.00044613522537562605, + "loss": 1.5879, + "loss_base2": 2.2909, + "loss_pixel": 0.1564, + "loss_text": 1.4315, + "ppl": 4.8935, + "step": 13106 + }, + { + "epoch": 0.07, + "global_step": 13107, + "learning_rate": 0.00044613105175292156, + "loss": 1.6061, + "loss_base2": 2.3171, + "loss_pixel": 0.1563, + "loss_text": 1.4498, + "ppl": 4.9833, + "step": 13107 + }, + { + "epoch": 0.07, + "global_step": 13108, + "learning_rate": 0.000446126878130217, + "loss": 1.5905, + "loss_base2": 2.2946, + "loss_pixel": 0.1558, + "loss_text": 1.4347, + "ppl": 4.9062, + "step": 13108 + }, + { + "epoch": 0.07, + "global_step": 13109, + "learning_rate": 0.0004461227045075125, + "loss": 1.5917, + "loss_base2": 2.2963, + "loss_pixel": 0.1571, + "loss_text": 1.4346, + "ppl": 4.9121, + "step": 13109 + }, + { + "epoch": 0.07, + "global_step": 13110, + "learning_rate": 0.000446118530884808, + "loss": 1.5873, + "loss_base2": 2.29, + "loss_pixel": 0.1562, + "loss_text": 1.4311, + "ppl": 4.8905, + "step": 13110 + }, + { + "epoch": 0.07, + "global_step": 13111, + "learning_rate": 0.00044611435726210353, + "loss": 1.5817, + "loss_base2": 2.2819, + "loss_pixel": 0.1573, + "loss_text": 1.4245, + "ppl": 4.8632, + "step": 13111 + }, + { + "epoch": 0.07, + "global_step": 13112, + "learning_rate": 0.000446110183639399, + "loss": 1.5741, + "loss_base2": 2.2709, + "loss_pixel": 0.1556, + "loss_text": 1.4185, + "ppl": 4.8264, + "step": 13112 + }, + { + "epoch": 0.07, + "global_step": 13113, + "learning_rate": 0.0004461060100166945, + "loss": 1.5955, + "loss_base2": 2.3018, + "loss_pixel": 0.1567, + "loss_text": 1.4388, + "ppl": 4.9308, + "step": 13113 + }, + { + "epoch": 0.07, + "global_step": 13114, + "learning_rate": 0.00044610183639399, + "loss": 1.61, + "loss_base2": 2.3227, + "loss_pixel": 0.1552, + "loss_text": 1.4548, + "ppl": 5.0028, + "step": 13114 + }, + { + "epoch": 0.07, + "global_step": 13115, + "learning_rate": 0.0004460976627712855, + "loss": 1.6059, + "loss_base2": 2.3168, + "loss_pixel": 0.1576, + "loss_text": 1.4483, + "ppl": 4.9823, + "step": 13115 + }, + { + "epoch": 0.07, + "global_step": 13116, + "learning_rate": 0.000446093489148581, + "loss": 1.6036, + "loss_base2": 2.3135, + "loss_pixel": 0.1565, + "loss_text": 1.4471, + "ppl": 4.9709, + "step": 13116 + }, + { + "epoch": 0.07, + "global_step": 13117, + "learning_rate": 0.00044608931552587647, + "loss": 1.6107, + "loss_base2": 2.3237, + "loss_pixel": 0.1559, + "loss_text": 1.4549, + "ppl": 5.0063, + "step": 13117 + }, + { + "epoch": 0.07, + "global_step": 13118, + "learning_rate": 0.000446085141903172, + "loss": 1.5921, + "loss_base2": 2.2969, + "loss_pixel": 0.1573, + "loss_text": 1.4348, + "ppl": 4.9141, + "step": 13118 + }, + { + "epoch": 0.07, + "global_step": 13119, + "learning_rate": 0.0004460809682804675, + "loss": 1.5922, + "loss_base2": 2.2971, + "loss_pixel": 0.1565, + "loss_text": 1.4358, + "ppl": 4.9145, + "step": 13119 + }, + { + "epoch": 0.07, + "global_step": 13120, + "learning_rate": 0.000446076794657763, + "loss": 1.598, + "loss_base2": 2.3054, + "loss_pixel": 0.1559, + "loss_text": 1.4421, + "ppl": 4.9431, + "step": 13120 + }, + { + "epoch": 0.07, + "global_step": 13121, + "learning_rate": 0.0004460726210350584, + "loss": 1.5922, + "loss_base2": 2.2971, + "loss_pixel": 0.1553, + "loss_text": 1.4368, + "ppl": 4.9145, + "step": 13121 + }, + { + "epoch": 0.07, + "global_step": 13122, + "learning_rate": 0.0004460684474123539, + "loss": 1.5818, + "loss_base2": 2.2821, + "loss_pixel": 0.1561, + "loss_text": 1.4258, + "ppl": 4.8637, + "step": 13122 + }, + { + "epoch": 0.07, + "global_step": 13123, + "learning_rate": 0.0004460642737896494, + "loss": 1.5904, + "loss_base2": 2.2945, + "loss_pixel": 0.1563, + "loss_text": 1.434, + "ppl": 4.9057, + "step": 13123 + }, + { + "epoch": 0.07, + "global_step": 13124, + "learning_rate": 0.0004460601001669449, + "loss": 1.5826, + "loss_base2": 2.2832, + "loss_pixel": 0.1567, + "loss_text": 1.4259, + "ppl": 4.8676, + "step": 13124 + }, + { + "epoch": 0.07, + "global_step": 13125, + "learning_rate": 0.0004460559265442404, + "loss": 1.5709, + "loss_base2": 2.2663, + "loss_pixel": 0.1543, + "loss_text": 1.4166, + "ppl": 4.811, + "step": 13125 + }, + { + "epoch": 0.07, + "global_step": 13126, + "learning_rate": 0.00044605175292153587, + "loss": 1.5793, + "loss_base2": 2.2784, + "loss_pixel": 0.1559, + "loss_text": 1.4234, + "ppl": 4.8516, + "step": 13126 + }, + { + "epoch": 0.07, + "global_step": 13127, + "learning_rate": 0.0004460475792988314, + "loss": 1.6018, + "loss_base2": 2.3109, + "loss_pixel": 0.1565, + "loss_text": 1.4454, + "ppl": 4.962, + "step": 13127 + }, + { + "epoch": 0.07, + "global_step": 13128, + "learning_rate": 0.0004460434056761269, + "loss": 1.5923, + "loss_base2": 2.2972, + "loss_pixel": 0.1568, + "loss_text": 1.4355, + "ppl": 4.915, + "step": 13128 + }, + { + "epoch": 0.07, + "global_step": 13129, + "learning_rate": 0.0004460392320534224, + "loss": 1.5857, + "loss_base2": 2.2877, + "loss_pixel": 0.1558, + "loss_text": 1.4299, + "ppl": 4.8827, + "step": 13129 + }, + { + "epoch": 0.07, + "global_step": 13130, + "learning_rate": 0.0004460350584307179, + "loss": 1.5876, + "loss_base2": 2.2904, + "loss_pixel": 0.1579, + "loss_text": 1.4297, + "ppl": 4.892, + "step": 13130 + }, + { + "epoch": 0.07, + "global_step": 13131, + "learning_rate": 0.00044603088480801335, + "loss": 1.5922, + "loss_base2": 2.2971, + "loss_pixel": 0.1564, + "loss_text": 1.4358, + "ppl": 4.9145, + "step": 13131 + }, + { + "epoch": 0.07, + "global_step": 13132, + "learning_rate": 0.00044602671118530886, + "loss": 1.5934, + "loss_base2": 2.2988, + "loss_pixel": 0.158, + "loss_text": 1.4354, + "ppl": 4.9205, + "step": 13132 + }, + { + "epoch": 0.07, + "global_step": 13133, + "learning_rate": 0.00044602253756260437, + "loss": 1.5904, + "loss_base2": 2.2945, + "loss_pixel": 0.1563, + "loss_text": 1.434, + "ppl": 4.9057, + "step": 13133 + }, + { + "epoch": 0.07, + "global_step": 13134, + "learning_rate": 0.0004460183639398999, + "loss": 1.6051, + "loss_base2": 2.3157, + "loss_pixel": 0.1569, + "loss_text": 1.4482, + "ppl": 4.9784, + "step": 13134 + }, + { + "epoch": 0.07, + "global_step": 13135, + "learning_rate": 0.00044601419031719533, + "loss": 1.5823, + "loss_base2": 2.2828, + "loss_pixel": 0.1555, + "loss_text": 1.4268, + "ppl": 4.8661, + "step": 13135 + }, + { + "epoch": 0.07, + "global_step": 13136, + "learning_rate": 0.00044601001669449084, + "loss": 1.6035, + "loss_base2": 2.3134, + "loss_pixel": 0.1559, + "loss_text": 1.4476, + "ppl": 4.9704, + "step": 13136 + }, + { + "epoch": 0.07, + "global_step": 13137, + "learning_rate": 0.00044600584307178634, + "loss": 1.5784, + "loss_base2": 2.2771, + "loss_pixel": 0.1566, + "loss_text": 1.4218, + "ppl": 4.8472, + "step": 13137 + }, + { + "epoch": 0.07, + "global_step": 13138, + "learning_rate": 0.00044600166944908185, + "loss": 1.5797, + "loss_base2": 2.279, + "loss_pixel": 0.1542, + "loss_text": 1.4255, + "ppl": 4.8535, + "step": 13138 + }, + { + "epoch": 0.07, + "global_step": 13139, + "learning_rate": 0.00044599749582637736, + "loss": 1.59, + "loss_base2": 2.2939, + "loss_pixel": 0.1559, + "loss_text": 1.4341, + "ppl": 4.9037, + "step": 13139 + }, + { + "epoch": 0.07, + "global_step": 13140, + "learning_rate": 0.00044599332220367276, + "loss": 1.6094, + "loss_base2": 2.3219, + "loss_pixel": 0.156, + "loss_text": 1.4534, + "ppl": 4.9998, + "step": 13140 + }, + { + "epoch": 0.07, + "global_step": 13141, + "learning_rate": 0.00044598914858096826, + "loss": 1.5782, + "loss_base2": 2.2769, + "loss_pixel": 0.1554, + "loss_text": 1.4228, + "ppl": 4.8462, + "step": 13141 + }, + { + "epoch": 0.07, + "global_step": 13142, + "learning_rate": 0.00044598497495826377, + "loss": 1.6041, + "loss_base2": 2.3142, + "loss_pixel": 0.1562, + "loss_text": 1.4478, + "ppl": 4.9734, + "step": 13142 + }, + { + "epoch": 0.07, + "global_step": 13143, + "learning_rate": 0.0004459808013355593, + "loss": 1.5718, + "loss_base2": 2.2676, + "loss_pixel": 0.1552, + "loss_text": 1.4166, + "ppl": 4.8153, + "step": 13143 + }, + { + "epoch": 0.07, + "global_step": 13144, + "learning_rate": 0.00044597662771285473, + "loss": 1.5458, + "loss_base2": 2.2301, + "loss_pixel": 0.1558, + "loss_text": 1.39, + "ppl": 4.6917, + "step": 13144 + }, + { + "epoch": 0.07, + "global_step": 13145, + "learning_rate": 0.00044597245409015024, + "loss": 1.5939, + "loss_base2": 2.2995, + "loss_pixel": 0.1565, + "loss_text": 1.4373, + "ppl": 4.9229, + "step": 13145 + }, + { + "epoch": 0.07, + "global_step": 13146, + "learning_rate": 0.00044596828046744575, + "loss": 1.5885, + "loss_base2": 2.2917, + "loss_pixel": 0.156, + "loss_text": 1.4326, + "ppl": 4.8964, + "step": 13146 + }, + { + "epoch": 0.07, + "global_step": 13147, + "learning_rate": 0.00044596410684474125, + "loss": 1.5879, + "loss_base2": 2.2909, + "loss_pixel": 0.1561, + "loss_text": 1.4318, + "ppl": 4.8935, + "step": 13147 + }, + { + "epoch": 0.07, + "global_step": 13148, + "learning_rate": 0.00044595993322203676, + "loss": 1.6032, + "loss_base2": 2.3129, + "loss_pixel": 0.1562, + "loss_text": 1.447, + "ppl": 4.9689, + "step": 13148 + }, + { + "epoch": 0.07, + "global_step": 13149, + "learning_rate": 0.0004459557595993322, + "loss": 1.5859, + "loss_base2": 2.288, + "loss_pixel": 0.1555, + "loss_text": 1.4304, + "ppl": 4.8837, + "step": 13149 + }, + { + "epoch": 0.07, + "global_step": 13150, + "learning_rate": 0.0004459515859766277, + "loss": 1.5792, + "loss_base2": 2.2783, + "loss_pixel": 0.155, + "loss_text": 1.4242, + "ppl": 4.8511, + "step": 13150 + }, + { + "epoch": 0.07, + "global_step": 13151, + "learning_rate": 0.00044594741235392323, + "loss": 1.6039, + "loss_base2": 2.3139, + "loss_pixel": 0.1544, + "loss_text": 1.4496, + "ppl": 4.9724, + "step": 13151 + }, + { + "epoch": 0.07, + "global_step": 13152, + "learning_rate": 0.00044594323873121874, + "loss": 1.5894, + "loss_base2": 2.293, + "loss_pixel": 0.1559, + "loss_text": 1.4335, + "ppl": 4.9008, + "step": 13152 + }, + { + "epoch": 0.07, + "global_step": 13153, + "learning_rate": 0.0004459390651085142, + "loss": 1.5891, + "loss_base2": 2.2926, + "loss_pixel": 0.1567, + "loss_text": 1.4325, + "ppl": 4.8993, + "step": 13153 + }, + { + "epoch": 0.07, + "global_step": 13154, + "learning_rate": 0.0004459348914858097, + "loss": 1.592, + "loss_base2": 2.2968, + "loss_pixel": 0.1553, + "loss_text": 1.4367, + "ppl": 4.9136, + "step": 13154 + }, + { + "epoch": 0.07, + "global_step": 13155, + "learning_rate": 0.0004459307178631052, + "loss": 1.5992, + "loss_base2": 2.3072, + "loss_pixel": 0.155, + "loss_text": 1.4442, + "ppl": 4.9491, + "step": 13155 + }, + { + "epoch": 0.07, + "global_step": 13156, + "learning_rate": 0.0004459265442404007, + "loss": 1.5922, + "loss_base2": 2.2971, + "loss_pixel": 0.1604, + "loss_text": 1.4318, + "ppl": 4.9145, + "step": 13156 + }, + { + "epoch": 0.07, + "global_step": 13157, + "learning_rate": 0.0004459223706176962, + "loss": 1.5787, + "loss_base2": 2.2776, + "loss_pixel": 0.1567, + "loss_text": 1.422, + "ppl": 4.8486, + "step": 13157 + }, + { + "epoch": 0.07, + "global_step": 13158, + "learning_rate": 0.0004459181969949916, + "loss": 1.5838, + "loss_base2": 2.2849, + "loss_pixel": 0.1549, + "loss_text": 1.4288, + "ppl": 4.8734, + "step": 13158 + }, + { + "epoch": 0.07, + "global_step": 13159, + "learning_rate": 0.0004459140233722871, + "loss": 1.6037, + "loss_base2": 2.3137, + "loss_pixel": 0.1557, + "loss_text": 1.448, + "ppl": 4.9714, + "step": 13159 + }, + { + "epoch": 0.07, + "global_step": 13160, + "learning_rate": 0.00044590984974958263, + "loss": 1.5763, + "loss_base2": 2.2741, + "loss_pixel": 0.1537, + "loss_text": 1.4227, + "ppl": 4.837, + "step": 13160 + }, + { + "epoch": 0.07, + "global_step": 13161, + "learning_rate": 0.00044590567612687814, + "loss": 1.5921, + "loss_base2": 2.2969, + "loss_pixel": 0.1551, + "loss_text": 1.437, + "ppl": 4.9141, + "step": 13161 + }, + { + "epoch": 0.07, + "global_step": 13162, + "learning_rate": 0.0004459015025041736, + "loss": 1.5889, + "loss_base2": 2.2923, + "loss_pixel": 0.1556, + "loss_text": 1.4333, + "ppl": 4.8984, + "step": 13162 + }, + { + "epoch": 0.07, + "global_step": 13163, + "learning_rate": 0.0004458973288814691, + "loss": 1.5854, + "loss_base2": 2.2872, + "loss_pixel": 0.1563, + "loss_text": 1.4291, + "ppl": 4.8812, + "step": 13163 + }, + { + "epoch": 0.07, + "global_step": 13164, + "learning_rate": 0.0004458931552587646, + "loss": 1.589, + "loss_base2": 2.2924, + "loss_pixel": 0.1559, + "loss_text": 1.433, + "ppl": 4.8988, + "step": 13164 + }, + { + "epoch": 0.07, + "global_step": 13165, + "learning_rate": 0.0004458889816360601, + "loss": 1.5866, + "loss_base2": 2.289, + "loss_pixel": 0.1543, + "loss_text": 1.4323, + "ppl": 4.8871, + "step": 13165 + }, + { + "epoch": 0.07, + "global_step": 13166, + "learning_rate": 0.0004458848080133556, + "loss": 1.5897, + "loss_base2": 2.2935, + "loss_pixel": 0.1555, + "loss_text": 1.4342, + "ppl": 4.9023, + "step": 13166 + }, + { + "epoch": 0.07, + "global_step": 13167, + "learning_rate": 0.0004458806343906511, + "loss": 1.6037, + "loss_base2": 2.3137, + "loss_pixel": 0.1556, + "loss_text": 1.4481, + "ppl": 4.9714, + "step": 13167 + }, + { + "epoch": 0.07, + "global_step": 13168, + "learning_rate": 0.0004458764607679466, + "loss": 1.6054, + "loss_base2": 2.3161, + "loss_pixel": 0.1559, + "loss_text": 1.4495, + "ppl": 4.9799, + "step": 13168 + }, + { + "epoch": 0.07, + "global_step": 13169, + "learning_rate": 0.0004458722871452421, + "loss": 1.4834, + "loss_base2": 2.1401, + "loss_pixel": 0.1558, + "loss_text": 1.3276, + "ppl": 4.4079, + "step": 13169 + }, + { + "epoch": 0.07, + "global_step": 13170, + "learning_rate": 0.0004458681135225376, + "loss": 1.3463, + "loss_base2": 1.9423, + "loss_pixel": 0.1568, + "loss_text": 1.1895, + "ppl": 3.8432, + "step": 13170 + }, + { + "epoch": 0.07, + "global_step": 13171, + "learning_rate": 0.00044586393989983305, + "loss": 1.3635, + "loss_base2": 1.9671, + "loss_pixel": 0.1556, + "loss_text": 1.2079, + "ppl": 3.9099, + "step": 13171 + }, + { + "epoch": 0.07, + "global_step": 13172, + "learning_rate": 0.00044585976627712856, + "loss": 1.3447, + "loss_base2": 1.94, + "loss_pixel": 0.1554, + "loss_text": 1.1893, + "ppl": 3.837, + "step": 13172 + }, + { + "epoch": 0.07, + "global_step": 13173, + "learning_rate": 0.00044585559265442406, + "loss": 1.3488, + "loss_base2": 1.9459, + "loss_pixel": 0.1559, + "loss_text": 1.1929, + "ppl": 3.8528, + "step": 13173 + }, + { + "epoch": 0.07, + "global_step": 13174, + "learning_rate": 0.00044585141903171957, + "loss": 1.3622, + "loss_base2": 1.9652, + "loss_pixel": 0.1561, + "loss_text": 1.2061, + "ppl": 3.9048, + "step": 13174 + }, + { + "epoch": 0.07, + "global_step": 13175, + "learning_rate": 0.0004458472454090151, + "loss": 1.3606, + "loss_base2": 1.9629, + "loss_pixel": 0.1558, + "loss_text": 1.2048, + "ppl": 3.8985, + "step": 13175 + }, + { + "epoch": 0.07, + "global_step": 13176, + "learning_rate": 0.00044584307178631053, + "loss": 1.3474, + "loss_base2": 1.9439, + "loss_pixel": 0.1549, + "loss_text": 1.1925, + "ppl": 3.8474, + "step": 13176 + }, + { + "epoch": 0.07, + "global_step": 13177, + "learning_rate": 0.000445838898163606, + "loss": 1.4682, + "loss_base2": 2.1182, + "loss_pixel": 0.155, + "loss_text": 1.3132, + "ppl": 4.3414, + "step": 13177 + }, + { + "epoch": 0.07, + "global_step": 13178, + "learning_rate": 0.0004458347245409015, + "loss": 1.608, + "loss_base2": 2.3199, + "loss_pixel": 0.1566, + "loss_text": 1.4514, + "ppl": 4.9928, + "step": 13178 + }, + { + "epoch": 0.07, + "global_step": 13179, + "learning_rate": 0.000445830550918197, + "loss": 1.5919, + "loss_base2": 2.2966, + "loss_pixel": 0.1558, + "loss_text": 1.4361, + "ppl": 4.9131, + "step": 13179 + }, + { + "epoch": 0.07, + "global_step": 13180, + "learning_rate": 0.00044582637729549245, + "loss": 1.6036, + "loss_base2": 2.3135, + "loss_pixel": 0.1547, + "loss_text": 1.4489, + "ppl": 4.9709, + "step": 13180 + }, + { + "epoch": 0.07, + "global_step": 13181, + "learning_rate": 0.00044582220367278796, + "loss": 1.5944, + "loss_base2": 2.3002, + "loss_pixel": 0.1555, + "loss_text": 1.4389, + "ppl": 4.9254, + "step": 13181 + }, + { + "epoch": 0.07, + "global_step": 13182, + "learning_rate": 0.00044581803005008347, + "loss": 1.5755, + "loss_base2": 2.273, + "loss_pixel": 0.1557, + "loss_text": 1.4198, + "ppl": 4.8332, + "step": 13182 + }, + { + "epoch": 0.07, + "global_step": 13183, + "learning_rate": 0.000445813856427379, + "loss": 1.5872, + "loss_base2": 2.2898, + "loss_pixel": 0.1547, + "loss_text": 1.4324, + "ppl": 4.89, + "step": 13183 + }, + { + "epoch": 0.07, + "global_step": 13184, + "learning_rate": 0.0004458096828046745, + "loss": 1.6045, + "loss_base2": 2.3148, + "loss_pixel": 0.1553, + "loss_text": 1.4492, + "ppl": 4.9754, + "step": 13184 + }, + { + "epoch": 0.07, + "global_step": 13185, + "learning_rate": 0.00044580550918196994, + "loss": 1.5719, + "loss_base2": 2.2678, + "loss_pixel": 0.1551, + "loss_text": 1.4168, + "ppl": 4.8158, + "step": 13185 + }, + { + "epoch": 0.07, + "global_step": 13186, + "learning_rate": 0.00044580133555926544, + "loss": 1.5861, + "loss_base2": 2.2883, + "loss_pixel": 0.1558, + "loss_text": 1.4303, + "ppl": 4.8847, + "step": 13186 + }, + { + "epoch": 0.07, + "global_step": 13187, + "learning_rate": 0.00044579716193656095, + "loss": 1.6005, + "loss_base2": 2.309, + "loss_pixel": 0.1548, + "loss_text": 1.4457, + "ppl": 4.9555, + "step": 13187 + }, + { + "epoch": 0.07, + "global_step": 13188, + "learning_rate": 0.00044579298831385646, + "loss": 1.5887, + "loss_base2": 2.292, + "loss_pixel": 0.154, + "loss_text": 1.4347, + "ppl": 4.8974, + "step": 13188 + }, + { + "epoch": 0.07, + "global_step": 13189, + "learning_rate": 0.00044578881469115196, + "loss": 1.6097, + "loss_base2": 2.3223, + "loss_pixel": 0.1563, + "loss_text": 1.4534, + "ppl": 5.0013, + "step": 13189 + }, + { + "epoch": 0.07, + "global_step": 13190, + "learning_rate": 0.0004457846410684474, + "loss": 1.5936, + "loss_base2": 2.2991, + "loss_pixel": 0.1563, + "loss_text": 1.4373, + "ppl": 4.9214, + "step": 13190 + }, + { + "epoch": 0.07, + "global_step": 13191, + "learning_rate": 0.0004457804674457429, + "loss": 1.5776, + "loss_base2": 2.276, + "loss_pixel": 0.1554, + "loss_text": 1.4222, + "ppl": 4.8433, + "step": 13191 + }, + { + "epoch": 0.07, + "global_step": 13192, + "learning_rate": 0.00044577629382303843, + "loss": 1.5861, + "loss_base2": 2.2883, + "loss_pixel": 0.1544, + "loss_text": 1.4317, + "ppl": 4.8847, + "step": 13192 + }, + { + "epoch": 0.07, + "global_step": 13193, + "learning_rate": 0.00044577212020033394, + "loss": 1.5911, + "loss_base2": 2.2955, + "loss_pixel": 0.1548, + "loss_text": 1.4363, + "ppl": 4.9091, + "step": 13193 + }, + { + "epoch": 0.07, + "global_step": 13194, + "learning_rate": 0.0004457679465776294, + "loss": 1.5945, + "loss_base2": 2.3004, + "loss_pixel": 0.1547, + "loss_text": 1.4398, + "ppl": 4.9259, + "step": 13194 + }, + { + "epoch": 0.07, + "global_step": 13195, + "learning_rate": 0.0004457637729549249, + "loss": 1.5894, + "loss_base2": 2.293, + "loss_pixel": 0.1562, + "loss_text": 1.4332, + "ppl": 4.9008, + "step": 13195 + }, + { + "epoch": 0.07, + "global_step": 13196, + "learning_rate": 0.00044575959933222035, + "loss": 1.5767, + "loss_base2": 2.2747, + "loss_pixel": 0.1542, + "loss_text": 1.4224, + "ppl": 4.839, + "step": 13196 + }, + { + "epoch": 0.07, + "global_step": 13197, + "learning_rate": 0.00044575542570951586, + "loss": 1.5877, + "loss_base2": 2.2906, + "loss_pixel": 0.1548, + "loss_text": 1.4329, + "ppl": 4.8925, + "step": 13197 + }, + { + "epoch": 0.07, + "global_step": 13198, + "learning_rate": 0.00044575125208681137, + "loss": 1.6054, + "loss_base2": 2.3161, + "loss_pixel": 0.1553, + "loss_text": 1.4501, + "ppl": 4.9799, + "step": 13198 + }, + { + "epoch": 0.07, + "global_step": 13199, + "learning_rate": 0.0004457470784641068, + "loss": 1.5862, + "loss_base2": 2.2884, + "loss_pixel": 0.1558, + "loss_text": 1.4304, + "ppl": 4.8852, + "step": 13199 + }, + { + "epoch": 0.07, + "global_step": 13200, + "learning_rate": 0.00044574290484140233, + "loss": 1.5872, + "loss_base2": 2.2898, + "loss_pixel": 0.156, + "loss_text": 1.4312, + "ppl": 4.89, + "step": 13200 + }, + { + "epoch": 0.07, + "global_step": 13201, + "learning_rate": 0.00044573873121869784, + "loss": 1.5944, + "loss_base2": 2.3002, + "loss_pixel": 0.1542, + "loss_text": 1.4401, + "ppl": 4.9254, + "step": 13201 + }, + { + "epoch": 0.07, + "global_step": 13202, + "learning_rate": 0.00044573455759599334, + "loss": 1.5182, + "loss_base2": 2.1903, + "loss_pixel": 0.1564, + "loss_text": 1.3617, + "ppl": 4.564, + "step": 13202 + }, + { + "epoch": 0.07, + "global_step": 13203, + "learning_rate": 0.0004457303839732888, + "loss": 1.3827, + "loss_base2": 1.9948, + "loss_pixel": 0.1553, + "loss_text": 1.2274, + "ppl": 3.9856, + "step": 13203 + }, + { + "epoch": 0.07, + "global_step": 13204, + "learning_rate": 0.0004457262103505843, + "loss": 1.3833, + "loss_base2": 1.9957, + "loss_pixel": 0.1558, + "loss_text": 1.2274, + "ppl": 3.988, + "step": 13204 + }, + { + "epoch": 0.07, + "global_step": 13205, + "learning_rate": 0.0004457220367278798, + "loss": 1.3732, + "loss_base2": 1.9811, + "loss_pixel": 0.155, + "loss_text": 1.2181, + "ppl": 3.948, + "step": 13205 + }, + { + "epoch": 0.07, + "global_step": 13206, + "learning_rate": 0.0004457178631051753, + "loss": 1.3691, + "loss_base2": 1.9752, + "loss_pixel": 0.154, + "loss_text": 1.215, + "ppl": 3.9318, + "step": 13206 + }, + { + "epoch": 0.07, + "global_step": 13207, + "learning_rate": 0.0004457136894824708, + "loss": 1.3594, + "loss_base2": 1.9612, + "loss_pixel": 0.1552, + "loss_text": 1.2042, + "ppl": 3.8939, + "step": 13207 + }, + { + "epoch": 0.07, + "global_step": 13208, + "learning_rate": 0.0004457095158597663, + "loss": 1.3282, + "loss_base2": 1.9162, + "loss_pixel": 0.1581, + "loss_text": 1.1701, + "ppl": 3.7742, + "step": 13208 + }, + { + "epoch": 0.07, + "global_step": 13209, + "learning_rate": 0.0004457053422370618, + "loss": 1.3761, + "loss_base2": 1.9853, + "loss_pixel": 0.1559, + "loss_text": 1.2202, + "ppl": 3.9594, + "step": 13209 + }, + { + "epoch": 0.07, + "global_step": 13210, + "learning_rate": 0.0004457011686143573, + "loss": 1.3625, + "loss_base2": 1.9657, + "loss_pixel": 0.1556, + "loss_text": 1.2069, + "ppl": 3.9059, + "step": 13210 + }, + { + "epoch": 0.07, + "global_step": 13211, + "learning_rate": 0.0004456969949916528, + "loss": 1.5945, + "loss_base2": 2.3004, + "loss_pixel": 0.1562, + "loss_text": 1.4382, + "ppl": 4.9259, + "step": 13211 + }, + { + "epoch": 0.07, + "global_step": 13212, + "learning_rate": 0.00044569282136894825, + "loss": 1.5862, + "loss_base2": 2.2884, + "loss_pixel": 0.1495, + "loss_text": 1.4367, + "ppl": 4.8852, + "step": 13212 + }, + { + "epoch": 0.07, + "global_step": 13213, + "learning_rate": 0.00044568864774624376, + "loss": 1.589, + "loss_base2": 2.2924, + "loss_pixel": 0.147, + "loss_text": 1.442, + "ppl": 4.8988, + "step": 13213 + }, + { + "epoch": 0.07, + "global_step": 13214, + "learning_rate": 0.0004456844741235392, + "loss": 1.595, + "loss_base2": 2.3011, + "loss_pixel": 0.146, + "loss_text": 1.449, + "ppl": 4.9283, + "step": 13214 + }, + { + "epoch": 0.07, + "global_step": 13215, + "learning_rate": 0.0004456803005008347, + "loss": 1.5754, + "loss_base2": 2.2728, + "loss_pixel": 0.1476, + "loss_text": 1.4278, + "ppl": 4.8327, + "step": 13215 + }, + { + "epoch": 0.07, + "global_step": 13216, + "learning_rate": 0.00044567612687813023, + "loss": 1.5908, + "loss_base2": 2.295, + "loss_pixel": 0.1443, + "loss_text": 1.4466, + "ppl": 4.9077, + "step": 13216 + }, + { + "epoch": 0.07, + "global_step": 13217, + "learning_rate": 0.0004456719532554257, + "loss": 1.5634, + "loss_base2": 2.2555, + "loss_pixel": 0.1447, + "loss_text": 1.4186, + "ppl": 4.775, + "step": 13217 + }, + { + "epoch": 0.07, + "global_step": 13218, + "learning_rate": 0.0004456677796327212, + "loss": 1.5865, + "loss_base2": 2.2888, + "loss_pixel": 0.1453, + "loss_text": 1.4412, + "ppl": 4.8866, + "step": 13218 + }, + { + "epoch": 0.07, + "global_step": 13219, + "learning_rate": 0.0004456636060100167, + "loss": 1.5835, + "loss_base2": 2.2845, + "loss_pixel": 0.1451, + "loss_text": 1.4384, + "ppl": 4.872, + "step": 13219 + }, + { + "epoch": 0.07, + "global_step": 13220, + "learning_rate": 0.0004456594323873122, + "loss": 1.5877, + "loss_base2": 2.2906, + "loss_pixel": 0.1453, + "loss_text": 1.4425, + "ppl": 4.8925, + "step": 13220 + }, + { + "epoch": 0.07, + "global_step": 13221, + "learning_rate": 0.00044565525876460766, + "loss": 1.5766, + "loss_base2": 2.2746, + "loss_pixel": 0.1427, + "loss_text": 1.4339, + "ppl": 4.8385, + "step": 13221 + }, + { + "epoch": 0.07, + "global_step": 13222, + "learning_rate": 0.00044565108514190316, + "loss": 1.5857, + "loss_base2": 2.2877, + "loss_pixel": 0.1438, + "loss_text": 1.4419, + "ppl": 4.8827, + "step": 13222 + }, + { + "epoch": 0.07, + "global_step": 13223, + "learning_rate": 0.00044564691151919867, + "loss": 1.5935, + "loss_base2": 2.2989, + "loss_pixel": 0.1454, + "loss_text": 1.4481, + "ppl": 4.9209, + "step": 13223 + }, + { + "epoch": 0.07, + "global_step": 13224, + "learning_rate": 0.0004456427378964942, + "loss": 1.599, + "loss_base2": 2.3069, + "loss_pixel": 0.1429, + "loss_text": 1.456, + "ppl": 4.9481, + "step": 13224 + }, + { + "epoch": 0.07, + "global_step": 13225, + "learning_rate": 0.0004456385642737897, + "loss": 1.5922, + "loss_base2": 2.2971, + "loss_pixel": 0.1458, + "loss_text": 1.4463, + "ppl": 4.9145, + "step": 13225 + }, + { + "epoch": 0.07, + "global_step": 13226, + "learning_rate": 0.00044563439065108514, + "loss": 1.5965, + "loss_base2": 2.3033, + "loss_pixel": 0.1421, + "loss_text": 1.4545, + "ppl": 4.9357, + "step": 13226 + }, + { + "epoch": 0.07, + "global_step": 13227, + "learning_rate": 0.00044563021702838065, + "loss": 1.5771, + "loss_base2": 2.2753, + "loss_pixel": 0.1444, + "loss_text": 1.4327, + "ppl": 4.8409, + "step": 13227 + }, + { + "epoch": 0.07, + "global_step": 13228, + "learning_rate": 0.00044562604340567615, + "loss": 1.5883, + "loss_base2": 2.2914, + "loss_pixel": 0.1475, + "loss_text": 1.4409, + "ppl": 4.8954, + "step": 13228 + }, + { + "epoch": 0.07, + "global_step": 13229, + "learning_rate": 0.00044562186978297166, + "loss": 1.6112, + "loss_base2": 2.3245, + "loss_pixel": 0.1628, + "loss_text": 1.4484, + "ppl": 5.0088, + "step": 13229 + }, + { + "epoch": 0.07, + "global_step": 13230, + "learning_rate": 0.0004456176961602671, + "loss": 1.5967, + "loss_base2": 2.3036, + "loss_pixel": 0.1614, + "loss_text": 1.4353, + "ppl": 4.9367, + "step": 13230 + }, + { + "epoch": 0.07, + "global_step": 13231, + "learning_rate": 0.0004456135225375626, + "loss": 1.6026, + "loss_base2": 2.3121, + "loss_pixel": 0.1587, + "loss_text": 1.4439, + "ppl": 4.9659, + "step": 13231 + }, + { + "epoch": 0.07, + "global_step": 13232, + "learning_rate": 0.00044560934891485813, + "loss": 1.6097, + "loss_base2": 2.3223, + "loss_pixel": 0.1569, + "loss_text": 1.4529, + "ppl": 5.0013, + "step": 13232 + }, + { + "epoch": 0.07, + "global_step": 13233, + "learning_rate": 0.0004456051752921536, + "loss": 1.6063, + "loss_base2": 2.3174, + "loss_pixel": 0.1567, + "loss_text": 1.4496, + "ppl": 4.9843, + "step": 13233 + }, + { + "epoch": 0.07, + "global_step": 13234, + "learning_rate": 0.0004456010016694491, + "loss": 1.5293, + "loss_base2": 2.2063, + "loss_pixel": 0.1561, + "loss_text": 1.3732, + "ppl": 4.6149, + "step": 13234 + }, + { + "epoch": 0.07, + "global_step": 13235, + "learning_rate": 0.00044559682804674454, + "loss": 1.391, + "loss_base2": 2.0068, + "loss_pixel": 0.1583, + "loss_text": 1.2327, + "ppl": 4.0189, + "step": 13235 + }, + { + "epoch": 0.07, + "global_step": 13236, + "learning_rate": 0.00044559265442404005, + "loss": 1.3808, + "loss_base2": 1.9921, + "loss_pixel": 0.1545, + "loss_text": 1.2264, + "ppl": 3.9781, + "step": 13236 + }, + { + "epoch": 0.07, + "global_step": 13237, + "learning_rate": 0.00044558848080133556, + "loss": 1.3809, + "loss_base2": 1.9922, + "loss_pixel": 0.1561, + "loss_text": 1.2247, + "ppl": 3.9785, + "step": 13237 + }, + { + "epoch": 0.07, + "global_step": 13238, + "learning_rate": 0.00044558430717863106, + "loss": 1.3593, + "loss_base2": 1.9611, + "loss_pixel": 0.1576, + "loss_text": 1.2017, + "ppl": 3.8935, + "step": 13238 + }, + { + "epoch": 0.07, + "global_step": 13239, + "learning_rate": 0.00044558013355592657, + "loss": 1.3518, + "loss_base2": 1.9502, + "loss_pixel": 0.1568, + "loss_text": 1.195, + "ppl": 3.8644, + "step": 13239 + }, + { + "epoch": 0.07, + "global_step": 13240, + "learning_rate": 0.000445575959933222, + "loss": 1.3498, + "loss_base2": 1.9473, + "loss_pixel": 0.156, + "loss_text": 1.1938, + "ppl": 3.8567, + "step": 13240 + }, + { + "epoch": 0.07, + "global_step": 13241, + "learning_rate": 0.00044557178631051753, + "loss": 1.3519, + "loss_base2": 1.9504, + "loss_pixel": 0.1559, + "loss_text": 1.196, + "ppl": 3.8648, + "step": 13241 + }, + { + "epoch": 0.07, + "global_step": 13242, + "learning_rate": 0.00044556761268781304, + "loss": 1.3647, + "loss_base2": 1.9688, + "loss_pixel": 0.1559, + "loss_text": 1.2089, + "ppl": 3.9145, + "step": 13242 + }, + { + "epoch": 0.07, + "global_step": 13243, + "learning_rate": 0.00044556343906510855, + "loss": 1.5092, + "loss_base2": 2.1773, + "loss_pixel": 0.1551, + "loss_text": 1.3541, + "ppl": 4.5231, + "step": 13243 + }, + { + "epoch": 0.07, + "global_step": 13244, + "learning_rate": 0.000445559265442404, + "loss": 1.6022, + "loss_base2": 2.3115, + "loss_pixel": 0.1561, + "loss_text": 1.4461, + "ppl": 4.9639, + "step": 13244 + }, + { + "epoch": 0.07, + "global_step": 13245, + "learning_rate": 0.0004455550918196995, + "loss": 1.5976, + "loss_base2": 2.3048, + "loss_pixel": 0.1577, + "loss_text": 1.4399, + "ppl": 4.9412, + "step": 13245 + }, + { + "epoch": 0.07, + "global_step": 13246, + "learning_rate": 0.000445550918196995, + "loss": 1.621, + "loss_base2": 2.3386, + "loss_pixel": 0.1559, + "loss_text": 1.4651, + "ppl": 5.0581, + "step": 13246 + }, + { + "epoch": 0.07, + "global_step": 13247, + "learning_rate": 0.0004455467445742905, + "loss": 1.6066, + "loss_base2": 2.3178, + "loss_pixel": 0.1554, + "loss_text": 1.4512, + "ppl": 4.9858, + "step": 13247 + }, + { + "epoch": 0.07, + "global_step": 13248, + "learning_rate": 0.00044554257095158603, + "loss": 1.6004, + "loss_base2": 2.3089, + "loss_pixel": 0.1553, + "loss_text": 1.4451, + "ppl": 4.955, + "step": 13248 + }, + { + "epoch": 0.07, + "global_step": 13249, + "learning_rate": 0.0004455383973288815, + "loss": 1.6074, + "loss_base2": 2.319, + "loss_pixel": 0.1548, + "loss_text": 1.4525, + "ppl": 4.9898, + "step": 13249 + }, + { + "epoch": 0.07, + "global_step": 13250, + "learning_rate": 0.000445534223706177, + "loss": 1.6081, + "loss_base2": 2.32, + "loss_pixel": 0.1562, + "loss_text": 1.452, + "ppl": 4.9933, + "step": 13250 + }, + { + "epoch": 0.07, + "global_step": 13251, + "learning_rate": 0.0004455300500834725, + "loss": 1.6164, + "loss_base2": 2.332, + "loss_pixel": 0.1563, + "loss_text": 1.4601, + "ppl": 5.0349, + "step": 13251 + }, + { + "epoch": 0.07, + "global_step": 13252, + "learning_rate": 0.00044552587646076795, + "loss": 1.5918, + "loss_base2": 2.2965, + "loss_pixel": 0.1561, + "loss_text": 1.4357, + "ppl": 4.9126, + "step": 13252 + }, + { + "epoch": 0.07, + "global_step": 13253, + "learning_rate": 0.0004455217028380634, + "loss": 1.6119, + "loss_base2": 2.3255, + "loss_pixel": 0.1564, + "loss_text": 1.4555, + "ppl": 5.0123, + "step": 13253 + }, + { + "epoch": 0.07, + "global_step": 13254, + "learning_rate": 0.0004455175292153589, + "loss": 1.6145, + "loss_base2": 2.3292, + "loss_pixel": 0.1551, + "loss_text": 1.4594, + "ppl": 5.0254, + "step": 13254 + }, + { + "epoch": 0.07, + "global_step": 13255, + "learning_rate": 0.0004455133555926544, + "loss": 1.5897, + "loss_base2": 2.2935, + "loss_pixel": 0.1556, + "loss_text": 1.4341, + "ppl": 4.9023, + "step": 13255 + }, + { + "epoch": 0.07, + "global_step": 13256, + "learning_rate": 0.0004455091819699499, + "loss": 1.5932, + "loss_base2": 2.2985, + "loss_pixel": 0.156, + "loss_text": 1.4371, + "ppl": 4.9195, + "step": 13256 + }, + { + "epoch": 0.07, + "global_step": 13257, + "learning_rate": 0.00044550500834724543, + "loss": 1.6089, + "loss_base2": 2.3212, + "loss_pixel": 0.1573, + "loss_text": 1.4516, + "ppl": 4.9973, + "step": 13257 + }, + { + "epoch": 0.07, + "global_step": 13258, + "learning_rate": 0.0004455008347245409, + "loss": 1.5999, + "loss_base2": 2.3082, + "loss_pixel": 0.1558, + "loss_text": 1.4441, + "ppl": 4.9525, + "step": 13258 + }, + { + "epoch": 0.07, + "global_step": 13259, + "learning_rate": 0.0004454966611018364, + "loss": 1.5985, + "loss_base2": 2.3061, + "loss_pixel": 0.1547, + "loss_text": 1.4439, + "ppl": 4.9456, + "step": 13259 + }, + { + "epoch": 0.07, + "global_step": 13260, + "learning_rate": 0.0004454924874791319, + "loss": 1.6141, + "loss_base2": 2.3287, + "loss_pixel": 0.1546, + "loss_text": 1.4595, + "ppl": 5.0234, + "step": 13260 + }, + { + "epoch": 0.07, + "global_step": 13261, + "learning_rate": 0.0004454883138564274, + "loss": 1.5775, + "loss_base2": 2.2759, + "loss_pixel": 0.157, + "loss_text": 1.4205, + "ppl": 4.8428, + "step": 13261 + }, + { + "epoch": 0.07, + "global_step": 13262, + "learning_rate": 0.00044548414023372286, + "loss": 1.5976, + "loss_base2": 2.3048, + "loss_pixel": 0.1557, + "loss_text": 1.4419, + "ppl": 4.9412, + "step": 13262 + }, + { + "epoch": 0.07, + "global_step": 13263, + "learning_rate": 0.00044547996661101837, + "loss": 1.5872, + "loss_base2": 2.2898, + "loss_pixel": 0.1582, + "loss_text": 1.429, + "ppl": 4.89, + "step": 13263 + }, + { + "epoch": 0.07, + "global_step": 13264, + "learning_rate": 0.0004454757929883139, + "loss": 1.596, + "loss_base2": 2.3025, + "loss_pixel": 0.1559, + "loss_text": 1.4401, + "ppl": 4.9333, + "step": 13264 + }, + { + "epoch": 0.07, + "global_step": 13265, + "learning_rate": 0.0004454716193656094, + "loss": 1.5831, + "loss_base2": 2.2839, + "loss_pixel": 0.156, + "loss_text": 1.4271, + "ppl": 4.87, + "step": 13265 + }, + { + "epoch": 0.07, + "global_step": 13266, + "learning_rate": 0.0004454674457429049, + "loss": 1.5916, + "loss_base2": 2.2962, + "loss_pixel": 0.1562, + "loss_text": 1.4354, + "ppl": 4.9116, + "step": 13266 + }, + { + "epoch": 0.07, + "global_step": 13267, + "learning_rate": 0.00044546327212020034, + "loss": 1.5963, + "loss_base2": 2.303, + "loss_pixel": 0.1548, + "loss_text": 1.4415, + "ppl": 4.9347, + "step": 13267 + }, + { + "epoch": 0.07, + "global_step": 13268, + "learning_rate": 0.00044545909849749585, + "loss": 1.4996, + "loss_base2": 2.1635, + "loss_pixel": 0.1545, + "loss_text": 1.3451, + "ppl": 4.4799, + "step": 13268 + }, + { + "epoch": 0.07, + "global_step": 13269, + "learning_rate": 0.00044545492487479136, + "loss": 1.3662, + "loss_base2": 1.971, + "loss_pixel": 0.1543, + "loss_text": 1.2119, + "ppl": 3.9204, + "step": 13269 + }, + { + "epoch": 0.07, + "global_step": 13270, + "learning_rate": 0.00044545075125208686, + "loss": 1.3837, + "loss_base2": 1.9963, + "loss_pixel": 0.1545, + "loss_text": 1.2293, + "ppl": 3.9896, + "step": 13270 + }, + { + "epoch": 0.07, + "global_step": 13271, + "learning_rate": 0.00044544657762938226, + "loss": 1.3672, + "loss_base2": 1.9725, + "loss_pixel": 0.1553, + "loss_text": 1.212, + "ppl": 3.9243, + "step": 13271 + }, + { + "epoch": 0.07, + "global_step": 13272, + "learning_rate": 0.00044544240400667777, + "loss": 1.354, + "loss_base2": 1.9534, + "loss_pixel": 0.1552, + "loss_text": 1.1988, + "ppl": 3.8729, + "step": 13272 + }, + { + "epoch": 0.07, + "global_step": 13273, + "learning_rate": 0.0004454382303839733, + "loss": 1.3799, + "loss_base2": 1.9908, + "loss_pixel": 0.1549, + "loss_text": 1.2249, + "ppl": 3.9745, + "step": 13273 + }, + { + "epoch": 0.07, + "global_step": 13274, + "learning_rate": 0.0004454340567612688, + "loss": 1.3574, + "loss_base2": 1.9583, + "loss_pixel": 0.1562, + "loss_text": 1.2012, + "ppl": 3.8861, + "step": 13274 + }, + { + "epoch": 0.07, + "global_step": 13275, + "learning_rate": 0.0004454298831385643, + "loss": 1.3588, + "loss_base2": 1.9603, + "loss_pixel": 0.1557, + "loss_text": 1.203, + "ppl": 3.8915, + "step": 13275 + }, + { + "epoch": 0.07, + "global_step": 13276, + "learning_rate": 0.00044542570951585975, + "loss": 1.391, + "loss_base2": 2.0068, + "loss_pixel": 0.1566, + "loss_text": 1.2344, + "ppl": 4.0189, + "step": 13276 + }, + { + "epoch": 0.07, + "global_step": 13277, + "learning_rate": 0.00044542153589315525, + "loss": 1.6074, + "loss_base2": 2.319, + "loss_pixel": 0.1556, + "loss_text": 1.4518, + "ppl": 4.9898, + "step": 13277 + }, + { + "epoch": 0.07, + "global_step": 13278, + "learning_rate": 0.00044541736227045076, + "loss": 1.5872, + "loss_base2": 2.2898, + "loss_pixel": 0.1558, + "loss_text": 1.4313, + "ppl": 4.89, + "step": 13278 + }, + { + "epoch": 0.07, + "global_step": 13279, + "learning_rate": 0.00044541318864774627, + "loss": 1.6046, + "loss_base2": 2.3149, + "loss_pixel": 0.1557, + "loss_text": 1.4489, + "ppl": 4.9759, + "step": 13279 + }, + { + "epoch": 0.07, + "global_step": 13280, + "learning_rate": 0.0004454090150250417, + "loss": 1.5863, + "loss_base2": 2.2885, + "loss_pixel": 0.1556, + "loss_text": 1.4307, + "ppl": 4.8856, + "step": 13280 + }, + { + "epoch": 0.07, + "global_step": 13281, + "learning_rate": 0.00044540484140233723, + "loss": 1.6002, + "loss_base2": 2.3086, + "loss_pixel": 0.156, + "loss_text": 1.4442, + "ppl": 4.954, + "step": 13281 + }, + { + "epoch": 0.07, + "global_step": 13282, + "learning_rate": 0.00044540066777963274, + "loss": 1.5948, + "loss_base2": 2.3008, + "loss_pixel": 0.1571, + "loss_text": 1.4376, + "ppl": 4.9273, + "step": 13282 + }, + { + "epoch": 0.07, + "global_step": 13283, + "learning_rate": 0.00044539649415692824, + "loss": 1.6079, + "loss_base2": 2.3197, + "loss_pixel": 0.1569, + "loss_text": 1.451, + "ppl": 4.9923, + "step": 13283 + }, + { + "epoch": 0.07, + "global_step": 13284, + "learning_rate": 0.00044539232053422375, + "loss": 1.6088, + "loss_base2": 2.321, + "loss_pixel": 0.1551, + "loss_text": 1.4537, + "ppl": 4.9968, + "step": 13284 + }, + { + "epoch": 0.07, + "global_step": 13285, + "learning_rate": 0.0004453881469115192, + "loss": 1.6236, + "loss_base2": 2.3424, + "loss_pixel": 0.1568, + "loss_text": 1.4668, + "ppl": 5.0713, + "step": 13285 + }, + { + "epoch": 0.07, + "global_step": 13286, + "learning_rate": 0.0004453839732888147, + "loss": 1.6132, + "loss_base2": 2.3274, + "loss_pixel": 0.1555, + "loss_text": 1.4577, + "ppl": 5.0188, + "step": 13286 + }, + { + "epoch": 0.07, + "global_step": 13287, + "learning_rate": 0.0004453797996661102, + "loss": 1.6053, + "loss_base2": 2.316, + "loss_pixel": 0.1549, + "loss_text": 1.4504, + "ppl": 4.9794, + "step": 13287 + }, + { + "epoch": 0.07, + "global_step": 13288, + "learning_rate": 0.0004453756260434057, + "loss": 1.5962, + "loss_base2": 2.3028, + "loss_pixel": 0.1552, + "loss_text": 1.4411, + "ppl": 4.9342, + "step": 13288 + }, + { + "epoch": 0.07, + "global_step": 13289, + "learning_rate": 0.0004453714524207011, + "loss": 1.6021, + "loss_base2": 2.3113, + "loss_pixel": 0.1554, + "loss_text": 1.4467, + "ppl": 4.9634, + "step": 13289 + }, + { + "epoch": 0.07, + "global_step": 13290, + "learning_rate": 0.00044536727879799663, + "loss": 1.5878, + "loss_base2": 2.2907, + "loss_pixel": 0.1595, + "loss_text": 1.4283, + "ppl": 4.893, + "step": 13290 + }, + { + "epoch": 0.07, + "global_step": 13291, + "learning_rate": 0.00044536310517529214, + "loss": 1.5935, + "loss_base2": 2.2989, + "loss_pixel": 0.1591, + "loss_text": 1.4343, + "ppl": 4.9209, + "step": 13291 + }, + { + "epoch": 0.07, + "global_step": 13292, + "learning_rate": 0.00044535893155258765, + "loss": 1.6059, + "loss_base2": 2.3168, + "loss_pixel": 0.1594, + "loss_text": 1.4465, + "ppl": 4.9823, + "step": 13292 + }, + { + "epoch": 0.07, + "global_step": 13293, + "learning_rate": 0.00044535475792988315, + "loss": 1.6124, + "loss_base2": 2.3262, + "loss_pixel": 0.1561, + "loss_text": 1.4564, + "ppl": 5.0148, + "step": 13293 + }, + { + "epoch": 0.07, + "global_step": 13294, + "learning_rate": 0.0004453505843071786, + "loss": 1.5853, + "loss_base2": 2.2871, + "loss_pixel": 0.1542, + "loss_text": 1.4311, + "ppl": 4.8808, + "step": 13294 + }, + { + "epoch": 0.07, + "global_step": 13295, + "learning_rate": 0.0004453464106844741, + "loss": 1.6005, + "loss_base2": 2.309, + "loss_pixel": 0.1572, + "loss_text": 1.4433, + "ppl": 4.9555, + "step": 13295 + }, + { + "epoch": 0.07, + "global_step": 13296, + "learning_rate": 0.0004453422370617696, + "loss": 1.5934, + "loss_base2": 2.2988, + "loss_pixel": 0.1549, + "loss_text": 1.4384, + "ppl": 4.9205, + "step": 13296 + }, + { + "epoch": 0.07, + "global_step": 13297, + "learning_rate": 0.00044533806343906513, + "loss": 1.5808, + "loss_base2": 2.2806, + "loss_pixel": 0.1566, + "loss_text": 1.4243, + "ppl": 4.8588, + "step": 13297 + }, + { + "epoch": 0.07, + "global_step": 13298, + "learning_rate": 0.00044533388981636064, + "loss": 1.6134, + "loss_base2": 2.3276, + "loss_pixel": 0.156, + "loss_text": 1.4574, + "ppl": 5.0198, + "step": 13298 + }, + { + "epoch": 0.07, + "global_step": 13299, + "learning_rate": 0.0004453297161936561, + "loss": 1.5232, + "loss_base2": 2.1975, + "loss_pixel": 0.1554, + "loss_text": 1.3678, + "ppl": 4.5869, + "step": 13299 + }, + { + "epoch": 0.07, + "global_step": 13300, + "learning_rate": 0.0004453255425709516, + "loss": 1.3898, + "loss_base2": 2.0051, + "loss_pixel": 0.1558, + "loss_text": 1.234, + "ppl": 4.014, + "step": 13300 + }, + { + "epoch": 0.07, + "global_step": 13301, + "learning_rate": 0.0004453213689482471, + "loss": 1.3781, + "loss_base2": 1.9882, + "loss_pixel": 0.1556, + "loss_text": 1.2225, + "ppl": 3.9674, + "step": 13301 + }, + { + "epoch": 0.07, + "global_step": 13302, + "learning_rate": 0.0004453171953255426, + "loss": 1.7125, + "loss_base2": 2.4706, + "loss_pixel": 0.155, + "loss_text": 1.5575, + "ppl": 5.5428, + "step": 13302 + }, + { + "epoch": 0.07, + "global_step": 13303, + "learning_rate": 0.00044531302170283806, + "loss": 1.4025, + "loss_base2": 2.0234, + "loss_pixel": 0.1547, + "loss_text": 1.2478, + "ppl": 4.0654, + "step": 13303 + }, + { + "epoch": 0.07, + "global_step": 13304, + "learning_rate": 0.00044530884808013357, + "loss": 1.3749, + "loss_base2": 1.9836, + "loss_pixel": 0.155, + "loss_text": 1.2199, + "ppl": 3.9547, + "step": 13304 + }, + { + "epoch": 0.07, + "global_step": 13305, + "learning_rate": 0.0004453046744574291, + "loss": 1.3803, + "loss_base2": 1.9914, + "loss_pixel": 0.1559, + "loss_text": 1.2244, + "ppl": 3.9761, + "step": 13305 + }, + { + "epoch": 0.07, + "global_step": 13306, + "learning_rate": 0.0004453005008347246, + "loss": 1.3795, + "loss_base2": 1.9902, + "loss_pixel": 0.1553, + "loss_text": 1.2241, + "ppl": 3.9729, + "step": 13306 + }, + { + "epoch": 0.07, + "global_step": 13307, + "learning_rate": 0.0004452963272120201, + "loss": 1.4071, + "loss_base2": 2.03, + "loss_pixel": 0.1555, + "loss_text": 1.2516, + "ppl": 4.0841, + "step": 13307 + }, + { + "epoch": 0.07, + "global_step": 13308, + "learning_rate": 0.0004452921535893155, + "loss": 1.373, + "loss_base2": 1.9808, + "loss_pixel": 0.156, + "loss_text": 1.217, + "ppl": 3.9472, + "step": 13308 + }, + { + "epoch": 0.07, + "global_step": 13309, + "learning_rate": 0.000445287979966611, + "loss": 1.3763, + "loss_base2": 1.9856, + "loss_pixel": 0.1548, + "loss_text": 1.2215, + "ppl": 3.9602, + "step": 13309 + }, + { + "epoch": 0.07, + "global_step": 13310, + "learning_rate": 0.0004452838063439065, + "loss": 1.3787, + "loss_base2": 1.989, + "loss_pixel": 0.1558, + "loss_text": 1.2228, + "ppl": 3.9697, + "step": 13310 + }, + { + "epoch": 0.07, + "global_step": 13311, + "learning_rate": 0.000445279632721202, + "loss": 1.3777, + "loss_base2": 1.9876, + "loss_pixel": 0.156, + "loss_text": 1.2217, + "ppl": 3.9658, + "step": 13311 + }, + { + "epoch": 0.07, + "global_step": 13312, + "learning_rate": 0.00044527545909849747, + "loss": 1.3881, + "loss_base2": 2.0026, + "loss_pixel": 0.157, + "loss_text": 1.2311, + "ppl": 4.0072, + "step": 13312 + }, + { + "epoch": 0.07, + "global_step": 13313, + "learning_rate": 0.000445271285475793, + "loss": 1.3711, + "loss_base2": 1.9781, + "loss_pixel": 0.156, + "loss_text": 1.2151, + "ppl": 3.9397, + "step": 13313 + }, + { + "epoch": 0.07, + "global_step": 13314, + "learning_rate": 0.0004452671118530885, + "loss": 1.3538, + "loss_base2": 1.9531, + "loss_pixel": 0.1545, + "loss_text": 1.1993, + "ppl": 3.8721, + "step": 13314 + }, + { + "epoch": 0.07, + "global_step": 13315, + "learning_rate": 0.000445262938230384, + "loss": 1.3941, + "loss_base2": 2.0113, + "loss_pixel": 0.1539, + "loss_text": 1.2401, + "ppl": 4.0313, + "step": 13315 + }, + { + "epoch": 0.07, + "global_step": 13316, + "learning_rate": 0.0004452587646076795, + "loss": 1.3365, + "loss_base2": 1.9282, + "loss_pixel": 0.1552, + "loss_text": 1.1813, + "ppl": 3.8057, + "step": 13316 + }, + { + "epoch": 0.07, + "global_step": 13317, + "learning_rate": 0.00044525459098497495, + "loss": 1.3682, + "loss_base2": 1.9739, + "loss_pixel": 0.155, + "loss_text": 1.2132, + "ppl": 3.9283, + "step": 13317 + }, + { + "epoch": 0.07, + "global_step": 13318, + "learning_rate": 0.00044525041736227046, + "loss": 1.3675, + "loss_base2": 1.9729, + "loss_pixel": 0.1546, + "loss_text": 1.2129, + "ppl": 3.9255, + "step": 13318 + }, + { + "epoch": 0.07, + "global_step": 13319, + "learning_rate": 0.00044524624373956596, + "loss": 1.3667, + "loss_base2": 1.9717, + "loss_pixel": 0.1557, + "loss_text": 1.211, + "ppl": 3.9224, + "step": 13319 + }, + { + "epoch": 0.07, + "global_step": 13320, + "learning_rate": 0.00044524207011686147, + "loss": 1.3712, + "loss_base2": 1.9782, + "loss_pixel": 0.1553, + "loss_text": 1.2159, + "ppl": 3.9401, + "step": 13320 + }, + { + "epoch": 0.07, + "global_step": 13321, + "learning_rate": 0.0004452378964941569, + "loss": 1.3885, + "loss_base2": 2.0032, + "loss_pixel": 0.1553, + "loss_text": 1.2333, + "ppl": 4.0088, + "step": 13321 + }, + { + "epoch": 0.07, + "global_step": 13322, + "learning_rate": 0.00044523372287145243, + "loss": 1.3446, + "loss_base2": 1.9398, + "loss_pixel": 0.1562, + "loss_text": 1.1884, + "ppl": 3.8367, + "step": 13322 + }, + { + "epoch": 0.07, + "global_step": 13323, + "learning_rate": 0.00044522954924874794, + "loss": 1.4317, + "loss_base2": 2.0655, + "loss_pixel": 0.156, + "loss_text": 1.2756, + "ppl": 4.1858, + "step": 13323 + }, + { + "epoch": 0.07, + "global_step": 13324, + "learning_rate": 0.00044522537562604345, + "loss": 1.6097, + "loss_base2": 2.3223, + "loss_pixel": 0.1532, + "loss_text": 1.4564, + "ppl": 5.0013, + "step": 13324 + }, + { + "epoch": 0.07, + "global_step": 13325, + "learning_rate": 0.00044522120200333895, + "loss": 1.609, + "loss_base2": 2.3213, + "loss_pixel": 0.1561, + "loss_text": 1.4529, + "ppl": 4.9978, + "step": 13325 + }, + { + "epoch": 0.07, + "global_step": 13326, + "learning_rate": 0.0004452170283806344, + "loss": 1.6165, + "loss_base2": 2.3321, + "loss_pixel": 0.1553, + "loss_text": 1.4611, + "ppl": 5.0354, + "step": 13326 + }, + { + "epoch": 0.07, + "global_step": 13327, + "learning_rate": 0.00044521285475792986, + "loss": 1.5993, + "loss_base2": 2.3073, + "loss_pixel": 0.1564, + "loss_text": 1.4429, + "ppl": 4.9496, + "step": 13327 + }, + { + "epoch": 0.07, + "global_step": 13328, + "learning_rate": 0.00044520868113522537, + "loss": 1.6192, + "loss_base2": 2.336, + "loss_pixel": 0.155, + "loss_text": 1.4642, + "ppl": 5.049, + "step": 13328 + }, + { + "epoch": 0.07, + "global_step": 13329, + "learning_rate": 0.0004452045075125209, + "loss": 1.6081, + "loss_base2": 2.32, + "loss_pixel": 0.1575, + "loss_text": 1.4506, + "ppl": 4.9933, + "step": 13329 + }, + { + "epoch": 0.07, + "global_step": 13330, + "learning_rate": 0.00044520033388981633, + "loss": 1.6112, + "loss_base2": 2.3245, + "loss_pixel": 0.1547, + "loss_text": 1.4565, + "ppl": 5.0088, + "step": 13330 + }, + { + "epoch": 0.07, + "global_step": 13331, + "learning_rate": 0.00044519616026711184, + "loss": 1.6163, + "loss_base2": 2.3318, + "loss_pixel": 0.1558, + "loss_text": 1.4605, + "ppl": 5.0344, + "step": 13331 + }, + { + "epoch": 0.07, + "global_step": 13332, + "learning_rate": 0.00044519198664440734, + "loss": 1.6, + "loss_base2": 2.3083, + "loss_pixel": 0.1554, + "loss_text": 1.4446, + "ppl": 4.953, + "step": 13332 + }, + { + "epoch": 0.07, + "global_step": 13333, + "learning_rate": 0.00044518781302170285, + "loss": 1.5971, + "loss_base2": 2.3041, + "loss_pixel": 0.1552, + "loss_text": 1.4419, + "ppl": 4.9387, + "step": 13333 + }, + { + "epoch": 0.07, + "global_step": 13334, + "learning_rate": 0.00044518363939899836, + "loss": 1.6203, + "loss_base2": 2.3376, + "loss_pixel": 0.1559, + "loss_text": 1.4644, + "ppl": 5.0546, + "step": 13334 + }, + { + "epoch": 0.07, + "global_step": 13335, + "learning_rate": 0.0004451794657762938, + "loss": 1.5887, + "loss_base2": 2.292, + "loss_pixel": 0.1549, + "loss_text": 1.4338, + "ppl": 4.8974, + "step": 13335 + }, + { + "epoch": 0.07, + "global_step": 13336, + "learning_rate": 0.0004451752921535893, + "loss": 1.5879, + "loss_base2": 2.2909, + "loss_pixel": 0.155, + "loss_text": 1.4329, + "ppl": 4.8935, + "step": 13336 + }, + { + "epoch": 0.07, + "global_step": 13337, + "learning_rate": 0.0004451711185308848, + "loss": 1.607, + "loss_base2": 2.3184, + "loss_pixel": 0.1544, + "loss_text": 1.4526, + "ppl": 4.9878, + "step": 13337 + }, + { + "epoch": 0.07, + "global_step": 13338, + "learning_rate": 0.00044516694490818033, + "loss": 1.5945, + "loss_base2": 2.3004, + "loss_pixel": 0.1536, + "loss_text": 1.4408, + "ppl": 4.9259, + "step": 13338 + }, + { + "epoch": 0.07, + "global_step": 13339, + "learning_rate": 0.0004451627712854758, + "loss": 1.6064, + "loss_base2": 2.3175, + "loss_pixel": 0.1548, + "loss_text": 1.4515, + "ppl": 4.9848, + "step": 13339 + }, + { + "epoch": 0.07, + "global_step": 13340, + "learning_rate": 0.0004451585976627713, + "loss": 1.5977, + "loss_base2": 2.305, + "loss_pixel": 0.1538, + "loss_text": 1.4439, + "ppl": 4.9417, + "step": 13340 + }, + { + "epoch": 0.07, + "global_step": 13341, + "learning_rate": 0.0004451544240400668, + "loss": 1.6063, + "loss_base2": 2.3174, + "loss_pixel": 0.156, + "loss_text": 1.4503, + "ppl": 4.9843, + "step": 13341 + }, + { + "epoch": 0.07, + "global_step": 13342, + "learning_rate": 0.0004451502504173623, + "loss": 1.6016, + "loss_base2": 2.3106, + "loss_pixel": 0.1549, + "loss_text": 1.4467, + "ppl": 4.961, + "step": 13342 + }, + { + "epoch": 0.07, + "global_step": 13343, + "learning_rate": 0.0004451460767946578, + "loss": 1.6059, + "loss_base2": 2.3168, + "loss_pixel": 0.1564, + "loss_text": 1.4495, + "ppl": 4.9823, + "step": 13343 + }, + { + "epoch": 0.07, + "global_step": 13344, + "learning_rate": 0.00044514190317195327, + "loss": 1.5845, + "loss_base2": 2.286, + "loss_pixel": 0.1551, + "loss_text": 1.4294, + "ppl": 4.8769, + "step": 13344 + }, + { + "epoch": 0.07, + "global_step": 13345, + "learning_rate": 0.0004451377295492488, + "loss": 1.5975, + "loss_base2": 2.3047, + "loss_pixel": 0.1564, + "loss_text": 1.4411, + "ppl": 4.9407, + "step": 13345 + }, + { + "epoch": 0.07, + "global_step": 13346, + "learning_rate": 0.00044513355592654423, + "loss": 1.3852, + "loss_base2": 1.9984, + "loss_pixel": 0.1549, + "loss_text": 1.2302, + "ppl": 3.9956, + "step": 13346 + }, + { + "epoch": 0.07, + "global_step": 13347, + "learning_rate": 0.00044512938230383974, + "loss": 1.3762, + "loss_base2": 1.9854, + "loss_pixel": 0.1542, + "loss_text": 1.222, + "ppl": 3.9598, + "step": 13347 + }, + { + "epoch": 0.07, + "global_step": 13348, + "learning_rate": 0.0004451252086811352, + "loss": 1.3736, + "loss_base2": 1.9817, + "loss_pixel": 0.1554, + "loss_text": 1.2182, + "ppl": 3.9495, + "step": 13348 + }, + { + "epoch": 0.07, + "global_step": 13349, + "learning_rate": 0.0004451210350584307, + "loss": 1.3748, + "loss_base2": 1.9834, + "loss_pixel": 0.1551, + "loss_text": 1.2197, + "ppl": 3.9543, + "step": 13349 + }, + { + "epoch": 0.07, + "global_step": 13350, + "learning_rate": 0.0004451168614357262, + "loss": 1.3605, + "loss_base2": 1.9628, + "loss_pixel": 0.1548, + "loss_text": 1.2057, + "ppl": 3.8981, + "step": 13350 + }, + { + "epoch": 0.07, + "global_step": 13351, + "learning_rate": 0.0004451126878130217, + "loss": 1.364, + "loss_base2": 1.9678, + "loss_pixel": 0.1537, + "loss_text": 1.2103, + "ppl": 3.9118, + "step": 13351 + }, + { + "epoch": 0.07, + "global_step": 13352, + "learning_rate": 0.0004451085141903172, + "loss": 1.3646, + "loss_base2": 1.9687, + "loss_pixel": 0.156, + "loss_text": 1.2086, + "ppl": 3.9142, + "step": 13352 + }, + { + "epoch": 0.07, + "global_step": 13353, + "learning_rate": 0.00044510434056761267, + "loss": 1.3825, + "loss_base2": 1.9945, + "loss_pixel": 0.1549, + "loss_text": 1.2276, + "ppl": 3.9849, + "step": 13353 + }, + { + "epoch": 0.07, + "global_step": 13354, + "learning_rate": 0.0004451001669449082, + "loss": 1.3654, + "loss_base2": 1.9699, + "loss_pixel": 0.1562, + "loss_text": 1.2092, + "ppl": 3.9173, + "step": 13354 + }, + { + "epoch": 0.07, + "global_step": 13355, + "learning_rate": 0.0004450959933222037, + "loss": 1.3582, + "loss_base2": 1.9595, + "loss_pixel": 0.1544, + "loss_text": 1.2038, + "ppl": 3.8892, + "step": 13355 + }, + { + "epoch": 0.07, + "global_step": 13356, + "learning_rate": 0.0004450918196994992, + "loss": 1.3744, + "loss_base2": 1.9828, + "loss_pixel": 0.1563, + "loss_text": 1.2182, + "ppl": 3.9527, + "step": 13356 + }, + { + "epoch": 0.07, + "global_step": 13357, + "learning_rate": 0.0004450876460767947, + "loss": 1.3599, + "loss_base2": 1.9619, + "loss_pixel": 0.1555, + "loss_text": 1.2044, + "ppl": 3.8958, + "step": 13357 + }, + { + "epoch": 0.07, + "global_step": 13358, + "learning_rate": 0.00044508347245409015, + "loss": 1.3687, + "loss_base2": 1.9746, + "loss_pixel": 0.1548, + "loss_text": 1.214, + "ppl": 3.9302, + "step": 13358 + }, + { + "epoch": 0.07, + "global_step": 13359, + "learning_rate": 0.00044507929883138566, + "loss": 1.356, + "loss_base2": 1.9563, + "loss_pixel": 0.1548, + "loss_text": 1.2012, + "ppl": 3.8806, + "step": 13359 + }, + { + "epoch": 0.07, + "global_step": 13360, + "learning_rate": 0.00044507512520868117, + "loss": 1.3543, + "loss_base2": 1.9538, + "loss_pixel": 0.156, + "loss_text": 1.1983, + "ppl": 3.874, + "step": 13360 + }, + { + "epoch": 0.07, + "global_step": 13361, + "learning_rate": 0.0004450709515859767, + "loss": 1.3456, + "loss_base2": 1.9413, + "loss_pixel": 0.1565, + "loss_text": 1.1891, + "ppl": 3.8405, + "step": 13361 + }, + { + "epoch": 0.07, + "global_step": 13362, + "learning_rate": 0.00044506677796327213, + "loss": 1.3648, + "loss_base2": 1.969, + "loss_pixel": 0.1539, + "loss_text": 1.2109, + "ppl": 3.9149, + "step": 13362 + }, + { + "epoch": 0.07, + "global_step": 13363, + "learning_rate": 0.00044506260434056764, + "loss": 1.493, + "loss_base2": 2.1539, + "loss_pixel": 0.1564, + "loss_text": 1.3367, + "ppl": 4.4504, + "step": 13363 + }, + { + "epoch": 0.07, + "global_step": 13364, + "learning_rate": 0.00044505843071786314, + "loss": 1.606, + "loss_base2": 2.317, + "loss_pixel": 0.1553, + "loss_text": 1.4508, + "ppl": 4.9828, + "step": 13364 + }, + { + "epoch": 0.07, + "global_step": 13365, + "learning_rate": 0.0004450542570951586, + "loss": 1.6099, + "loss_base2": 2.3226, + "loss_pixel": 0.1542, + "loss_text": 1.4557, + "ppl": 5.0023, + "step": 13365 + }, + { + "epoch": 0.07, + "global_step": 13366, + "learning_rate": 0.0004450500834724541, + "loss": 1.6165, + "loss_base2": 2.3321, + "loss_pixel": 0.1536, + "loss_text": 1.4629, + "ppl": 5.0354, + "step": 13366 + }, + { + "epoch": 0.07, + "global_step": 13367, + "learning_rate": 0.00044504590984974956, + "loss": 1.5718, + "loss_base2": 2.2676, + "loss_pixel": 0.1557, + "loss_text": 1.4161, + "ppl": 4.8153, + "step": 13367 + }, + { + "epoch": 0.07, + "global_step": 13368, + "learning_rate": 0.00044504173622704506, + "loss": 1.6087, + "loss_base2": 2.3209, + "loss_pixel": 0.1555, + "loss_text": 1.4531, + "ppl": 4.9963, + "step": 13368 + }, + { + "epoch": 0.07, + "global_step": 13369, + "learning_rate": 0.00044503756260434057, + "loss": 1.6276, + "loss_base2": 2.3481, + "loss_pixel": 0.1559, + "loss_text": 1.4717, + "ppl": 5.0916, + "step": 13369 + }, + { + "epoch": 0.07, + "global_step": 13370, + "learning_rate": 0.0004450333889816361, + "loss": 1.5849, + "loss_base2": 2.2865, + "loss_pixel": 0.1545, + "loss_text": 1.4304, + "ppl": 4.8788, + "step": 13370 + }, + { + "epoch": 0.07, + "global_step": 13371, + "learning_rate": 0.00044502921535893153, + "loss": 1.5506, + "loss_base2": 2.237, + "loss_pixel": 0.154, + "loss_text": 1.3966, + "ppl": 4.7143, + "step": 13371 + }, + { + "epoch": 0.07, + "global_step": 13372, + "learning_rate": 0.00044502504173622704, + "loss": 1.6106, + "loss_base2": 2.3236, + "loss_pixel": 0.1546, + "loss_text": 1.456, + "ppl": 5.0058, + "step": 13372 + }, + { + "epoch": 0.07, + "global_step": 13373, + "learning_rate": 0.00044502086811352255, + "loss": 1.5947, + "loss_base2": 2.3007, + "loss_pixel": 0.154, + "loss_text": 1.4407, + "ppl": 4.9269, + "step": 13373 + }, + { + "epoch": 0.07, + "global_step": 13374, + "learning_rate": 0.00044501669449081805, + "loss": 1.6017, + "loss_base2": 2.3108, + "loss_pixel": 0.1543, + "loss_text": 1.4473, + "ppl": 4.9615, + "step": 13374 + }, + { + "epoch": 0.07, + "global_step": 13375, + "learning_rate": 0.00044501252086811356, + "loss": 1.6061, + "loss_base2": 2.3171, + "loss_pixel": 0.154, + "loss_text": 1.4521, + "ppl": 4.9833, + "step": 13375 + }, + { + "epoch": 0.07, + "global_step": 13376, + "learning_rate": 0.000445008347245409, + "loss": 1.6119, + "loss_base2": 2.3255, + "loss_pixel": 0.1549, + "loss_text": 1.457, + "ppl": 5.0123, + "step": 13376 + }, + { + "epoch": 0.07, + "global_step": 13377, + "learning_rate": 0.0004450041736227045, + "loss": 1.6038, + "loss_base2": 2.3138, + "loss_pixel": 0.1543, + "loss_text": 1.4495, + "ppl": 4.9719, + "step": 13377 + }, + { + "epoch": 0.07, + "global_step": 13378, + "learning_rate": 0.00044500000000000003, + "loss": 1.6002, + "loss_base2": 2.3086, + "loss_pixel": 0.1559, + "loss_text": 1.4443, + "ppl": 4.954, + "step": 13378 + }, + { + "epoch": 0.07, + "global_step": 13379, + "learning_rate": 0.00044499582637729554, + "loss": 1.6109, + "loss_base2": 2.324, + "loss_pixel": 0.1552, + "loss_text": 1.4557, + "ppl": 5.0073, + "step": 13379 + }, + { + "epoch": 0.07, + "global_step": 13380, + "learning_rate": 0.000444991652754591, + "loss": 1.6113, + "loss_base2": 2.3246, + "loss_pixel": 0.1554, + "loss_text": 1.4559, + "ppl": 5.0093, + "step": 13380 + }, + { + "epoch": 0.07, + "global_step": 13381, + "learning_rate": 0.0004449874791318865, + "loss": 1.604, + "loss_base2": 2.3141, + "loss_pixel": 0.1547, + "loss_text": 1.4493, + "ppl": 4.9729, + "step": 13381 + }, + { + "epoch": 0.07, + "global_step": 13382, + "learning_rate": 0.000444983305509182, + "loss": 1.6153, + "loss_base2": 2.3304, + "loss_pixel": 0.1559, + "loss_text": 1.4595, + "ppl": 5.0294, + "step": 13382 + }, + { + "epoch": 0.07, + "global_step": 13383, + "learning_rate": 0.00044497913188647746, + "loss": 1.6029, + "loss_base2": 2.3125, + "loss_pixel": 0.1562, + "loss_text": 1.4467, + "ppl": 4.9674, + "step": 13383 + }, + { + "epoch": 0.07, + "global_step": 13384, + "learning_rate": 0.00044497495826377296, + "loss": 1.5983, + "loss_base2": 2.3059, + "loss_pixel": 0.1543, + "loss_text": 1.4441, + "ppl": 4.9446, + "step": 13384 + }, + { + "epoch": 0.07, + "global_step": 13385, + "learning_rate": 0.0004449707846410684, + "loss": 1.5952, + "loss_base2": 2.3014, + "loss_pixel": 0.1548, + "loss_text": 1.4404, + "ppl": 4.9293, + "step": 13385 + }, + { + "epoch": 0.07, + "global_step": 13386, + "learning_rate": 0.0004449666110183639, + "loss": 1.6026, + "loss_base2": 2.3121, + "loss_pixel": 0.1598, + "loss_text": 1.4428, + "ppl": 4.9659, + "step": 13386 + }, + { + "epoch": 0.07, + "global_step": 13387, + "learning_rate": 0.00044496243739565943, + "loss": 1.6037, + "loss_base2": 2.3137, + "loss_pixel": 0.161, + "loss_text": 1.4427, + "ppl": 4.9714, + "step": 13387 + }, + { + "epoch": 0.07, + "global_step": 13388, + "learning_rate": 0.00044495826377295494, + "loss": 1.6001, + "loss_base2": 2.3085, + "loss_pixel": 0.1632, + "loss_text": 1.437, + "ppl": 4.9535, + "step": 13388 + }, + { + "epoch": 0.07, + "global_step": 13389, + "learning_rate": 0.0004449540901502504, + "loss": 1.5039, + "loss_base2": 2.1697, + "loss_pixel": 0.1628, + "loss_text": 1.341, + "ppl": 4.4992, + "step": 13389 + }, + { + "epoch": 0.07, + "global_step": 13390, + "learning_rate": 0.0004449499165275459, + "loss": 1.3986, + "loss_base2": 2.0178, + "loss_pixel": 0.1879, + "loss_text": 1.2107, + "ppl": 4.0495, + "step": 13390 + }, + { + "epoch": 0.07, + "global_step": 13391, + "learning_rate": 0.0004449457429048414, + "loss": 1.4731, + "loss_base2": 2.1252, + "loss_pixel": 0.2662, + "loss_text": 1.2069, + "ppl": 4.3627, + "step": 13391 + }, + { + "epoch": 0.07, + "global_step": 13392, + "learning_rate": 0.0004449415692821369, + "loss": 1.5396, + "loss_base2": 2.2212, + "loss_pixel": 0.3157, + "loss_text": 1.2239, + "ppl": 4.6627, + "step": 13392 + }, + { + "epoch": 0.07, + "global_step": 13393, + "learning_rate": 0.0004449373956594324, + "loss": 1.5337, + "loss_base2": 2.2127, + "loss_pixel": 0.3204, + "loss_text": 1.2133, + "ppl": 4.6353, + "step": 13393 + }, + { + "epoch": 0.07, + "global_step": 13394, + "learning_rate": 0.0004449332220367279, + "loss": 1.5616, + "loss_base2": 2.2529, + "loss_pixel": 0.3409, + "loss_text": 1.2207, + "ppl": 4.7664, + "step": 13394 + }, + { + "epoch": 0.07, + "global_step": 13395, + "learning_rate": 0.0004449290484140234, + "loss": 1.5598, + "loss_base2": 2.2503, + "loss_pixel": 0.357, + "loss_text": 1.2029, + "ppl": 4.7579, + "step": 13395 + }, + { + "epoch": 0.07, + "global_step": 13396, + "learning_rate": 0.0004449248747913189, + "loss": 1.5695, + "loss_base2": 2.2643, + "loss_pixel": 0.352, + "loss_text": 1.2175, + "ppl": 4.8042, + "step": 13396 + }, + { + "epoch": 0.07, + "global_step": 13397, + "learning_rate": 0.0004449207011686144, + "loss": 1.5714, + "loss_base2": 2.2671, + "loss_pixel": 0.3438, + "loss_text": 1.2276, + "ppl": 4.8134, + "step": 13397 + }, + { + "epoch": 0.07, + "global_step": 13398, + "learning_rate": 0.00044491652754590985, + "loss": 1.5336, + "loss_base2": 2.2125, + "loss_pixel": 0.337, + "loss_text": 1.1966, + "ppl": 4.6348, + "step": 13398 + }, + { + "epoch": 0.07, + "global_step": 13399, + "learning_rate": 0.00044491235392320536, + "loss": 1.5817, + "loss_base2": 2.2819, + "loss_pixel": 0.3539, + "loss_text": 1.2279, + "ppl": 4.8632, + "step": 13399 + }, + { + "epoch": 0.07, + "global_step": 13400, + "learning_rate": 0.00044490818030050086, + "loss": 1.5623, + "loss_base2": 2.2539, + "loss_pixel": 0.3492, + "loss_text": 1.2131, + "ppl": 4.7698, + "step": 13400 + }, + { + "epoch": 0.07, + "global_step": 13401, + "learning_rate": 0.00044490400667779637, + "loss": 1.5786, + "loss_base2": 2.2774, + "loss_pixel": 0.348, + "loss_text": 1.2307, + "ppl": 4.8482, + "step": 13401 + }, + { + "epoch": 0.07, + "global_step": 13402, + "learning_rate": 0.0004448998330550918, + "loss": 1.5427, + "loss_base2": 2.2256, + "loss_pixel": 0.3417, + "loss_text": 1.201, + "ppl": 4.6772, + "step": 13402 + }, + { + "epoch": 0.07, + "global_step": 13403, + "learning_rate": 0.0004448956594323873, + "loss": 1.5298, + "loss_base2": 2.207, + "loss_pixel": 0.3388, + "loss_text": 1.1909, + "ppl": 4.6173, + "step": 13403 + }, + { + "epoch": 0.07, + "global_step": 13404, + "learning_rate": 0.0004448914858096828, + "loss": 1.5819, + "loss_base2": 2.2822, + "loss_pixel": 0.3525, + "loss_text": 1.2295, + "ppl": 4.8642, + "step": 13404 + }, + { + "epoch": 0.07, + "global_step": 13405, + "learning_rate": 0.0004448873121869783, + "loss": 1.7369, + "loss_base2": 2.5058, + "loss_pixel": 0.3664, + "loss_text": 1.3706, + "ppl": 5.6797, + "step": 13405 + }, + { + "epoch": 0.07, + "global_step": 13406, + "learning_rate": 0.0004448831385642738, + "loss": 1.8275, + "loss_base2": 2.6365, + "loss_pixel": 0.3633, + "loss_text": 1.4641, + "ppl": 6.2183, + "step": 13406 + }, + { + "epoch": 0.07, + "global_step": 13407, + "learning_rate": 0.00044487896494156925, + "loss": 1.8431, + "loss_base2": 2.659, + "loss_pixel": 0.3577, + "loss_text": 1.4854, + "ppl": 6.3161, + "step": 13407 + }, + { + "epoch": 0.07, + "global_step": 13408, + "learning_rate": 0.00044487479131886476, + "loss": 1.8388, + "loss_base2": 2.6528, + "loss_pixel": 0.3541, + "loss_text": 1.4847, + "ppl": 6.289, + "step": 13408 + }, + { + "epoch": 0.07, + "global_step": 13409, + "learning_rate": 0.00044487061769616027, + "loss": 1.87, + "loss_base2": 2.6978, + "loss_pixel": 0.3743, + "loss_text": 1.4957, + "ppl": 6.4883, + "step": 13409 + }, + { + "epoch": 0.07, + "global_step": 13410, + "learning_rate": 0.0004448664440734558, + "loss": 1.8585, + "loss_base2": 2.6812, + "loss_pixel": 0.3676, + "loss_text": 1.4909, + "ppl": 6.4141, + "step": 13410 + }, + { + "epoch": 0.07, + "global_step": 13411, + "learning_rate": 0.0004448622704507513, + "loss": 1.8799, + "loss_base2": 2.7121, + "loss_pixel": 0.3622, + "loss_text": 1.5177, + "ppl": 6.5528, + "step": 13411 + }, + { + "epoch": 0.07, + "global_step": 13412, + "learning_rate": 0.00044485809682804674, + "loss": 1.8661, + "loss_base2": 2.6922, + "loss_pixel": 0.356, + "loss_text": 1.51, + "ppl": 6.463, + "step": 13412 + }, + { + "epoch": 0.07, + "global_step": 13413, + "learning_rate": 0.00044485392320534224, + "loss": 1.8627, + "loss_base2": 2.6873, + "loss_pixel": 0.3534, + "loss_text": 1.5092, + "ppl": 6.4411, + "step": 13413 + }, + { + "epoch": 0.07, + "global_step": 13414, + "learning_rate": 0.00044484974958263775, + "loss": 1.9132, + "loss_base2": 2.7602, + "loss_pixel": 0.3525, + "loss_text": 1.5607, + "ppl": 6.7747, + "step": 13414 + }, + { + "epoch": 0.07, + "global_step": 13415, + "learning_rate": 0.00044484557595993326, + "loss": 1.8593, + "loss_base2": 2.6824, + "loss_pixel": 0.3473, + "loss_text": 1.5121, + "ppl": 6.4192, + "step": 13415 + }, + { + "epoch": 0.07, + "global_step": 13416, + "learning_rate": 0.00044484140233722876, + "loss": 1.8501, + "loss_base2": 2.6691, + "loss_pixel": 0.3423, + "loss_text": 1.5078, + "ppl": 6.3605, + "step": 13416 + }, + { + "epoch": 0.07, + "global_step": 13417, + "learning_rate": 0.0004448372287145242, + "loss": 1.8438, + "loss_base2": 2.66, + "loss_pixel": 0.3382, + "loss_text": 1.5056, + "ppl": 6.3205, + "step": 13417 + }, + { + "epoch": 0.07, + "global_step": 13418, + "learning_rate": 0.0004448330550918197, + "loss": 1.8397, + "loss_base2": 2.6541, + "loss_pixel": 0.3389, + "loss_text": 1.5008, + "ppl": 6.2946, + "step": 13418 + }, + { + "epoch": 0.07, + "global_step": 13419, + "learning_rate": 0.00044482888146911523, + "loss": 1.8377, + "loss_base2": 2.6512, + "loss_pixel": 0.3406, + "loss_text": 1.4971, + "ppl": 6.2821, + "step": 13419 + }, + { + "epoch": 0.07, + "global_step": 13420, + "learning_rate": 0.00044482470784641074, + "loss": 1.8299, + "loss_base2": 2.64, + "loss_pixel": 0.3322, + "loss_text": 1.4977, + "ppl": 6.2333, + "step": 13420 + }, + { + "epoch": 0.07, + "global_step": 13421, + "learning_rate": 0.00044482053422370614, + "loss": 1.8391, + "loss_base2": 2.6533, + "loss_pixel": 0.3307, + "loss_text": 1.5083, + "ppl": 6.2909, + "step": 13421 + }, + { + "epoch": 0.07, + "global_step": 13422, + "learning_rate": 0.00044481636060100165, + "loss": 1.8294, + "loss_base2": 2.6393, + "loss_pixel": 0.328, + "loss_text": 1.5014, + "ppl": 6.2301, + "step": 13422 + }, + { + "epoch": 0.07, + "global_step": 13423, + "learning_rate": 0.00044481218697829715, + "loss": 1.8268, + "loss_base2": 2.6355, + "loss_pixel": 0.3252, + "loss_text": 1.5015, + "ppl": 6.214, + "step": 13423 + }, + { + "epoch": 0.07, + "global_step": 13424, + "learning_rate": 0.00044480801335559266, + "loss": 1.8264, + "loss_base2": 2.6349, + "loss_pixel": 0.3277, + "loss_text": 1.4987, + "ppl": 6.2115, + "step": 13424 + }, + { + "epoch": 0.07, + "global_step": 13425, + "learning_rate": 0.00044480383973288817, + "loss": 1.8073, + "loss_base2": 2.6074, + "loss_pixel": 0.3226, + "loss_text": 1.4847, + "ppl": 6.094, + "step": 13425 + }, + { + "epoch": 0.07, + "global_step": 13426, + "learning_rate": 0.0004447996661101836, + "loss": 1.8047, + "loss_base2": 2.6036, + "loss_pixel": 0.3203, + "loss_text": 1.4845, + "ppl": 6.0781, + "step": 13426 + }, + { + "epoch": 0.07, + "global_step": 13427, + "learning_rate": 0.00044479549248747913, + "loss": 1.7916, + "loss_base2": 2.5847, + "loss_pixel": 0.3171, + "loss_text": 1.4745, + "ppl": 5.999, + "step": 13427 + }, + { + "epoch": 0.07, + "global_step": 13428, + "learning_rate": 0.00044479131886477464, + "loss": 1.7779, + "loss_base2": 2.565, + "loss_pixel": 0.3124, + "loss_text": 1.4656, + "ppl": 5.9174, + "step": 13428 + }, + { + "epoch": 0.07, + "global_step": 13429, + "learning_rate": 0.00044478714524207014, + "loss": 1.7833, + "loss_base2": 2.5728, + "loss_pixel": 0.3122, + "loss_text": 1.4711, + "ppl": 5.9495, + "step": 13429 + }, + { + "epoch": 0.07, + "global_step": 13430, + "learning_rate": 0.0004447829716193656, + "loss": 1.7921, + "loss_base2": 2.5855, + "loss_pixel": 0.3094, + "loss_text": 1.4827, + "ppl": 6.002, + "step": 13430 + }, + { + "epoch": 0.07, + "global_step": 13431, + "learning_rate": 0.0004447787979966611, + "loss": 1.7588, + "loss_base2": 2.5374, + "loss_pixel": 0.3061, + "loss_text": 1.4527, + "ppl": 5.8055, + "step": 13431 + }, + { + "epoch": 0.07, + "global_step": 13432, + "learning_rate": 0.0004447746243739566, + "loss": 1.7946, + "loss_base2": 2.5891, + "loss_pixel": 0.3067, + "loss_text": 1.4879, + "ppl": 6.0171, + "step": 13432 + }, + { + "epoch": 0.07, + "global_step": 13433, + "learning_rate": 0.0004447704507512521, + "loss": 1.7768, + "loss_base2": 2.5634, + "loss_pixel": 0.303, + "loss_text": 1.4738, + "ppl": 5.9109, + "step": 13433 + }, + { + "epoch": 0.07, + "global_step": 13434, + "learning_rate": 0.0004447662771285476, + "loss": 1.764, + "loss_base2": 2.5449, + "loss_pixel": 0.3009, + "loss_text": 1.4631, + "ppl": 5.8357, + "step": 13434 + }, + { + "epoch": 0.07, + "global_step": 13435, + "learning_rate": 0.0004447621035058431, + "loss": 1.7787, + "loss_base2": 2.5661, + "loss_pixel": 0.3002, + "loss_text": 1.4785, + "ppl": 5.9222, + "step": 13435 + }, + { + "epoch": 0.07, + "global_step": 13436, + "learning_rate": 0.0004447579298831386, + "loss": 1.7758, + "loss_base2": 2.5619, + "loss_pixel": 0.2978, + "loss_text": 1.478, + "ppl": 5.905, + "step": 13436 + }, + { + "epoch": 0.07, + "global_step": 13437, + "learning_rate": 0.0004447537562604341, + "loss": 1.7577, + "loss_base2": 2.5358, + "loss_pixel": 0.2984, + "loss_text": 1.4593, + "ppl": 5.7991, + "step": 13437 + }, + { + "epoch": 0.07, + "global_step": 13438, + "learning_rate": 0.0004447495826377296, + "loss": 1.745, + "loss_base2": 2.5175, + "loss_pixel": 0.2997, + "loss_text": 1.4453, + "ppl": 5.7259, + "step": 13438 + }, + { + "epoch": 0.07, + "global_step": 13439, + "learning_rate": 0.000444745409015025, + "loss": 1.768, + "loss_base2": 2.5507, + "loss_pixel": 0.2971, + "loss_text": 1.4709, + "ppl": 5.8591, + "step": 13439 + }, + { + "epoch": 0.07, + "global_step": 13440, + "learning_rate": 0.0004447412353923205, + "loss": 1.7281, + "loss_base2": 2.4931, + "loss_pixel": 0.2983, + "loss_text": 1.4297, + "ppl": 5.6299, + "step": 13440 + }, + { + "epoch": 0.07, + "global_step": 13441, + "learning_rate": 0.000444737061769616, + "loss": 1.7599, + "loss_base2": 2.539, + "loss_pixel": 0.2965, + "loss_text": 1.4634, + "ppl": 5.8119, + "step": 13441 + }, + { + "epoch": 0.07, + "global_step": 13442, + "learning_rate": 0.0004447328881469115, + "loss": 1.7409, + "loss_base2": 2.5116, + "loss_pixel": 0.2955, + "loss_text": 1.4455, + "ppl": 5.7025, + "step": 13442 + }, + { + "epoch": 0.07, + "global_step": 13443, + "learning_rate": 0.00044472871452420703, + "loss": 1.7591, + "loss_base2": 2.5378, + "loss_pixel": 0.2944, + "loss_text": 1.4647, + "ppl": 5.8072, + "step": 13443 + }, + { + "epoch": 0.07, + "global_step": 13444, + "learning_rate": 0.0004447245409015025, + "loss": 1.7439, + "loss_base2": 2.5159, + "loss_pixel": 0.2926, + "loss_text": 1.4513, + "ppl": 5.7196, + "step": 13444 + }, + { + "epoch": 0.07, + "global_step": 13445, + "learning_rate": 0.000444720367278798, + "loss": 1.7503, + "loss_base2": 2.5251, + "loss_pixel": 0.2903, + "loss_text": 1.46, + "ppl": 5.7563, + "step": 13445 + }, + { + "epoch": 0.07, + "global_step": 13446, + "learning_rate": 0.0004447161936560935, + "loss": 1.7329, + "loss_base2": 2.5, + "loss_pixel": 0.2883, + "loss_text": 1.4446, + "ppl": 5.657, + "step": 13446 + }, + { + "epoch": 0.07, + "global_step": 13447, + "learning_rate": 0.000444712020033389, + "loss": 1.74, + "loss_base2": 2.5103, + "loss_pixel": 0.2868, + "loss_text": 1.4532, + "ppl": 5.6973, + "step": 13447 + }, + { + "epoch": 0.07, + "global_step": 13448, + "learning_rate": 0.00044470784641068446, + "loss": 1.7435, + "loss_base2": 2.5153, + "loss_pixel": 0.2856, + "loss_text": 1.4579, + "ppl": 5.7173, + "step": 13448 + }, + { + "epoch": 0.07, + "global_step": 13449, + "learning_rate": 0.00044470367278797996, + "loss": 1.6914, + "loss_base2": 2.4402, + "loss_pixel": 0.2832, + "loss_text": 1.4082, + "ppl": 5.4271, + "step": 13449 + }, + { + "epoch": 0.07, + "global_step": 13450, + "learning_rate": 0.00044469949916527547, + "loss": 1.4987, + "loss_base2": 2.1622, + "loss_pixel": 0.2812, + "loss_text": 1.2175, + "ppl": 4.4759, + "step": 13450 + }, + { + "epoch": 0.07, + "global_step": 13451, + "learning_rate": 0.000444695325542571, + "loss": 1.5263, + "loss_base2": 2.202, + "loss_pixel": 0.2807, + "loss_text": 1.2457, + "ppl": 4.6011, + "step": 13451 + }, + { + "epoch": 0.07, + "global_step": 13452, + "learning_rate": 0.0004446911519198665, + "loss": 1.5421, + "loss_base2": 2.2248, + "loss_pixel": 0.2791, + "loss_text": 1.263, + "ppl": 4.6744, + "step": 13452 + }, + { + "epoch": 0.07, + "global_step": 13453, + "learning_rate": 0.00044468697829716194, + "loss": 1.4793, + "loss_base2": 2.1342, + "loss_pixel": 0.2788, + "loss_text": 1.2005, + "ppl": 4.3899, + "step": 13453 + }, + { + "epoch": 0.07, + "global_step": 13454, + "learning_rate": 0.00044468280467445745, + "loss": 1.4907, + "loss_base2": 2.1506, + "loss_pixel": 0.2785, + "loss_text": 1.2122, + "ppl": 4.4402, + "step": 13454 + }, + { + "epoch": 0.07, + "global_step": 13455, + "learning_rate": 0.00044467863105175295, + "loss": 1.4884, + "loss_base2": 2.1473, + "loss_pixel": 0.2862, + "loss_text": 1.2022, + "ppl": 4.43, + "step": 13455 + }, + { + "epoch": 0.07, + "global_step": 13456, + "learning_rate": 0.00044467445742904846, + "loss": 1.4893, + "loss_base2": 2.1486, + "loss_pixel": 0.2894, + "loss_text": 1.1999, + "ppl": 4.434, + "step": 13456 + }, + { + "epoch": 0.07, + "global_step": 13457, + "learning_rate": 0.0004446702838063439, + "loss": 1.5079, + "loss_base2": 2.1754, + "loss_pixel": 0.2999, + "loss_text": 1.208, + "ppl": 4.5172, + "step": 13457 + }, + { + "epoch": 0.07, + "global_step": 13458, + "learning_rate": 0.00044466611018363937, + "loss": 1.6425, + "loss_base2": 2.3696, + "loss_pixel": 0.2996, + "loss_text": 1.343, + "ppl": 5.1681, + "step": 13458 + }, + { + "epoch": 0.07, + "global_step": 13459, + "learning_rate": 0.0004446619365609349, + "loss": 1.7564, + "loss_base2": 2.5339, + "loss_pixel": 0.2947, + "loss_text": 1.4618, + "ppl": 5.7916, + "step": 13459 + }, + { + "epoch": 0.07, + "global_step": 13460, + "learning_rate": 0.0004446577629382304, + "loss": 1.7503, + "loss_base2": 2.5251, + "loss_pixel": 0.291, + "loss_text": 1.4593, + "ppl": 5.7563, + "step": 13460 + }, + { + "epoch": 0.07, + "global_step": 13461, + "learning_rate": 0.0004446535893155259, + "loss": 1.7534, + "loss_base2": 2.5296, + "loss_pixel": 0.2881, + "loss_text": 1.4653, + "ppl": 5.7742, + "step": 13461 + }, + { + "epoch": 0.07, + "global_step": 13462, + "learning_rate": 0.00044464941569282134, + "loss": 1.7556, + "loss_base2": 2.5328, + "loss_pixel": 0.2865, + "loss_text": 1.4691, + "ppl": 5.7869, + "step": 13462 + }, + { + "epoch": 0.07, + "global_step": 13463, + "learning_rate": 0.00044464524207011685, + "loss": 1.7399, + "loss_base2": 2.5101, + "loss_pixel": 0.2852, + "loss_text": 1.4547, + "ppl": 5.6968, + "step": 13463 + }, + { + "epoch": 0.07, + "global_step": 13464, + "learning_rate": 0.00044464106844741236, + "loss": 1.7339, + "loss_base2": 2.5015, + "loss_pixel": 0.2819, + "loss_text": 1.452, + "ppl": 5.6627, + "step": 13464 + }, + { + "epoch": 0.07, + "global_step": 13465, + "learning_rate": 0.00044463689482470786, + "loss": 1.7475, + "loss_base2": 2.5211, + "loss_pixel": 0.281, + "loss_text": 1.4665, + "ppl": 5.7402, + "step": 13465 + }, + { + "epoch": 0.07, + "global_step": 13466, + "learning_rate": 0.0004446327212020033, + "loss": 1.7463, + "loss_base2": 2.5194, + "loss_pixel": 0.2806, + "loss_text": 1.4658, + "ppl": 5.7333, + "step": 13466 + }, + { + "epoch": 0.07, + "global_step": 13467, + "learning_rate": 0.0004446285475792988, + "loss": 1.7373, + "loss_base2": 2.5064, + "loss_pixel": 0.2783, + "loss_text": 1.459, + "ppl": 5.682, + "step": 13467 + }, + { + "epoch": 0.07, + "global_step": 13468, + "learning_rate": 0.00044462437395659433, + "loss": 1.7332, + "loss_base2": 2.5005, + "loss_pixel": 0.2773, + "loss_text": 1.4559, + "ppl": 5.6587, + "step": 13468 + }, + { + "epoch": 0.07, + "global_step": 13469, + "learning_rate": 0.00044462020033388984, + "loss": 1.7123, + "loss_base2": 2.4703, + "loss_pixel": 0.2763, + "loss_text": 1.436, + "ppl": 5.5417, + "step": 13469 + }, + { + "epoch": 0.07, + "global_step": 13470, + "learning_rate": 0.00044461602671118535, + "loss": 1.7327, + "loss_base2": 2.4998, + "loss_pixel": 0.2747, + "loss_text": 1.458, + "ppl": 5.6559, + "step": 13470 + }, + { + "epoch": 0.07, + "global_step": 13471, + "learning_rate": 0.0004446118530884808, + "loss": 1.7242, + "loss_base2": 2.4875, + "loss_pixel": 0.273, + "loss_text": 1.4512, + "ppl": 5.608, + "step": 13471 + }, + { + "epoch": 0.07, + "global_step": 13472, + "learning_rate": 0.0004446076794657763, + "loss": 1.7445, + "loss_base2": 2.5168, + "loss_pixel": 0.2724, + "loss_text": 1.4721, + "ppl": 5.723, + "step": 13472 + }, + { + "epoch": 0.07, + "global_step": 13473, + "learning_rate": 0.0004446035058430718, + "loss": 1.7189, + "loss_base2": 2.4798, + "loss_pixel": 0.2705, + "loss_text": 1.4484, + "ppl": 5.5784, + "step": 13473 + }, + { + "epoch": 0.07, + "global_step": 13474, + "learning_rate": 0.0004445993322203673, + "loss": 1.7168, + "loss_base2": 2.4768, + "loss_pixel": 0.2701, + "loss_text": 1.4467, + "ppl": 5.5667, + "step": 13474 + }, + { + "epoch": 0.07, + "global_step": 13475, + "learning_rate": 0.00044459515859766283, + "loss": 1.7287, + "loss_base2": 2.494, + "loss_pixel": 0.269, + "loss_text": 1.4597, + "ppl": 5.6333, + "step": 13475 + }, + { + "epoch": 0.07, + "global_step": 13476, + "learning_rate": 0.0004445909849749583, + "loss": 1.7271, + "loss_base2": 2.4917, + "loss_pixel": 0.2683, + "loss_text": 1.4588, + "ppl": 5.6243, + "step": 13476 + }, + { + "epoch": 0.07, + "global_step": 13477, + "learning_rate": 0.00044458681135225374, + "loss": 1.7236, + "loss_base2": 2.4866, + "loss_pixel": 0.2691, + "loss_text": 1.4545, + "ppl": 5.6047, + "step": 13477 + }, + { + "epoch": 0.07, + "global_step": 13478, + "learning_rate": 0.00044458263772954924, + "loss": 1.7176, + "loss_base2": 2.478, + "loss_pixel": 0.2706, + "loss_text": 1.4471, + "ppl": 5.5711, + "step": 13478 + }, + { + "epoch": 0.07, + "global_step": 13479, + "learning_rate": 0.00044457846410684475, + "loss": 1.7186, + "loss_base2": 2.4794, + "loss_pixel": 0.2681, + "loss_text": 1.4505, + "ppl": 5.5767, + "step": 13479 + }, + { + "epoch": 0.07, + "global_step": 13480, + "learning_rate": 0.0004445742904841402, + "loss": 1.6897, + "loss_base2": 2.4377, + "loss_pixel": 0.2669, + "loss_text": 1.4229, + "ppl": 5.4179, + "step": 13480 + }, + { + "epoch": 0.07, + "global_step": 13481, + "learning_rate": 0.0004445701168614357, + "loss": 1.7324, + "loss_base2": 2.4993, + "loss_pixel": 0.2675, + "loss_text": 1.4649, + "ppl": 5.6542, + "step": 13481 + }, + { + "epoch": 0.07, + "global_step": 13482, + "learning_rate": 0.0004445659432387312, + "loss": 1.7014, + "loss_base2": 2.4546, + "loss_pixel": 0.2651, + "loss_text": 1.4363, + "ppl": 5.4816, + "step": 13482 + }, + { + "epoch": 0.07, + "global_step": 13483, + "learning_rate": 0.0004445617696160267, + "loss": 1.7125, + "loss_base2": 2.4706, + "loss_pixel": 0.2632, + "loss_text": 1.4493, + "ppl": 5.5428, + "step": 13483 + }, + { + "epoch": 0.07, + "global_step": 13484, + "learning_rate": 0.00044455759599332223, + "loss": 1.6907, + "loss_base2": 2.4392, + "loss_pixel": 0.2627, + "loss_text": 1.428, + "ppl": 5.4233, + "step": 13484 + }, + { + "epoch": 0.07, + "global_step": 13485, + "learning_rate": 0.0004445534223706177, + "loss": 1.6934, + "loss_base2": 2.4431, + "loss_pixel": 0.2619, + "loss_text": 1.4315, + "ppl": 5.4379, + "step": 13485 + }, + { + "epoch": 0.07, + "global_step": 13486, + "learning_rate": 0.0004445492487479132, + "loss": 1.7056, + "loss_base2": 2.4607, + "loss_pixel": 0.2615, + "loss_text": 1.4441, + "ppl": 5.5047, + "step": 13486 + }, + { + "epoch": 0.07, + "global_step": 13487, + "learning_rate": 0.0004445450751252087, + "loss": 1.7119, + "loss_base2": 2.4697, + "loss_pixel": 0.2599, + "loss_text": 1.452, + "ppl": 5.5395, + "step": 13487 + }, + { + "epoch": 0.07, + "global_step": 13488, + "learning_rate": 0.0004445409015025042, + "loss": 1.7148, + "loss_base2": 2.4739, + "loss_pixel": 0.259, + "loss_text": 1.4558, + "ppl": 5.5556, + "step": 13488 + }, + { + "epoch": 0.07, + "global_step": 13489, + "learning_rate": 0.00044453672787979966, + "loss": 1.7267, + "loss_base2": 2.4911, + "loss_pixel": 0.2583, + "loss_text": 1.4684, + "ppl": 5.6221, + "step": 13489 + }, + { + "epoch": 0.07, + "global_step": 13490, + "learning_rate": 0.00044453255425709517, + "loss": 1.7093, + "loss_base2": 2.466, + "loss_pixel": 0.2588, + "loss_text": 1.4505, + "ppl": 5.5251, + "step": 13490 + }, + { + "epoch": 0.07, + "global_step": 13491, + "learning_rate": 0.0004445283806343907, + "loss": 1.7352, + "loss_base2": 2.5034, + "loss_pixel": 0.2675, + "loss_text": 1.4677, + "ppl": 5.6701, + "step": 13491 + }, + { + "epoch": 0.07, + "global_step": 13492, + "learning_rate": 0.0004445242070116862, + "loss": 1.7073, + "loss_base2": 2.4631, + "loss_pixel": 0.2626, + "loss_text": 1.4447, + "ppl": 5.5141, + "step": 13492 + }, + { + "epoch": 0.07, + "global_step": 13493, + "learning_rate": 0.0004445200333889817, + "loss": 1.7075, + "loss_base2": 2.4634, + "loss_pixel": 0.2643, + "loss_text": 1.4431, + "ppl": 5.5152, + "step": 13493 + }, + { + "epoch": 0.07, + "global_step": 13494, + "learning_rate": 0.00044451585976627714, + "loss": 1.6896, + "loss_base2": 2.4376, + "loss_pixel": 0.2604, + "loss_text": 1.4292, + "ppl": 5.4173, + "step": 13494 + }, + { + "epoch": 0.07, + "global_step": 13495, + "learning_rate": 0.00044451168614357265, + "loss": 1.6921, + "loss_base2": 2.4412, + "loss_pixel": 0.2596, + "loss_text": 1.4325, + "ppl": 5.4309, + "step": 13495 + }, + { + "epoch": 0.07, + "global_step": 13496, + "learning_rate": 0.0004445075125208681, + "loss": 1.6961, + "loss_base2": 2.447, + "loss_pixel": 0.2582, + "loss_text": 1.4379, + "ppl": 5.4526, + "step": 13496 + }, + { + "epoch": 0.07, + "global_step": 13497, + "learning_rate": 0.0004445033388981636, + "loss": 1.6974, + "loss_base2": 2.4488, + "loss_pixel": 0.2574, + "loss_text": 1.44, + "ppl": 5.4597, + "step": 13497 + }, + { + "epoch": 0.07, + "global_step": 13498, + "learning_rate": 0.00044449916527545906, + "loss": 1.6948, + "loss_base2": 2.4451, + "loss_pixel": 0.2559, + "loss_text": 1.4389, + "ppl": 5.4456, + "step": 13498 + }, + { + "epoch": 0.07, + "global_step": 13499, + "learning_rate": 0.00044449499165275457, + "loss": 1.7002, + "loss_base2": 2.4529, + "loss_pixel": 0.2549, + "loss_text": 1.4452, + "ppl": 5.475, + "step": 13499 + }, + { + "epoch": 0.07, + "global_step": 13500, + "learning_rate": 0.0004444908180300501, + "loss": 1.6844, + "loss_base2": 2.4301, + "loss_pixel": 0.2534, + "loss_text": 1.4309, + "ppl": 5.3892, + "step": 13500 + }, + { + "epoch": 0.07, + "global_step": 13501, + "learning_rate": 0.0004444866444073456, + "loss": 1.6768, + "loss_base2": 2.4191, + "loss_pixel": 0.2546, + "loss_text": 1.4222, + "ppl": 5.3484, + "step": 13501 + }, + { + "epoch": 0.07, + "global_step": 13502, + "learning_rate": 0.0004444824707846411, + "loss": 1.4866, + "loss_base2": 2.1447, + "loss_pixel": 0.2513, + "loss_text": 1.2353, + "ppl": 4.422, + "step": 13502 + }, + { + "epoch": 0.07, + "global_step": 13503, + "learning_rate": 0.00044447829716193655, + "loss": 1.4956, + "loss_base2": 2.1577, + "loss_pixel": 0.2504, + "loss_text": 1.2453, + "ppl": 4.462, + "step": 13503 + }, + { + "epoch": 0.07, + "global_step": 13504, + "learning_rate": 0.00044447412353923205, + "loss": 1.4786, + "loss_base2": 2.1332, + "loss_pixel": 0.2496, + "loss_text": 1.2291, + "ppl": 4.3868, + "step": 13504 + }, + { + "epoch": 0.07, + "global_step": 13505, + "learning_rate": 0.00044446994991652756, + "loss": 1.4508, + "loss_base2": 2.0931, + "loss_pixel": 0.2492, + "loss_text": 1.2016, + "ppl": 4.2665, + "step": 13505 + }, + { + "epoch": 0.07, + "global_step": 13506, + "learning_rate": 0.00044446577629382307, + "loss": 1.4447, + "loss_base2": 2.0843, + "loss_pixel": 0.2497, + "loss_text": 1.195, + "ppl": 4.2406, + "step": 13506 + }, + { + "epoch": 0.07, + "global_step": 13507, + "learning_rate": 0.0004444616026711185, + "loss": 1.4447, + "loss_base2": 2.0843, + "loss_pixel": 0.2481, + "loss_text": 1.1966, + "ppl": 4.2406, + "step": 13507 + }, + { + "epoch": 0.07, + "global_step": 13508, + "learning_rate": 0.00044445742904841403, + "loss": 1.4688, + "loss_base2": 2.119, + "loss_pixel": 0.2472, + "loss_text": 1.2217, + "ppl": 4.344, + "step": 13508 + }, + { + "epoch": 0.07, + "global_step": 13509, + "learning_rate": 0.00044445325542570954, + "loss": 1.4592, + "loss_base2": 2.1052, + "loss_pixel": 0.245, + "loss_text": 1.2142, + "ppl": 4.3025, + "step": 13509 + }, + { + "epoch": 0.07, + "global_step": 13510, + "learning_rate": 0.00044444908180300504, + "loss": 1.5808, + "loss_base2": 2.2806, + "loss_pixel": 0.2454, + "loss_text": 1.3354, + "ppl": 4.8588, + "step": 13510 + }, + { + "epoch": 0.07, + "global_step": 13511, + "learning_rate": 0.00044444490818030055, + "loss": 1.6874, + "loss_base2": 2.4344, + "loss_pixel": 0.2459, + "loss_text": 1.4415, + "ppl": 5.4054, + "step": 13511 + }, + { + "epoch": 0.07, + "global_step": 13512, + "learning_rate": 0.000444440734557596, + "loss": 1.7171, + "loss_base2": 2.4773, + "loss_pixel": 0.2465, + "loss_text": 1.4706, + "ppl": 5.5684, + "step": 13512 + }, + { + "epoch": 0.07, + "global_step": 13513, + "learning_rate": 0.0004444365609348915, + "loss": 1.6851, + "loss_base2": 2.4311, + "loss_pixel": 0.2448, + "loss_text": 1.4404, + "ppl": 5.393, + "step": 13513 + }, + { + "epoch": 0.07, + "global_step": 13514, + "learning_rate": 0.000444432387312187, + "loss": 1.7121, + "loss_base2": 2.47, + "loss_pixel": 0.2442, + "loss_text": 1.4679, + "ppl": 5.5406, + "step": 13514 + }, + { + "epoch": 0.07, + "global_step": 13515, + "learning_rate": 0.00044442821368948247, + "loss": 1.6848, + "loss_base2": 2.4307, + "loss_pixel": 0.2441, + "loss_text": 1.4407, + "ppl": 5.3914, + "step": 13515 + }, + { + "epoch": 0.07, + "global_step": 13516, + "learning_rate": 0.0004444240400667779, + "loss": 1.6971, + "loss_base2": 2.4484, + "loss_pixel": 0.2427, + "loss_text": 1.4544, + "ppl": 5.4581, + "step": 13516 + }, + { + "epoch": 0.07, + "global_step": 13517, + "learning_rate": 0.00044441986644407343, + "loss": 1.7085, + "loss_base2": 2.4648, + "loss_pixel": 0.2399, + "loss_text": 1.4686, + "ppl": 5.5207, + "step": 13517 + }, + { + "epoch": 0.07, + "global_step": 13518, + "learning_rate": 0.00044441569282136894, + "loss": 1.69, + "loss_base2": 2.4382, + "loss_pixel": 0.2404, + "loss_text": 1.4496, + "ppl": 5.4195, + "step": 13518 + }, + { + "epoch": 0.07, + "global_step": 13519, + "learning_rate": 0.00044441151919866445, + "loss": 1.6871, + "loss_base2": 2.434, + "loss_pixel": 0.2367, + "loss_text": 1.4505, + "ppl": 5.4038, + "step": 13519 + }, + { + "epoch": 0.07, + "global_step": 13520, + "learning_rate": 0.00044440734557595995, + "loss": 1.6954, + "loss_base2": 2.4459, + "loss_pixel": 0.2375, + "loss_text": 1.4579, + "ppl": 5.4488, + "step": 13520 + }, + { + "epoch": 0.07, + "global_step": 13521, + "learning_rate": 0.0004444031719532554, + "loss": 1.6566, + "loss_base2": 2.39, + "loss_pixel": 0.2357, + "loss_text": 1.4209, + "ppl": 5.2415, + "step": 13521 + }, + { + "epoch": 0.07, + "global_step": 13522, + "learning_rate": 0.0004443989983305509, + "loss": 1.6783, + "loss_base2": 2.4213, + "loss_pixel": 0.2334, + "loss_text": 1.445, + "ppl": 5.3564, + "step": 13522 + }, + { + "epoch": 0.07, + "global_step": 13523, + "learning_rate": 0.0004443948247078464, + "loss": 1.6749, + "loss_base2": 2.4164, + "loss_pixel": 0.2301, + "loss_text": 1.4448, + "ppl": 5.3383, + "step": 13523 + }, + { + "epoch": 0.07, + "global_step": 13524, + "learning_rate": 0.00044439065108514193, + "loss": 1.6787, + "loss_base2": 2.4219, + "loss_pixel": 0.2295, + "loss_text": 1.4492, + "ppl": 5.3586, + "step": 13524 + }, + { + "epoch": 0.07, + "global_step": 13525, + "learning_rate": 0.0004443864774624374, + "loss": 1.6568, + "loss_base2": 2.3903, + "loss_pixel": 0.2286, + "loss_text": 1.4282, + "ppl": 5.2425, + "step": 13525 + }, + { + "epoch": 0.07, + "global_step": 13526, + "learning_rate": 0.0004443823038397329, + "loss": 1.6757, + "loss_base2": 2.4175, + "loss_pixel": 0.2279, + "loss_text": 1.4477, + "ppl": 5.3425, + "step": 13526 + }, + { + "epoch": 0.07, + "global_step": 13527, + "learning_rate": 0.0004443781302170284, + "loss": 1.6798, + "loss_base2": 2.4234, + "loss_pixel": 0.2408, + "loss_text": 1.439, + "ppl": 5.3645, + "step": 13527 + }, + { + "epoch": 0.07, + "global_step": 13528, + "learning_rate": 0.0004443739565943239, + "loss": 1.6806, + "loss_base2": 2.4246, + "loss_pixel": 0.2489, + "loss_text": 1.4317, + "ppl": 5.3688, + "step": 13528 + }, + { + "epoch": 0.07, + "global_step": 13529, + "learning_rate": 0.0004443697829716194, + "loss": 1.708, + "loss_base2": 2.4641, + "loss_pixel": 0.2639, + "loss_text": 1.4441, + "ppl": 5.5179, + "step": 13529 + }, + { + "epoch": 0.07, + "global_step": 13530, + "learning_rate": 0.00044436560934891486, + "loss": 1.6974, + "loss_base2": 2.4488, + "loss_pixel": 0.2645, + "loss_text": 1.4329, + "ppl": 5.4597, + "step": 13530 + }, + { + "epoch": 0.07, + "global_step": 13531, + "learning_rate": 0.00044436143572621037, + "loss": 1.7063, + "loss_base2": 2.4617, + "loss_pixel": 0.2678, + "loss_text": 1.4384, + "ppl": 5.5085, + "step": 13531 + }, + { + "epoch": 0.07, + "global_step": 13532, + "learning_rate": 0.0004443572621035059, + "loss": 1.7214, + "loss_base2": 2.4835, + "loss_pixel": 0.2637, + "loss_text": 1.4578, + "ppl": 5.5924, + "step": 13532 + }, + { + "epoch": 0.07, + "global_step": 13533, + "learning_rate": 0.0004443530884808014, + "loss": 1.7119, + "loss_base2": 2.4697, + "loss_pixel": 0.2586, + "loss_text": 1.4533, + "ppl": 5.5395, + "step": 13533 + }, + { + "epoch": 0.07, + "global_step": 13534, + "learning_rate": 0.00044434891485809684, + "loss": 1.6928, + "loss_base2": 2.4422, + "loss_pixel": 0.2537, + "loss_text": 1.4391, + "ppl": 5.4347, + "step": 13534 + }, + { + "epoch": 0.07, + "global_step": 13535, + "learning_rate": 0.0004443447412353923, + "loss": 1.6797, + "loss_base2": 2.4233, + "loss_pixel": 0.2525, + "loss_text": 1.4273, + "ppl": 5.3639, + "step": 13535 + }, + { + "epoch": 0.07, + "global_step": 13536, + "learning_rate": 0.0004443405676126878, + "loss": 1.7043, + "loss_base2": 2.4588, + "loss_pixel": 0.2498, + "loss_text": 1.4546, + "ppl": 5.4975, + "step": 13536 + }, + { + "epoch": 0.07, + "global_step": 13537, + "learning_rate": 0.0004443363939899833, + "loss": 1.6928, + "loss_base2": 2.4422, + "loss_pixel": 0.2471, + "loss_text": 1.4457, + "ppl": 5.4347, + "step": 13537 + }, + { + "epoch": 0.07, + "global_step": 13538, + "learning_rate": 0.0004443322203672788, + "loss": 1.6869, + "loss_base2": 2.4337, + "loss_pixel": 0.2449, + "loss_text": 1.4419, + "ppl": 5.4027, + "step": 13538 + }, + { + "epoch": 0.07, + "global_step": 13539, + "learning_rate": 0.00044432804674457427, + "loss": 1.6947, + "loss_base2": 2.4449, + "loss_pixel": 0.2417, + "loss_text": 1.453, + "ppl": 5.445, + "step": 13539 + }, + { + "epoch": 0.07, + "global_step": 13540, + "learning_rate": 0.0004443238731218698, + "loss": 1.6989, + "loss_base2": 2.451, + "loss_pixel": 0.2399, + "loss_text": 1.459, + "ppl": 5.4679, + "step": 13540 + }, + { + "epoch": 0.07, + "global_step": 13541, + "learning_rate": 0.0004443196994991653, + "loss": 1.666, + "loss_base2": 2.4035, + "loss_pixel": 0.2364, + "loss_text": 1.4297, + "ppl": 5.291, + "step": 13541 + }, + { + "epoch": 0.07, + "global_step": 13542, + "learning_rate": 0.0004443155258764608, + "loss": 1.6681, + "loss_base2": 2.4066, + "loss_pixel": 0.235, + "loss_text": 1.4331, + "ppl": 5.3021, + "step": 13542 + }, + { + "epoch": 0.07, + "global_step": 13543, + "learning_rate": 0.0004443113522537563, + "loss": 1.6399, + "loss_base2": 2.3659, + "loss_pixel": 0.2312, + "loss_text": 1.4087, + "ppl": 5.1547, + "step": 13543 + }, + { + "epoch": 0.07, + "global_step": 13544, + "learning_rate": 0.00044430717863105175, + "loss": 1.6739, + "loss_base2": 2.4149, + "loss_pixel": 0.2293, + "loss_text": 1.4446, + "ppl": 5.3329, + "step": 13544 + }, + { + "epoch": 0.07, + "global_step": 13545, + "learning_rate": 0.00044430300500834726, + "loss": 1.6488, + "loss_base2": 2.3787, + "loss_pixel": 0.225, + "loss_text": 1.4238, + "ppl": 5.2007, + "step": 13545 + }, + { + "epoch": 0.07, + "global_step": 13546, + "learning_rate": 0.00044429883138564276, + "loss": 1.6661, + "loss_base2": 2.4037, + "loss_pixel": 0.2223, + "loss_text": 1.4438, + "ppl": 5.2915, + "step": 13546 + }, + { + "epoch": 0.07, + "global_step": 13547, + "learning_rate": 0.00044429465776293827, + "loss": 1.6472, + "loss_base2": 2.3764, + "loss_pixel": 0.2202, + "loss_text": 1.427, + "ppl": 5.1924, + "step": 13547 + }, + { + "epoch": 0.07, + "global_step": 13548, + "learning_rate": 0.0004442904841402337, + "loss": 1.6502, + "loss_base2": 2.3807, + "loss_pixel": 0.2175, + "loss_text": 1.4326, + "ppl": 5.208, + "step": 13548 + }, + { + "epoch": 0.07, + "global_step": 13549, + "learning_rate": 0.00044428631051752923, + "loss": 1.6381, + "loss_base2": 2.3633, + "loss_pixel": 0.2146, + "loss_text": 1.4235, + "ppl": 5.1454, + "step": 13549 + }, + { + "epoch": 0.07, + "global_step": 13550, + "learning_rate": 0.00044428213689482474, + "loss": 1.6525, + "loss_base2": 2.3841, + "loss_pixel": 0.2221, + "loss_text": 1.4304, + "ppl": 5.22, + "step": 13550 + }, + { + "epoch": 0.07, + "global_step": 13551, + "learning_rate": 0.00044427796327212025, + "loss": 1.676, + "loss_base2": 2.418, + "loss_pixel": 0.2309, + "loss_text": 1.4452, + "ppl": 5.3441, + "step": 13551 + }, + { + "epoch": 0.07, + "global_step": 13552, + "learning_rate": 0.0004442737896494157, + "loss": 1.6893, + "loss_base2": 2.4371, + "loss_pixel": 0.2337, + "loss_text": 1.4556, + "ppl": 5.4157, + "step": 13552 + }, + { + "epoch": 0.07, + "global_step": 13553, + "learning_rate": 0.00044426961602671115, + "loss": 1.6858, + "loss_base2": 2.4321, + "loss_pixel": 0.2329, + "loss_text": 1.4529, + "ppl": 5.3968, + "step": 13553 + }, + { + "epoch": 0.07, + "global_step": 13554, + "learning_rate": 0.00044426544240400666, + "loss": 1.6627, + "loss_base2": 2.3988, + "loss_pixel": 0.2239, + "loss_text": 1.4388, + "ppl": 5.2735, + "step": 13554 + }, + { + "epoch": 0.07, + "global_step": 13555, + "learning_rate": 0.00044426126878130217, + "loss": 1.6692, + "loss_base2": 2.4081, + "loss_pixel": 0.2199, + "loss_text": 1.4493, + "ppl": 5.3079, + "step": 13555 + }, + { + "epoch": 0.07, + "global_step": 13556, + "learning_rate": 0.0004442570951585977, + "loss": 1.6721, + "loss_base2": 2.4123, + "loss_pixel": 0.215, + "loss_text": 1.4572, + "ppl": 5.3233, + "step": 13556 + }, + { + "epoch": 0.07, + "global_step": 13557, + "learning_rate": 0.00044425292153589313, + "loss": 1.6512, + "loss_base2": 2.3822, + "loss_pixel": 0.211, + "loss_text": 1.4402, + "ppl": 5.2132, + "step": 13557 + }, + { + "epoch": 0.07, + "global_step": 13558, + "learning_rate": 0.00044424874791318864, + "loss": 1.6541, + "loss_base2": 2.3864, + "loss_pixel": 0.2088, + "loss_text": 1.4453, + "ppl": 5.2284, + "step": 13558 + }, + { + "epoch": 0.07, + "global_step": 13559, + "learning_rate": 0.00044424457429048414, + "loss": 1.6116, + "loss_base2": 2.325, + "loss_pixel": 0.2039, + "loss_text": 1.4077, + "ppl": 5.0108, + "step": 13559 + }, + { + "epoch": 0.07, + "global_step": 13560, + "learning_rate": 0.00044424040066777965, + "loss": 1.639, + "loss_base2": 2.3646, + "loss_pixel": 0.2033, + "loss_text": 1.4356, + "ppl": 5.15, + "step": 13560 + }, + { + "epoch": 0.07, + "global_step": 13561, + "learning_rate": 0.00044423622704507516, + "loss": 1.651, + "loss_base2": 2.3819, + "loss_pixel": 0.2005, + "loss_text": 1.4504, + "ppl": 5.2122, + "step": 13561 + }, + { + "epoch": 0.07, + "global_step": 13562, + "learning_rate": 0.0004442320534223706, + "loss": 1.6285, + "loss_base2": 2.3494, + "loss_pixel": 0.1973, + "loss_text": 1.4312, + "ppl": 5.0962, + "step": 13562 + }, + { + "epoch": 0.07, + "global_step": 13563, + "learning_rate": 0.0004442278797996661, + "loss": 1.6003, + "loss_base2": 2.3087, + "loss_pixel": 0.1973, + "loss_text": 1.403, + "ppl": 4.9545, + "step": 13563 + }, + { + "epoch": 0.07, + "global_step": 13564, + "learning_rate": 0.0004442237061769616, + "loss": 1.6363, + "loss_base2": 2.3607, + "loss_pixel": 0.1928, + "loss_text": 1.4434, + "ppl": 5.1361, + "step": 13564 + }, + { + "epoch": 0.07, + "global_step": 13565, + "learning_rate": 0.00044421953255425713, + "loss": 1.612, + "loss_base2": 2.3256, + "loss_pixel": 0.1931, + "loss_text": 1.4189, + "ppl": 5.0128, + "step": 13565 + }, + { + "epoch": 0.07, + "global_step": 13566, + "learning_rate": 0.0004442153589315526, + "loss": 1.6532, + "loss_base2": 2.3851, + "loss_pixel": 0.1905, + "loss_text": 1.4627, + "ppl": 5.2237, + "step": 13566 + }, + { + "epoch": 0.07, + "global_step": 13567, + "learning_rate": 0.0004442111853088481, + "loss": 1.6356, + "loss_base2": 2.3597, + "loss_pixel": 0.1875, + "loss_text": 1.4482, + "ppl": 5.1325, + "step": 13567 + }, + { + "epoch": 0.07, + "global_step": 13568, + "learning_rate": 0.0004442070116861436, + "loss": 1.6261, + "loss_base2": 2.346, + "loss_pixel": 0.188, + "loss_text": 1.4381, + "ppl": 5.084, + "step": 13568 + }, + { + "epoch": 0.07, + "global_step": 13569, + "learning_rate": 0.0004442028380634391, + "loss": 1.619, + "loss_base2": 2.3357, + "loss_pixel": 0.1855, + "loss_text": 1.4335, + "ppl": 5.048, + "step": 13569 + }, + { + "epoch": 0.07, + "global_step": 13570, + "learning_rate": 0.0004441986644407346, + "loss": 1.6253, + "loss_base2": 2.3448, + "loss_pixel": 0.1848, + "loss_text": 1.4405, + "ppl": 5.0799, + "step": 13570 + }, + { + "epoch": 0.07, + "global_step": 13571, + "learning_rate": 0.00044419449081803, + "loss": 1.6387, + "loss_base2": 2.3641, + "loss_pixel": 0.1829, + "loss_text": 1.4557, + "ppl": 5.1485, + "step": 13571 + }, + { + "epoch": 0.07, + "global_step": 13572, + "learning_rate": 0.0004441903171953255, + "loss": 1.6279, + "loss_base2": 2.3486, + "loss_pixel": 0.1818, + "loss_text": 1.4461, + "ppl": 5.0932, + "step": 13572 + }, + { + "epoch": 0.07, + "global_step": 13573, + "learning_rate": 0.00044418614357262103, + "loss": 1.6223, + "loss_base2": 2.3405, + "loss_pixel": 0.1789, + "loss_text": 1.4433, + "ppl": 5.0647, + "step": 13573 + }, + { + "epoch": 0.07, + "global_step": 13574, + "learning_rate": 0.00044418196994991654, + "loss": 1.6217, + "loss_base2": 2.3396, + "loss_pixel": 0.1791, + "loss_text": 1.4427, + "ppl": 5.0617, + "step": 13574 + }, + { + "epoch": 0.07, + "global_step": 13575, + "learning_rate": 0.000444177796327212, + "loss": 1.6253, + "loss_base2": 2.3448, + "loss_pixel": 0.1775, + "loss_text": 1.4479, + "ppl": 5.0799, + "step": 13575 + }, + { + "epoch": 0.07, + "global_step": 13576, + "learning_rate": 0.0004441736227045075, + "loss": 1.6086, + "loss_base2": 2.3207, + "loss_pixel": 0.1783, + "loss_text": 1.4303, + "ppl": 4.9958, + "step": 13576 + }, + { + "epoch": 0.07, + "global_step": 13577, + "learning_rate": 0.000444169449081803, + "loss": 1.5922, + "loss_base2": 2.2971, + "loss_pixel": 0.1779, + "loss_text": 1.4143, + "ppl": 4.9145, + "step": 13577 + }, + { + "epoch": 0.07, + "global_step": 13578, + "learning_rate": 0.0004441652754590985, + "loss": 1.627, + "loss_base2": 2.3473, + "loss_pixel": 0.1769, + "loss_text": 1.4501, + "ppl": 5.0886, + "step": 13578 + }, + { + "epoch": 0.07, + "global_step": 13579, + "learning_rate": 0.000444161101836394, + "loss": 1.6322, + "loss_base2": 2.3548, + "loss_pixel": 0.1795, + "loss_text": 1.4526, + "ppl": 5.1151, + "step": 13579 + }, + { + "epoch": 0.07, + "global_step": 13580, + "learning_rate": 0.00044415692821368947, + "loss": 1.6034, + "loss_base2": 2.3132, + "loss_pixel": 0.1773, + "loss_text": 1.4261, + "ppl": 4.9699, + "step": 13580 + }, + { + "epoch": 0.07, + "global_step": 13581, + "learning_rate": 0.000444152754590985, + "loss": 1.6047, + "loss_base2": 2.3151, + "loss_pixel": 0.1758, + "loss_text": 1.4289, + "ppl": 4.9764, + "step": 13581 + }, + { + "epoch": 0.07, + "global_step": 13582, + "learning_rate": 0.0004441485809682805, + "loss": 1.6278, + "loss_base2": 2.3484, + "loss_pixel": 0.1756, + "loss_text": 1.4522, + "ppl": 5.0927, + "step": 13582 + }, + { + "epoch": 0.07, + "global_step": 13583, + "learning_rate": 0.000444144407345576, + "loss": 1.6202, + "loss_base2": 2.3375, + "loss_pixel": 0.1747, + "loss_text": 1.4455, + "ppl": 5.0541, + "step": 13583 + }, + { + "epoch": 0.07, + "global_step": 13584, + "learning_rate": 0.00044414023372287145, + "loss": 1.6037, + "loss_base2": 2.3137, + "loss_pixel": 0.1748, + "loss_text": 1.4289, + "ppl": 4.9714, + "step": 13584 + }, + { + "epoch": 0.07, + "global_step": 13585, + "learning_rate": 0.00044413606010016695, + "loss": 1.5999, + "loss_base2": 2.3082, + "loss_pixel": 0.1734, + "loss_text": 1.4265, + "ppl": 4.9525, + "step": 13585 + }, + { + "epoch": 0.07, + "global_step": 13586, + "learning_rate": 0.00044413188647746246, + "loss": 1.6214, + "loss_base2": 2.3392, + "loss_pixel": 0.1727, + "loss_text": 1.4487, + "ppl": 5.0602, + "step": 13586 + }, + { + "epoch": 0.07, + "global_step": 13587, + "learning_rate": 0.00044412771285475797, + "loss": 1.6006, + "loss_base2": 2.3092, + "loss_pixel": 0.1715, + "loss_text": 1.4291, + "ppl": 4.956, + "step": 13587 + }, + { + "epoch": 0.07, + "global_step": 13588, + "learning_rate": 0.0004441235392320535, + "loss": 1.6159, + "loss_base2": 2.3313, + "loss_pixel": 0.1716, + "loss_text": 1.4443, + "ppl": 5.0324, + "step": 13588 + }, + { + "epoch": 0.07, + "global_step": 13589, + "learning_rate": 0.00044411936560934893, + "loss": 1.6068, + "loss_base2": 2.3181, + "loss_pixel": 0.1713, + "loss_text": 1.4355, + "ppl": 4.9868, + "step": 13589 + }, + { + "epoch": 0.07, + "global_step": 13590, + "learning_rate": 0.0004441151919866444, + "loss": 1.5962, + "loss_base2": 2.3028, + "loss_pixel": 0.1684, + "loss_text": 1.4278, + "ppl": 4.9342, + "step": 13590 + }, + { + "epoch": 0.07, + "global_step": 13591, + "learning_rate": 0.0004441110183639399, + "loss": 1.6043, + "loss_base2": 2.3145, + "loss_pixel": 0.1692, + "loss_text": 1.4351, + "ppl": 4.9744, + "step": 13591 + }, + { + "epoch": 0.07, + "global_step": 13592, + "learning_rate": 0.0004441068447412354, + "loss": 1.6176, + "loss_base2": 2.3337, + "loss_pixel": 0.1696, + "loss_text": 1.448, + "ppl": 5.041, + "step": 13592 + }, + { + "epoch": 0.07, + "global_step": 13593, + "learning_rate": 0.0004441026711185309, + "loss": 1.6092, + "loss_base2": 2.3216, + "loss_pixel": 0.1695, + "loss_text": 1.4398, + "ppl": 4.9988, + "step": 13593 + }, + { + "epoch": 0.07, + "global_step": 13594, + "learning_rate": 0.00044409849749582636, + "loss": 1.6021, + "loss_base2": 2.3113, + "loss_pixel": 0.1685, + "loss_text": 1.4336, + "ppl": 4.9634, + "step": 13594 + }, + { + "epoch": 0.07, + "global_step": 13595, + "learning_rate": 0.00044409432387312186, + "loss": 1.6034, + "loss_base2": 2.3132, + "loss_pixel": 0.1673, + "loss_text": 1.4361, + "ppl": 4.9699, + "step": 13595 + }, + { + "epoch": 0.07, + "global_step": 13596, + "learning_rate": 0.00044409015025041737, + "loss": 1.5955, + "loss_base2": 2.3018, + "loss_pixel": 0.1675, + "loss_text": 1.4279, + "ppl": 4.9308, + "step": 13596 + }, + { + "epoch": 0.07, + "global_step": 13597, + "learning_rate": 0.0004440859766277129, + "loss": 1.612, + "loss_base2": 2.3256, + "loss_pixel": 0.1685, + "loss_text": 1.4435, + "ppl": 5.0128, + "step": 13597 + }, + { + "epoch": 0.07, + "global_step": 13598, + "learning_rate": 0.00044408180300500833, + "loss": 1.6196, + "loss_base2": 2.3366, + "loss_pixel": 0.1661, + "loss_text": 1.4535, + "ppl": 5.0511, + "step": 13598 + }, + { + "epoch": 0.07, + "global_step": 13599, + "learning_rate": 0.00044407762938230384, + "loss": 1.5988, + "loss_base2": 2.3066, + "loss_pixel": 0.167, + "loss_text": 1.4318, + "ppl": 4.9471, + "step": 13599 + }, + { + "epoch": 0.07, + "global_step": 13600, + "learning_rate": 0.00044407345575959935, + "loss": 1.5998, + "loss_base2": 2.308, + "loss_pixel": 0.1648, + "loss_text": 1.435, + "ppl": 4.952, + "step": 13600 + }, + { + "epoch": 0.07, + "global_step": 13601, + "learning_rate": 0.00044406928213689485, + "loss": 1.6185, + "loss_base2": 2.335, + "loss_pixel": 0.1672, + "loss_text": 1.4513, + "ppl": 5.0455, + "step": 13601 + }, + { + "epoch": 0.07, + "global_step": 13602, + "learning_rate": 0.00044406510851419036, + "loss": 1.5972, + "loss_base2": 2.3043, + "loss_pixel": 0.165, + "loss_text": 1.4322, + "ppl": 4.9392, + "step": 13602 + }, + { + "epoch": 0.07, + "global_step": 13603, + "learning_rate": 0.0004440609348914858, + "loss": 1.6111, + "loss_base2": 2.3243, + "loss_pixel": 0.1649, + "loss_text": 1.4463, + "ppl": 5.0083, + "step": 13603 + }, + { + "epoch": 0.07, + "global_step": 13604, + "learning_rate": 0.0004440567612687813, + "loss": 1.6206, + "loss_base2": 2.338, + "loss_pixel": 0.1643, + "loss_text": 1.4563, + "ppl": 5.0561, + "step": 13604 + }, + { + "epoch": 0.07, + "global_step": 13605, + "learning_rate": 0.00044405258764607683, + "loss": 1.5278, + "loss_base2": 2.2041, + "loss_pixel": 0.1649, + "loss_text": 1.3628, + "ppl": 4.608, + "step": 13605 + }, + { + "epoch": 0.07, + "global_step": 13606, + "learning_rate": 0.00044404841402337234, + "loss": 1.3894, + "loss_base2": 2.0045, + "loss_pixel": 0.1648, + "loss_text": 1.2246, + "ppl": 4.0124, + "step": 13606 + }, + { + "epoch": 0.07, + "global_step": 13607, + "learning_rate": 0.0004440442404006678, + "loss": 1.3644, + "loss_base2": 1.9684, + "loss_pixel": 0.1648, + "loss_text": 1.1996, + "ppl": 3.9134, + "step": 13607 + }, + { + "epoch": 0.07, + "global_step": 13608, + "learning_rate": 0.00044404006677796324, + "loss": 1.3954, + "loss_base2": 2.0131, + "loss_pixel": 0.1636, + "loss_text": 1.2318, + "ppl": 4.0366, + "step": 13608 + }, + { + "epoch": 0.07, + "global_step": 13609, + "learning_rate": 0.00044403589315525875, + "loss": 1.3712, + "loss_base2": 1.9782, + "loss_pixel": 0.1642, + "loss_text": 1.207, + "ppl": 3.9401, + "step": 13609 + }, + { + "epoch": 0.07, + "global_step": 13610, + "learning_rate": 0.00044403171953255426, + "loss": 1.3705, + "loss_base2": 1.9772, + "loss_pixel": 0.1648, + "loss_text": 1.2057, + "ppl": 3.9373, + "step": 13610 + }, + { + "epoch": 0.07, + "global_step": 13611, + "learning_rate": 0.00044402754590984976, + "loss": 1.3642, + "loss_base2": 1.9681, + "loss_pixel": 0.1639, + "loss_text": 1.2003, + "ppl": 3.9126, + "step": 13611 + }, + { + "epoch": 0.07, + "global_step": 13612, + "learning_rate": 0.0004440233722871452, + "loss": 1.3737, + "loss_base2": 1.9818, + "loss_pixel": 0.1646, + "loss_text": 1.2092, + "ppl": 3.9499, + "step": 13612 + }, + { + "epoch": 0.07, + "global_step": 13613, + "learning_rate": 0.0004440191986644407, + "loss": 1.3761, + "loss_base2": 1.9853, + "loss_pixel": 0.1634, + "loss_text": 1.2127, + "ppl": 3.9594, + "step": 13613 + }, + { + "epoch": 0.07, + "global_step": 13614, + "learning_rate": 0.00044401502504173623, + "loss": 1.3859, + "loss_base2": 1.9994, + "loss_pixel": 0.1657, + "loss_text": 1.2201, + "ppl": 3.9984, + "step": 13614 + }, + { + "epoch": 0.07, + "global_step": 13615, + "learning_rate": 0.00044401085141903174, + "loss": 1.391, + "loss_base2": 2.0068, + "loss_pixel": 0.163, + "loss_text": 1.2279, + "ppl": 4.0189, + "step": 13615 + }, + { + "epoch": 0.07, + "global_step": 13616, + "learning_rate": 0.0004440066777963272, + "loss": 1.3774, + "loss_base2": 1.9872, + "loss_pixel": 0.162, + "loss_text": 1.2154, + "ppl": 3.9646, + "step": 13616 + }, + { + "epoch": 0.07, + "global_step": 13617, + "learning_rate": 0.0004440025041736227, + "loss": 1.3671, + "loss_base2": 1.9723, + "loss_pixel": 0.1645, + "loss_text": 1.2027, + "ppl": 3.924, + "step": 13617 + }, + { + "epoch": 0.07, + "global_step": 13618, + "learning_rate": 0.0004439983305509182, + "loss": 1.3672, + "loss_base2": 1.9725, + "loss_pixel": 0.1623, + "loss_text": 1.205, + "ppl": 3.9243, + "step": 13618 + }, + { + "epoch": 0.07, + "global_step": 13619, + "learning_rate": 0.0004439941569282137, + "loss": 1.378, + "loss_base2": 1.988, + "loss_pixel": 0.1626, + "loss_text": 1.2154, + "ppl": 3.967, + "step": 13619 + }, + { + "epoch": 0.07, + "global_step": 13620, + "learning_rate": 0.0004439899833055092, + "loss": 1.3866, + "loss_base2": 2.0004, + "loss_pixel": 0.1622, + "loss_text": 1.2244, + "ppl": 4.0012, + "step": 13620 + }, + { + "epoch": 0.07, + "global_step": 13621, + "learning_rate": 0.0004439858096828047, + "loss": 1.3778, + "loss_base2": 1.9877, + "loss_pixel": 0.1636, + "loss_text": 1.2141, + "ppl": 3.9662, + "step": 13621 + }, + { + "epoch": 0.07, + "global_step": 13622, + "learning_rate": 0.0004439816360601002, + "loss": 1.5413, + "loss_base2": 2.2236, + "loss_pixel": 0.1627, + "loss_text": 1.3786, + "ppl": 4.6707, + "step": 13622 + }, + { + "epoch": 0.07, + "global_step": 13623, + "learning_rate": 0.0004439774624373957, + "loss": 1.5548, + "loss_base2": 2.2431, + "loss_pixel": 0.1619, + "loss_text": 1.3929, + "ppl": 4.7341, + "step": 13623 + }, + { + "epoch": 0.07, + "global_step": 13624, + "learning_rate": 0.0004439732888146912, + "loss": 1.4127, + "loss_base2": 2.0381, + "loss_pixel": 0.1609, + "loss_text": 1.2518, + "ppl": 4.107, + "step": 13624 + }, + { + "epoch": 0.07, + "global_step": 13625, + "learning_rate": 0.00044396911519198665, + "loss": 1.3784, + "loss_base2": 1.9886, + "loss_pixel": 0.1619, + "loss_text": 1.2165, + "ppl": 3.9685, + "step": 13625 + }, + { + "epoch": 0.07, + "global_step": 13626, + "learning_rate": 0.00044396494156928216, + "loss": 1.3726, + "loss_base2": 1.9802, + "loss_pixel": 0.1621, + "loss_text": 1.2105, + "ppl": 3.9456, + "step": 13626 + }, + { + "epoch": 0.07, + "global_step": 13627, + "learning_rate": 0.0004439607679465776, + "loss": 1.3674, + "loss_base2": 1.9727, + "loss_pixel": 0.1613, + "loss_text": 1.2061, + "ppl": 3.9251, + "step": 13627 + }, + { + "epoch": 0.07, + "global_step": 13628, + "learning_rate": 0.0004439565943238731, + "loss": 1.3698, + "loss_base2": 1.9762, + "loss_pixel": 0.1628, + "loss_text": 1.207, + "ppl": 3.9346, + "step": 13628 + }, + { + "epoch": 0.07, + "global_step": 13629, + "learning_rate": 0.0004439524207011686, + "loss": 1.382, + "loss_base2": 1.9938, + "loss_pixel": 0.1617, + "loss_text": 1.2203, + "ppl": 3.9829, + "step": 13629 + }, + { + "epoch": 0.07, + "global_step": 13630, + "learning_rate": 0.0004439482470784641, + "loss": 1.3955, + "loss_base2": 2.0133, + "loss_pixel": 0.1626, + "loss_text": 1.2328, + "ppl": 4.037, + "step": 13630 + }, + { + "epoch": 0.07, + "global_step": 13631, + "learning_rate": 0.0004439440734557596, + "loss": 1.3599, + "loss_base2": 1.9619, + "loss_pixel": 0.1625, + "loss_text": 1.1974, + "ppl": 3.8958, + "step": 13631 + }, + { + "epoch": 0.07, + "global_step": 13632, + "learning_rate": 0.0004439398998330551, + "loss": 1.3689, + "loss_base2": 1.9749, + "loss_pixel": 0.16, + "loss_text": 1.2089, + "ppl": 3.931, + "step": 13632 + }, + { + "epoch": 0.07, + "global_step": 13633, + "learning_rate": 0.0004439357262103506, + "loss": 1.3814, + "loss_base2": 1.9929, + "loss_pixel": 0.1611, + "loss_text": 1.2203, + "ppl": 3.9805, + "step": 13633 + }, + { + "epoch": 0.07, + "global_step": 13634, + "learning_rate": 0.00044393155258764605, + "loss": 1.4022, + "loss_base2": 2.0229, + "loss_pixel": 0.1618, + "loss_text": 1.2405, + "ppl": 4.0641, + "step": 13634 + }, + { + "epoch": 0.07, + "global_step": 13635, + "learning_rate": 0.00044392737896494156, + "loss": 1.3896, + "loss_base2": 2.0048, + "loss_pixel": 0.1632, + "loss_text": 1.2264, + "ppl": 4.0132, + "step": 13635 + }, + { + "epoch": 0.07, + "global_step": 13636, + "learning_rate": 0.00044392320534223707, + "loss": 1.3684, + "loss_base2": 1.9742, + "loss_pixel": 0.1605, + "loss_text": 1.2079, + "ppl": 3.9291, + "step": 13636 + }, + { + "epoch": 0.07, + "global_step": 13637, + "learning_rate": 0.0004439190317195326, + "loss": 1.3813, + "loss_base2": 1.9928, + "loss_pixel": 0.162, + "loss_text": 1.2193, + "ppl": 3.9801, + "step": 13637 + }, + { + "epoch": 0.07, + "global_step": 13638, + "learning_rate": 0.0004439148580968281, + "loss": 1.3561, + "loss_base2": 1.9564, + "loss_pixel": 0.1617, + "loss_text": 1.1944, + "ppl": 3.881, + "step": 13638 + }, + { + "epoch": 0.07, + "global_step": 13639, + "learning_rate": 0.00044391068447412354, + "loss": 1.5423, + "loss_base2": 2.2251, + "loss_pixel": 0.1612, + "loss_text": 1.3811, + "ppl": 4.6753, + "step": 13639 + }, + { + "epoch": 0.07, + "global_step": 13640, + "learning_rate": 0.00044390651085141904, + "loss": 1.4208, + "loss_base2": 2.0498, + "loss_pixel": 0.1622, + "loss_text": 1.2586, + "ppl": 4.1404, + "step": 13640 + }, + { + "epoch": 0.07, + "global_step": 13641, + "learning_rate": 0.00044390233722871455, + "loss": 1.3957, + "loss_base2": 2.0136, + "loss_pixel": 0.1603, + "loss_text": 1.2354, + "ppl": 4.0378, + "step": 13641 + }, + { + "epoch": 0.07, + "global_step": 13642, + "learning_rate": 0.00044389816360601006, + "loss": 1.3802, + "loss_base2": 1.9912, + "loss_pixel": 0.1605, + "loss_text": 1.2197, + "ppl": 3.9757, + "step": 13642 + }, + { + "epoch": 0.07, + "global_step": 13643, + "learning_rate": 0.00044389398998330557, + "loss": 1.341, + "loss_base2": 1.9347, + "loss_pixel": 0.1614, + "loss_text": 1.1796, + "ppl": 3.8229, + "step": 13643 + }, + { + "epoch": 0.07, + "global_step": 13644, + "learning_rate": 0.000443889816360601, + "loss": 1.3876, + "loss_base2": 2.0019, + "loss_pixel": 0.1613, + "loss_text": 1.2263, + "ppl": 4.0052, + "step": 13644 + }, + { + "epoch": 0.07, + "global_step": 13645, + "learning_rate": 0.0004438856427378965, + "loss": 1.3401, + "loss_base2": 1.9334, + "loss_pixel": 0.1611, + "loss_text": 1.1791, + "ppl": 3.8194, + "step": 13645 + }, + { + "epoch": 0.07, + "global_step": 13646, + "learning_rate": 0.000443881469115192, + "loss": 1.3761, + "loss_base2": 1.9853, + "loss_pixel": 0.1647, + "loss_text": 1.2114, + "ppl": 3.9594, + "step": 13646 + }, + { + "epoch": 0.07, + "global_step": 13647, + "learning_rate": 0.0004438772954924875, + "loss": 1.3578, + "loss_base2": 1.9589, + "loss_pixel": 0.1619, + "loss_text": 1.1959, + "ppl": 3.8876, + "step": 13647 + }, + { + "epoch": 0.07, + "global_step": 13648, + "learning_rate": 0.00044387312186978294, + "loss": 1.4735, + "loss_base2": 2.1258, + "loss_pixel": 0.1661, + "loss_text": 1.3074, + "ppl": 4.3645, + "step": 13648 + }, + { + "epoch": 0.07, + "global_step": 13649, + "learning_rate": 0.00044386894824707845, + "loss": 1.6627, + "loss_base2": 2.3988, + "loss_pixel": 0.1601, + "loss_text": 1.5026, + "ppl": 5.2735, + "step": 13649 + }, + { + "epoch": 0.07, + "global_step": 13650, + "learning_rate": 0.00044386477462437395, + "loss": 1.6455, + "loss_base2": 2.374, + "loss_pixel": 0.1607, + "loss_text": 1.4849, + "ppl": 5.1836, + "step": 13650 + }, + { + "epoch": 0.07, + "global_step": 13651, + "learning_rate": 0.00044386060100166946, + "loss": 1.6364, + "loss_base2": 2.3608, + "loss_pixel": 0.1607, + "loss_text": 1.4757, + "ppl": 5.1366, + "step": 13651 + }, + { + "epoch": 0.07, + "global_step": 13652, + "learning_rate": 0.00044385642737896497, + "loss": 1.6336, + "loss_base2": 2.3568, + "loss_pixel": 0.1602, + "loss_text": 1.4734, + "ppl": 5.1223, + "step": 13652 + }, + { + "epoch": 0.07, + "global_step": 13653, + "learning_rate": 0.0004438522537562604, + "loss": 1.6217, + "loss_base2": 2.3396, + "loss_pixel": 0.1586, + "loss_text": 1.4631, + "ppl": 5.0617, + "step": 13653 + }, + { + "epoch": 0.07, + "global_step": 13654, + "learning_rate": 0.00044384808013355593, + "loss": 1.6186, + "loss_base2": 2.3351, + "loss_pixel": 0.1605, + "loss_text": 1.458, + "ppl": 5.046, + "step": 13654 + }, + { + "epoch": 0.07, + "global_step": 13655, + "learning_rate": 0.00044384390651085144, + "loss": 1.6096, + "loss_base2": 2.3222, + "loss_pixel": 0.152, + "loss_text": 1.4576, + "ppl": 5.0008, + "step": 13655 + }, + { + "epoch": 0.07, + "global_step": 13656, + "learning_rate": 0.00044383973288814694, + "loss": 1.6171, + "loss_base2": 2.333, + "loss_pixel": 0.1568, + "loss_text": 1.4603, + "ppl": 5.0385, + "step": 13656 + }, + { + "epoch": 0.07, + "global_step": 13657, + "learning_rate": 0.0004438355592654424, + "loss": 1.5963, + "loss_base2": 2.303, + "loss_pixel": 0.1536, + "loss_text": 1.4426, + "ppl": 4.9347, + "step": 13657 + }, + { + "epoch": 0.07, + "global_step": 13658, + "learning_rate": 0.0004438313856427379, + "loss": 1.5861, + "loss_base2": 2.2883, + "loss_pixel": 0.1512, + "loss_text": 1.4349, + "ppl": 4.8847, + "step": 13658 + }, + { + "epoch": 0.07, + "global_step": 13659, + "learning_rate": 0.0004438272120200334, + "loss": 1.6024, + "loss_base2": 2.3118, + "loss_pixel": 0.1532, + "loss_text": 1.4493, + "ppl": 4.9649, + "step": 13659 + }, + { + "epoch": 0.07, + "global_step": 13660, + "learning_rate": 0.0004438230383973289, + "loss": 1.613, + "loss_base2": 2.3271, + "loss_pixel": 0.1528, + "loss_text": 1.4602, + "ppl": 5.0178, + "step": 13660 + }, + { + "epoch": 0.07, + "global_step": 13661, + "learning_rate": 0.0004438188647746244, + "loss": 1.6089, + "loss_base2": 2.3212, + "loss_pixel": 0.152, + "loss_text": 1.4569, + "ppl": 4.9973, + "step": 13661 + }, + { + "epoch": 0.07, + "global_step": 13662, + "learning_rate": 0.0004438146911519199, + "loss": 1.6202, + "loss_base2": 2.3375, + "loss_pixel": 0.151, + "loss_text": 1.4692, + "ppl": 5.0541, + "step": 13662 + }, + { + "epoch": 0.07, + "global_step": 13663, + "learning_rate": 0.0004438105175292154, + "loss": 1.6031, + "loss_base2": 2.3128, + "loss_pixel": 0.1514, + "loss_text": 1.4516, + "ppl": 4.9684, + "step": 13663 + }, + { + "epoch": 0.07, + "global_step": 13664, + "learning_rate": 0.0004438063439065109, + "loss": 1.6145, + "loss_base2": 2.3292, + "loss_pixel": 0.1517, + "loss_text": 1.4628, + "ppl": 5.0254, + "step": 13664 + }, + { + "epoch": 0.07, + "global_step": 13665, + "learning_rate": 0.00044380217028380635, + "loss": 1.6032, + "loss_base2": 2.3129, + "loss_pixel": 0.1513, + "loss_text": 1.4519, + "ppl": 4.9689, + "step": 13665 + }, + { + "epoch": 0.07, + "global_step": 13666, + "learning_rate": 0.0004437979966611018, + "loss": 1.6044, + "loss_base2": 2.3147, + "loss_pixel": 0.1513, + "loss_text": 1.4531, + "ppl": 4.9749, + "step": 13666 + }, + { + "epoch": 0.07, + "global_step": 13667, + "learning_rate": 0.0004437938230383973, + "loss": 1.6028, + "loss_base2": 2.3124, + "loss_pixel": 0.1496, + "loss_text": 1.4532, + "ppl": 4.9669, + "step": 13667 + }, + { + "epoch": 0.07, + "global_step": 13668, + "learning_rate": 0.0004437896494156928, + "loss": 1.6024, + "loss_base2": 2.3118, + "loss_pixel": 0.1544, + "loss_text": 1.4479, + "ppl": 4.9649, + "step": 13668 + }, + { + "epoch": 0.07, + "global_step": 13669, + "learning_rate": 0.0004437854757929883, + "loss": 1.6072, + "loss_base2": 2.3187, + "loss_pixel": 0.1641, + "loss_text": 1.443, + "ppl": 4.9888, + "step": 13669 + }, + { + "epoch": 0.07, + "global_step": 13670, + "learning_rate": 0.00044378130217028383, + "loss": 1.608, + "loss_base2": 2.3199, + "loss_pixel": 0.1613, + "loss_text": 1.4467, + "ppl": 4.9928, + "step": 13670 + }, + { + "epoch": 0.07, + "global_step": 13671, + "learning_rate": 0.0004437771285475793, + "loss": 1.6137, + "loss_base2": 2.3281, + "loss_pixel": 0.1624, + "loss_text": 1.4514, + "ppl": 5.0214, + "step": 13671 + }, + { + "epoch": 0.07, + "global_step": 13672, + "learning_rate": 0.0004437729549248748, + "loss": 1.6111, + "loss_base2": 2.3243, + "loss_pixel": 0.1597, + "loss_text": 1.4514, + "ppl": 5.0083, + "step": 13672 + }, + { + "epoch": 0.07, + "global_step": 13673, + "learning_rate": 0.0004437687813021703, + "loss": 1.6021, + "loss_base2": 2.3113, + "loss_pixel": 0.1614, + "loss_text": 1.4407, + "ppl": 4.9634, + "step": 13673 + }, + { + "epoch": 0.07, + "global_step": 13674, + "learning_rate": 0.0004437646076794658, + "loss": 1.5983, + "loss_base2": 2.3059, + "loss_pixel": 0.161, + "loss_text": 1.4373, + "ppl": 4.9446, + "step": 13674 + }, + { + "epoch": 0.07, + "global_step": 13675, + "learning_rate": 0.00044376043405676126, + "loss": 1.5983, + "loss_base2": 2.3059, + "loss_pixel": 0.1599, + "loss_text": 1.4384, + "ppl": 4.9446, + "step": 13675 + }, + { + "epoch": 0.07, + "global_step": 13676, + "learning_rate": 0.00044375626043405676, + "loss": 1.5883, + "loss_base2": 2.2914, + "loss_pixel": 0.1599, + "loss_text": 1.4284, + "ppl": 4.8954, + "step": 13676 + }, + { + "epoch": 0.07, + "global_step": 13677, + "learning_rate": 0.00044375208681135227, + "loss": 1.6034, + "loss_base2": 2.3132, + "loss_pixel": 0.1601, + "loss_text": 1.4433, + "ppl": 4.9699, + "step": 13677 + }, + { + "epoch": 0.07, + "global_step": 13678, + "learning_rate": 0.0004437479131886478, + "loss": 1.574, + "loss_base2": 2.2708, + "loss_pixel": 0.1615, + "loss_text": 1.4125, + "ppl": 4.8259, + "step": 13678 + }, + { + "epoch": 0.07, + "global_step": 13679, + "learning_rate": 0.0004437437395659433, + "loss": 1.5784, + "loss_base2": 2.2771, + "loss_pixel": 0.161, + "loss_text": 1.4174, + "ppl": 4.8472, + "step": 13679 + }, + { + "epoch": 0.07, + "global_step": 13680, + "learning_rate": 0.00044373956594323874, + "loss": 1.5904, + "loss_base2": 2.2945, + "loss_pixel": 0.1611, + "loss_text": 1.4292, + "ppl": 4.9057, + "step": 13680 + }, + { + "epoch": 0.07, + "global_step": 13681, + "learning_rate": 0.00044373539232053425, + "loss": 1.5921, + "loss_base2": 2.2969, + "loss_pixel": 0.1608, + "loss_text": 1.4313, + "ppl": 4.9141, + "step": 13681 + }, + { + "epoch": 0.07, + "global_step": 13682, + "learning_rate": 0.00044373121869782975, + "loss": 1.605, + "loss_base2": 2.3155, + "loss_pixel": 0.1611, + "loss_text": 1.444, + "ppl": 4.9779, + "step": 13682 + }, + { + "epoch": 0.07, + "global_step": 13683, + "learning_rate": 0.00044372704507512526, + "loss": 1.5835, + "loss_base2": 2.2845, + "loss_pixel": 0.1603, + "loss_text": 1.4232, + "ppl": 4.872, + "step": 13683 + }, + { + "epoch": 0.07, + "global_step": 13684, + "learning_rate": 0.00044372287145242066, + "loss": 1.5945, + "loss_base2": 2.3004, + "loss_pixel": 0.1602, + "loss_text": 1.4343, + "ppl": 4.9259, + "step": 13684 + }, + { + "epoch": 0.07, + "global_step": 13685, + "learning_rate": 0.00044371869782971617, + "loss": 1.6151, + "loss_base2": 2.3301, + "loss_pixel": 0.1586, + "loss_text": 1.4565, + "ppl": 5.0284, + "step": 13685 + }, + { + "epoch": 0.07, + "global_step": 13686, + "learning_rate": 0.0004437145242070117, + "loss": 1.5939, + "loss_base2": 2.2995, + "loss_pixel": 0.1606, + "loss_text": 1.4333, + "ppl": 4.9229, + "step": 13686 + }, + { + "epoch": 0.07, + "global_step": 13687, + "learning_rate": 0.0004437103505843072, + "loss": 1.5967, + "loss_base2": 2.3036, + "loss_pixel": 0.1604, + "loss_text": 1.4362, + "ppl": 4.9367, + "step": 13687 + }, + { + "epoch": 0.07, + "global_step": 13688, + "learning_rate": 0.0004437061769616027, + "loss": 1.598, + "loss_base2": 2.3054, + "loss_pixel": 0.1587, + "loss_text": 1.4393, + "ppl": 4.9431, + "step": 13688 + }, + { + "epoch": 0.07, + "global_step": 13689, + "learning_rate": 0.00044370200333889814, + "loss": 1.595, + "loss_base2": 2.3011, + "loss_pixel": 0.1594, + "loss_text": 1.4356, + "ppl": 4.9283, + "step": 13689 + }, + { + "epoch": 0.07, + "global_step": 13690, + "learning_rate": 0.00044369782971619365, + "loss": 1.593, + "loss_base2": 2.2982, + "loss_pixel": 0.1592, + "loss_text": 1.4338, + "ppl": 4.9185, + "step": 13690 + }, + { + "epoch": 0.07, + "global_step": 13691, + "learning_rate": 0.00044369365609348916, + "loss": 1.5962, + "loss_base2": 2.3028, + "loss_pixel": 0.159, + "loss_text": 1.4372, + "ppl": 4.9342, + "step": 13691 + }, + { + "epoch": 0.07, + "global_step": 13692, + "learning_rate": 0.00044368948247078466, + "loss": 1.6226, + "loss_base2": 2.3409, + "loss_pixel": 0.1607, + "loss_text": 1.4619, + "ppl": 5.0662, + "step": 13692 + }, + { + "epoch": 0.07, + "global_step": 13693, + "learning_rate": 0.0004436853088480801, + "loss": 1.5935, + "loss_base2": 2.2989, + "loss_pixel": 0.1606, + "loss_text": 1.4329, + "ppl": 4.9209, + "step": 13693 + }, + { + "epoch": 0.07, + "global_step": 13694, + "learning_rate": 0.0004436811352253756, + "loss": 1.6125, + "loss_base2": 2.3263, + "loss_pixel": 0.1589, + "loss_text": 1.4535, + "ppl": 5.0153, + "step": 13694 + }, + { + "epoch": 0.07, + "global_step": 13695, + "learning_rate": 0.00044367696160267113, + "loss": 1.6167, + "loss_base2": 2.3324, + "loss_pixel": 0.16, + "loss_text": 1.4567, + "ppl": 5.0364, + "step": 13695 + }, + { + "epoch": 0.07, + "global_step": 13696, + "learning_rate": 0.00044367278797996664, + "loss": 1.5873, + "loss_base2": 2.29, + "loss_pixel": 0.1601, + "loss_text": 1.4273, + "ppl": 4.8905, + "step": 13696 + }, + { + "epoch": 0.07, + "global_step": 13697, + "learning_rate": 0.00044366861435726215, + "loss": 1.6106, + "loss_base2": 2.3236, + "loss_pixel": 0.1601, + "loss_text": 1.4505, + "ppl": 5.0058, + "step": 13697 + }, + { + "epoch": 0.07, + "global_step": 13698, + "learning_rate": 0.0004436644407345576, + "loss": 1.5951, + "loss_base2": 2.3012, + "loss_pixel": 0.1603, + "loss_text": 1.4348, + "ppl": 4.9288, + "step": 13698 + }, + { + "epoch": 0.07, + "global_step": 13699, + "learning_rate": 0.0004436602671118531, + "loss": 1.606, + "loss_base2": 2.317, + "loss_pixel": 0.1584, + "loss_text": 1.4477, + "ppl": 4.9828, + "step": 13699 + }, + { + "epoch": 0.07, + "global_step": 13700, + "learning_rate": 0.0004436560934891486, + "loss": 1.5889, + "loss_base2": 2.2923, + "loss_pixel": 0.1594, + "loss_text": 1.4295, + "ppl": 4.8984, + "step": 13700 + }, + { + "epoch": 0.07, + "global_step": 13701, + "learning_rate": 0.0004436519198664441, + "loss": 1.5964, + "loss_base2": 2.3031, + "loss_pixel": 0.1585, + "loss_text": 1.4379, + "ppl": 4.9352, + "step": 13701 + }, + { + "epoch": 0.07, + "global_step": 13702, + "learning_rate": 0.00044364774624373963, + "loss": 1.6112, + "loss_base2": 2.3245, + "loss_pixel": 0.1584, + "loss_text": 1.4529, + "ppl": 5.0088, + "step": 13702 + }, + { + "epoch": 0.07, + "global_step": 13703, + "learning_rate": 0.00044364357262103503, + "loss": 1.6023, + "loss_base2": 2.3116, + "loss_pixel": 0.1586, + "loss_text": 1.4437, + "ppl": 4.9644, + "step": 13703 + }, + { + "epoch": 0.07, + "global_step": 13704, + "learning_rate": 0.00044363939899833054, + "loss": 1.6101, + "loss_base2": 2.3229, + "loss_pixel": 0.1582, + "loss_text": 1.4519, + "ppl": 5.0033, + "step": 13704 + }, + { + "epoch": 0.07, + "global_step": 13705, + "learning_rate": 0.00044363522537562604, + "loss": 1.6002, + "loss_base2": 2.3086, + "loss_pixel": 0.1593, + "loss_text": 1.4408, + "ppl": 4.954, + "step": 13705 + }, + { + "epoch": 0.07, + "global_step": 13706, + "learning_rate": 0.00044363105175292155, + "loss": 1.5936, + "loss_base2": 2.2991, + "loss_pixel": 0.1575, + "loss_text": 1.4361, + "ppl": 4.9214, + "step": 13706 + }, + { + "epoch": 0.07, + "global_step": 13707, + "learning_rate": 0.000443626878130217, + "loss": 1.6048, + "loss_base2": 2.3152, + "loss_pixel": 0.157, + "loss_text": 1.4479, + "ppl": 4.9769, + "step": 13707 + }, + { + "epoch": 0.07, + "global_step": 13708, + "learning_rate": 0.0004436227045075125, + "loss": 1.5862, + "loss_base2": 2.2884, + "loss_pixel": 0.1583, + "loss_text": 1.4279, + "ppl": 4.8852, + "step": 13708 + }, + { + "epoch": 0.07, + "global_step": 13709, + "learning_rate": 0.000443618530884808, + "loss": 1.6069, + "loss_base2": 2.3183, + "loss_pixel": 0.157, + "loss_text": 1.4499, + "ppl": 4.9873, + "step": 13709 + }, + { + "epoch": 0.07, + "global_step": 13710, + "learning_rate": 0.0004436143572621035, + "loss": 1.5939, + "loss_base2": 2.2995, + "loss_pixel": 0.1562, + "loss_text": 1.4377, + "ppl": 4.9229, + "step": 13710 + }, + { + "epoch": 0.07, + "global_step": 13711, + "learning_rate": 0.00044361018363939903, + "loss": 1.5873, + "loss_base2": 2.29, + "loss_pixel": 0.1577, + "loss_text": 1.4296, + "ppl": 4.8905, + "step": 13711 + }, + { + "epoch": 0.07, + "global_step": 13712, + "learning_rate": 0.0004436060100166945, + "loss": 1.5962, + "loss_base2": 2.3028, + "loss_pixel": 0.1587, + "loss_text": 1.4374, + "ppl": 4.9342, + "step": 13712 + }, + { + "epoch": 0.07, + "global_step": 13713, + "learning_rate": 0.00044360183639399, + "loss": 1.5814, + "loss_base2": 2.2815, + "loss_pixel": 0.1586, + "loss_text": 1.4228, + "ppl": 4.8618, + "step": 13713 + }, + { + "epoch": 0.07, + "global_step": 13714, + "learning_rate": 0.0004435976627712855, + "loss": 1.5822, + "loss_base2": 2.2826, + "loss_pixel": 0.1576, + "loss_text": 1.4245, + "ppl": 4.8656, + "step": 13714 + }, + { + "epoch": 0.07, + "global_step": 13715, + "learning_rate": 0.000443593489148581, + "loss": 1.5869, + "loss_base2": 2.2894, + "loss_pixel": 0.1582, + "loss_text": 1.4287, + "ppl": 4.8886, + "step": 13715 + }, + { + "epoch": 0.07, + "global_step": 13716, + "learning_rate": 0.00044358931552587646, + "loss": 1.6147, + "loss_base2": 2.3295, + "loss_pixel": 0.1587, + "loss_text": 1.4561, + "ppl": 5.0264, + "step": 13716 + }, + { + "epoch": 0.07, + "global_step": 13717, + "learning_rate": 0.00044358514190317197, + "loss": 1.5978, + "loss_base2": 2.3051, + "loss_pixel": 0.1591, + "loss_text": 1.4387, + "ppl": 4.9421, + "step": 13717 + }, + { + "epoch": 0.07, + "global_step": 13718, + "learning_rate": 0.0004435809682804675, + "loss": 1.5799, + "loss_base2": 2.2793, + "loss_pixel": 0.1581, + "loss_text": 1.4218, + "ppl": 4.8545, + "step": 13718 + }, + { + "epoch": 0.07, + "global_step": 13719, + "learning_rate": 0.000443576794657763, + "loss": 1.5688, + "loss_base2": 2.2633, + "loss_pixel": 0.1558, + "loss_text": 1.4131, + "ppl": 4.8009, + "step": 13719 + }, + { + "epoch": 0.07, + "global_step": 13720, + "learning_rate": 0.0004435726210350585, + "loss": 1.5817, + "loss_base2": 2.2819, + "loss_pixel": 0.1573, + "loss_text": 1.4244, + "ppl": 4.8632, + "step": 13720 + }, + { + "epoch": 0.07, + "global_step": 13721, + "learning_rate": 0.0004435684474123539, + "loss": 1.5909, + "loss_base2": 2.2952, + "loss_pixel": 0.1585, + "loss_text": 1.4324, + "ppl": 4.9082, + "step": 13721 + }, + { + "epoch": 0.07, + "global_step": 13722, + "learning_rate": 0.0004435642737896494, + "loss": 1.5954, + "loss_base2": 2.3017, + "loss_pixel": 0.1575, + "loss_text": 1.438, + "ppl": 4.9303, + "step": 13722 + }, + { + "epoch": 0.07, + "global_step": 13723, + "learning_rate": 0.0004435601001669449, + "loss": 1.5863, + "loss_base2": 2.2885, + "loss_pixel": 0.1577, + "loss_text": 1.4285, + "ppl": 4.8856, + "step": 13723 + }, + { + "epoch": 0.07, + "global_step": 13724, + "learning_rate": 0.0004435559265442404, + "loss": 1.6044, + "loss_base2": 2.3147, + "loss_pixel": 0.1572, + "loss_text": 1.4472, + "ppl": 4.9749, + "step": 13724 + }, + { + "epoch": 0.07, + "global_step": 13725, + "learning_rate": 0.00044355175292153586, + "loss": 1.6047, + "loss_base2": 2.3151, + "loss_pixel": 0.1592, + "loss_text": 1.4455, + "ppl": 4.9764, + "step": 13725 + }, + { + "epoch": 0.07, + "global_step": 13726, + "learning_rate": 0.00044354757929883137, + "loss": 1.5984, + "loss_base2": 2.306, + "loss_pixel": 0.1562, + "loss_text": 1.4422, + "ppl": 4.9451, + "step": 13726 + }, + { + "epoch": 0.07, + "global_step": 13727, + "learning_rate": 0.0004435434056761269, + "loss": 1.5994, + "loss_base2": 2.3074, + "loss_pixel": 0.1581, + "loss_text": 1.4413, + "ppl": 4.9501, + "step": 13727 + }, + { + "epoch": 0.07, + "global_step": 13728, + "learning_rate": 0.0004435392320534224, + "loss": 1.5909, + "loss_base2": 2.2952, + "loss_pixel": 0.1577, + "loss_text": 1.4332, + "ppl": 4.9082, + "step": 13728 + }, + { + "epoch": 0.07, + "global_step": 13729, + "learning_rate": 0.0004435350584307179, + "loss": 1.5845, + "loss_base2": 2.286, + "loss_pixel": 0.1573, + "loss_text": 1.4272, + "ppl": 4.8769, + "step": 13729 + }, + { + "epoch": 0.07, + "global_step": 13730, + "learning_rate": 0.00044353088480801335, + "loss": 1.5859, + "loss_base2": 2.288, + "loss_pixel": 0.157, + "loss_text": 1.4288, + "ppl": 4.8837, + "step": 13730 + }, + { + "epoch": 0.07, + "global_step": 13731, + "learning_rate": 0.00044352671118530885, + "loss": 1.5865, + "loss_base2": 2.2888, + "loss_pixel": 0.1585, + "loss_text": 1.428, + "ppl": 4.8866, + "step": 13731 + }, + { + "epoch": 0.07, + "global_step": 13732, + "learning_rate": 0.00044352253756260436, + "loss": 1.5926, + "loss_base2": 2.2976, + "loss_pixel": 0.1581, + "loss_text": 1.4345, + "ppl": 4.9165, + "step": 13732 + }, + { + "epoch": 0.07, + "global_step": 13733, + "learning_rate": 0.00044351836393989987, + "loss": 1.5842, + "loss_base2": 2.2855, + "loss_pixel": 0.1579, + "loss_text": 1.4263, + "ppl": 4.8754, + "step": 13733 + }, + { + "epoch": 0.07, + "global_step": 13734, + "learning_rate": 0.0004435141903171953, + "loss": 1.5911, + "loss_base2": 2.2955, + "loss_pixel": 0.1553, + "loss_text": 1.4359, + "ppl": 4.9091, + "step": 13734 + }, + { + "epoch": 0.07, + "global_step": 13735, + "learning_rate": 0.00044351001669449083, + "loss": 1.572, + "loss_base2": 2.2679, + "loss_pixel": 0.1505, + "loss_text": 1.4215, + "ppl": 4.8163, + "step": 13735 + }, + { + "epoch": 0.07, + "global_step": 13736, + "learning_rate": 0.00044350584307178634, + "loss": 1.5857, + "loss_base2": 2.2877, + "loss_pixel": 0.1505, + "loss_text": 1.4352, + "ppl": 4.8827, + "step": 13736 + }, + { + "epoch": 0.07, + "global_step": 13737, + "learning_rate": 0.00044350166944908184, + "loss": 1.5843, + "loss_base2": 2.2857, + "loss_pixel": 0.1495, + "loss_text": 1.4348, + "ppl": 4.8759, + "step": 13737 + }, + { + "epoch": 0.07, + "global_step": 13738, + "learning_rate": 0.00044349749582637735, + "loss": 1.5943, + "loss_base2": 2.3001, + "loss_pixel": 0.1464, + "loss_text": 1.4479, + "ppl": 4.9249, + "step": 13738 + }, + { + "epoch": 0.07, + "global_step": 13739, + "learning_rate": 0.0004434933222036728, + "loss": 1.5912, + "loss_base2": 2.2956, + "loss_pixel": 0.1486, + "loss_text": 1.4426, + "ppl": 4.9096, + "step": 13739 + }, + { + "epoch": 0.07, + "global_step": 13740, + "learning_rate": 0.00044348914858096826, + "loss": 1.5812, + "loss_base2": 2.2812, + "loss_pixel": 0.1495, + "loss_text": 1.4316, + "ppl": 4.8608, + "step": 13740 + }, + { + "epoch": 0.07, + "global_step": 13741, + "learning_rate": 0.00044348497495826376, + "loss": 1.5705, + "loss_base2": 2.2658, + "loss_pixel": 0.1465, + "loss_text": 1.4239, + "ppl": 4.8091, + "step": 13741 + }, + { + "epoch": 0.07, + "global_step": 13742, + "learning_rate": 0.00044348080133555927, + "loss": 1.4996, + "loss_base2": 2.1635, + "loss_pixel": 0.1478, + "loss_text": 1.3519, + "ppl": 4.4799, + "step": 13742 + }, + { + "epoch": 0.07, + "global_step": 13743, + "learning_rate": 0.0004434766277128547, + "loss": 1.5304, + "loss_base2": 2.2079, + "loss_pixel": 0.148, + "loss_text": 1.3824, + "ppl": 4.62, + "step": 13743 + }, + { + "epoch": 0.07, + "global_step": 13744, + "learning_rate": 0.00044347245409015023, + "loss": 1.5821, + "loss_base2": 2.2825, + "loss_pixel": 0.1483, + "loss_text": 1.4338, + "ppl": 4.8652, + "step": 13744 + }, + { + "epoch": 0.07, + "global_step": 13745, + "learning_rate": 0.00044346828046744574, + "loss": 1.5827, + "loss_base2": 2.2834, + "loss_pixel": 0.1475, + "loss_text": 1.4353, + "ppl": 4.8681, + "step": 13745 + }, + { + "epoch": 0.07, + "global_step": 13746, + "learning_rate": 0.00044346410684474125, + "loss": 1.5496, + "loss_base2": 2.2356, + "loss_pixel": 0.1491, + "loss_text": 1.4004, + "ppl": 4.7096, + "step": 13746 + }, + { + "epoch": 0.07, + "global_step": 13747, + "learning_rate": 0.00044345993322203675, + "loss": 1.5797, + "loss_base2": 2.279, + "loss_pixel": 0.1473, + "loss_text": 1.4324, + "ppl": 4.8535, + "step": 13747 + }, + { + "epoch": 0.07, + "global_step": 13748, + "learning_rate": 0.0004434557595993322, + "loss": 1.5901, + "loss_base2": 2.294, + "loss_pixel": 0.1474, + "loss_text": 1.4427, + "ppl": 4.9042, + "step": 13748 + }, + { + "epoch": 0.07, + "global_step": 13749, + "learning_rate": 0.0004434515859766277, + "loss": 1.5795, + "loss_base2": 2.2787, + "loss_pixel": 0.1468, + "loss_text": 1.4327, + "ppl": 4.8525, + "step": 13749 + }, + { + "epoch": 0.07, + "global_step": 13750, + "learning_rate": 0.0004434474123539232, + "loss": 1.5805, + "loss_base2": 2.2802, + "loss_pixel": 0.1458, + "loss_text": 1.4347, + "ppl": 4.8574, + "step": 13750 + } + ], + "logging_steps": 1.0, + "max_steps": 120000, + "num_input_tokens_seen": 0, + "num_train_epochs": 9223372036854775807, + "save_steps": 250, + "total_flos": 5.493394168086528e+19, + "train_batch_size": 16, + "trial_name": null, + "trial_params": null +}