{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.0, "eval_steps": 500, "global_step": 8798, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 7.575757575757576e-07, "loss": 1.5995, "step": 1 }, { "epoch": 0.0, "learning_rate": 1.5151515151515152e-06, "loss": 1.6025, "step": 2 }, { "epoch": 0.0, "learning_rate": 2.2727272727272728e-06, "loss": 1.4831, "step": 3 }, { "epoch": 0.0, "learning_rate": 3.0303030303030305e-06, "loss": 1.4695, "step": 4 }, { "epoch": 0.0, "learning_rate": 3.7878787878787882e-06, "loss": 1.4307, "step": 5 }, { "epoch": 0.0, "learning_rate": 4.5454545454545455e-06, "loss": 1.6343, "step": 6 }, { "epoch": 0.0, "learning_rate": 5.303030303030304e-06, "loss": 1.5792, "step": 7 }, { "epoch": 0.0, "learning_rate": 6.060606060606061e-06, "loss": 1.6055, "step": 8 }, { "epoch": 0.0, "learning_rate": 6.818181818181818e-06, "loss": 1.5411, "step": 9 }, { "epoch": 0.0, "learning_rate": 7.5757575757575764e-06, "loss": 1.5648, "step": 10 }, { "epoch": 0.0, "learning_rate": 8.333333333333334e-06, "loss": 1.5765, "step": 11 }, { "epoch": 0.0, "learning_rate": 9.090909090909091e-06, "loss": 1.4917, "step": 12 }, { "epoch": 0.0, "learning_rate": 9.848484848484848e-06, "loss": 1.4627, "step": 13 }, { "epoch": 0.0, "learning_rate": 1.0606060606060607e-05, "loss": 1.535, "step": 14 }, { "epoch": 0.0, "learning_rate": 1.1363636363636365e-05, "loss": 1.5061, "step": 15 }, { "epoch": 0.0, "learning_rate": 1.2121212121212122e-05, "loss": 1.4243, "step": 16 }, { "epoch": 0.0, "learning_rate": 1.287878787878788e-05, "loss": 1.4347, "step": 17 }, { "epoch": 0.0, "learning_rate": 1.3636363636363637e-05, "loss": 1.392, "step": 18 }, { "epoch": 0.0, "learning_rate": 1.4393939393939396e-05, "loss": 1.286, "step": 19 }, { "epoch": 0.0, "learning_rate": 1.5151515151515153e-05, "loss": 1.361, "step": 20 }, { "epoch": 0.0, "learning_rate": 1.590909090909091e-05, "loss": 1.315, "step": 21 }, { "epoch": 0.0, "learning_rate": 1.6666666666666667e-05, "loss": 1.3442, "step": 22 }, { "epoch": 0.0, "learning_rate": 1.7424242424242425e-05, "loss": 1.3323, "step": 23 }, { "epoch": 0.0, "learning_rate": 1.8181818181818182e-05, "loss": 1.2389, "step": 24 }, { "epoch": 0.0, "learning_rate": 1.893939393939394e-05, "loss": 1.2699, "step": 25 }, { "epoch": 0.0, "learning_rate": 1.9696969696969697e-05, "loss": 1.3249, "step": 26 }, { "epoch": 0.0, "learning_rate": 2.0454545454545457e-05, "loss": 1.2126, "step": 27 }, { "epoch": 0.0, "learning_rate": 2.1212121212121215e-05, "loss": 1.119, "step": 28 }, { "epoch": 0.0, "learning_rate": 2.1969696969696972e-05, "loss": 1.2153, "step": 29 }, { "epoch": 0.0, "learning_rate": 2.272727272727273e-05, "loss": 1.1493, "step": 30 }, { "epoch": 0.0, "learning_rate": 2.3484848484848487e-05, "loss": 1.1045, "step": 31 }, { "epoch": 0.0, "learning_rate": 2.4242424242424244e-05, "loss": 1.2138, "step": 32 }, { "epoch": 0.0, "learning_rate": 2.5e-05, "loss": 1.198, "step": 33 }, { "epoch": 0.0, "learning_rate": 2.575757575757576e-05, "loss": 1.0751, "step": 34 }, { "epoch": 0.0, "learning_rate": 2.6515151515151516e-05, "loss": 1.1204, "step": 35 }, { "epoch": 0.0, "learning_rate": 2.7272727272727273e-05, "loss": 1.0627, "step": 36 }, { "epoch": 0.0, "learning_rate": 2.803030303030303e-05, "loss": 1.0095, "step": 37 }, { "epoch": 0.0, "learning_rate": 2.878787878787879e-05, "loss": 1.0867, "step": 38 }, { "epoch": 0.0, "learning_rate": 2.954545454545455e-05, "loss": 1.022, "step": 39 }, { "epoch": 0.0, "learning_rate": 3.0303030303030306e-05, "loss": 0.9918, "step": 40 }, { "epoch": 0.0, "learning_rate": 3.106060606060606e-05, "loss": 1.0799, "step": 41 }, { "epoch": 0.0, "learning_rate": 3.181818181818182e-05, "loss": 1.0433, "step": 42 }, { "epoch": 0.0, "learning_rate": 3.257575757575758e-05, "loss": 1.0452, "step": 43 }, { "epoch": 0.01, "learning_rate": 3.3333333333333335e-05, "loss": 1.0388, "step": 44 }, { "epoch": 0.01, "learning_rate": 3.409090909090909e-05, "loss": 0.9024, "step": 45 }, { "epoch": 0.01, "learning_rate": 3.484848484848485e-05, "loss": 0.9071, "step": 46 }, { "epoch": 0.01, "learning_rate": 3.560606060606061e-05, "loss": 0.9649, "step": 47 }, { "epoch": 0.01, "learning_rate": 3.6363636363636364e-05, "loss": 0.9558, "step": 48 }, { "epoch": 0.01, "learning_rate": 3.712121212121212e-05, "loss": 0.9204, "step": 49 }, { "epoch": 0.01, "learning_rate": 3.787878787878788e-05, "loss": 0.9331, "step": 50 }, { "epoch": 0.01, "learning_rate": 3.8636363636363636e-05, "loss": 0.9148, "step": 51 }, { "epoch": 0.01, "learning_rate": 3.939393939393939e-05, "loss": 0.9862, "step": 52 }, { "epoch": 0.01, "learning_rate": 4.015151515151515e-05, "loss": 0.8719, "step": 53 }, { "epoch": 0.01, "learning_rate": 4.0909090909090915e-05, "loss": 0.9002, "step": 54 }, { "epoch": 0.01, "learning_rate": 4.166666666666667e-05, "loss": 0.8577, "step": 55 }, { "epoch": 0.01, "learning_rate": 4.242424242424243e-05, "loss": 0.8679, "step": 56 }, { "epoch": 0.01, "learning_rate": 4.318181818181819e-05, "loss": 0.8387, "step": 57 }, { "epoch": 0.01, "learning_rate": 4.3939393939393944e-05, "loss": 0.8958, "step": 58 }, { "epoch": 0.01, "learning_rate": 4.46969696969697e-05, "loss": 0.9206, "step": 59 }, { "epoch": 0.01, "learning_rate": 4.545454545454546e-05, "loss": 0.8489, "step": 60 }, { "epoch": 0.01, "learning_rate": 4.621212121212121e-05, "loss": 0.8351, "step": 61 }, { "epoch": 0.01, "learning_rate": 4.696969696969697e-05, "loss": 0.7888, "step": 62 }, { "epoch": 0.01, "learning_rate": 4.772727272727273e-05, "loss": 0.8466, "step": 63 }, { "epoch": 0.01, "learning_rate": 4.848484848484849e-05, "loss": 0.8515, "step": 64 }, { "epoch": 0.01, "learning_rate": 4.9242424242424245e-05, "loss": 0.8029, "step": 65 }, { "epoch": 0.01, "learning_rate": 5e-05, "loss": 0.8999, "step": 66 }, { "epoch": 0.01, "learning_rate": 5.075757575757576e-05, "loss": 0.8562, "step": 67 }, { "epoch": 0.01, "learning_rate": 5.151515151515152e-05, "loss": 0.8236, "step": 68 }, { "epoch": 0.01, "learning_rate": 5.2272727272727274e-05, "loss": 0.7905, "step": 69 }, { "epoch": 0.01, "learning_rate": 5.303030303030303e-05, "loss": 0.7333, "step": 70 }, { "epoch": 0.01, "learning_rate": 5.378787878787879e-05, "loss": 0.8526, "step": 71 }, { "epoch": 0.01, "learning_rate": 5.4545454545454546e-05, "loss": 0.7108, "step": 72 }, { "epoch": 0.01, "learning_rate": 5.5303030303030304e-05, "loss": 0.7914, "step": 73 }, { "epoch": 0.01, "learning_rate": 5.606060606060606e-05, "loss": 0.7933, "step": 74 }, { "epoch": 0.01, "learning_rate": 5.6818181818181825e-05, "loss": 0.7208, "step": 75 }, { "epoch": 0.01, "learning_rate": 5.757575757575758e-05, "loss": 0.7895, "step": 76 }, { "epoch": 0.01, "learning_rate": 5.833333333333334e-05, "loss": 0.8261, "step": 77 }, { "epoch": 0.01, "learning_rate": 5.90909090909091e-05, "loss": 0.7813, "step": 78 }, { "epoch": 0.01, "learning_rate": 5.9848484848484854e-05, "loss": 0.843, "step": 79 }, { "epoch": 0.01, "learning_rate": 6.060606060606061e-05, "loss": 0.8309, "step": 80 }, { "epoch": 0.01, "learning_rate": 6.136363636363636e-05, "loss": 0.8095, "step": 81 }, { "epoch": 0.01, "learning_rate": 6.212121212121213e-05, "loss": 0.8043, "step": 82 }, { "epoch": 0.01, "learning_rate": 6.287878787878788e-05, "loss": 0.7685, "step": 83 }, { "epoch": 0.01, "learning_rate": 6.363636363636364e-05, "loss": 0.781, "step": 84 }, { "epoch": 0.01, "learning_rate": 6.439393939393939e-05, "loss": 0.7755, "step": 85 }, { "epoch": 0.01, "learning_rate": 6.515151515151516e-05, "loss": 0.8117, "step": 86 }, { "epoch": 0.01, "learning_rate": 6.59090909090909e-05, "loss": 0.7297, "step": 87 }, { "epoch": 0.01, "learning_rate": 6.666666666666667e-05, "loss": 0.6834, "step": 88 }, { "epoch": 0.01, "learning_rate": 6.742424242424242e-05, "loss": 0.7423, "step": 89 }, { "epoch": 0.01, "learning_rate": 6.818181818181818e-05, "loss": 0.7235, "step": 90 }, { "epoch": 0.01, "learning_rate": 6.893939393939395e-05, "loss": 0.7681, "step": 91 }, { "epoch": 0.01, "learning_rate": 6.96969696969697e-05, "loss": 0.8289, "step": 92 }, { "epoch": 0.01, "learning_rate": 7.045454545454546e-05, "loss": 0.7712, "step": 93 }, { "epoch": 0.01, "learning_rate": 7.121212121212121e-05, "loss": 0.8138, "step": 94 }, { "epoch": 0.01, "learning_rate": 7.196969696969698e-05, "loss": 0.8129, "step": 95 }, { "epoch": 0.01, "learning_rate": 7.272727272727273e-05, "loss": 0.7915, "step": 96 }, { "epoch": 0.01, "learning_rate": 7.348484848484849e-05, "loss": 0.7527, "step": 97 }, { "epoch": 0.01, "learning_rate": 7.424242424242424e-05, "loss": 0.728, "step": 98 }, { "epoch": 0.01, "learning_rate": 7.500000000000001e-05, "loss": 0.8122, "step": 99 }, { "epoch": 0.01, "learning_rate": 7.575757575757576e-05, "loss": 0.781, "step": 100 }, { "epoch": 0.01, "learning_rate": 7.651515151515152e-05, "loss": 0.8104, "step": 101 }, { "epoch": 0.01, "learning_rate": 7.727272727272727e-05, "loss": 0.7665, "step": 102 }, { "epoch": 0.01, "learning_rate": 7.803030303030304e-05, "loss": 0.7282, "step": 103 }, { "epoch": 0.01, "learning_rate": 7.878787878787879e-05, "loss": 0.773, "step": 104 }, { "epoch": 0.01, "learning_rate": 7.954545454545455e-05, "loss": 0.693, "step": 105 }, { "epoch": 0.01, "learning_rate": 8.03030303030303e-05, "loss": 0.7379, "step": 106 }, { "epoch": 0.01, "learning_rate": 8.106060606060607e-05, "loss": 0.8172, "step": 107 }, { "epoch": 0.01, "learning_rate": 8.181818181818183e-05, "loss": 0.7864, "step": 108 }, { "epoch": 0.01, "learning_rate": 8.257575757575758e-05, "loss": 0.7628, "step": 109 }, { "epoch": 0.01, "learning_rate": 8.333333333333334e-05, "loss": 0.7497, "step": 110 }, { "epoch": 0.01, "learning_rate": 8.40909090909091e-05, "loss": 0.7624, "step": 111 }, { "epoch": 0.01, "learning_rate": 8.484848484848486e-05, "loss": 0.7955, "step": 112 }, { "epoch": 0.01, "learning_rate": 8.560606060606061e-05, "loss": 0.7166, "step": 113 }, { "epoch": 0.01, "learning_rate": 8.636363636363637e-05, "loss": 0.7474, "step": 114 }, { "epoch": 0.01, "learning_rate": 8.712121212121212e-05, "loss": 0.7483, "step": 115 }, { "epoch": 0.01, "learning_rate": 8.787878787878789e-05, "loss": 0.7603, "step": 116 }, { "epoch": 0.01, "learning_rate": 8.863636363636364e-05, "loss": 0.6997, "step": 117 }, { "epoch": 0.01, "learning_rate": 8.93939393939394e-05, "loss": 0.7624, "step": 118 }, { "epoch": 0.01, "learning_rate": 9.015151515151515e-05, "loss": 0.8124, "step": 119 }, { "epoch": 0.01, "learning_rate": 9.090909090909092e-05, "loss": 0.7691, "step": 120 }, { "epoch": 0.01, "learning_rate": 9.166666666666667e-05, "loss": 0.7093, "step": 121 }, { "epoch": 0.01, "learning_rate": 9.242424242424242e-05, "loss": 0.7835, "step": 122 }, { "epoch": 0.01, "learning_rate": 9.318181818181818e-05, "loss": 0.7382, "step": 123 }, { "epoch": 0.01, "learning_rate": 9.393939393939395e-05, "loss": 0.7044, "step": 124 }, { "epoch": 0.01, "learning_rate": 9.469696969696971e-05, "loss": 0.7139, "step": 125 }, { "epoch": 0.01, "learning_rate": 9.545454545454546e-05, "loss": 0.7757, "step": 126 }, { "epoch": 0.01, "learning_rate": 9.621212121212123e-05, "loss": 0.7229, "step": 127 }, { "epoch": 0.01, "learning_rate": 9.696969696969698e-05, "loss": 0.7853, "step": 128 }, { "epoch": 0.01, "learning_rate": 9.772727272727274e-05, "loss": 0.7995, "step": 129 }, { "epoch": 0.01, "learning_rate": 9.848484848484849e-05, "loss": 0.7554, "step": 130 }, { "epoch": 0.01, "learning_rate": 9.924242424242425e-05, "loss": 0.7416, "step": 131 }, { "epoch": 0.02, "learning_rate": 0.0001, "loss": 0.818, "step": 132 }, { "epoch": 0.02, "learning_rate": 0.00010075757575757576, "loss": 0.7828, "step": 133 }, { "epoch": 0.02, "learning_rate": 0.00010151515151515152, "loss": 0.7223, "step": 134 }, { "epoch": 0.02, "learning_rate": 0.00010227272727272727, "loss": 0.7771, "step": 135 }, { "epoch": 0.02, "learning_rate": 0.00010303030303030303, "loss": 0.6789, "step": 136 }, { "epoch": 0.02, "learning_rate": 0.00010378787878787878, "loss": 0.6826, "step": 137 }, { "epoch": 0.02, "learning_rate": 0.00010454545454545455, "loss": 0.6783, "step": 138 }, { "epoch": 0.02, "learning_rate": 0.0001053030303030303, "loss": 0.7646, "step": 139 }, { "epoch": 0.02, "learning_rate": 0.00010606060606060606, "loss": 0.7434, "step": 140 }, { "epoch": 0.02, "learning_rate": 0.00010681818181818181, "loss": 0.7191, "step": 141 }, { "epoch": 0.02, "learning_rate": 0.00010757575757575758, "loss": 0.7552, "step": 142 }, { "epoch": 0.02, "learning_rate": 0.00010833333333333333, "loss": 0.7365, "step": 143 }, { "epoch": 0.02, "learning_rate": 0.00010909090909090909, "loss": 0.6914, "step": 144 }, { "epoch": 0.02, "learning_rate": 0.00010984848484848484, "loss": 0.7797, "step": 145 }, { "epoch": 0.02, "learning_rate": 0.00011060606060606061, "loss": 0.6578, "step": 146 }, { "epoch": 0.02, "learning_rate": 0.00011136363636363636, "loss": 0.7227, "step": 147 }, { "epoch": 0.02, "learning_rate": 0.00011212121212121212, "loss": 0.7927, "step": 148 }, { "epoch": 0.02, "learning_rate": 0.0001128787878787879, "loss": 0.7437, "step": 149 }, { "epoch": 0.02, "learning_rate": 0.00011363636363636365, "loss": 0.7025, "step": 150 }, { "epoch": 0.02, "learning_rate": 0.00011439393939393941, "loss": 0.7076, "step": 151 }, { "epoch": 0.02, "learning_rate": 0.00011515151515151516, "loss": 0.7536, "step": 152 }, { "epoch": 0.02, "learning_rate": 0.00011590909090909093, "loss": 0.7133, "step": 153 }, { "epoch": 0.02, "learning_rate": 0.00011666666666666668, "loss": 0.714, "step": 154 }, { "epoch": 0.02, "learning_rate": 0.00011742424242424244, "loss": 0.7317, "step": 155 }, { "epoch": 0.02, "learning_rate": 0.0001181818181818182, "loss": 0.7354, "step": 156 }, { "epoch": 0.02, "learning_rate": 0.00011893939393939394, "loss": 0.7589, "step": 157 }, { "epoch": 0.02, "learning_rate": 0.00011969696969696971, "loss": 0.7116, "step": 158 }, { "epoch": 0.02, "learning_rate": 0.00012045454545454546, "loss": 0.7484, "step": 159 }, { "epoch": 0.02, "learning_rate": 0.00012121212121212122, "loss": 0.798, "step": 160 }, { "epoch": 0.02, "learning_rate": 0.00012196969696969697, "loss": 0.7221, "step": 161 }, { "epoch": 0.02, "learning_rate": 0.00012272727272727272, "loss": 0.6626, "step": 162 }, { "epoch": 0.02, "learning_rate": 0.0001234848484848485, "loss": 0.6994, "step": 163 }, { "epoch": 0.02, "learning_rate": 0.00012424242424242425, "loss": 0.7012, "step": 164 }, { "epoch": 0.02, "learning_rate": 0.000125, "loss": 0.7106, "step": 165 }, { "epoch": 0.02, "learning_rate": 0.00012575757575757575, "loss": 0.692, "step": 166 }, { "epoch": 0.02, "learning_rate": 0.00012651515151515153, "loss": 0.7247, "step": 167 }, { "epoch": 0.02, "learning_rate": 0.00012727272727272728, "loss": 0.6732, "step": 168 }, { "epoch": 0.02, "learning_rate": 0.00012803030303030303, "loss": 0.6409, "step": 169 }, { "epoch": 0.02, "learning_rate": 0.00012878787878787878, "loss": 0.7322, "step": 170 }, { "epoch": 0.02, "learning_rate": 0.00012954545454545456, "loss": 0.7139, "step": 171 }, { "epoch": 0.02, "learning_rate": 0.0001303030303030303, "loss": 0.7374, "step": 172 }, { "epoch": 0.02, "learning_rate": 0.00013106060606060606, "loss": 0.7569, "step": 173 }, { "epoch": 0.02, "learning_rate": 0.0001318181818181818, "loss": 0.7279, "step": 174 }, { "epoch": 0.02, "learning_rate": 0.00013257575757575756, "loss": 0.7603, "step": 175 }, { "epoch": 0.02, "learning_rate": 0.00013333333333333334, "loss": 0.7119, "step": 176 }, { "epoch": 0.02, "learning_rate": 0.0001340909090909091, "loss": 0.7334, "step": 177 }, { "epoch": 0.02, "learning_rate": 0.00013484848484848484, "loss": 0.7814, "step": 178 }, { "epoch": 0.02, "learning_rate": 0.0001356060606060606, "loss": 0.7224, "step": 179 }, { "epoch": 0.02, "learning_rate": 0.00013636363636363637, "loss": 0.6868, "step": 180 }, { "epoch": 0.02, "learning_rate": 0.00013712121212121212, "loss": 0.6848, "step": 181 }, { "epoch": 0.02, "learning_rate": 0.0001378787878787879, "loss": 0.7315, "step": 182 }, { "epoch": 0.02, "learning_rate": 0.00013863636363636365, "loss": 0.7569, "step": 183 }, { "epoch": 0.02, "learning_rate": 0.0001393939393939394, "loss": 0.7048, "step": 184 }, { "epoch": 0.02, "learning_rate": 0.00014015151515151518, "loss": 0.7271, "step": 185 }, { "epoch": 0.02, "learning_rate": 0.00014090909090909093, "loss": 0.7272, "step": 186 }, { "epoch": 0.02, "learning_rate": 0.00014166666666666668, "loss": 0.6641, "step": 187 }, { "epoch": 0.02, "learning_rate": 0.00014242424242424243, "loss": 0.722, "step": 188 }, { "epoch": 0.02, "learning_rate": 0.0001431818181818182, "loss": 0.7036, "step": 189 }, { "epoch": 0.02, "learning_rate": 0.00014393939393939396, "loss": 0.7264, "step": 190 }, { "epoch": 0.02, "learning_rate": 0.0001446969696969697, "loss": 0.7525, "step": 191 }, { "epoch": 0.02, "learning_rate": 0.00014545454545454546, "loss": 0.7027, "step": 192 }, { "epoch": 0.02, "learning_rate": 0.00014621212121212123, "loss": 0.6899, "step": 193 }, { "epoch": 0.02, "learning_rate": 0.00014696969696969698, "loss": 0.7701, "step": 194 }, { "epoch": 0.02, "learning_rate": 0.00014772727272727274, "loss": 0.7382, "step": 195 }, { "epoch": 0.02, "learning_rate": 0.00014848484848484849, "loss": 0.7306, "step": 196 }, { "epoch": 0.02, "learning_rate": 0.00014924242424242426, "loss": 0.7352, "step": 197 }, { "epoch": 0.02, "learning_rate": 0.00015000000000000001, "loss": 0.6955, "step": 198 }, { "epoch": 0.02, "learning_rate": 0.00015075757575757576, "loss": 0.7586, "step": 199 }, { "epoch": 0.02, "learning_rate": 0.00015151515151515152, "loss": 0.6703, "step": 200 }, { "epoch": 0.02, "learning_rate": 0.00015227272727272727, "loss": 0.6897, "step": 201 }, { "epoch": 0.02, "learning_rate": 0.00015303030303030304, "loss": 0.7703, "step": 202 }, { "epoch": 0.02, "learning_rate": 0.0001537878787878788, "loss": 0.6606, "step": 203 }, { "epoch": 0.02, "learning_rate": 0.00015454545454545454, "loss": 0.6923, "step": 204 }, { "epoch": 0.02, "learning_rate": 0.0001553030303030303, "loss": 0.7373, "step": 205 }, { "epoch": 0.02, "learning_rate": 0.00015606060606060607, "loss": 0.7156, "step": 206 }, { "epoch": 0.02, "learning_rate": 0.00015681818181818182, "loss": 0.6811, "step": 207 }, { "epoch": 0.02, "learning_rate": 0.00015757575757575757, "loss": 0.8106, "step": 208 }, { "epoch": 0.02, "learning_rate": 0.00015833333333333332, "loss": 0.7062, "step": 209 }, { "epoch": 0.02, "learning_rate": 0.0001590909090909091, "loss": 0.6753, "step": 210 }, { "epoch": 0.02, "learning_rate": 0.00015984848484848485, "loss": 0.7017, "step": 211 }, { "epoch": 0.02, "learning_rate": 0.0001606060606060606, "loss": 0.7287, "step": 212 }, { "epoch": 0.02, "learning_rate": 0.00016136363636363635, "loss": 0.7194, "step": 213 }, { "epoch": 0.02, "learning_rate": 0.00016212121212121213, "loss": 0.6861, "step": 214 }, { "epoch": 0.02, "learning_rate": 0.0001628787878787879, "loss": 0.7645, "step": 215 }, { "epoch": 0.02, "learning_rate": 0.00016363636363636366, "loss": 0.7142, "step": 216 }, { "epoch": 0.02, "learning_rate": 0.0001643939393939394, "loss": 0.7509, "step": 217 }, { "epoch": 0.02, "learning_rate": 0.00016515151515151516, "loss": 0.7741, "step": 218 }, { "epoch": 0.02, "learning_rate": 0.00016590909090909094, "loss": 0.7265, "step": 219 }, { "epoch": 0.03, "learning_rate": 0.0001666666666666667, "loss": 0.7701, "step": 220 }, { "epoch": 0.03, "learning_rate": 0.00016742424242424244, "loss": 0.7368, "step": 221 }, { "epoch": 0.03, "learning_rate": 0.0001681818181818182, "loss": 0.7427, "step": 222 }, { "epoch": 0.03, "learning_rate": 0.00016893939393939394, "loss": 0.7352, "step": 223 }, { "epoch": 0.03, "learning_rate": 0.00016969696969696972, "loss": 0.723, "step": 224 }, { "epoch": 0.03, "learning_rate": 0.00017045454545454547, "loss": 0.7167, "step": 225 }, { "epoch": 0.03, "learning_rate": 0.00017121212121212122, "loss": 0.8083, "step": 226 }, { "epoch": 0.03, "learning_rate": 0.00017196969696969697, "loss": 0.7055, "step": 227 }, { "epoch": 0.03, "learning_rate": 0.00017272727272727275, "loss": 0.7748, "step": 228 }, { "epoch": 0.03, "learning_rate": 0.0001734848484848485, "loss": 0.73, "step": 229 }, { "epoch": 0.03, "learning_rate": 0.00017424242424242425, "loss": 0.7219, "step": 230 }, { "epoch": 0.03, "learning_rate": 0.000175, "loss": 0.7062, "step": 231 }, { "epoch": 0.03, "learning_rate": 0.00017575757575757578, "loss": 0.7143, "step": 232 }, { "epoch": 0.03, "learning_rate": 0.00017651515151515153, "loss": 0.6966, "step": 233 }, { "epoch": 0.03, "learning_rate": 0.00017727272727272728, "loss": 0.7514, "step": 234 }, { "epoch": 0.03, "learning_rate": 0.00017803030303030303, "loss": 0.7177, "step": 235 }, { "epoch": 0.03, "learning_rate": 0.0001787878787878788, "loss": 0.7685, "step": 236 }, { "epoch": 0.03, "learning_rate": 0.00017954545454545456, "loss": 0.7558, "step": 237 }, { "epoch": 0.03, "learning_rate": 0.0001803030303030303, "loss": 0.7791, "step": 238 }, { "epoch": 0.03, "learning_rate": 0.00018106060606060606, "loss": 0.7528, "step": 239 }, { "epoch": 0.03, "learning_rate": 0.00018181818181818183, "loss": 0.7807, "step": 240 }, { "epoch": 0.03, "learning_rate": 0.00018257575757575758, "loss": 0.7117, "step": 241 }, { "epoch": 0.03, "learning_rate": 0.00018333333333333334, "loss": 0.7482, "step": 242 }, { "epoch": 0.03, "learning_rate": 0.00018409090909090909, "loss": 0.7198, "step": 243 }, { "epoch": 0.03, "learning_rate": 0.00018484848484848484, "loss": 0.7819, "step": 244 }, { "epoch": 0.03, "learning_rate": 0.00018560606060606061, "loss": 0.7053, "step": 245 }, { "epoch": 0.03, "learning_rate": 0.00018636363636363636, "loss": 0.7614, "step": 246 }, { "epoch": 0.03, "learning_rate": 0.00018712121212121212, "loss": 0.748, "step": 247 }, { "epoch": 0.03, "learning_rate": 0.0001878787878787879, "loss": 0.7459, "step": 248 }, { "epoch": 0.03, "learning_rate": 0.00018863636363636364, "loss": 0.6916, "step": 249 }, { "epoch": 0.03, "learning_rate": 0.00018939393939393942, "loss": 0.681, "step": 250 }, { "epoch": 0.03, "learning_rate": 0.00019015151515151517, "loss": 0.7689, "step": 251 }, { "epoch": 0.03, "learning_rate": 0.00019090909090909092, "loss": 0.7515, "step": 252 }, { "epoch": 0.03, "learning_rate": 0.00019166666666666667, "loss": 0.7611, "step": 253 }, { "epoch": 0.03, "learning_rate": 0.00019242424242424245, "loss": 0.7107, "step": 254 }, { "epoch": 0.03, "learning_rate": 0.0001931818181818182, "loss": 0.7695, "step": 255 }, { "epoch": 0.03, "learning_rate": 0.00019393939393939395, "loss": 0.7917, "step": 256 }, { "epoch": 0.03, "learning_rate": 0.0001946969696969697, "loss": 0.7511, "step": 257 }, { "epoch": 0.03, "learning_rate": 0.00019545454545454548, "loss": 0.7098, "step": 258 }, { "epoch": 0.03, "learning_rate": 0.00019621212121212123, "loss": 0.6834, "step": 259 }, { "epoch": 0.03, "learning_rate": 0.00019696969696969698, "loss": 0.7538, "step": 260 }, { "epoch": 0.03, "learning_rate": 0.00019772727272727273, "loss": 0.6989, "step": 261 }, { "epoch": 0.03, "learning_rate": 0.0001984848484848485, "loss": 0.7197, "step": 262 }, { "epoch": 0.03, "learning_rate": 0.00019924242424242426, "loss": 0.6967, "step": 263 }, { "epoch": 0.03, "learning_rate": 0.0002, "loss": 0.7553, "step": 264 }, { "epoch": 0.03, "learning_rate": 0.00019999999322413935, "loss": 0.7642, "step": 265 }, { "epoch": 0.03, "learning_rate": 0.0001999999728965582, "loss": 0.6531, "step": 266 }, { "epoch": 0.03, "learning_rate": 0.0001999999390172594, "loss": 0.7051, "step": 267 }, { "epoch": 0.03, "learning_rate": 0.0001999998915862475, "loss": 0.749, "step": 268 }, { "epoch": 0.03, "learning_rate": 0.00019999983060352893, "loss": 0.7684, "step": 269 }, { "epoch": 0.03, "learning_rate": 0.00019999975606911193, "loss": 0.6728, "step": 270 }, { "epoch": 0.03, "learning_rate": 0.00019999966798300668, "loss": 0.6686, "step": 271 }, { "epoch": 0.03, "learning_rate": 0.00019999956634522502, "loss": 0.7544, "step": 272 }, { "epoch": 0.03, "learning_rate": 0.0001999994511557808, "loss": 0.6754, "step": 273 }, { "epoch": 0.03, "learning_rate": 0.00019999932241468956, "loss": 0.6706, "step": 274 }, { "epoch": 0.03, "learning_rate": 0.00019999918012196882, "loss": 0.666, "step": 275 }, { "epoch": 0.03, "learning_rate": 0.0001999990242776378, "loss": 0.6977, "step": 276 }, { "epoch": 0.03, "learning_rate": 0.0001999988548817177, "loss": 0.709, "step": 277 }, { "epoch": 0.03, "learning_rate": 0.00019999867193423138, "loss": 0.7909, "step": 278 }, { "epoch": 0.03, "learning_rate": 0.0001999984754352037, "loss": 0.7193, "step": 279 }, { "epoch": 0.03, "learning_rate": 0.00019999826538466125, "loss": 0.706, "step": 280 }, { "epoch": 0.03, "learning_rate": 0.0001999980417826325, "loss": 0.719, "step": 281 }, { "epoch": 0.03, "learning_rate": 0.00019999780462914778, "loss": 0.6676, "step": 282 }, { "epoch": 0.03, "learning_rate": 0.0001999975539242392, "loss": 0.677, "step": 283 }, { "epoch": 0.03, "learning_rate": 0.00019999728966794075, "loss": 0.6579, "step": 284 }, { "epoch": 0.03, "learning_rate": 0.00019999701186028824, "loss": 0.7432, "step": 285 }, { "epoch": 0.03, "learning_rate": 0.0001999967205013193, "loss": 0.6932, "step": 286 }, { "epoch": 0.03, "learning_rate": 0.00019999641559107344, "loss": 0.7486, "step": 287 }, { "epoch": 0.03, "learning_rate": 0.00019999609712959197, "loss": 0.6979, "step": 288 }, { "epoch": 0.03, "learning_rate": 0.00019999576511691808, "loss": 0.7139, "step": 289 }, { "epoch": 0.03, "learning_rate": 0.00019999541955309668, "loss": 0.6846, "step": 290 }, { "epoch": 0.03, "learning_rate": 0.00019999506043817466, "loss": 0.7428, "step": 291 }, { "epoch": 0.03, "learning_rate": 0.00019999468777220068, "loss": 0.7131, "step": 292 }, { "epoch": 0.03, "learning_rate": 0.00019999430155522526, "loss": 0.7232, "step": 293 }, { "epoch": 0.03, "learning_rate": 0.00019999390178730068, "loss": 0.7035, "step": 294 }, { "epoch": 0.03, "learning_rate": 0.0001999934884684812, "loss": 0.7583, "step": 295 }, { "epoch": 0.03, "learning_rate": 0.00019999306159882273, "loss": 0.6763, "step": 296 }, { "epoch": 0.03, "learning_rate": 0.0001999926211783832, "loss": 0.7212, "step": 297 }, { "epoch": 0.03, "learning_rate": 0.00019999216720722226, "loss": 0.7111, "step": 298 }, { "epoch": 0.03, "learning_rate": 0.00019999169968540144, "loss": 0.7161, "step": 299 }, { "epoch": 0.03, "learning_rate": 0.0001999912186129841, "loss": 0.7399, "step": 300 }, { "epoch": 0.03, "learning_rate": 0.00019999072399003547, "loss": 0.7176, "step": 301 }, { "epoch": 0.03, "learning_rate": 0.00019999021581662248, "loss": 0.7674, "step": 302 }, { "epoch": 0.03, "learning_rate": 0.0001999896940928141, "loss": 0.7091, "step": 303 }, { "epoch": 0.03, "learning_rate": 0.00019998915881868094, "loss": 0.697, "step": 304 }, { "epoch": 0.03, "learning_rate": 0.00019998860999429562, "loss": 0.7033, "step": 305 }, { "epoch": 0.03, "learning_rate": 0.0001999880476197325, "loss": 0.7153, "step": 306 }, { "epoch": 0.03, "learning_rate": 0.00019998747169506774, "loss": 0.7831, "step": 307 }, { "epoch": 0.04, "learning_rate": 0.0001999868822203794, "loss": 0.7075, "step": 308 }, { "epoch": 0.04, "learning_rate": 0.00019998627919574745, "loss": 0.7312, "step": 309 }, { "epoch": 0.04, "learning_rate": 0.0001999856626212535, "loss": 0.7604, "step": 310 }, { "epoch": 0.04, "learning_rate": 0.00019998503249698117, "loss": 0.7787, "step": 311 }, { "epoch": 0.04, "learning_rate": 0.00019998438882301583, "loss": 0.6982, "step": 312 }, { "epoch": 0.04, "learning_rate": 0.0001999837315994447, "loss": 0.7288, "step": 313 }, { "epoch": 0.04, "learning_rate": 0.00019998306082635688, "loss": 0.7258, "step": 314 }, { "epoch": 0.04, "learning_rate": 0.00019998237650384324, "loss": 0.6941, "step": 315 }, { "epoch": 0.04, "learning_rate": 0.00019998167863199653, "loss": 0.672, "step": 316 }, { "epoch": 0.04, "learning_rate": 0.00019998096721091132, "loss": 0.683, "step": 317 }, { "epoch": 0.04, "learning_rate": 0.00019998024224068402, "loss": 0.7613, "step": 318 }, { "epoch": 0.04, "learning_rate": 0.0001999795037214129, "loss": 0.7346, "step": 319 }, { "epoch": 0.04, "learning_rate": 0.000199978751653198, "loss": 0.7294, "step": 320 }, { "epoch": 0.04, "learning_rate": 0.00019997798603614122, "loss": 0.662, "step": 321 }, { "epoch": 0.04, "learning_rate": 0.0001999772068703464, "loss": 0.7724, "step": 322 }, { "epoch": 0.04, "learning_rate": 0.00019997641415591904, "loss": 0.646, "step": 323 }, { "epoch": 0.04, "learning_rate": 0.00019997560789296665, "loss": 0.7418, "step": 324 }, { "epoch": 0.04, "learning_rate": 0.00019997478808159844, "loss": 0.6962, "step": 325 }, { "epoch": 0.04, "learning_rate": 0.00019997395472192553, "loss": 0.7101, "step": 326 }, { "epoch": 0.04, "learning_rate": 0.0001999731078140608, "loss": 0.7226, "step": 327 }, { "epoch": 0.04, "learning_rate": 0.00019997224735811912, "loss": 0.7468, "step": 328 }, { "epoch": 0.04, "learning_rate": 0.000199971373354217, "loss": 0.7187, "step": 329 }, { "epoch": 0.04, "learning_rate": 0.00019997048580247295, "loss": 0.7544, "step": 330 }, { "epoch": 0.04, "learning_rate": 0.0001999695847030072, "loss": 0.7001, "step": 331 }, { "epoch": 0.04, "learning_rate": 0.0001999686700559419, "loss": 0.7345, "step": 332 }, { "epoch": 0.04, "learning_rate": 0.00019996774186140098, "loss": 0.7311, "step": 333 }, { "epoch": 0.04, "learning_rate": 0.00019996680011951027, "loss": 0.644, "step": 334 }, { "epoch": 0.04, "learning_rate": 0.00019996584483039732, "loss": 0.7856, "step": 335 }, { "epoch": 0.04, "learning_rate": 0.0001999648759941916, "loss": 0.7299, "step": 336 }, { "epoch": 0.04, "learning_rate": 0.0001999638936110245, "loss": 0.6912, "step": 337 }, { "epoch": 0.04, "learning_rate": 0.000199962897681029, "loss": 0.7478, "step": 338 }, { "epoch": 0.04, "learning_rate": 0.00019996188820434017, "loss": 0.6739, "step": 339 }, { "epoch": 0.04, "learning_rate": 0.00019996086518109482, "loss": 0.6303, "step": 340 }, { "epoch": 0.04, "learning_rate": 0.00019995982861143152, "loss": 0.7578, "step": 341 }, { "epoch": 0.04, "learning_rate": 0.00019995877849549078, "loss": 0.6493, "step": 342 }, { "epoch": 0.04, "learning_rate": 0.0001999577148334149, "loss": 0.7605, "step": 343 }, { "epoch": 0.04, "learning_rate": 0.00019995663762534805, "loss": 0.7031, "step": 344 }, { "epoch": 0.04, "learning_rate": 0.00019995554687143616, "loss": 0.7524, "step": 345 }, { "epoch": 0.04, "learning_rate": 0.00019995444257182708, "loss": 0.6828, "step": 346 }, { "epoch": 0.04, "learning_rate": 0.00019995332472667047, "loss": 0.645, "step": 347 }, { "epoch": 0.04, "learning_rate": 0.0001999521933361178, "loss": 0.6334, "step": 348 }, { "epoch": 0.04, "learning_rate": 0.00019995104840032238, "loss": 0.6931, "step": 349 }, { "epoch": 0.04, "learning_rate": 0.0001999498899194394, "loss": 0.7439, "step": 350 }, { "epoch": 0.04, "learning_rate": 0.00019994871789362584, "loss": 0.6747, "step": 351 }, { "epoch": 0.04, "learning_rate": 0.0001999475323230405, "loss": 0.698, "step": 352 }, { "epoch": 0.04, "learning_rate": 0.00019994633320784413, "loss": 0.7182, "step": 353 }, { "epoch": 0.04, "learning_rate": 0.00019994512054819912, "loss": 0.6275, "step": 354 }, { "epoch": 0.04, "learning_rate": 0.00019994389434426987, "loss": 0.7275, "step": 355 }, { "epoch": 0.04, "learning_rate": 0.0001999426545962226, "loss": 0.6177, "step": 356 }, { "epoch": 0.04, "learning_rate": 0.0001999414013042252, "loss": 0.7316, "step": 357 }, { "epoch": 0.04, "learning_rate": 0.0001999401344684476, "loss": 0.7488, "step": 358 }, { "epoch": 0.04, "learning_rate": 0.00019993885408906145, "loss": 0.6801, "step": 359 }, { "epoch": 0.04, "learning_rate": 0.00019993756016624024, "loss": 0.6955, "step": 360 }, { "epoch": 0.04, "learning_rate": 0.00019993625270015933, "loss": 0.6636, "step": 361 }, { "epoch": 0.04, "learning_rate": 0.00019993493169099592, "loss": 0.7255, "step": 362 }, { "epoch": 0.04, "learning_rate": 0.00019993359713892908, "loss": 0.6432, "step": 363 }, { "epoch": 0.04, "learning_rate": 0.00019993224904413958, "loss": 0.7182, "step": 364 }, { "epoch": 0.04, "learning_rate": 0.0001999308874068101, "loss": 0.7522, "step": 365 }, { "epoch": 0.04, "learning_rate": 0.00019992951222712527, "loss": 0.7633, "step": 366 }, { "epoch": 0.04, "learning_rate": 0.00019992812350527137, "loss": 0.7535, "step": 367 }, { "epoch": 0.04, "learning_rate": 0.00019992672124143662, "loss": 0.7125, "step": 368 }, { "epoch": 0.04, "learning_rate": 0.00019992530543581102, "loss": 0.7948, "step": 369 }, { "epoch": 0.04, "learning_rate": 0.00019992387608858646, "loss": 0.7442, "step": 370 }, { "epoch": 0.04, "learning_rate": 0.00019992243319995665, "loss": 0.7059, "step": 371 }, { "epoch": 0.04, "learning_rate": 0.00019992097677011712, "loss": 0.6887, "step": 372 }, { "epoch": 0.04, "learning_rate": 0.00019991950679926524, "loss": 0.7325, "step": 373 }, { "epoch": 0.04, "learning_rate": 0.00019991802328760022, "loss": 0.7474, "step": 374 }, { "epoch": 0.04, "learning_rate": 0.0001999165262353231, "loss": 0.7128, "step": 375 }, { "epoch": 0.04, "learning_rate": 0.00019991501564263674, "loss": 0.7067, "step": 376 }, { "epoch": 0.04, "learning_rate": 0.00019991349150974585, "loss": 0.7511, "step": 377 }, { "epoch": 0.04, "learning_rate": 0.000199911953836857, "loss": 0.7164, "step": 378 }, { "epoch": 0.04, "learning_rate": 0.00019991040262417857, "loss": 0.7067, "step": 379 }, { "epoch": 0.04, "learning_rate": 0.00019990883787192077, "loss": 0.7185, "step": 380 }, { "epoch": 0.04, "learning_rate": 0.00019990725958029564, "loss": 0.7612, "step": 381 }, { "epoch": 0.04, "learning_rate": 0.00019990566774951706, "loss": 0.6974, "step": 382 }, { "epoch": 0.04, "learning_rate": 0.0001999040623798008, "loss": 0.6824, "step": 383 }, { "epoch": 0.04, "learning_rate": 0.00019990244347136432, "loss": 0.6644, "step": 384 }, { "epoch": 0.04, "learning_rate": 0.00019990081102442712, "loss": 0.6808, "step": 385 }, { "epoch": 0.04, "learning_rate": 0.00019989916503921034, "loss": 0.7419, "step": 386 }, { "epoch": 0.04, "learning_rate": 0.00019989750551593712, "loss": 0.6889, "step": 387 }, { "epoch": 0.04, "learning_rate": 0.0001998958324548323, "loss": 0.7186, "step": 388 }, { "epoch": 0.04, "learning_rate": 0.00019989414585612258, "loss": 0.6781, "step": 389 }, { "epoch": 0.04, "learning_rate": 0.00019989244572003658, "loss": 0.7318, "step": 390 }, { "epoch": 0.04, "learning_rate": 0.00019989073204680467, "loss": 0.6751, "step": 391 }, { "epoch": 0.04, "learning_rate": 0.0001998890048366591, "loss": 0.766, "step": 392 }, { "epoch": 0.04, "learning_rate": 0.0001998872640898339, "loss": 0.7055, "step": 393 }, { "epoch": 0.04, "learning_rate": 0.000199885509806565, "loss": 0.7034, "step": 394 }, { "epoch": 0.04, "learning_rate": 0.00019988374198709016, "loss": 0.6496, "step": 395 }, { "epoch": 0.05, "learning_rate": 0.0001998819606316489, "loss": 0.6554, "step": 396 }, { "epoch": 0.05, "learning_rate": 0.00019988016574048266, "loss": 0.6756, "step": 397 }, { "epoch": 0.05, "learning_rate": 0.00019987835731383467, "loss": 0.732, "step": 398 }, { "epoch": 0.05, "learning_rate": 0.00019987653535194998, "loss": 0.7026, "step": 399 }, { "epoch": 0.05, "learning_rate": 0.00019987469985507553, "loss": 0.6752, "step": 400 }, { "epoch": 0.05, "learning_rate": 0.00019987285082346005, "loss": 0.6729, "step": 401 }, { "epoch": 0.05, "learning_rate": 0.00019987098825735412, "loss": 0.693, "step": 402 }, { "epoch": 0.05, "learning_rate": 0.0001998691121570101, "loss": 0.6494, "step": 403 }, { "epoch": 0.05, "learning_rate": 0.0001998672225226823, "loss": 0.669, "step": 404 }, { "epoch": 0.05, "learning_rate": 0.0001998653193546268, "loss": 0.692, "step": 405 }, { "epoch": 0.05, "learning_rate": 0.00019986340265310147, "loss": 0.7303, "step": 406 }, { "epoch": 0.05, "learning_rate": 0.00019986147241836605, "loss": 0.7372, "step": 407 }, { "epoch": 0.05, "learning_rate": 0.00019985952865068216, "loss": 0.6224, "step": 408 }, { "epoch": 0.05, "learning_rate": 0.0001998575713503132, "loss": 0.6677, "step": 409 }, { "epoch": 0.05, "learning_rate": 0.0001998556005175244, "loss": 0.6783, "step": 410 }, { "epoch": 0.05, "learning_rate": 0.00019985361615258287, "loss": 0.7357, "step": 411 }, { "epoch": 0.05, "learning_rate": 0.0001998516182557575, "loss": 0.7206, "step": 412 }, { "epoch": 0.05, "learning_rate": 0.00019984960682731907, "loss": 0.672, "step": 413 }, { "epoch": 0.05, "learning_rate": 0.00019984758186754014, "loss": 0.687, "step": 414 }, { "epoch": 0.05, "learning_rate": 0.00019984554337669513, "loss": 0.7123, "step": 415 }, { "epoch": 0.05, "learning_rate": 0.00019984349135506027, "loss": 0.6826, "step": 416 }, { "epoch": 0.05, "learning_rate": 0.00019984142580291368, "loss": 0.7343, "step": 417 }, { "epoch": 0.05, "learning_rate": 0.00019983934672053525, "loss": 0.6705, "step": 418 }, { "epoch": 0.05, "learning_rate": 0.00019983725410820677, "loss": 0.6797, "step": 419 }, { "epoch": 0.05, "learning_rate": 0.00019983514796621178, "loss": 0.7025, "step": 420 }, { "epoch": 0.05, "learning_rate": 0.00019983302829483575, "loss": 0.7427, "step": 421 }, { "epoch": 0.05, "learning_rate": 0.00019983089509436589, "loss": 0.6882, "step": 422 }, { "epoch": 0.05, "learning_rate": 0.00019982874836509126, "loss": 0.6923, "step": 423 }, { "epoch": 0.05, "learning_rate": 0.00019982658810730283, "loss": 0.7128, "step": 424 }, { "epoch": 0.05, "learning_rate": 0.00019982441432129334, "loss": 0.7191, "step": 425 }, { "epoch": 0.05, "learning_rate": 0.0001998222270073574, "loss": 0.7117, "step": 426 }, { "epoch": 0.05, "learning_rate": 0.0001998200261657914, "loss": 0.7754, "step": 427 }, { "epoch": 0.05, "learning_rate": 0.00019981781179689354, "loss": 0.6957, "step": 428 }, { "epoch": 0.05, "learning_rate": 0.000199815583900964, "loss": 0.6595, "step": 429 }, { "epoch": 0.05, "learning_rate": 0.00019981334247830463, "loss": 0.6977, "step": 430 }, { "epoch": 0.05, "learning_rate": 0.00019981108752921924, "loss": 0.6631, "step": 431 }, { "epoch": 0.05, "learning_rate": 0.00019980881905401336, "loss": 0.6981, "step": 432 }, { "epoch": 0.05, "learning_rate": 0.00019980653705299446, "loss": 0.6981, "step": 433 }, { "epoch": 0.05, "learning_rate": 0.00019980424152647171, "loss": 0.747, "step": 434 }, { "epoch": 0.05, "learning_rate": 0.00019980193247475628, "loss": 0.6993, "step": 435 }, { "epoch": 0.05, "learning_rate": 0.00019979960989816104, "loss": 0.7171, "step": 436 }, { "epoch": 0.05, "learning_rate": 0.00019979727379700076, "loss": 0.6882, "step": 437 }, { "epoch": 0.05, "learning_rate": 0.000199794924171592, "loss": 0.7085, "step": 438 }, { "epoch": 0.05, "learning_rate": 0.00019979256102225316, "loss": 0.6876, "step": 439 }, { "epoch": 0.05, "learning_rate": 0.00019979018434930455, "loss": 0.6769, "step": 440 }, { "epoch": 0.05, "learning_rate": 0.00019978779415306822, "loss": 0.7362, "step": 441 }, { "epoch": 0.05, "learning_rate": 0.00019978539043386803, "loss": 0.7144, "step": 442 }, { "epoch": 0.05, "learning_rate": 0.0001997829731920298, "loss": 0.6396, "step": 443 }, { "epoch": 0.05, "learning_rate": 0.00019978054242788108, "loss": 0.7016, "step": 444 }, { "epoch": 0.05, "learning_rate": 0.00019977809814175127, "loss": 0.7393, "step": 445 }, { "epoch": 0.05, "learning_rate": 0.00019977564033397163, "loss": 0.639, "step": 446 }, { "epoch": 0.05, "learning_rate": 0.00019977316900487524, "loss": 0.6987, "step": 447 }, { "epoch": 0.05, "learning_rate": 0.00019977068415479696, "loss": 0.7098, "step": 448 }, { "epoch": 0.05, "learning_rate": 0.00019976818578407358, "loss": 0.6645, "step": 449 }, { "epoch": 0.05, "learning_rate": 0.00019976567389304366, "loss": 0.7033, "step": 450 }, { "epoch": 0.05, "learning_rate": 0.0001997631484820476, "loss": 0.72, "step": 451 }, { "epoch": 0.05, "learning_rate": 0.00019976060955142764, "loss": 0.7009, "step": 452 }, { "epoch": 0.05, "learning_rate": 0.00019975805710152787, "loss": 0.7107, "step": 453 }, { "epoch": 0.05, "learning_rate": 0.0001997554911326941, "loss": 0.7628, "step": 454 }, { "epoch": 0.05, "learning_rate": 0.0001997529116452742, "loss": 0.7107, "step": 455 }, { "epoch": 0.05, "learning_rate": 0.00019975031863961765, "loss": 0.6465, "step": 456 }, { "epoch": 0.05, "learning_rate": 0.00019974771211607586, "loss": 0.7002, "step": 457 }, { "epoch": 0.05, "learning_rate": 0.00019974509207500206, "loss": 0.758, "step": 458 }, { "epoch": 0.05, "learning_rate": 0.00019974245851675127, "loss": 0.7378, "step": 459 }, { "epoch": 0.05, "learning_rate": 0.0001997398114416805, "loss": 0.7141, "step": 460 }, { "epoch": 0.05, "learning_rate": 0.00019973715085014833, "loss": 0.7103, "step": 461 }, { "epoch": 0.05, "learning_rate": 0.00019973447674251544, "loss": 0.7204, "step": 462 }, { "epoch": 0.05, "learning_rate": 0.00019973178911914414, "loss": 0.6908, "step": 463 }, { "epoch": 0.05, "learning_rate": 0.00019972908798039865, "loss": 0.6952, "step": 464 }, { "epoch": 0.05, "learning_rate": 0.00019972637332664507, "loss": 0.7316, "step": 465 }, { "epoch": 0.05, "learning_rate": 0.00019972364515825127, "loss": 0.7026, "step": 466 }, { "epoch": 0.05, "learning_rate": 0.00019972090347558693, "loss": 0.7349, "step": 467 }, { "epoch": 0.05, "learning_rate": 0.0001997181482790236, "loss": 0.6927, "step": 468 }, { "epoch": 0.05, "learning_rate": 0.00019971537956893468, "loss": 0.7065, "step": 469 }, { "epoch": 0.05, "learning_rate": 0.00019971259734569537, "loss": 0.5994, "step": 470 }, { "epoch": 0.05, "learning_rate": 0.0001997098016096827, "loss": 0.7561, "step": 471 }, { "epoch": 0.05, "learning_rate": 0.00019970699236127555, "loss": 0.7264, "step": 472 }, { "epoch": 0.05, "learning_rate": 0.00019970416960085464, "loss": 0.6991, "step": 473 }, { "epoch": 0.05, "learning_rate": 0.00019970133332880246, "loss": 0.7075, "step": 474 }, { "epoch": 0.05, "learning_rate": 0.0001996984835455034, "loss": 0.7303, "step": 475 }, { "epoch": 0.05, "learning_rate": 0.00019969562025134362, "loss": 0.739, "step": 476 }, { "epoch": 0.05, "learning_rate": 0.00019969274344671121, "loss": 0.6716, "step": 477 }, { "epoch": 0.05, "learning_rate": 0.000199689853131996, "loss": 0.6822, "step": 478 }, { "epoch": 0.05, "learning_rate": 0.00019968694930758968, "loss": 0.7357, "step": 479 }, { "epoch": 0.05, "learning_rate": 0.00019968403197388572, "loss": 0.7244, "step": 480 }, { "epoch": 0.05, "learning_rate": 0.00019968110113127954, "loss": 0.7168, "step": 481 }, { "epoch": 0.05, "learning_rate": 0.00019967815678016826, "loss": 0.6738, "step": 482 }, { "epoch": 0.05, "learning_rate": 0.00019967519892095093, "loss": 0.6947, "step": 483 }, { "epoch": 0.06, "learning_rate": 0.00019967222755402838, "loss": 0.7482, "step": 484 }, { "epoch": 0.06, "learning_rate": 0.00019966924267980326, "loss": 0.6991, "step": 485 }, { "epoch": 0.06, "learning_rate": 0.00019966624429868012, "loss": 0.6858, "step": 486 }, { "epoch": 0.06, "learning_rate": 0.0001996632324110652, "loss": 0.6668, "step": 487 }, { "epoch": 0.06, "learning_rate": 0.00019966020701736681, "loss": 0.6884, "step": 488 }, { "epoch": 0.06, "learning_rate": 0.00019965716811799482, "loss": 0.7056, "step": 489 }, { "epoch": 0.06, "learning_rate": 0.00019965411571336108, "loss": 0.6942, "step": 490 }, { "epoch": 0.06, "learning_rate": 0.00019965104980387927, "loss": 0.7278, "step": 491 }, { "epoch": 0.06, "learning_rate": 0.00019964797038996487, "loss": 0.7203, "step": 492 }, { "epoch": 0.06, "learning_rate": 0.00019964487747203515, "loss": 0.7222, "step": 493 }, { "epoch": 0.06, "learning_rate": 0.00019964177105050932, "loss": 0.6691, "step": 494 }, { "epoch": 0.06, "learning_rate": 0.0001996386511258083, "loss": 0.6949, "step": 495 }, { "epoch": 0.06, "learning_rate": 0.00019963551769835492, "loss": 0.7039, "step": 496 }, { "epoch": 0.06, "learning_rate": 0.0001996323707685738, "loss": 0.7211, "step": 497 }, { "epoch": 0.06, "learning_rate": 0.00019962921033689143, "loss": 0.7138, "step": 498 }, { "epoch": 0.06, "learning_rate": 0.00019962603640373607, "loss": 0.6815, "step": 499 }, { "epoch": 0.06, "learning_rate": 0.00019962284896953784, "loss": 0.7122, "step": 500 }, { "epoch": 0.06, "learning_rate": 0.00019961964803472872, "loss": 0.6799, "step": 501 }, { "epoch": 0.06, "learning_rate": 0.0001996164335997425, "loss": 0.6672, "step": 502 }, { "epoch": 0.06, "learning_rate": 0.0001996132056650147, "loss": 0.6827, "step": 503 }, { "epoch": 0.06, "learning_rate": 0.0001996099642309829, "loss": 0.756, "step": 504 }, { "epoch": 0.06, "learning_rate": 0.00019960670929808626, "loss": 0.6732, "step": 505 }, { "epoch": 0.06, "learning_rate": 0.00019960344086676597, "loss": 0.6443, "step": 506 }, { "epoch": 0.06, "learning_rate": 0.0001996001589374649, "loss": 0.7405, "step": 507 }, { "epoch": 0.06, "learning_rate": 0.0001995968635106278, "loss": 0.7329, "step": 508 }, { "epoch": 0.06, "learning_rate": 0.00019959355458670124, "loss": 0.7647, "step": 509 }, { "epoch": 0.06, "learning_rate": 0.0001995902321661337, "loss": 0.7204, "step": 510 }, { "epoch": 0.06, "learning_rate": 0.00019958689624937538, "loss": 0.7329, "step": 511 }, { "epoch": 0.06, "learning_rate": 0.0001995835468368784, "loss": 0.7223, "step": 512 }, { "epoch": 0.06, "learning_rate": 0.00019958018392909663, "loss": 0.7016, "step": 513 }, { "epoch": 0.06, "learning_rate": 0.00019957680752648579, "loss": 0.767, "step": 514 }, { "epoch": 0.06, "learning_rate": 0.00019957341762950344, "loss": 0.7097, "step": 515 }, { "epoch": 0.06, "learning_rate": 0.00019957001423860903, "loss": 0.7762, "step": 516 }, { "epoch": 0.06, "learning_rate": 0.00019956659735426372, "loss": 0.7228, "step": 517 }, { "epoch": 0.06, "learning_rate": 0.00019956316697693053, "loss": 0.6283, "step": 518 }, { "epoch": 0.06, "learning_rate": 0.0001995597231070744, "loss": 0.7202, "step": 519 }, { "epoch": 0.06, "learning_rate": 0.00019955626574516203, "loss": 0.664, "step": 520 }, { "epoch": 0.06, "learning_rate": 0.0001995527948916619, "loss": 0.6332, "step": 521 }, { "epoch": 0.06, "learning_rate": 0.00019954931054704442, "loss": 0.6496, "step": 522 }, { "epoch": 0.06, "learning_rate": 0.00019954581271178174, "loss": 0.7112, "step": 523 }, { "epoch": 0.06, "learning_rate": 0.0001995423013863479, "loss": 0.7058, "step": 524 }, { "epoch": 0.06, "learning_rate": 0.00019953877657121876, "loss": 0.7347, "step": 525 }, { "epoch": 0.06, "learning_rate": 0.00019953523826687195, "loss": 0.7406, "step": 526 }, { "epoch": 0.06, "learning_rate": 0.00019953168647378702, "loss": 0.7073, "step": 527 }, { "epoch": 0.06, "learning_rate": 0.00019952812119244527, "loss": 0.6958, "step": 528 }, { "epoch": 0.06, "learning_rate": 0.00019952454242332983, "loss": 0.7219, "step": 529 }, { "epoch": 0.06, "learning_rate": 0.00019952095016692573, "loss": 0.655, "step": 530 }, { "epoch": 0.06, "learning_rate": 0.0001995173444237198, "loss": 0.7067, "step": 531 }, { "epoch": 0.06, "learning_rate": 0.00019951372519420063, "loss": 0.7006, "step": 532 }, { "epoch": 0.06, "learning_rate": 0.0001995100924788587, "loss": 0.7376, "step": 533 }, { "epoch": 0.06, "learning_rate": 0.0001995064462781863, "loss": 0.6477, "step": 534 }, { "epoch": 0.06, "learning_rate": 0.00019950278659267758, "loss": 0.7203, "step": 535 }, { "epoch": 0.06, "learning_rate": 0.00019949911342282848, "loss": 0.6979, "step": 536 }, { "epoch": 0.06, "learning_rate": 0.00019949542676913677, "loss": 0.7027, "step": 537 }, { "epoch": 0.06, "learning_rate": 0.00019949172663210208, "loss": 0.7231, "step": 538 }, { "epoch": 0.06, "learning_rate": 0.0001994880130122258, "loss": 0.7012, "step": 539 }, { "epoch": 0.06, "learning_rate": 0.0001994842859100112, "loss": 0.681, "step": 540 }, { "epoch": 0.06, "learning_rate": 0.00019948054532596338, "loss": 0.6357, "step": 541 }, { "epoch": 0.06, "learning_rate": 0.00019947679126058928, "loss": 0.7454, "step": 542 }, { "epoch": 0.06, "learning_rate": 0.00019947302371439758, "loss": 0.7188, "step": 543 }, { "epoch": 0.06, "learning_rate": 0.00019946924268789888, "loss": 0.7198, "step": 544 }, { "epoch": 0.06, "learning_rate": 0.00019946544818160559, "loss": 0.6949, "step": 545 }, { "epoch": 0.06, "learning_rate": 0.0001994616401960319, "loss": 0.6952, "step": 546 }, { "epoch": 0.06, "learning_rate": 0.00019945781873169388, "loss": 0.7129, "step": 547 }, { "epoch": 0.06, "learning_rate": 0.0001994539837891094, "loss": 0.7108, "step": 548 }, { "epoch": 0.06, "learning_rate": 0.00019945013536879812, "loss": 0.662, "step": 549 }, { "epoch": 0.06, "learning_rate": 0.00019944627347128163, "loss": 0.7127, "step": 550 }, { "epoch": 0.06, "learning_rate": 0.0001994423980970833, "loss": 0.7003, "step": 551 }, { "epoch": 0.06, "learning_rate": 0.0001994385092467282, "loss": 0.7108, "step": 552 }, { "epoch": 0.06, "learning_rate": 0.00019943460692074344, "loss": 0.7492, "step": 553 }, { "epoch": 0.06, "learning_rate": 0.00019943069111965777, "loss": 0.71, "step": 554 }, { "epoch": 0.06, "learning_rate": 0.00019942676184400194, "loss": 0.7658, "step": 555 }, { "epoch": 0.06, "learning_rate": 0.00019942281909430837, "loss": 0.6969, "step": 556 }, { "epoch": 0.06, "learning_rate": 0.0001994188628711114, "loss": 0.7619, "step": 557 }, { "epoch": 0.06, "learning_rate": 0.00019941489317494714, "loss": 0.7334, "step": 558 }, { "epoch": 0.06, "learning_rate": 0.00019941091000635357, "loss": 0.7116, "step": 559 }, { "epoch": 0.06, "learning_rate": 0.0001994069133658705, "loss": 0.771, "step": 560 }, { "epoch": 0.06, "learning_rate": 0.00019940290325403946, "loss": 0.7646, "step": 561 }, { "epoch": 0.06, "learning_rate": 0.00019939887967140402, "loss": 0.7284, "step": 562 }, { "epoch": 0.06, "learning_rate": 0.00019939484261850932, "loss": 0.678, "step": 563 }, { "epoch": 0.06, "learning_rate": 0.00019939079209590251, "loss": 0.7179, "step": 564 }, { "epoch": 0.06, "learning_rate": 0.00019938672810413253, "loss": 0.6749, "step": 565 }, { "epoch": 0.06, "learning_rate": 0.00019938265064375007, "loss": 0.7112, "step": 566 }, { "epoch": 0.06, "learning_rate": 0.0001993785597153077, "loss": 0.7427, "step": 567 }, { "epoch": 0.06, "learning_rate": 0.00019937445531935984, "loss": 0.6675, "step": 568 }, { "epoch": 0.06, "learning_rate": 0.00019937033745646269, "loss": 0.7042, "step": 569 }, { "epoch": 0.06, "learning_rate": 0.0001993662061271743, "loss": 0.7084, "step": 570 }, { "epoch": 0.06, "learning_rate": 0.00019936206133205453, "loss": 0.7114, "step": 571 }, { "epoch": 0.07, "learning_rate": 0.00019935790307166505, "loss": 0.7183, "step": 572 }, { "epoch": 0.07, "learning_rate": 0.00019935373134656942, "loss": 0.6791, "step": 573 }, { "epoch": 0.07, "learning_rate": 0.00019934954615733296, "loss": 0.6434, "step": 574 }, { "epoch": 0.07, "learning_rate": 0.00019934534750452282, "loss": 0.6828, "step": 575 }, { "epoch": 0.07, "learning_rate": 0.000199341135388708, "loss": 0.7138, "step": 576 }, { "epoch": 0.07, "learning_rate": 0.00019933690981045933, "loss": 0.7029, "step": 577 }, { "epoch": 0.07, "learning_rate": 0.00019933267077034943, "loss": 0.6928, "step": 578 }, { "epoch": 0.07, "learning_rate": 0.00019932841826895276, "loss": 0.7029, "step": 579 }, { "epoch": 0.07, "learning_rate": 0.00019932415230684562, "loss": 0.7284, "step": 580 }, { "epoch": 0.07, "learning_rate": 0.00019931987288460611, "loss": 0.6909, "step": 581 }, { "epoch": 0.07, "learning_rate": 0.00019931558000281418, "loss": 0.7077, "step": 582 }, { "epoch": 0.07, "learning_rate": 0.00019931127366205157, "loss": 0.7021, "step": 583 }, { "epoch": 0.07, "learning_rate": 0.0001993069538629019, "loss": 0.7443, "step": 584 }, { "epoch": 0.07, "learning_rate": 0.00019930262060595055, "loss": 0.697, "step": 585 }, { "epoch": 0.07, "learning_rate": 0.00019929827389178476, "loss": 0.7507, "step": 586 }, { "epoch": 0.07, "learning_rate": 0.00019929391372099352, "loss": 0.7056, "step": 587 }, { "epoch": 0.07, "learning_rate": 0.0001992895400941678, "loss": 0.6908, "step": 588 }, { "epoch": 0.07, "learning_rate": 0.0001992851530119003, "loss": 0.7237, "step": 589 }, { "epoch": 0.07, "learning_rate": 0.00019928075247478545, "loss": 0.7061, "step": 590 }, { "epoch": 0.07, "learning_rate": 0.0001992763384834197, "loss": 0.7365, "step": 591 }, { "epoch": 0.07, "learning_rate": 0.00019927191103840118, "loss": 0.6567, "step": 592 }, { "epoch": 0.07, "learning_rate": 0.0001992674701403299, "loss": 0.7157, "step": 593 }, { "epoch": 0.07, "learning_rate": 0.00019926301578980767, "loss": 0.7278, "step": 594 }, { "epoch": 0.07, "learning_rate": 0.00019925854798743807, "loss": 0.6712, "step": 595 }, { "epoch": 0.07, "learning_rate": 0.00019925406673382666, "loss": 0.719, "step": 596 }, { "epoch": 0.07, "learning_rate": 0.0001992495720295807, "loss": 0.7068, "step": 597 }, { "epoch": 0.07, "learning_rate": 0.00019924506387530928, "loss": 0.6893, "step": 598 }, { "epoch": 0.07, "learning_rate": 0.00019924054227162335, "loss": 0.6646, "step": 599 }, { "epoch": 0.07, "learning_rate": 0.00019923600721913562, "loss": 0.6961, "step": 600 }, { "epoch": 0.07, "learning_rate": 0.00019923145871846072, "loss": 0.649, "step": 601 }, { "epoch": 0.07, "learning_rate": 0.00019922689677021505, "loss": 0.7457, "step": 602 }, { "epoch": 0.07, "learning_rate": 0.0001992223213750168, "loss": 0.6621, "step": 603 }, { "epoch": 0.07, "learning_rate": 0.00019921773253348603, "loss": 0.6899, "step": 604 }, { "epoch": 0.07, "learning_rate": 0.00019921313024624462, "loss": 0.6915, "step": 605 }, { "epoch": 0.07, "learning_rate": 0.00019920851451391623, "loss": 0.7495, "step": 606 }, { "epoch": 0.07, "learning_rate": 0.0001992038853371264, "loss": 0.6636, "step": 607 }, { "epoch": 0.07, "learning_rate": 0.00019919924271650244, "loss": 0.6816, "step": 608 }, { "epoch": 0.07, "learning_rate": 0.00019919458665267355, "loss": 0.7286, "step": 609 }, { "epoch": 0.07, "learning_rate": 0.00019918991714627064, "loss": 0.6749, "step": 610 }, { "epoch": 0.07, "learning_rate": 0.00019918523419792657, "loss": 0.7527, "step": 611 }, { "epoch": 0.07, "learning_rate": 0.0001991805378082759, "loss": 0.7104, "step": 612 }, { "epoch": 0.07, "learning_rate": 0.0001991758279779551, "loss": 0.7325, "step": 613 }, { "epoch": 0.07, "learning_rate": 0.00019917110470760245, "loss": 0.7432, "step": 614 }, { "epoch": 0.07, "learning_rate": 0.000199166367997858, "loss": 0.682, "step": 615 }, { "epoch": 0.07, "learning_rate": 0.00019916161784936374, "loss": 0.6975, "step": 616 }, { "epoch": 0.07, "learning_rate": 0.00019915685426276326, "loss": 0.6333, "step": 617 }, { "epoch": 0.07, "learning_rate": 0.00019915207723870224, "loss": 0.7066, "step": 618 }, { "epoch": 0.07, "learning_rate": 0.00019914728677782793, "loss": 0.6604, "step": 619 }, { "epoch": 0.07, "learning_rate": 0.00019914248288078966, "loss": 0.6962, "step": 620 }, { "epoch": 0.07, "learning_rate": 0.0001991376655482383, "loss": 0.7311, "step": 621 }, { "epoch": 0.07, "learning_rate": 0.00019913283478082677, "loss": 0.7164, "step": 622 }, { "epoch": 0.07, "learning_rate": 0.00019912799057920965, "loss": 0.6733, "step": 623 }, { "epoch": 0.07, "learning_rate": 0.0001991231329440435, "loss": 0.6226, "step": 624 }, { "epoch": 0.07, "learning_rate": 0.00019911826187598658, "loss": 0.7026, "step": 625 }, { "epoch": 0.07, "learning_rate": 0.00019911337737569897, "loss": 0.7385, "step": 626 }, { "epoch": 0.07, "learning_rate": 0.00019910847944384262, "loss": 0.7586, "step": 627 }, { "epoch": 0.07, "learning_rate": 0.00019910356808108132, "loss": 0.7296, "step": 628 }, { "epoch": 0.07, "learning_rate": 0.00019909864328808058, "loss": 0.7261, "step": 629 }, { "epoch": 0.07, "learning_rate": 0.00019909370506550786, "loss": 0.6936, "step": 630 }, { "epoch": 0.07, "learning_rate": 0.00019908875341403235, "loss": 0.7406, "step": 631 }, { "epoch": 0.07, "learning_rate": 0.00019908378833432506, "loss": 0.7343, "step": 632 }, { "epoch": 0.07, "learning_rate": 0.00019907880982705887, "loss": 0.7671, "step": 633 }, { "epoch": 0.07, "learning_rate": 0.00019907381789290845, "loss": 0.7342, "step": 634 }, { "epoch": 0.07, "learning_rate": 0.00019906881253255025, "loss": 0.6824, "step": 635 }, { "epoch": 0.07, "learning_rate": 0.00019906379374666266, "loss": 0.7244, "step": 636 }, { "epoch": 0.07, "learning_rate": 0.00019905876153592577, "loss": 0.7523, "step": 637 }, { "epoch": 0.07, "learning_rate": 0.00019905371590102155, "loss": 0.7386, "step": 638 }, { "epoch": 0.07, "learning_rate": 0.00019904865684263373, "loss": 0.696, "step": 639 }, { "epoch": 0.07, "learning_rate": 0.00019904358436144791, "loss": 0.6657, "step": 640 }, { "epoch": 0.07, "learning_rate": 0.00019903849845815153, "loss": 0.692, "step": 641 }, { "epoch": 0.07, "learning_rate": 0.0001990333991334338, "loss": 0.7006, "step": 642 }, { "epoch": 0.07, "learning_rate": 0.0001990282863879858, "loss": 0.6973, "step": 643 }, { "epoch": 0.07, "learning_rate": 0.00019902316022250033, "loss": 0.7257, "step": 644 }, { "epoch": 0.07, "learning_rate": 0.0001990180206376721, "loss": 0.6101, "step": 645 }, { "epoch": 0.07, "learning_rate": 0.00019901286763419763, "loss": 0.7215, "step": 646 }, { "epoch": 0.07, "learning_rate": 0.00019900770121277522, "loss": 0.7173, "step": 647 }, { "epoch": 0.07, "learning_rate": 0.000199002521374105, "loss": 0.7321, "step": 648 }, { "epoch": 0.07, "learning_rate": 0.00019899732811888899, "loss": 0.749, "step": 649 }, { "epoch": 0.07, "learning_rate": 0.00019899212144783087, "loss": 0.6963, "step": 650 }, { "epoch": 0.07, "learning_rate": 0.00019898690136163633, "loss": 0.6759, "step": 651 }, { "epoch": 0.07, "learning_rate": 0.0001989816678610127, "loss": 0.6507, "step": 652 }, { "epoch": 0.07, "learning_rate": 0.00019897642094666927, "loss": 0.7407, "step": 653 }, { "epoch": 0.07, "learning_rate": 0.00019897116061931704, "loss": 0.7402, "step": 654 }, { "epoch": 0.07, "learning_rate": 0.0001989658868796689, "loss": 0.7149, "step": 655 }, { "epoch": 0.07, "learning_rate": 0.00019896059972843952, "loss": 0.698, "step": 656 }, { "epoch": 0.07, "learning_rate": 0.00019895529916634543, "loss": 0.731, "step": 657 }, { "epoch": 0.07, "learning_rate": 0.00019894998519410492, "loss": 0.6905, "step": 658 }, { "epoch": 0.07, "learning_rate": 0.00019894465781243814, "loss": 0.7396, "step": 659 }, { "epoch": 0.08, "learning_rate": 0.00019893931702206702, "loss": 0.7324, "step": 660 }, { "epoch": 0.08, "learning_rate": 0.00019893396282371536, "loss": 0.6946, "step": 661 }, { "epoch": 0.08, "learning_rate": 0.0001989285952181087, "loss": 0.7127, "step": 662 }, { "epoch": 0.08, "learning_rate": 0.00019892321420597448, "loss": 0.6903, "step": 663 }, { "epoch": 0.08, "learning_rate": 0.00019891781978804193, "loss": 0.7428, "step": 664 }, { "epoch": 0.08, "learning_rate": 0.00019891241196504206, "loss": 0.675, "step": 665 }, { "epoch": 0.08, "learning_rate": 0.00019890699073770772, "loss": 0.6411, "step": 666 }, { "epoch": 0.08, "learning_rate": 0.00019890155610677358, "loss": 0.7018, "step": 667 }, { "epoch": 0.08, "learning_rate": 0.00019889610807297616, "loss": 0.7384, "step": 668 }, { "epoch": 0.08, "learning_rate": 0.00019889064663705373, "loss": 0.7023, "step": 669 }, { "epoch": 0.08, "learning_rate": 0.00019888517179974643, "loss": 0.7082, "step": 670 }, { "epoch": 0.08, "learning_rate": 0.00019887968356179615, "loss": 0.7309, "step": 671 }, { "epoch": 0.08, "learning_rate": 0.0001988741819239467, "loss": 0.6472, "step": 672 }, { "epoch": 0.08, "learning_rate": 0.00019886866688694358, "loss": 0.7156, "step": 673 }, { "epoch": 0.08, "learning_rate": 0.00019886313845153425, "loss": 0.7146, "step": 674 }, { "epoch": 0.08, "learning_rate": 0.00019885759661846788, "loss": 0.7125, "step": 675 }, { "epoch": 0.08, "learning_rate": 0.00019885204138849545, "loss": 0.7334, "step": 676 }, { "epoch": 0.08, "learning_rate": 0.00019884647276236983, "loss": 0.6858, "step": 677 }, { "epoch": 0.08, "learning_rate": 0.00019884089074084563, "loss": 0.7089, "step": 678 }, { "epoch": 0.08, "learning_rate": 0.00019883529532467933, "loss": 0.6977, "step": 679 }, { "epoch": 0.08, "learning_rate": 0.00019882968651462922, "loss": 0.7291, "step": 680 }, { "epoch": 0.08, "learning_rate": 0.00019882406431145534, "loss": 0.7182, "step": 681 }, { "epoch": 0.08, "learning_rate": 0.00019881842871591964, "loss": 0.7137, "step": 682 }, { "epoch": 0.08, "learning_rate": 0.00019881277972878586, "loss": 0.7569, "step": 683 }, { "epoch": 0.08, "learning_rate": 0.00019880711735081945, "loss": 0.7297, "step": 684 }, { "epoch": 0.08, "learning_rate": 0.00019880144158278783, "loss": 0.7781, "step": 685 }, { "epoch": 0.08, "learning_rate": 0.0001987957524254602, "loss": 0.8181, "step": 686 }, { "epoch": 0.08, "learning_rate": 0.0001987900498796074, "loss": 0.7083, "step": 687 }, { "epoch": 0.08, "learning_rate": 0.0001987843339460024, "loss": 0.7067, "step": 688 }, { "epoch": 0.08, "learning_rate": 0.00019877860462541965, "loss": 0.661, "step": 689 }, { "epoch": 0.08, "learning_rate": 0.00019877286191863567, "loss": 0.6525, "step": 690 }, { "epoch": 0.08, "learning_rate": 0.00019876710582642862, "loss": 0.7106, "step": 691 }, { "epoch": 0.08, "learning_rate": 0.00019876133634957866, "loss": 0.6237, "step": 692 }, { "epoch": 0.08, "learning_rate": 0.00019875555348886754, "loss": 0.7499, "step": 693 }, { "epoch": 0.08, "learning_rate": 0.00019874975724507897, "loss": 0.7449, "step": 694 }, { "epoch": 0.08, "learning_rate": 0.0001987439476189985, "loss": 0.6704, "step": 695 }, { "epoch": 0.08, "learning_rate": 0.00019873812461141337, "loss": 0.7885, "step": 696 }, { "epoch": 0.08, "learning_rate": 0.00019873228822311272, "loss": 0.7233, "step": 697 }, { "epoch": 0.08, "learning_rate": 0.00019872643845488748, "loss": 0.7269, "step": 698 }, { "epoch": 0.08, "learning_rate": 0.0001987205753075304, "loss": 0.7093, "step": 699 }, { "epoch": 0.08, "learning_rate": 0.000198714698781836, "loss": 0.7574, "step": 700 }, { "epoch": 0.08, "learning_rate": 0.0001987088088786007, "loss": 0.6926, "step": 701 }, { "epoch": 0.08, "learning_rate": 0.00019870290559862269, "loss": 0.743, "step": 702 }, { "epoch": 0.08, "learning_rate": 0.0001986969889427019, "loss": 0.6394, "step": 703 }, { "epoch": 0.08, "learning_rate": 0.00019869105891164019, "loss": 0.7214, "step": 704 }, { "epoch": 0.08, "learning_rate": 0.00019868511550624117, "loss": 0.7415, "step": 705 }, { "epoch": 0.08, "learning_rate": 0.0001986791587273103, "loss": 0.6679, "step": 706 }, { "epoch": 0.08, "learning_rate": 0.00019867318857565475, "loss": 0.742, "step": 707 }, { "epoch": 0.08, "learning_rate": 0.00019866720505208366, "loss": 0.7219, "step": 708 }, { "epoch": 0.08, "learning_rate": 0.00019866120815740786, "loss": 0.6902, "step": 709 }, { "epoch": 0.08, "learning_rate": 0.00019865519789244004, "loss": 0.6488, "step": 710 }, { "epoch": 0.08, "learning_rate": 0.0001986491742579947, "loss": 0.7506, "step": 711 }, { "epoch": 0.08, "learning_rate": 0.00019864313725488812, "loss": 0.6926, "step": 712 }, { "epoch": 0.08, "learning_rate": 0.00019863708688393846, "loss": 0.6186, "step": 713 }, { "epoch": 0.08, "learning_rate": 0.0001986310231459656, "loss": 0.7056, "step": 714 }, { "epoch": 0.08, "learning_rate": 0.00019862494604179135, "loss": 0.6953, "step": 715 }, { "epoch": 0.08, "learning_rate": 0.0001986188555722392, "loss": 0.6682, "step": 716 }, { "epoch": 0.08, "learning_rate": 0.00019861275173813455, "loss": 0.6765, "step": 717 }, { "epoch": 0.08, "learning_rate": 0.00019860663454030454, "loss": 0.6674, "step": 718 }, { "epoch": 0.08, "learning_rate": 0.00019860050397957818, "loss": 0.7088, "step": 719 }, { "epoch": 0.08, "learning_rate": 0.00019859436005678624, "loss": 0.7298, "step": 720 }, { "epoch": 0.08, "learning_rate": 0.00019858820277276137, "loss": 0.7767, "step": 721 }, { "epoch": 0.08, "learning_rate": 0.00019858203212833798, "loss": 0.7706, "step": 722 }, { "epoch": 0.08, "learning_rate": 0.00019857584812435229, "loss": 0.7011, "step": 723 }, { "epoch": 0.08, "learning_rate": 0.0001985696507616423, "loss": 0.6868, "step": 724 }, { "epoch": 0.08, "learning_rate": 0.00019856344004104791, "loss": 0.6909, "step": 725 }, { "epoch": 0.08, "learning_rate": 0.00019855721596341076, "loss": 0.7567, "step": 726 }, { "epoch": 0.08, "learning_rate": 0.00019855097852957437, "loss": 0.668, "step": 727 }, { "epoch": 0.08, "learning_rate": 0.00019854472774038392, "loss": 0.7099, "step": 728 }, { "epoch": 0.08, "learning_rate": 0.00019853846359668657, "loss": 0.7303, "step": 729 }, { "epoch": 0.08, "learning_rate": 0.00019853218609933117, "loss": 0.7199, "step": 730 }, { "epoch": 0.08, "learning_rate": 0.0001985258952491685, "loss": 0.7397, "step": 731 }, { "epoch": 0.08, "learning_rate": 0.000198519591047051, "loss": 0.715, "step": 732 }, { "epoch": 0.08, "learning_rate": 0.0001985132734938331, "loss": 0.7009, "step": 733 }, { "epoch": 0.08, "learning_rate": 0.00019850694259037081, "loss": 0.6843, "step": 734 }, { "epoch": 0.08, "learning_rate": 0.0001985005983375222, "loss": 0.605, "step": 735 }, { "epoch": 0.08, "learning_rate": 0.0001984942407361469, "loss": 0.7231, "step": 736 }, { "epoch": 0.08, "learning_rate": 0.00019848786978710658, "loss": 0.7202, "step": 737 }, { "epoch": 0.08, "learning_rate": 0.00019848148549126457, "loss": 0.7288, "step": 738 }, { "epoch": 0.08, "learning_rate": 0.00019847508784948605, "loss": 0.6606, "step": 739 }, { "epoch": 0.08, "learning_rate": 0.00019846867686263803, "loss": 0.7426, "step": 740 }, { "epoch": 0.08, "learning_rate": 0.00019846225253158925, "loss": 0.633, "step": 741 }, { "epoch": 0.08, "learning_rate": 0.0001984558148572104, "loss": 0.7274, "step": 742 }, { "epoch": 0.08, "learning_rate": 0.00019844936384037386, "loss": 0.7356, "step": 743 }, { "epoch": 0.08, "learning_rate": 0.00019844289948195385, "loss": 0.7298, "step": 744 }, { "epoch": 0.08, "learning_rate": 0.0001984364217828264, "loss": 0.6984, "step": 745 }, { "epoch": 0.08, "learning_rate": 0.00019842993074386934, "loss": 0.7472, "step": 746 }, { "epoch": 0.08, "learning_rate": 0.00019842342636596235, "loss": 0.763, "step": 747 }, { "epoch": 0.09, "learning_rate": 0.00019841690864998688, "loss": 0.695, "step": 748 }, { "epoch": 0.09, "learning_rate": 0.00019841037759682614, "loss": 0.6521, "step": 749 }, { "epoch": 0.09, "learning_rate": 0.00019840383320736526, "loss": 0.7062, "step": 750 }, { "epoch": 0.09, "learning_rate": 0.0001983972754824911, "loss": 0.6473, "step": 751 }, { "epoch": 0.09, "learning_rate": 0.00019839070442309234, "loss": 0.7513, "step": 752 }, { "epoch": 0.09, "learning_rate": 0.00019838412003005945, "loss": 0.6158, "step": 753 }, { "epoch": 0.09, "learning_rate": 0.0001983775223042848, "loss": 0.7244, "step": 754 }, { "epoch": 0.09, "learning_rate": 0.0001983709112466624, "loss": 0.6509, "step": 755 }, { "epoch": 0.09, "learning_rate": 0.0001983642868580882, "loss": 0.7097, "step": 756 }, { "epoch": 0.09, "learning_rate": 0.00019835764913945998, "loss": 0.7008, "step": 757 }, { "epoch": 0.09, "learning_rate": 0.00019835099809167717, "loss": 0.7138, "step": 758 }, { "epoch": 0.09, "learning_rate": 0.00019834433371564115, "loss": 0.7447, "step": 759 }, { "epoch": 0.09, "learning_rate": 0.00019833765601225508, "loss": 0.7134, "step": 760 }, { "epoch": 0.09, "learning_rate": 0.00019833096498242386, "loss": 0.6859, "step": 761 }, { "epoch": 0.09, "learning_rate": 0.00019832426062705425, "loss": 0.6749, "step": 762 }, { "epoch": 0.09, "learning_rate": 0.00019831754294705482, "loss": 0.7314, "step": 763 }, { "epoch": 0.09, "learning_rate": 0.00019831081194333593, "loss": 0.7003, "step": 764 }, { "epoch": 0.09, "learning_rate": 0.0001983040676168097, "loss": 0.7027, "step": 765 }, { "epoch": 0.09, "learning_rate": 0.0001982973099683902, "loss": 0.6361, "step": 766 }, { "epoch": 0.09, "learning_rate": 0.0001982905389989931, "loss": 0.6237, "step": 767 }, { "epoch": 0.09, "learning_rate": 0.00019828375470953608, "loss": 0.6462, "step": 768 }, { "epoch": 0.09, "learning_rate": 0.0001982769571009384, "loss": 0.7198, "step": 769 }, { "epoch": 0.09, "learning_rate": 0.0001982701461741214, "loss": 0.7271, "step": 770 }, { "epoch": 0.09, "learning_rate": 0.000198263321930008, "loss": 0.7158, "step": 771 }, { "epoch": 0.09, "learning_rate": 0.000198256484369523, "loss": 0.6965, "step": 772 }, { "epoch": 0.09, "learning_rate": 0.00019824963349359304, "loss": 0.7, "step": 773 }, { "epoch": 0.09, "learning_rate": 0.0001982427693031465, "loss": 0.6625, "step": 774 }, { "epoch": 0.09, "learning_rate": 0.00019823589179911362, "loss": 0.7142, "step": 775 }, { "epoch": 0.09, "learning_rate": 0.00019822900098242637, "loss": 0.6679, "step": 776 }, { "epoch": 0.09, "learning_rate": 0.00019822209685401863, "loss": 0.6272, "step": 777 }, { "epoch": 0.09, "learning_rate": 0.00019821517941482603, "loss": 0.7297, "step": 778 }, { "epoch": 0.09, "learning_rate": 0.00019820824866578597, "loss": 0.7245, "step": 779 }, { "epoch": 0.09, "learning_rate": 0.00019820130460783771, "loss": 0.6415, "step": 780 }, { "epoch": 0.09, "learning_rate": 0.00019819434724192226, "loss": 0.7485, "step": 781 }, { "epoch": 0.09, "learning_rate": 0.0001981873765689825, "loss": 0.6912, "step": 782 }, { "epoch": 0.09, "learning_rate": 0.00019818039258996304, "loss": 0.6917, "step": 783 }, { "epoch": 0.09, "learning_rate": 0.00019817339530581033, "loss": 0.7086, "step": 784 }, { "epoch": 0.09, "learning_rate": 0.0001981663847174727, "loss": 0.7026, "step": 785 }, { "epoch": 0.09, "learning_rate": 0.0001981593608259001, "loss": 0.6738, "step": 786 }, { "epoch": 0.09, "learning_rate": 0.00019815232363204444, "loss": 0.7226, "step": 787 }, { "epoch": 0.09, "learning_rate": 0.00019814527313685937, "loss": 0.7263, "step": 788 }, { "epoch": 0.09, "learning_rate": 0.00019813820934130036, "loss": 0.7032, "step": 789 }, { "epoch": 0.09, "learning_rate": 0.00019813113224632467, "loss": 0.6949, "step": 790 }, { "epoch": 0.09, "learning_rate": 0.00019812404185289137, "loss": 0.7113, "step": 791 }, { "epoch": 0.09, "learning_rate": 0.00019811693816196134, "loss": 0.6917, "step": 792 }, { "epoch": 0.09, "learning_rate": 0.00019810982117449724, "loss": 0.6602, "step": 793 }, { "epoch": 0.09, "learning_rate": 0.00019810269089146353, "loss": 0.7113, "step": 794 }, { "epoch": 0.09, "learning_rate": 0.00019809554731382652, "loss": 0.6263, "step": 795 }, { "epoch": 0.09, "learning_rate": 0.00019808839044255428, "loss": 0.7024, "step": 796 }, { "epoch": 0.09, "learning_rate": 0.00019808122027861668, "loss": 0.731, "step": 797 }, { "epoch": 0.09, "learning_rate": 0.0001980740368229854, "loss": 0.6686, "step": 798 }, { "epoch": 0.09, "learning_rate": 0.00019806684007663393, "loss": 0.6409, "step": 799 }, { "epoch": 0.09, "learning_rate": 0.0001980596300405375, "loss": 0.6373, "step": 800 }, { "epoch": 0.09, "learning_rate": 0.00019805240671567331, "loss": 0.6751, "step": 801 }, { "epoch": 0.09, "learning_rate": 0.00019804517010302012, "loss": 0.7339, "step": 802 }, { "epoch": 0.09, "learning_rate": 0.00019803792020355873, "loss": 0.6788, "step": 803 }, { "epoch": 0.09, "learning_rate": 0.0001980306570182715, "loss": 0.6758, "step": 804 }, { "epoch": 0.09, "learning_rate": 0.00019802338054814283, "loss": 0.6872, "step": 805 }, { "epoch": 0.09, "learning_rate": 0.00019801609079415875, "loss": 0.7672, "step": 806 }, { "epoch": 0.09, "learning_rate": 0.00019800878775730715, "loss": 0.6942, "step": 807 }, { "epoch": 0.09, "learning_rate": 0.00019800147143857771, "loss": 0.7169, "step": 808 }, { "epoch": 0.09, "learning_rate": 0.00019799414183896196, "loss": 0.6644, "step": 809 }, { "epoch": 0.09, "learning_rate": 0.00019798679895945316, "loss": 0.678, "step": 810 }, { "epoch": 0.09, "learning_rate": 0.00019797944280104635, "loss": 0.741, "step": 811 }, { "epoch": 0.09, "learning_rate": 0.00019797207336473853, "loss": 0.6919, "step": 812 }, { "epoch": 0.09, "learning_rate": 0.00019796469065152828, "loss": 0.7481, "step": 813 }, { "epoch": 0.09, "learning_rate": 0.00019795729466241612, "loss": 0.6399, "step": 814 }, { "epoch": 0.09, "learning_rate": 0.00019794988539840436, "loss": 0.6361, "step": 815 }, { "epoch": 0.09, "learning_rate": 0.00019794246286049702, "loss": 0.7021, "step": 816 }, { "epoch": 0.09, "learning_rate": 0.00019793502704970007, "loss": 0.6398, "step": 817 }, { "epoch": 0.09, "learning_rate": 0.00019792757796702112, "loss": 0.7032, "step": 818 }, { "epoch": 0.09, "learning_rate": 0.00019792011561346965, "loss": 0.6662, "step": 819 }, { "epoch": 0.09, "learning_rate": 0.00019791263999005695, "loss": 0.693, "step": 820 }, { "epoch": 0.09, "learning_rate": 0.00019790515109779615, "loss": 0.6842, "step": 821 }, { "epoch": 0.09, "learning_rate": 0.00019789764893770207, "loss": 0.7145, "step": 822 }, { "epoch": 0.09, "learning_rate": 0.00019789013351079136, "loss": 0.6715, "step": 823 }, { "epoch": 0.09, "learning_rate": 0.00019788260481808253, "loss": 0.7985, "step": 824 }, { "epoch": 0.09, "learning_rate": 0.00019787506286059582, "loss": 0.6962, "step": 825 }, { "epoch": 0.09, "learning_rate": 0.00019786750763935333, "loss": 0.6799, "step": 826 }, { "epoch": 0.09, "learning_rate": 0.0001978599391553789, "loss": 0.7207, "step": 827 }, { "epoch": 0.09, "learning_rate": 0.00019785235740969815, "loss": 0.6164, "step": 828 }, { "epoch": 0.09, "learning_rate": 0.00019784476240333865, "loss": 0.6582, "step": 829 }, { "epoch": 0.09, "learning_rate": 0.00019783715413732955, "loss": 0.6454, "step": 830 }, { "epoch": 0.09, "learning_rate": 0.00019782953261270194, "loss": 0.733, "step": 831 }, { "epoch": 0.09, "learning_rate": 0.00019782189783048865, "loss": 0.6112, "step": 832 }, { "epoch": 0.09, "learning_rate": 0.00019781424979172435, "loss": 0.663, "step": 833 }, { "epoch": 0.09, "learning_rate": 0.00019780658849744546, "loss": 0.6783, "step": 834 }, { "epoch": 0.09, "learning_rate": 0.00019779891394869025, "loss": 0.6964, "step": 835 }, { "epoch": 0.1, "learning_rate": 0.0001977912261464987, "loss": 0.6857, "step": 836 }, { "epoch": 0.1, "learning_rate": 0.0001977835250919127, "loss": 0.718, "step": 837 }, { "epoch": 0.1, "learning_rate": 0.00019777581078597582, "loss": 0.7423, "step": 838 }, { "epoch": 0.1, "learning_rate": 0.0001977680832297335, "loss": 0.7089, "step": 839 }, { "epoch": 0.1, "learning_rate": 0.000197760342424233, "loss": 0.6428, "step": 840 }, { "epoch": 0.1, "learning_rate": 0.00019775258837052327, "loss": 0.6665, "step": 841 }, { "epoch": 0.1, "learning_rate": 0.00019774482106965513, "loss": 0.7494, "step": 842 }, { "epoch": 0.1, "learning_rate": 0.00019773704052268118, "loss": 0.7063, "step": 843 }, { "epoch": 0.1, "learning_rate": 0.00019772924673065588, "loss": 0.7191, "step": 844 }, { "epoch": 0.1, "learning_rate": 0.00019772143969463532, "loss": 0.7552, "step": 845 }, { "epoch": 0.1, "learning_rate": 0.0001977136194156776, "loss": 0.6679, "step": 846 }, { "epoch": 0.1, "learning_rate": 0.00019770578589484243, "loss": 0.7013, "step": 847 }, { "epoch": 0.1, "learning_rate": 0.0001976979391331914, "loss": 0.7073, "step": 848 }, { "epoch": 0.1, "learning_rate": 0.0001976900791317879, "loss": 0.6567, "step": 849 }, { "epoch": 0.1, "learning_rate": 0.00019768220589169702, "loss": 0.6605, "step": 850 }, { "epoch": 0.1, "learning_rate": 0.00019767431941398585, "loss": 0.6971, "step": 851 }, { "epoch": 0.1, "learning_rate": 0.00019766641969972304, "loss": 0.6859, "step": 852 }, { "epoch": 0.1, "learning_rate": 0.00019765850674997916, "loss": 0.6907, "step": 853 }, { "epoch": 0.1, "learning_rate": 0.0001976505805658266, "loss": 0.6489, "step": 854 }, { "epoch": 0.1, "learning_rate": 0.0001976426411483394, "loss": 0.6955, "step": 855 }, { "epoch": 0.1, "learning_rate": 0.00019763468849859359, "loss": 0.6841, "step": 856 }, { "epoch": 0.1, "learning_rate": 0.00019762672261766683, "loss": 0.6757, "step": 857 }, { "epoch": 0.1, "learning_rate": 0.00019761874350663865, "loss": 0.7069, "step": 858 }, { "epoch": 0.1, "learning_rate": 0.00019761075116659036, "loss": 0.7011, "step": 859 }, { "epoch": 0.1, "learning_rate": 0.00019760274559860506, "loss": 0.6355, "step": 860 }, { "epoch": 0.1, "learning_rate": 0.00019759472680376763, "loss": 0.7045, "step": 861 }, { "epoch": 0.1, "learning_rate": 0.00019758669478316473, "loss": 0.7035, "step": 862 }, { "epoch": 0.1, "learning_rate": 0.0001975786495378849, "loss": 0.7071, "step": 863 }, { "epoch": 0.1, "learning_rate": 0.00019757059106901838, "loss": 0.7199, "step": 864 }, { "epoch": 0.1, "learning_rate": 0.0001975625193776572, "loss": 0.701, "step": 865 }, { "epoch": 0.1, "learning_rate": 0.0001975544344648953, "loss": 0.6315, "step": 866 }, { "epoch": 0.1, "learning_rate": 0.00019754633633182821, "loss": 0.6323, "step": 867 }, { "epoch": 0.1, "learning_rate": 0.00019753822497955347, "loss": 0.7229, "step": 868 }, { "epoch": 0.1, "learning_rate": 0.00019753010040917025, "loss": 0.7083, "step": 869 }, { "epoch": 0.1, "learning_rate": 0.00019752196262177955, "loss": 0.6712, "step": 870 }, { "epoch": 0.1, "learning_rate": 0.00019751381161848424, "loss": 0.706, "step": 871 }, { "epoch": 0.1, "learning_rate": 0.0001975056474003889, "loss": 0.6746, "step": 872 }, { "epoch": 0.1, "learning_rate": 0.0001974974699685999, "loss": 0.6428, "step": 873 }, { "epoch": 0.1, "learning_rate": 0.00019748927932422542, "loss": 0.6786, "step": 874 }, { "epoch": 0.1, "learning_rate": 0.00019748107546837547, "loss": 0.7754, "step": 875 }, { "epoch": 0.1, "learning_rate": 0.00019747285840216182, "loss": 0.716, "step": 876 }, { "epoch": 0.1, "learning_rate": 0.00019746462812669796, "loss": 0.7021, "step": 877 }, { "epoch": 0.1, "learning_rate": 0.0001974563846430993, "loss": 0.7326, "step": 878 }, { "epoch": 0.1, "learning_rate": 0.00019744812795248292, "loss": 0.6779, "step": 879 }, { "epoch": 0.1, "learning_rate": 0.00019743985805596777, "loss": 0.675, "step": 880 }, { "epoch": 0.1, "learning_rate": 0.00019743157495467456, "loss": 0.7256, "step": 881 }, { "epoch": 0.1, "learning_rate": 0.0001974232786497258, "loss": 0.6729, "step": 882 }, { "epoch": 0.1, "learning_rate": 0.0001974149691422458, "loss": 0.6986, "step": 883 }, { "epoch": 0.1, "learning_rate": 0.0001974066464333606, "loss": 0.7747, "step": 884 }, { "epoch": 0.1, "learning_rate": 0.0001973983105241981, "loss": 0.6811, "step": 885 }, { "epoch": 0.1, "learning_rate": 0.00019738996141588792, "loss": 0.7142, "step": 886 }, { "epoch": 0.1, "learning_rate": 0.00019738159910956158, "loss": 0.697, "step": 887 }, { "epoch": 0.1, "learning_rate": 0.00019737322360635225, "loss": 0.7201, "step": 888 }, { "epoch": 0.1, "learning_rate": 0.00019736483490739496, "loss": 0.7345, "step": 889 }, { "epoch": 0.1, "learning_rate": 0.00019735643301382658, "loss": 0.7458, "step": 890 }, { "epoch": 0.1, "learning_rate": 0.00019734801792678565, "loss": 0.6765, "step": 891 }, { "epoch": 0.1, "learning_rate": 0.0001973395896474126, "loss": 0.6422, "step": 892 }, { "epoch": 0.1, "learning_rate": 0.00019733114817684956, "loss": 0.7133, "step": 893 }, { "epoch": 0.1, "learning_rate": 0.00019732269351624052, "loss": 0.7025, "step": 894 }, { "epoch": 0.1, "learning_rate": 0.00019731422566673126, "loss": 0.7506, "step": 895 }, { "epoch": 0.1, "learning_rate": 0.0001973057446294693, "loss": 0.7096, "step": 896 }, { "epoch": 0.1, "learning_rate": 0.00019729725040560397, "loss": 0.6589, "step": 897 }, { "epoch": 0.1, "learning_rate": 0.00019728874299628632, "loss": 0.7377, "step": 898 }, { "epoch": 0.1, "learning_rate": 0.00019728022240266934, "loss": 0.6324, "step": 899 }, { "epoch": 0.1, "learning_rate": 0.00019727168862590768, "loss": 0.6184, "step": 900 }, { "epoch": 0.1, "learning_rate": 0.00019726314166715783, "loss": 0.6999, "step": 901 }, { "epoch": 0.1, "learning_rate": 0.000197254581527578, "loss": 0.7044, "step": 902 }, { "epoch": 0.1, "learning_rate": 0.0001972460082083283, "loss": 0.6841, "step": 903 }, { "epoch": 0.1, "learning_rate": 0.00019723742171057053, "loss": 0.7491, "step": 904 }, { "epoch": 0.1, "learning_rate": 0.00019722882203546832, "loss": 0.6843, "step": 905 }, { "epoch": 0.1, "learning_rate": 0.00019722020918418705, "loss": 0.7038, "step": 906 }, { "epoch": 0.1, "learning_rate": 0.00019721158315789392, "loss": 0.6584, "step": 907 }, { "epoch": 0.1, "learning_rate": 0.00019720294395775793, "loss": 0.6978, "step": 908 }, { "epoch": 0.1, "learning_rate": 0.00019719429158494983, "loss": 0.6539, "step": 909 }, { "epoch": 0.1, "learning_rate": 0.00019718562604064213, "loss": 0.757, "step": 910 }, { "epoch": 0.1, "learning_rate": 0.0001971769473260092, "loss": 0.7197, "step": 911 }, { "epoch": 0.1, "learning_rate": 0.00019716825544222714, "loss": 0.6616, "step": 912 }, { "epoch": 0.1, "learning_rate": 0.00019715955039047387, "loss": 0.6842, "step": 913 }, { "epoch": 0.1, "learning_rate": 0.00019715083217192904, "loss": 0.685, "step": 914 }, { "epoch": 0.1, "learning_rate": 0.0001971421007877741, "loss": 0.752, "step": 915 }, { "epoch": 0.1, "learning_rate": 0.0001971333562391924, "loss": 0.6851, "step": 916 }, { "epoch": 0.1, "learning_rate": 0.0001971245985273689, "loss": 0.6688, "step": 917 }, { "epoch": 0.1, "learning_rate": 0.0001971158276534904, "loss": 0.7532, "step": 918 }, { "epoch": 0.1, "learning_rate": 0.0001971070436187456, "loss": 0.6701, "step": 919 }, { "epoch": 0.1, "learning_rate": 0.00019709824642432478, "loss": 0.6763, "step": 920 }, { "epoch": 0.1, "learning_rate": 0.00019708943607142017, "loss": 0.7615, "step": 921 }, { "epoch": 0.1, "learning_rate": 0.00019708061256122573, "loss": 0.7776, "step": 922 }, { "epoch": 0.1, "learning_rate": 0.00019707177589493716, "loss": 0.6828, "step": 923 }, { "epoch": 0.11, "learning_rate": 0.00019706292607375202, "loss": 0.6882, "step": 924 }, { "epoch": 0.11, "learning_rate": 0.00019705406309886958, "loss": 0.7442, "step": 925 }, { "epoch": 0.11, "learning_rate": 0.00019704518697149096, "loss": 0.706, "step": 926 }, { "epoch": 0.11, "learning_rate": 0.000197036297692819, "loss": 0.7193, "step": 927 }, { "epoch": 0.11, "learning_rate": 0.00019702739526405836, "loss": 0.679, "step": 928 }, { "epoch": 0.11, "learning_rate": 0.00019701847968641546, "loss": 0.7161, "step": 929 }, { "epoch": 0.11, "learning_rate": 0.00019700955096109852, "loss": 0.656, "step": 930 }, { "epoch": 0.11, "learning_rate": 0.00019700060908931757, "loss": 0.6491, "step": 931 }, { "epoch": 0.11, "learning_rate": 0.00019699165407228436, "loss": 0.6932, "step": 932 }, { "epoch": 0.11, "learning_rate": 0.0001969826859112124, "loss": 0.6852, "step": 933 }, { "epoch": 0.11, "learning_rate": 0.00019697370460731713, "loss": 0.625, "step": 934 }, { "epoch": 0.11, "learning_rate": 0.0001969647101618156, "loss": 0.7349, "step": 935 }, { "epoch": 0.11, "learning_rate": 0.00019695570257592673, "loss": 0.7413, "step": 936 }, { "epoch": 0.11, "learning_rate": 0.0001969466818508712, "loss": 0.7474, "step": 937 }, { "epoch": 0.11, "learning_rate": 0.00019693764798787148, "loss": 0.7039, "step": 938 }, { "epoch": 0.11, "learning_rate": 0.00019692860098815182, "loss": 0.5602, "step": 939 }, { "epoch": 0.11, "learning_rate": 0.00019691954085293824, "loss": 0.6562, "step": 940 }, { "epoch": 0.11, "learning_rate": 0.00019691046758345853, "loss": 0.7097, "step": 941 }, { "epoch": 0.11, "learning_rate": 0.00019690138118094228, "loss": 0.7377, "step": 942 }, { "epoch": 0.11, "learning_rate": 0.00019689228164662087, "loss": 0.6975, "step": 943 }, { "epoch": 0.11, "learning_rate": 0.00019688316898172742, "loss": 0.6406, "step": 944 }, { "epoch": 0.11, "learning_rate": 0.00019687404318749689, "loss": 0.702, "step": 945 }, { "epoch": 0.11, "learning_rate": 0.00019686490426516594, "loss": 0.6268, "step": 946 }, { "epoch": 0.11, "learning_rate": 0.0001968557522159731, "loss": 0.6943, "step": 947 }, { "epoch": 0.11, "learning_rate": 0.00019684658704115856, "loss": 0.6836, "step": 948 }, { "epoch": 0.11, "learning_rate": 0.0001968374087419644, "loss": 0.7417, "step": 949 }, { "epoch": 0.11, "learning_rate": 0.00019682821731963442, "loss": 0.7122, "step": 950 }, { "epoch": 0.11, "learning_rate": 0.00019681901277541429, "loss": 0.6447, "step": 951 }, { "epoch": 0.11, "learning_rate": 0.00019680979511055128, "loss": 0.7076, "step": 952 }, { "epoch": 0.11, "learning_rate": 0.00019680056432629458, "loss": 0.6726, "step": 953 }, { "epoch": 0.11, "learning_rate": 0.00019679132042389516, "loss": 0.6278, "step": 954 }, { "epoch": 0.11, "learning_rate": 0.00019678206340460568, "loss": 0.6932, "step": 955 }, { "epoch": 0.11, "learning_rate": 0.00019677279326968066, "loss": 0.6391, "step": 956 }, { "epoch": 0.11, "learning_rate": 0.00019676351002037633, "loss": 0.7113, "step": 957 }, { "epoch": 0.11, "learning_rate": 0.00019675421365795073, "loss": 0.6565, "step": 958 }, { "epoch": 0.11, "learning_rate": 0.0001967449041836637, "loss": 0.6985, "step": 959 }, { "epoch": 0.11, "learning_rate": 0.00019673558159877686, "loss": 0.6692, "step": 960 }, { "epoch": 0.11, "learning_rate": 0.0001967262459045535, "loss": 0.6711, "step": 961 }, { "epoch": 0.11, "learning_rate": 0.00019671689710225882, "loss": 0.7311, "step": 962 }, { "epoch": 0.11, "learning_rate": 0.00019670753519315977, "loss": 0.7255, "step": 963 }, { "epoch": 0.11, "learning_rate": 0.000196698160178525, "loss": 0.6845, "step": 964 }, { "epoch": 0.11, "learning_rate": 0.00019668877205962498, "loss": 0.726, "step": 965 }, { "epoch": 0.11, "learning_rate": 0.000196679370837732, "loss": 0.6777, "step": 966 }, { "epoch": 0.11, "learning_rate": 0.0001966699565141201, "loss": 0.7452, "step": 967 }, { "epoch": 0.11, "learning_rate": 0.00019666052909006498, "loss": 0.6359, "step": 968 }, { "epoch": 0.11, "learning_rate": 0.00019665108856684437, "loss": 0.7545, "step": 969 }, { "epoch": 0.11, "learning_rate": 0.0001966416349457375, "loss": 0.6422, "step": 970 }, { "epoch": 0.11, "learning_rate": 0.00019663216822802558, "loss": 0.6773, "step": 971 }, { "epoch": 0.11, "learning_rate": 0.00019662268841499146, "loss": 0.7604, "step": 972 }, { "epoch": 0.11, "learning_rate": 0.00019661319550791983, "loss": 0.6829, "step": 973 }, { "epoch": 0.11, "learning_rate": 0.00019660368950809716, "loss": 0.7628, "step": 974 }, { "epoch": 0.11, "learning_rate": 0.00019659417041681163, "loss": 0.696, "step": 975 }, { "epoch": 0.11, "learning_rate": 0.00019658463823535332, "loss": 0.6522, "step": 976 }, { "epoch": 0.11, "learning_rate": 0.00019657509296501396, "loss": 0.6778, "step": 977 }, { "epoch": 0.11, "learning_rate": 0.00019656553460708706, "loss": 0.7031, "step": 978 }, { "epoch": 0.11, "learning_rate": 0.000196555963162868, "loss": 0.6921, "step": 979 }, { "epoch": 0.11, "learning_rate": 0.0001965463786336539, "loss": 0.6866, "step": 980 }, { "epoch": 0.11, "learning_rate": 0.0001965367810207435, "loss": 0.6678, "step": 981 }, { "epoch": 0.11, "learning_rate": 0.00019652717032543756, "loss": 0.7159, "step": 982 }, { "epoch": 0.11, "learning_rate": 0.00019651754654903848, "loss": 0.6462, "step": 983 }, { "epoch": 0.11, "learning_rate": 0.00019650790969285043, "loss": 0.746, "step": 984 }, { "epoch": 0.11, "learning_rate": 0.00019649825975817938, "loss": 0.7147, "step": 985 }, { "epoch": 0.11, "learning_rate": 0.00019648859674633302, "loss": 0.6692, "step": 986 }, { "epoch": 0.11, "learning_rate": 0.0001964789206586209, "loss": 0.7218, "step": 987 }, { "epoch": 0.11, "learning_rate": 0.0001964692314963543, "loss": 0.6652, "step": 988 }, { "epoch": 0.11, "learning_rate": 0.0001964595292608462, "loss": 0.6723, "step": 989 }, { "epoch": 0.11, "learning_rate": 0.0001964498139534115, "loss": 0.7292, "step": 990 }, { "epoch": 0.11, "learning_rate": 0.00019644008557536676, "loss": 0.6524, "step": 991 }, { "epoch": 0.11, "learning_rate": 0.00019643034412803034, "loss": 0.7271, "step": 992 }, { "epoch": 0.11, "learning_rate": 0.00019642058961272238, "loss": 0.6607, "step": 993 }, { "epoch": 0.11, "learning_rate": 0.00019641082203076477, "loss": 0.7019, "step": 994 }, { "epoch": 0.11, "learning_rate": 0.00019640104138348124, "loss": 0.7026, "step": 995 }, { "epoch": 0.11, "learning_rate": 0.00019639124767219715, "loss": 0.5955, "step": 996 }, { "epoch": 0.11, "learning_rate": 0.00019638144089823977, "loss": 0.6011, "step": 997 }, { "epoch": 0.11, "learning_rate": 0.0001963716210629381, "loss": 0.769, "step": 998 }, { "epoch": 0.11, "learning_rate": 0.00019636178816762284, "loss": 0.7042, "step": 999 }, { "epoch": 0.11, "learning_rate": 0.00019635194221362658, "loss": 0.6937, "step": 1000 }, { "epoch": 0.11, "learning_rate": 0.0001963420832022836, "loss": 0.723, "step": 1001 }, { "epoch": 0.11, "learning_rate": 0.0001963322111349299, "loss": 0.7038, "step": 1002 }, { "epoch": 0.11, "learning_rate": 0.00019632232601290338, "loss": 0.6946, "step": 1003 }, { "epoch": 0.11, "learning_rate": 0.00019631242783754363, "loss": 0.7523, "step": 1004 }, { "epoch": 0.11, "learning_rate": 0.00019630251661019205, "loss": 0.6944, "step": 1005 }, { "epoch": 0.11, "learning_rate": 0.00019629259233219174, "loss": 0.6578, "step": 1006 }, { "epoch": 0.11, "learning_rate": 0.00019628265500488764, "loss": 0.7113, "step": 1007 }, { "epoch": 0.11, "learning_rate": 0.00019627270462962642, "loss": 0.7089, "step": 1008 }, { "epoch": 0.11, "learning_rate": 0.0001962627412077565, "loss": 0.6293, "step": 1009 }, { "epoch": 0.11, "learning_rate": 0.0001962527647406281, "loss": 0.7133, "step": 1010 }, { "epoch": 0.11, "learning_rate": 0.00019624277522959328, "loss": 0.7483, "step": 1011 }, { "epoch": 0.12, "learning_rate": 0.00019623277267600574, "loss": 0.7367, "step": 1012 }, { "epoch": 0.12, "learning_rate": 0.00019622275708122092, "loss": 0.696, "step": 1013 }, { "epoch": 0.12, "learning_rate": 0.00019621272844659623, "loss": 0.7297, "step": 1014 }, { "epoch": 0.12, "learning_rate": 0.00019620268677349065, "loss": 0.7183, "step": 1015 }, { "epoch": 0.12, "learning_rate": 0.00019619263206326502, "loss": 0.6788, "step": 1016 }, { "epoch": 0.12, "learning_rate": 0.00019618256431728194, "loss": 0.742, "step": 1017 }, { "epoch": 0.12, "learning_rate": 0.00019617248353690568, "loss": 0.7559, "step": 1018 }, { "epoch": 0.12, "learning_rate": 0.0001961623897235025, "loss": 0.6509, "step": 1019 }, { "epoch": 0.12, "learning_rate": 0.0001961522828784402, "loss": 0.7066, "step": 1020 }, { "epoch": 0.12, "learning_rate": 0.0001961421630030884, "loss": 0.6735, "step": 1021 }, { "epoch": 0.12, "learning_rate": 0.00019613203009881863, "loss": 0.7344, "step": 1022 }, { "epoch": 0.12, "learning_rate": 0.00019612188416700396, "loss": 0.734, "step": 1023 }, { "epoch": 0.12, "learning_rate": 0.0001961117252090194, "loss": 0.7583, "step": 1024 }, { "epoch": 0.12, "learning_rate": 0.00019610155322624163, "loss": 0.7108, "step": 1025 }, { "epoch": 0.12, "learning_rate": 0.00019609136822004914, "loss": 0.7187, "step": 1026 }, { "epoch": 0.12, "learning_rate": 0.0001960811701918222, "loss": 0.7239, "step": 1027 }, { "epoch": 0.12, "learning_rate": 0.0001960709591429428, "loss": 0.7187, "step": 1028 }, { "epoch": 0.12, "learning_rate": 0.00019606073507479464, "loss": 0.681, "step": 1029 }, { "epoch": 0.12, "learning_rate": 0.0001960504979887634, "loss": 0.6863, "step": 1030 }, { "epoch": 0.12, "learning_rate": 0.0001960402478862363, "loss": 0.6412, "step": 1031 }, { "epoch": 0.12, "learning_rate": 0.00019602998476860237, "loss": 0.7164, "step": 1032 }, { "epoch": 0.12, "learning_rate": 0.00019601970863725252, "loss": 0.7055, "step": 1033 }, { "epoch": 0.12, "learning_rate": 0.0001960094194935793, "loss": 0.7106, "step": 1034 }, { "epoch": 0.12, "learning_rate": 0.00019599911733897705, "loss": 0.6968, "step": 1035 }, { "epoch": 0.12, "learning_rate": 0.00019598880217484195, "loss": 0.7385, "step": 1036 }, { "epoch": 0.12, "learning_rate": 0.00019597847400257184, "loss": 0.6883, "step": 1037 }, { "epoch": 0.12, "learning_rate": 0.00019596813282356633, "loss": 0.6169, "step": 1038 }, { "epoch": 0.12, "learning_rate": 0.0001959577786392269, "loss": 0.7001, "step": 1039 }, { "epoch": 0.12, "learning_rate": 0.00019594741145095667, "loss": 0.6765, "step": 1040 }, { "epoch": 0.12, "learning_rate": 0.0001959370312601606, "loss": 0.6715, "step": 1041 }, { "epoch": 0.12, "learning_rate": 0.00019592663806824537, "loss": 0.7373, "step": 1042 }, { "epoch": 0.12, "learning_rate": 0.00019591623187661944, "loss": 0.6637, "step": 1043 }, { "epoch": 0.12, "learning_rate": 0.00019590581268669302, "loss": 0.7491, "step": 1044 }, { "epoch": 0.12, "learning_rate": 0.00019589538049987807, "loss": 0.6881, "step": 1045 }, { "epoch": 0.12, "learning_rate": 0.0001958849353175884, "loss": 0.7217, "step": 1046 }, { "epoch": 0.12, "learning_rate": 0.00019587447714123948, "loss": 0.6977, "step": 1047 }, { "epoch": 0.12, "learning_rate": 0.00019586400597224851, "loss": 0.6894, "step": 1048 }, { "epoch": 0.12, "learning_rate": 0.00019585352181203462, "loss": 0.6081, "step": 1049 }, { "epoch": 0.12, "learning_rate": 0.0001958430246620185, "loss": 0.6362, "step": 1050 }, { "epoch": 0.12, "learning_rate": 0.00019583251452362274, "loss": 0.6809, "step": 1051 }, { "epoch": 0.12, "learning_rate": 0.00019582199139827169, "loss": 0.6764, "step": 1052 }, { "epoch": 0.12, "learning_rate": 0.0001958114552873913, "loss": 0.6509, "step": 1053 }, { "epoch": 0.12, "learning_rate": 0.00019580090619240948, "loss": 0.7078, "step": 1054 }, { "epoch": 0.12, "learning_rate": 0.0001957903441147558, "loss": 0.6962, "step": 1055 }, { "epoch": 0.12, "learning_rate": 0.0001957797690558616, "loss": 0.7175, "step": 1056 }, { "epoch": 0.12, "learning_rate": 0.00019576918101715996, "loss": 0.6452, "step": 1057 }, { "epoch": 0.12, "learning_rate": 0.0001957585800000858, "loss": 0.7093, "step": 1058 }, { "epoch": 0.12, "learning_rate": 0.0001957479660060757, "loss": 0.6649, "step": 1059 }, { "epoch": 0.12, "learning_rate": 0.000195737339036568, "loss": 0.5816, "step": 1060 }, { "epoch": 0.12, "learning_rate": 0.00019572669909300288, "loss": 0.6877, "step": 1061 }, { "epoch": 0.12, "learning_rate": 0.00019571604617682223, "loss": 0.6527, "step": 1062 }, { "epoch": 0.12, "learning_rate": 0.0001957053802894697, "loss": 0.671, "step": 1063 }, { "epoch": 0.12, "learning_rate": 0.00019569470143239074, "loss": 0.6724, "step": 1064 }, { "epoch": 0.12, "learning_rate": 0.0001956840096070325, "loss": 0.6739, "step": 1065 }, { "epoch": 0.12, "learning_rate": 0.00019567330481484385, "loss": 0.7096, "step": 1066 }, { "epoch": 0.12, "learning_rate": 0.00019566258705727552, "loss": 0.6615, "step": 1067 }, { "epoch": 0.12, "learning_rate": 0.00019565185633577996, "loss": 0.7385, "step": 1068 }, { "epoch": 0.12, "learning_rate": 0.00019564111265181136, "loss": 0.6538, "step": 1069 }, { "epoch": 0.12, "learning_rate": 0.00019563035600682563, "loss": 0.7284, "step": 1070 }, { "epoch": 0.12, "learning_rate": 0.0001956195864022806, "loss": 0.7233, "step": 1071 }, { "epoch": 0.12, "learning_rate": 0.0001956088038396356, "loss": 0.6898, "step": 1072 }, { "epoch": 0.12, "learning_rate": 0.0001955980083203519, "loss": 0.6839, "step": 1073 }, { "epoch": 0.12, "learning_rate": 0.0001955871998458925, "loss": 0.6846, "step": 1074 }, { "epoch": 0.12, "learning_rate": 0.0001955763784177221, "loss": 0.6491, "step": 1075 }, { "epoch": 0.12, "learning_rate": 0.00019556554403730726, "loss": 0.735, "step": 1076 }, { "epoch": 0.12, "learning_rate": 0.00019555469670611616, "loss": 0.6949, "step": 1077 }, { "epoch": 0.12, "learning_rate": 0.00019554383642561877, "loss": 0.7073, "step": 1078 }, { "epoch": 0.12, "learning_rate": 0.00019553296319728693, "loss": 0.7571, "step": 1079 }, { "epoch": 0.12, "learning_rate": 0.00019552207702259412, "loss": 0.6941, "step": 1080 }, { "epoch": 0.12, "learning_rate": 0.00019551117790301555, "loss": 0.727, "step": 1081 }, { "epoch": 0.12, "learning_rate": 0.00019550026584002833, "loss": 0.726, "step": 1082 }, { "epoch": 0.12, "learning_rate": 0.0001954893408351112, "loss": 0.6805, "step": 1083 }, { "epoch": 0.12, "learning_rate": 0.00019547840288974464, "loss": 0.6833, "step": 1084 }, { "epoch": 0.12, "learning_rate": 0.00019546745200541094, "loss": 0.7303, "step": 1085 }, { "epoch": 0.12, "learning_rate": 0.00019545648818359418, "loss": 0.7199, "step": 1086 }, { "epoch": 0.12, "learning_rate": 0.00019544551142578013, "loss": 0.6412, "step": 1087 }, { "epoch": 0.12, "learning_rate": 0.00019543452173345632, "loss": 0.7781, "step": 1088 }, { "epoch": 0.12, "learning_rate": 0.00019542351910811203, "loss": 0.6798, "step": 1089 }, { "epoch": 0.12, "learning_rate": 0.00019541250355123834, "loss": 0.7262, "step": 1090 }, { "epoch": 0.12, "learning_rate": 0.00019540147506432799, "loss": 0.6349, "step": 1091 }, { "epoch": 0.12, "learning_rate": 0.0001953904336488756, "loss": 0.6932, "step": 1092 }, { "epoch": 0.12, "learning_rate": 0.00019537937930637743, "loss": 0.743, "step": 1093 }, { "epoch": 0.12, "learning_rate": 0.00019536831203833152, "loss": 0.6538, "step": 1094 }, { "epoch": 0.12, "learning_rate": 0.00019535723184623774, "loss": 0.6926, "step": 1095 }, { "epoch": 0.12, "learning_rate": 0.00019534613873159758, "loss": 0.692, "step": 1096 }, { "epoch": 0.12, "learning_rate": 0.00019533503269591438, "loss": 0.7323, "step": 1097 }, { "epoch": 0.12, "learning_rate": 0.00019532391374069318, "loss": 0.6259, "step": 1098 }, { "epoch": 0.12, "learning_rate": 0.0001953127818674408, "loss": 0.661, "step": 1099 }, { "epoch": 0.13, "learning_rate": 0.0001953016370776658, "loss": 0.7499, "step": 1100 }, { "epoch": 0.13, "learning_rate": 0.0001952904793728785, "loss": 0.7056, "step": 1101 }, { "epoch": 0.13, "learning_rate": 0.00019527930875459096, "loss": 0.684, "step": 1102 }, { "epoch": 0.13, "learning_rate": 0.00019526812522431696, "loss": 0.7359, "step": 1103 }, { "epoch": 0.13, "learning_rate": 0.00019525692878357212, "loss": 0.6833, "step": 1104 }, { "epoch": 0.13, "learning_rate": 0.0001952457194338737, "loss": 0.7161, "step": 1105 }, { "epoch": 0.13, "learning_rate": 0.00019523449717674077, "loss": 0.7089, "step": 1106 }, { "epoch": 0.13, "learning_rate": 0.00019522326201369415, "loss": 0.7344, "step": 1107 }, { "epoch": 0.13, "learning_rate": 0.00019521201394625637, "loss": 0.6684, "step": 1108 }, { "epoch": 0.13, "learning_rate": 0.00019520075297595177, "loss": 0.6966, "step": 1109 }, { "epoch": 0.13, "learning_rate": 0.0001951894791043064, "loss": 0.6747, "step": 1110 }, { "epoch": 0.13, "learning_rate": 0.00019517819233284806, "loss": 0.648, "step": 1111 }, { "epoch": 0.13, "learning_rate": 0.0001951668926631063, "loss": 0.6719, "step": 1112 }, { "epoch": 0.13, "learning_rate": 0.0001951555800966124, "loss": 0.7436, "step": 1113 }, { "epoch": 0.13, "learning_rate": 0.00019514425463489947, "loss": 0.5662, "step": 1114 }, { "epoch": 0.13, "learning_rate": 0.00019513291627950224, "loss": 0.7054, "step": 1115 }, { "epoch": 0.13, "learning_rate": 0.0001951215650319573, "loss": 0.6672, "step": 1116 }, { "epoch": 0.13, "learning_rate": 0.00019511020089380286, "loss": 0.7757, "step": 1117 }, { "epoch": 0.13, "learning_rate": 0.00019509882386657904, "loss": 0.7304, "step": 1118 }, { "epoch": 0.13, "learning_rate": 0.0001950874339518276, "loss": 0.6585, "step": 1119 }, { "epoch": 0.13, "learning_rate": 0.00019507603115109204, "loss": 0.6893, "step": 1120 }, { "epoch": 0.13, "learning_rate": 0.0001950646154659177, "loss": 0.6628, "step": 1121 }, { "epoch": 0.13, "learning_rate": 0.00019505318689785152, "loss": 0.7798, "step": 1122 }, { "epoch": 0.13, "learning_rate": 0.00019504174544844233, "loss": 0.6663, "step": 1123 }, { "epoch": 0.13, "learning_rate": 0.0001950302911192406, "loss": 0.7474, "step": 1124 }, { "epoch": 0.13, "learning_rate": 0.00019501882391179863, "loss": 0.7243, "step": 1125 }, { "epoch": 0.13, "learning_rate": 0.0001950073438276704, "loss": 0.6817, "step": 1126 }, { "epoch": 0.13, "learning_rate": 0.00019499585086841164, "loss": 0.7285, "step": 1127 }, { "epoch": 0.13, "learning_rate": 0.0001949843450355799, "loss": 0.6238, "step": 1128 }, { "epoch": 0.13, "learning_rate": 0.0001949728263307344, "loss": 0.7012, "step": 1129 }, { "epoch": 0.13, "learning_rate": 0.00019496129475543605, "loss": 0.6729, "step": 1130 }, { "epoch": 0.13, "learning_rate": 0.00019494975031124768, "loss": 0.5952, "step": 1131 }, { "epoch": 0.13, "learning_rate": 0.00019493819299973373, "loss": 0.7188, "step": 1132 }, { "epoch": 0.13, "learning_rate": 0.00019492662282246035, "loss": 0.6668, "step": 1133 }, { "epoch": 0.13, "learning_rate": 0.00019491503978099557, "loss": 0.7128, "step": 1134 }, { "epoch": 0.13, "learning_rate": 0.0001949034438769091, "loss": 0.6608, "step": 1135 }, { "epoch": 0.13, "learning_rate": 0.0001948918351117723, "loss": 0.7101, "step": 1136 }, { "epoch": 0.13, "learning_rate": 0.00019488021348715846, "loss": 0.6301, "step": 1137 }, { "epoch": 0.13, "learning_rate": 0.00019486857900464247, "loss": 0.6787, "step": 1138 }, { "epoch": 0.13, "learning_rate": 0.00019485693166580094, "loss": 0.7204, "step": 1139 }, { "epoch": 0.13, "learning_rate": 0.00019484527147221238, "loss": 0.7109, "step": 1140 }, { "epoch": 0.13, "learning_rate": 0.0001948335984254569, "loss": 0.6666, "step": 1141 }, { "epoch": 0.13, "learning_rate": 0.00019482191252711642, "loss": 0.6964, "step": 1142 }, { "epoch": 0.13, "learning_rate": 0.00019481021377877454, "loss": 0.723, "step": 1143 }, { "epoch": 0.13, "learning_rate": 0.00019479850218201666, "loss": 0.7299, "step": 1144 }, { "epoch": 0.13, "learning_rate": 0.00019478677773842996, "loss": 0.6745, "step": 1145 }, { "epoch": 0.13, "learning_rate": 0.00019477504044960323, "loss": 0.6974, "step": 1146 }, { "epoch": 0.13, "learning_rate": 0.0001947632903171271, "loss": 0.7498, "step": 1147 }, { "epoch": 0.13, "learning_rate": 0.0001947515273425939, "loss": 0.7436, "step": 1148 }, { "epoch": 0.13, "learning_rate": 0.00019473975152759773, "loss": 0.6986, "step": 1149 }, { "epoch": 0.13, "learning_rate": 0.00019472796287373445, "loss": 0.7066, "step": 1150 }, { "epoch": 0.13, "learning_rate": 0.00019471616138260156, "loss": 0.6549, "step": 1151 }, { "epoch": 0.13, "learning_rate": 0.0001947043470557984, "loss": 0.7048, "step": 1152 }, { "epoch": 0.13, "learning_rate": 0.00019469251989492602, "loss": 0.6919, "step": 1153 }, { "epoch": 0.13, "learning_rate": 0.00019468067990158718, "loss": 0.699, "step": 1154 }, { "epoch": 0.13, "learning_rate": 0.00019466882707738645, "loss": 0.6953, "step": 1155 }, { "epoch": 0.13, "learning_rate": 0.00019465696142393005, "loss": 0.6709, "step": 1156 }, { "epoch": 0.13, "learning_rate": 0.00019464508294282596, "loss": 0.6844, "step": 1157 }, { "epoch": 0.13, "learning_rate": 0.00019463319163568398, "loss": 0.7057, "step": 1158 }, { "epoch": 0.13, "learning_rate": 0.00019462128750411556, "loss": 0.8218, "step": 1159 }, { "epoch": 0.13, "learning_rate": 0.0001946093705497339, "loss": 0.7247, "step": 1160 }, { "epoch": 0.13, "learning_rate": 0.00019459744077415396, "loss": 0.7798, "step": 1161 }, { "epoch": 0.13, "learning_rate": 0.00019458549817899244, "loss": 0.6953, "step": 1162 }, { "epoch": 0.13, "learning_rate": 0.00019457354276586775, "loss": 0.7602, "step": 1163 }, { "epoch": 0.13, "learning_rate": 0.00019456157453640006, "loss": 0.6737, "step": 1164 }, { "epoch": 0.13, "learning_rate": 0.0001945495934922113, "loss": 0.6224, "step": 1165 }, { "epoch": 0.13, "learning_rate": 0.00019453759963492507, "loss": 0.685, "step": 1166 }, { "epoch": 0.13, "learning_rate": 0.00019452559296616675, "loss": 0.7398, "step": 1167 }, { "epoch": 0.13, "learning_rate": 0.00019451357348756348, "loss": 0.6784, "step": 1168 }, { "epoch": 0.13, "learning_rate": 0.00019450154120074405, "loss": 0.6658, "step": 1169 }, { "epoch": 0.13, "learning_rate": 0.00019448949610733908, "loss": 0.6812, "step": 1170 }, { "epoch": 0.13, "learning_rate": 0.0001944774382089809, "loss": 0.7472, "step": 1171 }, { "epoch": 0.13, "learning_rate": 0.00019446536750730356, "loss": 0.6482, "step": 1172 }, { "epoch": 0.13, "learning_rate": 0.00019445328400394282, "loss": 0.6905, "step": 1173 }, { "epoch": 0.13, "learning_rate": 0.00019444118770053622, "loss": 0.6654, "step": 1174 }, { "epoch": 0.13, "learning_rate": 0.000194429078598723, "loss": 0.7369, "step": 1175 }, { "epoch": 0.13, "learning_rate": 0.00019441695670014417, "loss": 0.6923, "step": 1176 }, { "epoch": 0.13, "learning_rate": 0.00019440482200644245, "loss": 0.7233, "step": 1177 }, { "epoch": 0.13, "learning_rate": 0.0001943926745192623, "loss": 0.71, "step": 1178 }, { "epoch": 0.13, "learning_rate": 0.00019438051424024996, "loss": 0.7275, "step": 1179 }, { "epoch": 0.13, "learning_rate": 0.00019436834117105323, "loss": 0.7185, "step": 1180 }, { "epoch": 0.13, "learning_rate": 0.00019435615531332193, "loss": 0.77, "step": 1181 }, { "epoch": 0.13, "learning_rate": 0.00019434395666870734, "loss": 0.7174, "step": 1182 }, { "epoch": 0.13, "learning_rate": 0.00019433174523886262, "loss": 0.7277, "step": 1183 }, { "epoch": 0.13, "learning_rate": 0.00019431952102544263, "loss": 0.702, "step": 1184 }, { "epoch": 0.13, "learning_rate": 0.000194307284030104, "loss": 0.7185, "step": 1185 }, { "epoch": 0.13, "learning_rate": 0.000194295034254505, "loss": 0.6447, "step": 1186 }, { "epoch": 0.13, "learning_rate": 0.00019428277170030568, "loss": 0.6511, "step": 1187 }, { "epoch": 0.14, "learning_rate": 0.00019427049636916785, "loss": 0.6899, "step": 1188 }, { "epoch": 0.14, "learning_rate": 0.00019425820826275505, "loss": 0.6495, "step": 1189 }, { "epoch": 0.14, "learning_rate": 0.00019424590738273246, "loss": 0.7041, "step": 1190 }, { "epoch": 0.14, "learning_rate": 0.00019423359373076717, "loss": 0.6985, "step": 1191 }, { "epoch": 0.14, "learning_rate": 0.00019422126730852778, "loss": 0.6996, "step": 1192 }, { "epoch": 0.14, "learning_rate": 0.00019420892811768483, "loss": 0.6446, "step": 1193 }, { "epoch": 0.14, "learning_rate": 0.0001941965761599104, "loss": 0.6849, "step": 1194 }, { "epoch": 0.14, "learning_rate": 0.00019418421143687847, "loss": 0.737, "step": 1195 }, { "epoch": 0.14, "learning_rate": 0.00019417183395026465, "loss": 0.651, "step": 1196 }, { "epoch": 0.14, "learning_rate": 0.00019415944370174628, "loss": 0.7019, "step": 1197 }, { "epoch": 0.14, "learning_rate": 0.00019414704069300247, "loss": 0.6418, "step": 1198 }, { "epoch": 0.14, "learning_rate": 0.000194134624925714, "loss": 0.6787, "step": 1199 }, { "epoch": 0.14, "learning_rate": 0.0001941221964015635, "loss": 0.7638, "step": 1200 }, { "epoch": 0.14, "learning_rate": 0.0001941097551222352, "loss": 0.6823, "step": 1201 }, { "epoch": 0.14, "learning_rate": 0.0001940973010894151, "loss": 0.6462, "step": 1202 }, { "epoch": 0.14, "learning_rate": 0.00019408483430479096, "loss": 0.6997, "step": 1203 }, { "epoch": 0.14, "learning_rate": 0.00019407235477005222, "loss": 0.7144, "step": 1204 }, { "epoch": 0.14, "learning_rate": 0.00019405986248689013, "loss": 0.7264, "step": 1205 }, { "epoch": 0.14, "learning_rate": 0.00019404735745699752, "loss": 0.6902, "step": 1206 }, { "epoch": 0.14, "learning_rate": 0.0001940348396820691, "loss": 0.6775, "step": 1207 }, { "epoch": 0.14, "learning_rate": 0.0001940223091638012, "loss": 0.6183, "step": 1208 }, { "epoch": 0.14, "learning_rate": 0.00019400976590389196, "loss": 0.7183, "step": 1209 }, { "epoch": 0.14, "learning_rate": 0.0001939972099040412, "loss": 0.6723, "step": 1210 }, { "epoch": 0.14, "learning_rate": 0.00019398464116595046, "loss": 0.7113, "step": 1211 }, { "epoch": 0.14, "learning_rate": 0.00019397205969132303, "loss": 0.7111, "step": 1212 }, { "epoch": 0.14, "learning_rate": 0.00019395946548186391, "loss": 0.6909, "step": 1213 }, { "epoch": 0.14, "learning_rate": 0.00019394685853927986, "loss": 0.7116, "step": 1214 }, { "epoch": 0.14, "learning_rate": 0.0001939342388652793, "loss": 0.7091, "step": 1215 }, { "epoch": 0.14, "learning_rate": 0.00019392160646157242, "loss": 0.6473, "step": 1216 }, { "epoch": 0.14, "learning_rate": 0.00019390896132987116, "loss": 0.7079, "step": 1217 }, { "epoch": 0.14, "learning_rate": 0.00019389630347188913, "loss": 0.7017, "step": 1218 }, { "epoch": 0.14, "learning_rate": 0.00019388363288934163, "loss": 0.6799, "step": 1219 }, { "epoch": 0.14, "learning_rate": 0.00019387094958394586, "loss": 0.6711, "step": 1220 }, { "epoch": 0.14, "learning_rate": 0.00019385825355742054, "loss": 0.6392, "step": 1221 }, { "epoch": 0.14, "learning_rate": 0.00019384554481148623, "loss": 0.6806, "step": 1222 }, { "epoch": 0.14, "learning_rate": 0.00019383282334786516, "loss": 0.5819, "step": 1223 }, { "epoch": 0.14, "learning_rate": 0.00019382008916828136, "loss": 0.7409, "step": 1224 }, { "epoch": 0.14, "learning_rate": 0.00019380734227446048, "loss": 0.6877, "step": 1225 }, { "epoch": 0.14, "learning_rate": 0.00019379458266812995, "loss": 0.6592, "step": 1226 }, { "epoch": 0.14, "learning_rate": 0.00019378181035101895, "loss": 0.6755, "step": 1227 }, { "epoch": 0.14, "learning_rate": 0.0001937690253248583, "loss": 0.7017, "step": 1228 }, { "epoch": 0.14, "learning_rate": 0.00019375622759138064, "loss": 0.6997, "step": 1229 }, { "epoch": 0.14, "learning_rate": 0.00019374341715232022, "loss": 0.7002, "step": 1230 }, { "epoch": 0.14, "learning_rate": 0.00019373059400941317, "loss": 0.6558, "step": 1231 }, { "epoch": 0.14, "learning_rate": 0.00019371775816439714, "loss": 0.7142, "step": 1232 }, { "epoch": 0.14, "learning_rate": 0.00019370490961901168, "loss": 0.6857, "step": 1233 }, { "epoch": 0.14, "learning_rate": 0.000193692048374998, "loss": 0.6862, "step": 1234 }, { "epoch": 0.14, "learning_rate": 0.00019367917443409893, "loss": 0.6955, "step": 1235 }, { "epoch": 0.14, "learning_rate": 0.0001936662877980592, "loss": 0.6398, "step": 1236 }, { "epoch": 0.14, "learning_rate": 0.00019365338846862512, "loss": 0.7179, "step": 1237 }, { "epoch": 0.14, "learning_rate": 0.00019364047644754485, "loss": 0.7182, "step": 1238 }, { "epoch": 0.14, "learning_rate": 0.0001936275517365681, "loss": 0.7625, "step": 1239 }, { "epoch": 0.14, "learning_rate": 0.00019361461433744639, "loss": 0.6922, "step": 1240 }, { "epoch": 0.14, "learning_rate": 0.00019360166425193303, "loss": 0.6912, "step": 1241 }, { "epoch": 0.14, "learning_rate": 0.0001935887014817829, "loss": 0.7634, "step": 1242 }, { "epoch": 0.14, "learning_rate": 0.00019357572602875275, "loss": 0.7372, "step": 1243 }, { "epoch": 0.14, "learning_rate": 0.00019356273789460096, "loss": 0.6881, "step": 1244 }, { "epoch": 0.14, "learning_rate": 0.00019354973708108763, "loss": 0.7376, "step": 1245 }, { "epoch": 0.14, "learning_rate": 0.0001935367235899746, "loss": 0.6973, "step": 1246 }, { "epoch": 0.14, "learning_rate": 0.0001935236974230254, "loss": 0.7079, "step": 1247 }, { "epoch": 0.14, "learning_rate": 0.00019351065858200532, "loss": 0.6952, "step": 1248 }, { "epoch": 0.14, "learning_rate": 0.00019349760706868137, "loss": 0.7117, "step": 1249 }, { "epoch": 0.14, "learning_rate": 0.0001934845428848222, "loss": 0.683, "step": 1250 }, { "epoch": 0.14, "learning_rate": 0.0001934714660321983, "loss": 0.6619, "step": 1251 }, { "epoch": 0.14, "learning_rate": 0.00019345837651258175, "loss": 0.6618, "step": 1252 }, { "epoch": 0.14, "learning_rate": 0.00019344527432774643, "loss": 0.6517, "step": 1253 }, { "epoch": 0.14, "learning_rate": 0.0001934321594794679, "loss": 0.6773, "step": 1254 }, { "epoch": 0.14, "learning_rate": 0.00019341903196952348, "loss": 0.699, "step": 1255 }, { "epoch": 0.14, "learning_rate": 0.00019340589179969215, "loss": 0.701, "step": 1256 }, { "epoch": 0.14, "learning_rate": 0.00019339273897175463, "loss": 0.5936, "step": 1257 }, { "epoch": 0.14, "learning_rate": 0.00019337957348749334, "loss": 0.6399, "step": 1258 }, { "epoch": 0.14, "learning_rate": 0.00019336639534869244, "loss": 0.6755, "step": 1259 }, { "epoch": 0.14, "learning_rate": 0.00019335320455713783, "loss": 0.7122, "step": 1260 }, { "epoch": 0.14, "learning_rate": 0.00019334000111461704, "loss": 0.6773, "step": 1261 }, { "epoch": 0.14, "learning_rate": 0.00019332678502291938, "loss": 0.7037, "step": 1262 }, { "epoch": 0.14, "learning_rate": 0.00019331355628383586, "loss": 0.7121, "step": 1263 }, { "epoch": 0.14, "learning_rate": 0.0001933003148991592, "loss": 0.7669, "step": 1264 }, { "epoch": 0.14, "learning_rate": 0.0001932870608706838, "loss": 0.6958, "step": 1265 }, { "epoch": 0.14, "learning_rate": 0.00019327379420020592, "loss": 0.6976, "step": 1266 }, { "epoch": 0.14, "learning_rate": 0.00019326051488952333, "loss": 0.6623, "step": 1267 }, { "epoch": 0.14, "learning_rate": 0.00019324722294043558, "loss": 0.7187, "step": 1268 }, { "epoch": 0.14, "learning_rate": 0.00019323391835474401, "loss": 0.7511, "step": 1269 }, { "epoch": 0.14, "learning_rate": 0.00019322060113425167, "loss": 0.7479, "step": 1270 }, { "epoch": 0.14, "learning_rate": 0.00019320727128076316, "loss": 0.6805, "step": 1271 }, { "epoch": 0.14, "learning_rate": 0.00019319392879608497, "loss": 0.7079, "step": 1272 }, { "epoch": 0.14, "learning_rate": 0.00019318057368202524, "loss": 0.7383, "step": 1273 }, { "epoch": 0.14, "learning_rate": 0.00019316720594039378, "loss": 0.6709, "step": 1274 }, { "epoch": 0.14, "learning_rate": 0.00019315382557300219, "loss": 0.6527, "step": 1275 }, { "epoch": 0.15, "learning_rate": 0.00019314043258166375, "loss": 0.6809, "step": 1276 }, { "epoch": 0.15, "learning_rate": 0.00019312702696819335, "loss": 0.7467, "step": 1277 }, { "epoch": 0.15, "learning_rate": 0.0001931136087344078, "loss": 0.6912, "step": 1278 }, { "epoch": 0.15, "learning_rate": 0.0001931001778821254, "loss": 0.7658, "step": 1279 }, { "epoch": 0.15, "learning_rate": 0.00019308673441316635, "loss": 0.6747, "step": 1280 }, { "epoch": 0.15, "learning_rate": 0.0001930732783293524, "loss": 0.7312, "step": 1281 }, { "epoch": 0.15, "learning_rate": 0.00019305980963250715, "loss": 0.688, "step": 1282 }, { "epoch": 0.15, "learning_rate": 0.00019304632832445575, "loss": 0.7011, "step": 1283 }, { "epoch": 0.15, "learning_rate": 0.0001930328344070252, "loss": 0.7312, "step": 1284 }, { "epoch": 0.15, "learning_rate": 0.0001930193278820442, "loss": 0.623, "step": 1285 }, { "epoch": 0.15, "learning_rate": 0.00019300580875134308, "loss": 0.6685, "step": 1286 }, { "epoch": 0.15, "learning_rate": 0.00019299227701675387, "loss": 0.729, "step": 1287 }, { "epoch": 0.15, "learning_rate": 0.0001929787326801104, "loss": 0.6755, "step": 1288 }, { "epoch": 0.15, "learning_rate": 0.00019296517574324818, "loss": 0.6865, "step": 1289 }, { "epoch": 0.15, "learning_rate": 0.00019295160620800433, "loss": 0.6421, "step": 1290 }, { "epoch": 0.15, "learning_rate": 0.00019293802407621785, "loss": 0.7125, "step": 1291 }, { "epoch": 0.15, "learning_rate": 0.00019292442934972932, "loss": 0.7429, "step": 1292 }, { "epoch": 0.15, "learning_rate": 0.00019291082203038102, "loss": 0.7327, "step": 1293 }, { "epoch": 0.15, "learning_rate": 0.00019289720212001702, "loss": 0.7041, "step": 1294 }, { "epoch": 0.15, "learning_rate": 0.00019288356962048303, "loss": 0.649, "step": 1295 }, { "epoch": 0.15, "learning_rate": 0.00019286992453362652, "loss": 0.7489, "step": 1296 }, { "epoch": 0.15, "learning_rate": 0.00019285626686129658, "loss": 0.7132, "step": 1297 }, { "epoch": 0.15, "learning_rate": 0.00019284259660534413, "loss": 0.731, "step": 1298 }, { "epoch": 0.15, "learning_rate": 0.00019282891376762163, "loss": 0.6693, "step": 1299 }, { "epoch": 0.15, "learning_rate": 0.00019281521834998343, "loss": 0.7307, "step": 1300 }, { "epoch": 0.15, "learning_rate": 0.00019280151035428543, "loss": 0.7452, "step": 1301 }, { "epoch": 0.15, "learning_rate": 0.00019278778978238536, "loss": 0.6838, "step": 1302 }, { "epoch": 0.15, "learning_rate": 0.00019277405663614257, "loss": 0.6986, "step": 1303 }, { "epoch": 0.15, "learning_rate": 0.0001927603109174181, "loss": 0.7114, "step": 1304 }, { "epoch": 0.15, "learning_rate": 0.00019274655262807477, "loss": 0.6771, "step": 1305 }, { "epoch": 0.15, "learning_rate": 0.00019273278176997708, "loss": 0.6949, "step": 1306 }, { "epoch": 0.15, "learning_rate": 0.00019271899834499116, "loss": 0.7402, "step": 1307 }, { "epoch": 0.15, "learning_rate": 0.00019270520235498497, "loss": 0.684, "step": 1308 }, { "epoch": 0.15, "learning_rate": 0.00019269139380182805, "loss": 0.6615, "step": 1309 }, { "epoch": 0.15, "learning_rate": 0.00019267757268739172, "loss": 0.7118, "step": 1310 }, { "epoch": 0.15, "learning_rate": 0.000192663739013549, "loss": 0.7515, "step": 1311 }, { "epoch": 0.15, "learning_rate": 0.00019264989278217453, "loss": 0.7621, "step": 1312 }, { "epoch": 0.15, "learning_rate": 0.00019263603399514477, "loss": 0.6476, "step": 1313 }, { "epoch": 0.15, "learning_rate": 0.00019262216265433782, "loss": 0.7359, "step": 1314 }, { "epoch": 0.15, "learning_rate": 0.00019260827876163344, "loss": 0.7213, "step": 1315 }, { "epoch": 0.15, "learning_rate": 0.0001925943823189132, "loss": 0.721, "step": 1316 }, { "epoch": 0.15, "learning_rate": 0.00019258047332806023, "loss": 0.671, "step": 1317 }, { "epoch": 0.15, "learning_rate": 0.00019256655179095952, "loss": 0.7457, "step": 1318 }, { "epoch": 0.15, "learning_rate": 0.00019255261770949762, "loss": 0.7294, "step": 1319 }, { "epoch": 0.15, "learning_rate": 0.00019253867108556287, "loss": 0.7467, "step": 1320 }, { "epoch": 0.15, "learning_rate": 0.00019252471192104524, "loss": 0.6643, "step": 1321 }, { "epoch": 0.15, "learning_rate": 0.0001925107402178365, "loss": 0.6609, "step": 1322 }, { "epoch": 0.15, "learning_rate": 0.00019249675597782999, "loss": 0.7567, "step": 1323 }, { "epoch": 0.15, "learning_rate": 0.00019248275920292086, "loss": 0.7339, "step": 1324 }, { "epoch": 0.15, "learning_rate": 0.00019246874989500587, "loss": 0.698, "step": 1325 }, { "epoch": 0.15, "learning_rate": 0.00019245472805598358, "loss": 0.6841, "step": 1326 }, { "epoch": 0.15, "learning_rate": 0.00019244069368775412, "loss": 0.6669, "step": 1327 }, { "epoch": 0.15, "learning_rate": 0.00019242664679221946, "loss": 0.6632, "step": 1328 }, { "epoch": 0.15, "learning_rate": 0.00019241258737128316, "loss": 0.6618, "step": 1329 }, { "epoch": 0.15, "learning_rate": 0.00019239851542685052, "loss": 0.752, "step": 1330 }, { "epoch": 0.15, "learning_rate": 0.00019238443096082853, "loss": 0.6392, "step": 1331 }, { "epoch": 0.15, "learning_rate": 0.0001923703339751259, "loss": 0.7301, "step": 1332 }, { "epoch": 0.15, "learning_rate": 0.00019235622447165293, "loss": 0.7107, "step": 1333 }, { "epoch": 0.15, "learning_rate": 0.0001923421024523218, "loss": 0.686, "step": 1334 }, { "epoch": 0.15, "learning_rate": 0.00019232796791904627, "loss": 0.7159, "step": 1335 }, { "epoch": 0.15, "learning_rate": 0.00019231382087374176, "loss": 0.7055, "step": 1336 }, { "epoch": 0.15, "learning_rate": 0.00019229966131832546, "loss": 0.7003, "step": 1337 }, { "epoch": 0.15, "learning_rate": 0.00019228548925471627, "loss": 0.6904, "step": 1338 }, { "epoch": 0.15, "learning_rate": 0.0001922713046848347, "loss": 0.7939, "step": 1339 }, { "epoch": 0.15, "learning_rate": 0.00019225710761060303, "loss": 0.7441, "step": 1340 }, { "epoch": 0.15, "learning_rate": 0.0001922428980339452, "loss": 0.6443, "step": 1341 }, { "epoch": 0.15, "learning_rate": 0.00019222867595678684, "loss": 0.6877, "step": 1342 }, { "epoch": 0.15, "learning_rate": 0.00019221444138105533, "loss": 0.7091, "step": 1343 }, { "epoch": 0.15, "learning_rate": 0.00019220019430867967, "loss": 0.7134, "step": 1344 }, { "epoch": 0.15, "learning_rate": 0.00019218593474159057, "loss": 0.6772, "step": 1345 }, { "epoch": 0.15, "learning_rate": 0.00019217166268172044, "loss": 0.6949, "step": 1346 }, { "epoch": 0.15, "learning_rate": 0.00019215737813100346, "loss": 0.7336, "step": 1347 }, { "epoch": 0.15, "learning_rate": 0.00019214308109137535, "loss": 0.7522, "step": 1348 }, { "epoch": 0.15, "learning_rate": 0.00019212877156477365, "loss": 0.7179, "step": 1349 }, { "epoch": 0.15, "learning_rate": 0.00019211444955313754, "loss": 0.7522, "step": 1350 }, { "epoch": 0.15, "learning_rate": 0.00019210011505840788, "loss": 0.693, "step": 1351 }, { "epoch": 0.15, "learning_rate": 0.00019208576808252726, "loss": 0.7069, "step": 1352 }, { "epoch": 0.15, "learning_rate": 0.00019207140862743995, "loss": 0.6303, "step": 1353 }, { "epoch": 0.15, "learning_rate": 0.00019205703669509188, "loss": 0.709, "step": 1354 }, { "epoch": 0.15, "learning_rate": 0.0001920426522874307, "loss": 0.6901, "step": 1355 }, { "epoch": 0.15, "learning_rate": 0.00019202825540640575, "loss": 0.6589, "step": 1356 }, { "epoch": 0.15, "learning_rate": 0.0001920138460539681, "loss": 0.647, "step": 1357 }, { "epoch": 0.15, "learning_rate": 0.00019199942423207036, "loss": 0.7542, "step": 1358 }, { "epoch": 0.15, "learning_rate": 0.00019198498994266704, "loss": 0.6647, "step": 1359 }, { "epoch": 0.15, "learning_rate": 0.00019197054318771412, "loss": 0.7148, "step": 1360 }, { "epoch": 0.15, "learning_rate": 0.0001919560839691695, "loss": 0.7107, "step": 1361 }, { "epoch": 0.15, "learning_rate": 0.00019194161228899264, "loss": 0.7523, "step": 1362 }, { "epoch": 0.15, "learning_rate": 0.00019192712814914464, "loss": 0.6803, "step": 1363 }, { "epoch": 0.16, "learning_rate": 0.00019191263155158837, "loss": 0.6894, "step": 1364 }, { "epoch": 0.16, "learning_rate": 0.0001918981224982884, "loss": 0.6986, "step": 1365 }, { "epoch": 0.16, "learning_rate": 0.00019188360099121093, "loss": 0.7109, "step": 1366 }, { "epoch": 0.16, "learning_rate": 0.00019186906703232387, "loss": 0.6698, "step": 1367 }, { "epoch": 0.16, "learning_rate": 0.00019185452062359682, "loss": 0.701, "step": 1368 }, { "epoch": 0.16, "learning_rate": 0.00019183996176700107, "loss": 0.701, "step": 1369 }, { "epoch": 0.16, "learning_rate": 0.00019182539046450962, "loss": 0.6754, "step": 1370 }, { "epoch": 0.16, "learning_rate": 0.00019181080671809713, "loss": 0.7239, "step": 1371 }, { "epoch": 0.16, "learning_rate": 0.00019179621052973993, "loss": 0.7083, "step": 1372 }, { "epoch": 0.16, "learning_rate": 0.00019178160190141605, "loss": 0.6879, "step": 1373 }, { "epoch": 0.16, "learning_rate": 0.00019176698083510523, "loss": 0.6823, "step": 1374 }, { "epoch": 0.16, "learning_rate": 0.00019175234733278886, "loss": 0.6882, "step": 1375 }, { "epoch": 0.16, "learning_rate": 0.00019173770139645005, "loss": 0.7098, "step": 1376 }, { "epoch": 0.16, "learning_rate": 0.00019172304302807357, "loss": 0.7354, "step": 1377 }, { "epoch": 0.16, "learning_rate": 0.00019170837222964586, "loss": 0.7403, "step": 1378 }, { "epoch": 0.16, "learning_rate": 0.00019169368900315506, "loss": 0.6684, "step": 1379 }, { "epoch": 0.16, "learning_rate": 0.00019167899335059105, "loss": 0.6122, "step": 1380 }, { "epoch": 0.16, "learning_rate": 0.00019166428527394534, "loss": 0.6832, "step": 1381 }, { "epoch": 0.16, "learning_rate": 0.00019164956477521106, "loss": 0.7458, "step": 1382 }, { "epoch": 0.16, "learning_rate": 0.00019163483185638316, "loss": 0.6467, "step": 1383 }, { "epoch": 0.16, "learning_rate": 0.00019162008651945817, "loss": 0.6753, "step": 1384 }, { "epoch": 0.16, "learning_rate": 0.00019160532876643434, "loss": 0.6751, "step": 1385 }, { "epoch": 0.16, "learning_rate": 0.00019159055859931164, "loss": 0.6673, "step": 1386 }, { "epoch": 0.16, "learning_rate": 0.0001915757760200916, "loss": 0.7074, "step": 1387 }, { "epoch": 0.16, "learning_rate": 0.00019156098103077757, "loss": 0.6279, "step": 1388 }, { "epoch": 0.16, "learning_rate": 0.00019154617363337454, "loss": 0.6888, "step": 1389 }, { "epoch": 0.16, "learning_rate": 0.00019153135382988913, "loss": 0.719, "step": 1390 }, { "epoch": 0.16, "learning_rate": 0.00019151652162232967, "loss": 0.7028, "step": 1391 }, { "epoch": 0.16, "learning_rate": 0.00019150167701270624, "loss": 0.6771, "step": 1392 }, { "epoch": 0.16, "learning_rate": 0.0001914868200030305, "loss": 0.7372, "step": 1393 }, { "epoch": 0.16, "learning_rate": 0.00019147195059531578, "loss": 0.7059, "step": 1394 }, { "epoch": 0.16, "learning_rate": 0.00019145706879157725, "loss": 0.6909, "step": 1395 }, { "epoch": 0.16, "learning_rate": 0.00019144217459383158, "loss": 0.7091, "step": 1396 }, { "epoch": 0.16, "learning_rate": 0.0001914272680040972, "loss": 0.7253, "step": 1397 }, { "epoch": 0.16, "learning_rate": 0.0001914123490243942, "loss": 0.7095, "step": 1398 }, { "epoch": 0.16, "learning_rate": 0.0001913974176567444, "loss": 0.6666, "step": 1399 }, { "epoch": 0.16, "learning_rate": 0.0001913824739031712, "loss": 0.6359, "step": 1400 }, { "epoch": 0.16, "learning_rate": 0.0001913675177656998, "loss": 0.7117, "step": 1401 }, { "epoch": 0.16, "learning_rate": 0.00019135254924635694, "loss": 0.7057, "step": 1402 }, { "epoch": 0.16, "learning_rate": 0.0001913375683471712, "loss": 0.6574, "step": 1403 }, { "epoch": 0.16, "learning_rate": 0.00019132257507017264, "loss": 0.7324, "step": 1404 }, { "epoch": 0.16, "learning_rate": 0.00019130756941739322, "loss": 0.6751, "step": 1405 }, { "epoch": 0.16, "learning_rate": 0.00019129255139086637, "loss": 0.6422, "step": 1406 }, { "epoch": 0.16, "learning_rate": 0.00019127752099262738, "loss": 0.602, "step": 1407 }, { "epoch": 0.16, "learning_rate": 0.00019126247822471304, "loss": 0.7522, "step": 1408 }, { "epoch": 0.16, "learning_rate": 0.00019124742308916198, "loss": 0.652, "step": 1409 }, { "epoch": 0.16, "learning_rate": 0.00019123235558801436, "loss": 0.7052, "step": 1410 }, { "epoch": 0.16, "learning_rate": 0.0001912172757233121, "loss": 0.746, "step": 1411 }, { "epoch": 0.16, "learning_rate": 0.00019120218349709885, "loss": 0.6402, "step": 1412 }, { "epoch": 0.16, "learning_rate": 0.00019118707891141982, "loss": 0.6947, "step": 1413 }, { "epoch": 0.16, "learning_rate": 0.0001911719619683219, "loss": 0.712, "step": 1414 }, { "epoch": 0.16, "learning_rate": 0.0001911568326698538, "loss": 0.7043, "step": 1415 }, { "epoch": 0.16, "learning_rate": 0.00019114169101806572, "loss": 0.6758, "step": 1416 }, { "epoch": 0.16, "learning_rate": 0.0001911265370150096, "loss": 0.7173, "step": 1417 }, { "epoch": 0.16, "learning_rate": 0.00019111137066273913, "loss": 0.7151, "step": 1418 }, { "epoch": 0.16, "learning_rate": 0.00019109619196330953, "loss": 0.7153, "step": 1419 }, { "epoch": 0.16, "learning_rate": 0.00019108100091877787, "loss": 0.735, "step": 1420 }, { "epoch": 0.16, "learning_rate": 0.00019106579753120273, "loss": 0.8014, "step": 1421 }, { "epoch": 0.16, "learning_rate": 0.00019105058180264445, "loss": 0.7148, "step": 1422 }, { "epoch": 0.16, "learning_rate": 0.00019103535373516506, "loss": 0.6267, "step": 1423 }, { "epoch": 0.16, "learning_rate": 0.00019102011333082817, "loss": 0.7303, "step": 1424 }, { "epoch": 0.16, "learning_rate": 0.00019100486059169916, "loss": 0.7976, "step": 1425 }, { "epoch": 0.16, "learning_rate": 0.000190989595519845, "loss": 0.7154, "step": 1426 }, { "epoch": 0.16, "learning_rate": 0.00019097431811733443, "loss": 0.7092, "step": 1427 }, { "epoch": 0.16, "learning_rate": 0.00019095902838623768, "loss": 0.6698, "step": 1428 }, { "epoch": 0.16, "learning_rate": 0.00019094372632862691, "loss": 0.6993, "step": 1429 }, { "epoch": 0.16, "learning_rate": 0.00019092841194657574, "loss": 0.6629, "step": 1430 }, { "epoch": 0.16, "learning_rate": 0.00019091308524215954, "loss": 0.754, "step": 1431 }, { "epoch": 0.16, "learning_rate": 0.00019089774621745535, "loss": 0.7291, "step": 1432 }, { "epoch": 0.16, "learning_rate": 0.00019088239487454188, "loss": 0.7013, "step": 1433 }, { "epoch": 0.16, "learning_rate": 0.0001908670312154995, "loss": 0.7355, "step": 1434 }, { "epoch": 0.16, "learning_rate": 0.0001908516552424102, "loss": 0.7446, "step": 1435 }, { "epoch": 0.16, "learning_rate": 0.00019083626695735778, "loss": 0.7226, "step": 1436 }, { "epoch": 0.16, "learning_rate": 0.00019082086636242756, "loss": 0.7418, "step": 1437 }, { "epoch": 0.16, "learning_rate": 0.00019080545345970658, "loss": 0.7267, "step": 1438 }, { "epoch": 0.16, "learning_rate": 0.0001907900282512836, "loss": 0.6689, "step": 1439 }, { "epoch": 0.16, "learning_rate": 0.0001907745907392489, "loss": 0.7364, "step": 1440 }, { "epoch": 0.16, "learning_rate": 0.00019075914092569468, "loss": 0.6161, "step": 1441 }, { "epoch": 0.16, "learning_rate": 0.0001907436788127145, "loss": 0.7298, "step": 1442 }, { "epoch": 0.16, "learning_rate": 0.00019072820440240386, "loss": 0.6539, "step": 1443 }, { "epoch": 0.16, "learning_rate": 0.00019071271769685976, "loss": 0.7699, "step": 1444 }, { "epoch": 0.16, "learning_rate": 0.00019069721869818088, "loss": 0.6174, "step": 1445 }, { "epoch": 0.16, "learning_rate": 0.0001906817074084677, "loss": 0.6938, "step": 1446 }, { "epoch": 0.16, "learning_rate": 0.00019066618382982217, "loss": 0.6715, "step": 1447 }, { "epoch": 0.16, "learning_rate": 0.00019065064796434806, "loss": 0.6922, "step": 1448 }, { "epoch": 0.16, "learning_rate": 0.0001906350998141507, "loss": 0.5785, "step": 1449 }, { "epoch": 0.16, "learning_rate": 0.0001906195393813372, "loss": 0.7089, "step": 1450 }, { "epoch": 0.16, "learning_rate": 0.00019060396666801621, "loss": 0.712, "step": 1451 }, { "epoch": 0.17, "learning_rate": 0.00019058838167629812, "loss": 0.7169, "step": 1452 }, { "epoch": 0.17, "learning_rate": 0.00019057278440829493, "loss": 0.6005, "step": 1453 }, { "epoch": 0.17, "learning_rate": 0.0001905571748661204, "loss": 0.6851, "step": 1454 }, { "epoch": 0.17, "learning_rate": 0.00019054155305188984, "loss": 0.739, "step": 1455 }, { "epoch": 0.17, "learning_rate": 0.00019052591896772032, "loss": 0.7201, "step": 1456 }, { "epoch": 0.17, "learning_rate": 0.0001905102726157305, "loss": 0.6278, "step": 1457 }, { "epoch": 0.17, "learning_rate": 0.0001904946139980407, "loss": 0.7202, "step": 1458 }, { "epoch": 0.17, "learning_rate": 0.00019047894311677302, "loss": 0.699, "step": 1459 }, { "epoch": 0.17, "learning_rate": 0.00019046325997405103, "loss": 0.6623, "step": 1460 }, { "epoch": 0.17, "learning_rate": 0.00019044756457200013, "loss": 0.6499, "step": 1461 }, { "epoch": 0.17, "learning_rate": 0.00019043185691274732, "loss": 0.7079, "step": 1462 }, { "epoch": 0.17, "learning_rate": 0.00019041613699842123, "loss": 0.7001, "step": 1463 }, { "epoch": 0.17, "learning_rate": 0.0001904004048311522, "loss": 0.7026, "step": 1464 }, { "epoch": 0.17, "learning_rate": 0.00019038466041307217, "loss": 0.6585, "step": 1465 }, { "epoch": 0.17, "learning_rate": 0.00019036890374631482, "loss": 0.7228, "step": 1466 }, { "epoch": 0.17, "learning_rate": 0.00019035313483301548, "loss": 0.6978, "step": 1467 }, { "epoch": 0.17, "learning_rate": 0.00019033735367531102, "loss": 0.7625, "step": 1468 }, { "epoch": 0.17, "learning_rate": 0.0001903215602753401, "loss": 0.6914, "step": 1469 }, { "epoch": 0.17, "learning_rate": 0.00019030575463524306, "loss": 0.7025, "step": 1470 }, { "epoch": 0.17, "learning_rate": 0.0001902899367571617, "loss": 0.6517, "step": 1471 }, { "epoch": 0.17, "learning_rate": 0.00019027410664323977, "loss": 0.7003, "step": 1472 }, { "epoch": 0.17, "learning_rate": 0.00019025826429562242, "loss": 0.7367, "step": 1473 }, { "epoch": 0.17, "learning_rate": 0.00019024240971645656, "loss": 0.7251, "step": 1474 }, { "epoch": 0.17, "learning_rate": 0.00019022654290789084, "loss": 0.6344, "step": 1475 }, { "epoch": 0.17, "learning_rate": 0.0001902106638720754, "loss": 0.6846, "step": 1476 }, { "epoch": 0.17, "learning_rate": 0.00019019477261116214, "loss": 0.6579, "step": 1477 }, { "epoch": 0.17, "learning_rate": 0.00019017886912730465, "loss": 0.7363, "step": 1478 }, { "epoch": 0.17, "learning_rate": 0.00019016295342265806, "loss": 0.699, "step": 1479 }, { "epoch": 0.17, "learning_rate": 0.0001901470254993793, "loss": 0.7614, "step": 1480 }, { "epoch": 0.17, "learning_rate": 0.00019013108535962677, "loss": 0.7171, "step": 1481 }, { "epoch": 0.17, "learning_rate": 0.00019011513300556075, "loss": 0.6741, "step": 1482 }, { "epoch": 0.17, "learning_rate": 0.00019009916843934296, "loss": 0.7094, "step": 1483 }, { "epoch": 0.17, "learning_rate": 0.00019008319166313693, "loss": 0.7289, "step": 1484 }, { "epoch": 0.17, "learning_rate": 0.00019006720267910777, "loss": 0.6568, "step": 1485 }, { "epoch": 0.17, "learning_rate": 0.0001900512014894223, "loss": 0.6738, "step": 1486 }, { "epoch": 0.17, "learning_rate": 0.00019003518809624888, "loss": 0.6871, "step": 1487 }, { "epoch": 0.17, "learning_rate": 0.00019001916250175764, "loss": 0.7331, "step": 1488 }, { "epoch": 0.17, "learning_rate": 0.00019000312470812035, "loss": 0.7389, "step": 1489 }, { "epoch": 0.17, "learning_rate": 0.0001899870747175104, "loss": 0.6829, "step": 1490 }, { "epoch": 0.17, "learning_rate": 0.0001899710125321028, "loss": 0.689, "step": 1491 }, { "epoch": 0.17, "learning_rate": 0.00018995493815407427, "loss": 0.7084, "step": 1492 }, { "epoch": 0.17, "learning_rate": 0.00018993885158560318, "loss": 0.7173, "step": 1493 }, { "epoch": 0.17, "learning_rate": 0.00018992275282886956, "loss": 0.6874, "step": 1494 }, { "epoch": 0.17, "learning_rate": 0.000189906641886055, "loss": 0.6509, "step": 1495 }, { "epoch": 0.17, "learning_rate": 0.00018989051875934287, "loss": 0.7362, "step": 1496 }, { "epoch": 0.17, "learning_rate": 0.0001898743834509181, "loss": 0.6119, "step": 1497 }, { "epoch": 0.17, "learning_rate": 0.0001898582359629673, "loss": 0.6503, "step": 1498 }, { "epoch": 0.17, "learning_rate": 0.00018984207629767875, "loss": 0.7112, "step": 1499 }, { "epoch": 0.17, "learning_rate": 0.00018982590445724238, "loss": 0.6765, "step": 1500 }, { "epoch": 0.17, "learning_rate": 0.0001898097204438497, "loss": 0.6787, "step": 1501 }, { "epoch": 0.17, "learning_rate": 0.00018979352425969396, "loss": 0.6833, "step": 1502 }, { "epoch": 0.17, "learning_rate": 0.00018977731590697, "loss": 0.709, "step": 1503 }, { "epoch": 0.17, "learning_rate": 0.0001897610953878744, "loss": 0.6868, "step": 1504 }, { "epoch": 0.17, "learning_rate": 0.00018974486270460517, "loss": 0.6845, "step": 1505 }, { "epoch": 0.17, "learning_rate": 0.0001897286178593623, "loss": 0.6533, "step": 1506 }, { "epoch": 0.17, "learning_rate": 0.0001897123608543471, "loss": 0.657, "step": 1507 }, { "epoch": 0.17, "learning_rate": 0.00018969609169176277, "loss": 0.669, "step": 1508 }, { "epoch": 0.17, "learning_rate": 0.000189679810373814, "loss": 0.7096, "step": 1509 }, { "epoch": 0.17, "learning_rate": 0.00018966351690270723, "loss": 0.7354, "step": 1510 }, { "epoch": 0.17, "learning_rate": 0.00018964721128065048, "loss": 0.6819, "step": 1511 }, { "epoch": 0.17, "learning_rate": 0.00018963089350985347, "loss": 0.6776, "step": 1512 }, { "epoch": 0.17, "learning_rate": 0.0001896145635925275, "loss": 0.6661, "step": 1513 }, { "epoch": 0.17, "learning_rate": 0.00018959822153088556, "loss": 0.7054, "step": 1514 }, { "epoch": 0.17, "learning_rate": 0.0001895818673271423, "loss": 0.6987, "step": 1515 }, { "epoch": 0.17, "learning_rate": 0.000189565500983514, "loss": 0.6946, "step": 1516 }, { "epoch": 0.17, "learning_rate": 0.00018954912250221856, "loss": 0.7043, "step": 1517 }, { "epoch": 0.17, "learning_rate": 0.00018953273188547558, "loss": 0.6898, "step": 1518 }, { "epoch": 0.17, "learning_rate": 0.00018951632913550626, "loss": 0.65, "step": 1519 }, { "epoch": 0.17, "learning_rate": 0.00018949991425453342, "loss": 0.6904, "step": 1520 }, { "epoch": 0.17, "learning_rate": 0.00018948348724478158, "loss": 0.7114, "step": 1521 }, { "epoch": 0.17, "learning_rate": 0.00018946704810847689, "loss": 0.728, "step": 1522 }, { "epoch": 0.17, "learning_rate": 0.00018945059684784713, "loss": 0.6842, "step": 1523 }, { "epoch": 0.17, "learning_rate": 0.00018943413346512173, "loss": 0.6965, "step": 1524 }, { "epoch": 0.17, "learning_rate": 0.00018941765796253178, "loss": 0.7758, "step": 1525 }, { "epoch": 0.17, "learning_rate": 0.00018940117034230996, "loss": 0.7252, "step": 1526 }, { "epoch": 0.17, "learning_rate": 0.00018938467060669066, "loss": 0.7544, "step": 1527 }, { "epoch": 0.17, "learning_rate": 0.00018936815875790982, "loss": 0.6519, "step": 1528 }, { "epoch": 0.17, "learning_rate": 0.00018935163479820517, "loss": 0.727, "step": 1529 }, { "epoch": 0.17, "learning_rate": 0.0001893350987298159, "loss": 0.7127, "step": 1530 }, { "epoch": 0.17, "learning_rate": 0.000189318550554983, "loss": 0.6667, "step": 1531 }, { "epoch": 0.17, "learning_rate": 0.000189301990275949, "loss": 0.6462, "step": 1532 }, { "epoch": 0.17, "learning_rate": 0.00018928541789495814, "loss": 0.7066, "step": 1533 }, { "epoch": 0.17, "learning_rate": 0.00018926883341425618, "loss": 0.7231, "step": 1534 }, { "epoch": 0.17, "learning_rate": 0.00018925223683609067, "loss": 0.6983, "step": 1535 }, { "epoch": 0.17, "learning_rate": 0.00018923562816271073, "loss": 0.7168, "step": 1536 }, { "epoch": 0.17, "learning_rate": 0.00018921900739636712, "loss": 0.7387, "step": 1537 }, { "epoch": 0.17, "learning_rate": 0.0001892023745393122, "loss": 0.655, "step": 1538 }, { "epoch": 0.17, "learning_rate": 0.00018918572959380006, "loss": 0.7105, "step": 1539 }, { "epoch": 0.18, "learning_rate": 0.00018916907256208635, "loss": 0.6659, "step": 1540 }, { "epoch": 0.18, "learning_rate": 0.00018915240344642836, "loss": 0.6918, "step": 1541 }, { "epoch": 0.18, "learning_rate": 0.00018913572224908508, "loss": 0.7169, "step": 1542 }, { "epoch": 0.18, "learning_rate": 0.0001891190289723171, "loss": 0.6692, "step": 1543 }, { "epoch": 0.18, "learning_rate": 0.00018910232361838664, "loss": 0.7264, "step": 1544 }, { "epoch": 0.18, "learning_rate": 0.00018908560618955753, "loss": 0.6898, "step": 1545 }, { "epoch": 0.18, "learning_rate": 0.00018906887668809533, "loss": 0.7034, "step": 1546 }, { "epoch": 0.18, "learning_rate": 0.00018905213511626712, "loss": 0.7023, "step": 1547 }, { "epoch": 0.18, "learning_rate": 0.00018903538147634172, "loss": 0.6716, "step": 1548 }, { "epoch": 0.18, "learning_rate": 0.0001890186157705895, "loss": 0.6808, "step": 1549 }, { "epoch": 0.18, "learning_rate": 0.00018900183800128252, "loss": 0.6611, "step": 1550 }, { "epoch": 0.18, "learning_rate": 0.00018898504817069442, "loss": 0.6648, "step": 1551 }, { "epoch": 0.18, "learning_rate": 0.00018896824628110057, "loss": 0.7282, "step": 1552 }, { "epoch": 0.18, "learning_rate": 0.00018895143233477787, "loss": 0.6845, "step": 1553 }, { "epoch": 0.18, "learning_rate": 0.0001889346063340049, "loss": 0.7534, "step": 1554 }, { "epoch": 0.18, "learning_rate": 0.0001889177682810619, "loss": 0.649, "step": 1555 }, { "epoch": 0.18, "learning_rate": 0.00018890091817823072, "loss": 0.713, "step": 1556 }, { "epoch": 0.18, "learning_rate": 0.00018888405602779482, "loss": 0.6832, "step": 1557 }, { "epoch": 0.18, "learning_rate": 0.0001888671818320393, "loss": 0.6861, "step": 1558 }, { "epoch": 0.18, "learning_rate": 0.00018885029559325092, "loss": 0.7273, "step": 1559 }, { "epoch": 0.18, "learning_rate": 0.00018883339731371804, "loss": 0.6946, "step": 1560 }, { "epoch": 0.18, "learning_rate": 0.00018881648699573073, "loss": 0.7641, "step": 1561 }, { "epoch": 0.18, "learning_rate": 0.00018879956464158055, "loss": 0.6459, "step": 1562 }, { "epoch": 0.18, "learning_rate": 0.0001887826302535608, "loss": 0.7103, "step": 1563 }, { "epoch": 0.18, "learning_rate": 0.00018876568383396637, "loss": 0.6853, "step": 1564 }, { "epoch": 0.18, "learning_rate": 0.00018874872538509382, "loss": 0.6955, "step": 1565 }, { "epoch": 0.18, "learning_rate": 0.0001887317549092413, "loss": 0.6841, "step": 1566 }, { "epoch": 0.18, "learning_rate": 0.00018871477240870862, "loss": 0.6567, "step": 1567 }, { "epoch": 0.18, "learning_rate": 0.00018869777788579713, "loss": 0.7284, "step": 1568 }, { "epoch": 0.18, "learning_rate": 0.00018868077134280995, "loss": 0.6536, "step": 1569 }, { "epoch": 0.18, "learning_rate": 0.00018866375278205172, "loss": 0.7408, "step": 1570 }, { "epoch": 0.18, "learning_rate": 0.0001886467222058288, "loss": 0.7465, "step": 1571 }, { "epoch": 0.18, "learning_rate": 0.00018862967961644905, "loss": 0.7028, "step": 1572 }, { "epoch": 0.18, "learning_rate": 0.00018861262501622213, "loss": 0.7192, "step": 1573 }, { "epoch": 0.18, "learning_rate": 0.00018859555840745914, "loss": 0.7187, "step": 1574 }, { "epoch": 0.18, "learning_rate": 0.00018857847979247293, "loss": 0.6673, "step": 1575 }, { "epoch": 0.18, "learning_rate": 0.00018856138917357798, "loss": 0.6386, "step": 1576 }, { "epoch": 0.18, "learning_rate": 0.00018854428655309033, "loss": 0.7718, "step": 1577 }, { "epoch": 0.18, "learning_rate": 0.0001885271719333277, "loss": 0.7188, "step": 1578 }, { "epoch": 0.18, "learning_rate": 0.00018851004531660937, "loss": 0.662, "step": 1579 }, { "epoch": 0.18, "learning_rate": 0.00018849290670525635, "loss": 0.7019, "step": 1580 }, { "epoch": 0.18, "learning_rate": 0.00018847575610159115, "loss": 0.6667, "step": 1581 }, { "epoch": 0.18, "learning_rate": 0.00018845859350793807, "loss": 0.6612, "step": 1582 }, { "epoch": 0.18, "learning_rate": 0.00018844141892662285, "loss": 0.6875, "step": 1583 }, { "epoch": 0.18, "learning_rate": 0.00018842423235997298, "loss": 0.663, "step": 1584 }, { "epoch": 0.18, "learning_rate": 0.00018840703381031753, "loss": 0.6379, "step": 1585 }, { "epoch": 0.18, "learning_rate": 0.00018838982327998717, "loss": 0.6677, "step": 1586 }, { "epoch": 0.18, "learning_rate": 0.00018837260077131425, "loss": 0.7397, "step": 1587 }, { "epoch": 0.18, "learning_rate": 0.00018835536628663272, "loss": 0.7019, "step": 1588 }, { "epoch": 0.18, "learning_rate": 0.00018833811982827818, "loss": 0.7422, "step": 1589 }, { "epoch": 0.18, "learning_rate": 0.00018832086139858775, "loss": 0.7119, "step": 1590 }, { "epoch": 0.18, "learning_rate": 0.0001883035909999003, "loss": 0.6617, "step": 1591 }, { "epoch": 0.18, "learning_rate": 0.00018828630863455622, "loss": 0.7265, "step": 1592 }, { "epoch": 0.18, "learning_rate": 0.00018826901430489762, "loss": 0.758, "step": 1593 }, { "epoch": 0.18, "learning_rate": 0.00018825170801326814, "loss": 0.6483, "step": 1594 }, { "epoch": 0.18, "learning_rate": 0.00018823438976201312, "loss": 0.6887, "step": 1595 }, { "epoch": 0.18, "learning_rate": 0.00018821705955347943, "loss": 0.7331, "step": 1596 }, { "epoch": 0.18, "learning_rate": 0.00018819971739001564, "loss": 0.65, "step": 1597 }, { "epoch": 0.18, "learning_rate": 0.00018818236327397192, "loss": 0.6832, "step": 1598 }, { "epoch": 0.18, "learning_rate": 0.00018816499720770004, "loss": 0.6387, "step": 1599 }, { "epoch": 0.18, "learning_rate": 0.0001881476191935534, "loss": 0.6782, "step": 1600 }, { "epoch": 0.18, "learning_rate": 0.00018813022923388703, "loss": 0.6532, "step": 1601 }, { "epoch": 0.18, "learning_rate": 0.00018811282733105755, "loss": 0.6754, "step": 1602 }, { "epoch": 0.18, "learning_rate": 0.00018809541348742322, "loss": 0.7505, "step": 1603 }, { "epoch": 0.18, "learning_rate": 0.00018807798770534395, "loss": 0.665, "step": 1604 }, { "epoch": 0.18, "learning_rate": 0.0001880605499871812, "loss": 0.6547, "step": 1605 }, { "epoch": 0.18, "learning_rate": 0.00018804310033529806, "loss": 0.648, "step": 1606 }, { "epoch": 0.18, "learning_rate": 0.00018802563875205933, "loss": 0.6676, "step": 1607 }, { "epoch": 0.18, "learning_rate": 0.00018800816523983126, "loss": 0.6421, "step": 1608 }, { "epoch": 0.18, "learning_rate": 0.00018799067980098189, "loss": 0.746, "step": 1609 }, { "epoch": 0.18, "learning_rate": 0.00018797318243788077, "loss": 0.699, "step": 1610 }, { "epoch": 0.18, "learning_rate": 0.0001879556731528991, "loss": 0.6637, "step": 1611 }, { "epoch": 0.18, "learning_rate": 0.00018793815194840968, "loss": 0.7216, "step": 1612 }, { "epoch": 0.18, "learning_rate": 0.00018792061882678694, "loss": 0.6477, "step": 1613 }, { "epoch": 0.18, "learning_rate": 0.00018790307379040692, "loss": 0.6681, "step": 1614 }, { "epoch": 0.18, "learning_rate": 0.00018788551684164725, "loss": 0.6537, "step": 1615 }, { "epoch": 0.18, "learning_rate": 0.00018786794798288727, "loss": 0.7085, "step": 1616 }, { "epoch": 0.18, "learning_rate": 0.00018785036721650778, "loss": 0.7168, "step": 1617 }, { "epoch": 0.18, "learning_rate": 0.00018783277454489133, "loss": 0.7151, "step": 1618 }, { "epoch": 0.18, "learning_rate": 0.000187815169970422, "loss": 0.7072, "step": 1619 }, { "epoch": 0.18, "learning_rate": 0.00018779755349548552, "loss": 0.7408, "step": 1620 }, { "epoch": 0.18, "learning_rate": 0.00018777992512246922, "loss": 0.6639, "step": 1621 }, { "epoch": 0.18, "learning_rate": 0.0001877622848537621, "loss": 0.6799, "step": 1622 }, { "epoch": 0.18, "learning_rate": 0.00018774463269175464, "loss": 0.7223, "step": 1623 }, { "epoch": 0.18, "learning_rate": 0.00018772696863883904, "loss": 0.6491, "step": 1624 }, { "epoch": 0.18, "learning_rate": 0.00018770929269740913, "loss": 0.6651, "step": 1625 }, { "epoch": 0.18, "learning_rate": 0.00018769160486986026, "loss": 0.7335, "step": 1626 }, { "epoch": 0.18, "learning_rate": 0.00018767390515858943, "loss": 0.7263, "step": 1627 }, { "epoch": 0.19, "learning_rate": 0.00018765619356599526, "loss": 0.7368, "step": 1628 }, { "epoch": 0.19, "learning_rate": 0.000187638470094478, "loss": 0.7324, "step": 1629 }, { "epoch": 0.19, "learning_rate": 0.00018762073474643947, "loss": 0.7252, "step": 1630 }, { "epoch": 0.19, "learning_rate": 0.00018760298752428312, "loss": 0.6847, "step": 1631 }, { "epoch": 0.19, "learning_rate": 0.00018758522843041395, "loss": 0.6528, "step": 1632 }, { "epoch": 0.19, "learning_rate": 0.0001875674574672387, "loss": 0.6815, "step": 1633 }, { "epoch": 0.19, "learning_rate": 0.00018754967463716565, "loss": 0.7897, "step": 1634 }, { "epoch": 0.19, "learning_rate": 0.0001875318799426046, "loss": 0.6729, "step": 1635 }, { "epoch": 0.19, "learning_rate": 0.0001875140733859671, "loss": 0.681, "step": 1636 }, { "epoch": 0.19, "learning_rate": 0.0001874962549696662, "loss": 0.7118, "step": 1637 }, { "epoch": 0.19, "learning_rate": 0.00018747842469611666, "loss": 0.659, "step": 1638 }, { "epoch": 0.19, "learning_rate": 0.00018746058256773475, "loss": 0.7022, "step": 1639 }, { "epoch": 0.19, "learning_rate": 0.00018744272858693835, "loss": 0.7526, "step": 1640 }, { "epoch": 0.19, "learning_rate": 0.00018742486275614707, "loss": 0.678, "step": 1641 }, { "epoch": 0.19, "learning_rate": 0.00018740698507778195, "loss": 0.6652, "step": 1642 }, { "epoch": 0.19, "learning_rate": 0.00018738909555426577, "loss": 0.7111, "step": 1643 }, { "epoch": 0.19, "learning_rate": 0.0001873711941880229, "loss": 0.6618, "step": 1644 }, { "epoch": 0.19, "learning_rate": 0.0001873532809814792, "loss": 0.6895, "step": 1645 }, { "epoch": 0.19, "learning_rate": 0.0001873353559370623, "loss": 0.6182, "step": 1646 }, { "epoch": 0.19, "learning_rate": 0.00018731741905720132, "loss": 0.6693, "step": 1647 }, { "epoch": 0.19, "learning_rate": 0.00018729947034432697, "loss": 0.7457, "step": 1648 }, { "epoch": 0.19, "learning_rate": 0.00018728150980087165, "loss": 0.7637, "step": 1649 }, { "epoch": 0.19, "learning_rate": 0.00018726353742926937, "loss": 0.624, "step": 1650 }, { "epoch": 0.19, "learning_rate": 0.0001872455532319556, "loss": 0.6473, "step": 1651 }, { "epoch": 0.19, "learning_rate": 0.00018722755721136758, "loss": 0.628, "step": 1652 }, { "epoch": 0.19, "learning_rate": 0.00018720954936994407, "loss": 0.677, "step": 1653 }, { "epoch": 0.19, "learning_rate": 0.00018719152971012542, "loss": 0.6879, "step": 1654 }, { "epoch": 0.19, "learning_rate": 0.00018717349823435363, "loss": 0.6348, "step": 1655 }, { "epoch": 0.19, "learning_rate": 0.00018715545494507222, "loss": 0.6279, "step": 1656 }, { "epoch": 0.19, "learning_rate": 0.00018713739984472643, "loss": 0.692, "step": 1657 }, { "epoch": 0.19, "learning_rate": 0.00018711933293576302, "loss": 0.7167, "step": 1658 }, { "epoch": 0.19, "learning_rate": 0.00018710125422063034, "loss": 0.676, "step": 1659 }, { "epoch": 0.19, "learning_rate": 0.0001870831637017784, "loss": 0.7833, "step": 1660 }, { "epoch": 0.19, "learning_rate": 0.00018706506138165877, "loss": 0.7813, "step": 1661 }, { "epoch": 0.19, "learning_rate": 0.00018704694726272462, "loss": 0.7451, "step": 1662 }, { "epoch": 0.19, "learning_rate": 0.00018702882134743071, "loss": 0.7662, "step": 1663 }, { "epoch": 0.19, "learning_rate": 0.00018701068363823344, "loss": 0.6541, "step": 1664 }, { "epoch": 0.19, "learning_rate": 0.0001869925341375908, "loss": 0.6975, "step": 1665 }, { "epoch": 0.19, "learning_rate": 0.00018697437284796226, "loss": 0.7249, "step": 1666 }, { "epoch": 0.19, "learning_rate": 0.0001869561997718091, "loss": 0.7363, "step": 1667 }, { "epoch": 0.19, "learning_rate": 0.00018693801491159406, "loss": 0.6935, "step": 1668 }, { "epoch": 0.19, "learning_rate": 0.00018691981826978143, "loss": 0.6923, "step": 1669 }, { "epoch": 0.19, "learning_rate": 0.00018690160984883726, "loss": 0.7786, "step": 1670 }, { "epoch": 0.19, "learning_rate": 0.00018688338965122908, "loss": 0.6309, "step": 1671 }, { "epoch": 0.19, "learning_rate": 0.00018686515767942597, "loss": 0.6518, "step": 1672 }, { "epoch": 0.19, "learning_rate": 0.00018684691393589878, "loss": 0.698, "step": 1673 }, { "epoch": 0.19, "learning_rate": 0.0001868286584231198, "loss": 0.6882, "step": 1674 }, { "epoch": 0.19, "learning_rate": 0.00018681039114356297, "loss": 0.6622, "step": 1675 }, { "epoch": 0.19, "learning_rate": 0.0001867921120997038, "loss": 0.693, "step": 1676 }, { "epoch": 0.19, "learning_rate": 0.00018677382129401947, "loss": 0.6976, "step": 1677 }, { "epoch": 0.19, "learning_rate": 0.00018675551872898865, "loss": 0.7116, "step": 1678 }, { "epoch": 0.19, "learning_rate": 0.00018673720440709165, "loss": 0.7212, "step": 1679 }, { "epoch": 0.19, "learning_rate": 0.0001867188783308104, "loss": 0.7589, "step": 1680 }, { "epoch": 0.19, "learning_rate": 0.00018670054050262842, "loss": 0.6912, "step": 1681 }, { "epoch": 0.19, "learning_rate": 0.00018668219092503075, "loss": 0.7495, "step": 1682 }, { "epoch": 0.19, "learning_rate": 0.0001866638296005041, "loss": 0.7092, "step": 1683 }, { "epoch": 0.19, "learning_rate": 0.00018664545653153676, "loss": 0.7145, "step": 1684 }, { "epoch": 0.19, "learning_rate": 0.00018662707172061854, "loss": 0.7224, "step": 1685 }, { "epoch": 0.19, "learning_rate": 0.00018660867517024098, "loss": 0.7276, "step": 1686 }, { "epoch": 0.19, "learning_rate": 0.00018659026688289706, "loss": 0.7038, "step": 1687 }, { "epoch": 0.19, "learning_rate": 0.00018657184686108144, "loss": 0.7207, "step": 1688 }, { "epoch": 0.19, "learning_rate": 0.0001865534151072904, "loss": 0.7356, "step": 1689 }, { "epoch": 0.19, "learning_rate": 0.00018653497162402166, "loss": 0.6368, "step": 1690 }, { "epoch": 0.19, "learning_rate": 0.00018651651641377474, "loss": 0.7185, "step": 1691 }, { "epoch": 0.19, "learning_rate": 0.00018649804947905055, "loss": 0.6919, "step": 1692 }, { "epoch": 0.19, "learning_rate": 0.00018647957082235174, "loss": 0.6935, "step": 1693 }, { "epoch": 0.19, "learning_rate": 0.00018646108044618247, "loss": 0.7019, "step": 1694 }, { "epoch": 0.19, "learning_rate": 0.00018644257835304846, "loss": 0.6723, "step": 1695 }, { "epoch": 0.19, "learning_rate": 0.0001864240645454571, "loss": 0.7077, "step": 1696 }, { "epoch": 0.19, "learning_rate": 0.00018640553902591733, "loss": 0.6355, "step": 1697 }, { "epoch": 0.19, "learning_rate": 0.00018638700179693968, "loss": 0.7233, "step": 1698 }, { "epoch": 0.19, "learning_rate": 0.00018636845286103623, "loss": 0.713, "step": 1699 }, { "epoch": 0.19, "learning_rate": 0.00018634989222072074, "loss": 0.6403, "step": 1700 }, { "epoch": 0.19, "learning_rate": 0.00018633131987850848, "loss": 0.6277, "step": 1701 }, { "epoch": 0.19, "learning_rate": 0.00018631273583691625, "loss": 0.6681, "step": 1702 }, { "epoch": 0.19, "learning_rate": 0.00018629414009846258, "loss": 0.6616, "step": 1703 }, { "epoch": 0.19, "learning_rate": 0.0001862755326656675, "loss": 0.6781, "step": 1704 }, { "epoch": 0.19, "learning_rate": 0.0001862569135410526, "loss": 0.7007, "step": 1705 }, { "epoch": 0.19, "learning_rate": 0.00018623828272714118, "loss": 0.6439, "step": 1706 }, { "epoch": 0.19, "learning_rate": 0.00018621964022645795, "loss": 0.7049, "step": 1707 }, { "epoch": 0.19, "learning_rate": 0.00018620098604152932, "loss": 0.6813, "step": 1708 }, { "epoch": 0.19, "learning_rate": 0.00018618232017488326, "loss": 0.6651, "step": 1709 }, { "epoch": 0.19, "learning_rate": 0.0001861636426290493, "loss": 0.7068, "step": 1710 }, { "epoch": 0.19, "learning_rate": 0.00018614495340655857, "loss": 0.6835, "step": 1711 }, { "epoch": 0.19, "learning_rate": 0.0001861262525099438, "loss": 0.6447, "step": 1712 }, { "epoch": 0.19, "learning_rate": 0.00018610753994173927, "loss": 0.6922, "step": 1713 }, { "epoch": 0.19, "learning_rate": 0.00018608881570448087, "loss": 0.7277, "step": 1714 }, { "epoch": 0.19, "learning_rate": 0.00018607007980070604, "loss": 0.6676, "step": 1715 }, { "epoch": 0.2, "learning_rate": 0.00018605133223295378, "loss": 0.6649, "step": 1716 }, { "epoch": 0.2, "learning_rate": 0.0001860325730037648, "loss": 0.646, "step": 1717 }, { "epoch": 0.2, "learning_rate": 0.00018601380211568126, "loss": 0.6765, "step": 1718 }, { "epoch": 0.2, "learning_rate": 0.0001859950195712469, "loss": 0.7469, "step": 1719 }, { "epoch": 0.2, "learning_rate": 0.00018597622537300706, "loss": 0.6999, "step": 1720 }, { "epoch": 0.2, "learning_rate": 0.0001859574195235088, "loss": 0.7143, "step": 1721 }, { "epoch": 0.2, "learning_rate": 0.0001859386020253005, "loss": 0.7089, "step": 1722 }, { "epoch": 0.2, "learning_rate": 0.00018591977288093237, "loss": 0.6608, "step": 1723 }, { "epoch": 0.2, "learning_rate": 0.00018590093209295598, "loss": 0.6555, "step": 1724 }, { "epoch": 0.2, "learning_rate": 0.00018588207966392463, "loss": 0.7077, "step": 1725 }, { "epoch": 0.2, "learning_rate": 0.00018586321559639317, "loss": 0.7315, "step": 1726 }, { "epoch": 0.2, "learning_rate": 0.00018584433989291796, "loss": 0.6629, "step": 1727 }, { "epoch": 0.2, "learning_rate": 0.00018582545255605703, "loss": 0.6848, "step": 1728 }, { "epoch": 0.2, "learning_rate": 0.0001858065535883699, "loss": 0.6547, "step": 1729 }, { "epoch": 0.2, "learning_rate": 0.00018578764299241772, "loss": 0.7039, "step": 1730 }, { "epoch": 0.2, "learning_rate": 0.0001857687207707632, "loss": 0.6769, "step": 1731 }, { "epoch": 0.2, "learning_rate": 0.0001857497869259706, "loss": 0.6799, "step": 1732 }, { "epoch": 0.2, "learning_rate": 0.00018573084146060584, "loss": 0.7263, "step": 1733 }, { "epoch": 0.2, "learning_rate": 0.00018571188437723632, "loss": 0.6742, "step": 1734 }, { "epoch": 0.2, "learning_rate": 0.00018569291567843105, "loss": 0.724, "step": 1735 }, { "epoch": 0.2, "learning_rate": 0.00018567393536676066, "loss": 0.6392, "step": 1736 }, { "epoch": 0.2, "learning_rate": 0.00018565494344479722, "loss": 0.714, "step": 1737 }, { "epoch": 0.2, "learning_rate": 0.00018563593991511454, "loss": 0.6132, "step": 1738 }, { "epoch": 0.2, "learning_rate": 0.0001856169247802879, "loss": 0.6435, "step": 1739 }, { "epoch": 0.2, "learning_rate": 0.00018559789804289416, "loss": 0.7037, "step": 1740 }, { "epoch": 0.2, "learning_rate": 0.00018557885970551182, "loss": 0.69, "step": 1741 }, { "epoch": 0.2, "learning_rate": 0.00018555980977072082, "loss": 0.7286, "step": 1742 }, { "epoch": 0.2, "learning_rate": 0.00018554074824110285, "loss": 0.7312, "step": 1743 }, { "epoch": 0.2, "learning_rate": 0.00018552167511924102, "loss": 0.6886, "step": 1744 }, { "epoch": 0.2, "learning_rate": 0.00018550259040772007, "loss": 0.6946, "step": 1745 }, { "epoch": 0.2, "learning_rate": 0.00018548349410912632, "loss": 0.7169, "step": 1746 }, { "epoch": 0.2, "learning_rate": 0.00018546438622604763, "loss": 0.6335, "step": 1747 }, { "epoch": 0.2, "learning_rate": 0.00018544526676107345, "loss": 0.6481, "step": 1748 }, { "epoch": 0.2, "learning_rate": 0.0001854261357167948, "loss": 0.7005, "step": 1749 }, { "epoch": 0.2, "learning_rate": 0.0001854069930958043, "loss": 0.7085, "step": 1750 }, { "epoch": 0.2, "learning_rate": 0.00018538783890069605, "loss": 0.6945, "step": 1751 }, { "epoch": 0.2, "learning_rate": 0.0001853686731340658, "loss": 0.693, "step": 1752 }, { "epoch": 0.2, "learning_rate": 0.00018534949579851085, "loss": 0.6796, "step": 1753 }, { "epoch": 0.2, "learning_rate": 0.00018533030689663003, "loss": 0.7433, "step": 1754 }, { "epoch": 0.2, "learning_rate": 0.00018531110643102379, "loss": 0.6899, "step": 1755 }, { "epoch": 0.2, "learning_rate": 0.00018529189440429414, "loss": 0.651, "step": 1756 }, { "epoch": 0.2, "learning_rate": 0.0001852726708190446, "loss": 0.7135, "step": 1757 }, { "epoch": 0.2, "learning_rate": 0.0001852534356778803, "loss": 0.7354, "step": 1758 }, { "epoch": 0.2, "learning_rate": 0.00018523418898340797, "loss": 0.7171, "step": 1759 }, { "epoch": 0.2, "learning_rate": 0.0001852149307382358, "loss": 0.7443, "step": 1760 }, { "epoch": 0.2, "learning_rate": 0.00018519566094497372, "loss": 0.7474, "step": 1761 }, { "epoch": 0.2, "learning_rate": 0.00018517637960623303, "loss": 0.7327, "step": 1762 }, { "epoch": 0.2, "learning_rate": 0.00018515708672462672, "loss": 0.6801, "step": 1763 }, { "epoch": 0.2, "learning_rate": 0.0001851377823027693, "loss": 0.6537, "step": 1764 }, { "epoch": 0.2, "learning_rate": 0.00018511846634327686, "loss": 0.7226, "step": 1765 }, { "epoch": 0.2, "learning_rate": 0.00018509913884876702, "loss": 0.7017, "step": 1766 }, { "epoch": 0.2, "learning_rate": 0.00018507979982185902, "loss": 0.7369, "step": 1767 }, { "epoch": 0.2, "learning_rate": 0.00018506044926517359, "loss": 0.6823, "step": 1768 }, { "epoch": 0.2, "learning_rate": 0.0001850410871813331, "loss": 0.6774, "step": 1769 }, { "epoch": 0.2, "learning_rate": 0.00018502171357296144, "loss": 0.7161, "step": 1770 }, { "epoch": 0.2, "learning_rate": 0.00018500232844268405, "loss": 0.7044, "step": 1771 }, { "epoch": 0.2, "learning_rate": 0.00018498293179312797, "loss": 0.7054, "step": 1772 }, { "epoch": 0.2, "learning_rate": 0.00018496352362692175, "loss": 0.6783, "step": 1773 }, { "epoch": 0.2, "learning_rate": 0.00018494410394669558, "loss": 0.7187, "step": 1774 }, { "epoch": 0.2, "learning_rate": 0.00018492467275508113, "loss": 0.702, "step": 1775 }, { "epoch": 0.2, "learning_rate": 0.00018490523005471163, "loss": 0.6755, "step": 1776 }, { "epoch": 0.2, "learning_rate": 0.00018488577584822196, "loss": 0.6602, "step": 1777 }, { "epoch": 0.2, "learning_rate": 0.00018486631013824844, "loss": 0.682, "step": 1778 }, { "epoch": 0.2, "learning_rate": 0.0001848468329274291, "loss": 0.6845, "step": 1779 }, { "epoch": 0.2, "learning_rate": 0.00018482734421840333, "loss": 0.6813, "step": 1780 }, { "epoch": 0.2, "learning_rate": 0.00018480784401381226, "loss": 0.679, "step": 1781 }, { "epoch": 0.2, "learning_rate": 0.0001847883323162985, "loss": 0.6955, "step": 1782 }, { "epoch": 0.2, "learning_rate": 0.00018476880912850614, "loss": 0.5997, "step": 1783 }, { "epoch": 0.2, "learning_rate": 0.00018474927445308098, "loss": 0.7515, "step": 1784 }, { "epoch": 0.2, "learning_rate": 0.00018472972829267032, "loss": 0.6878, "step": 1785 }, { "epoch": 0.2, "learning_rate": 0.00018471017064992297, "loss": 0.759, "step": 1786 }, { "epoch": 0.2, "learning_rate": 0.00018469060152748933, "loss": 0.7014, "step": 1787 }, { "epoch": 0.2, "learning_rate": 0.00018467102092802135, "loss": 0.6926, "step": 1788 }, { "epoch": 0.2, "learning_rate": 0.00018465142885417253, "loss": 0.7295, "step": 1789 }, { "epoch": 0.2, "learning_rate": 0.00018463182530859795, "loss": 0.6514, "step": 1790 }, { "epoch": 0.2, "learning_rate": 0.00018461221029395422, "loss": 0.7311, "step": 1791 }, { "epoch": 0.2, "learning_rate": 0.00018459258381289955, "loss": 0.6809, "step": 1792 }, { "epoch": 0.2, "learning_rate": 0.00018457294586809357, "loss": 0.662, "step": 1793 }, { "epoch": 0.2, "learning_rate": 0.00018455329646219765, "loss": 0.7402, "step": 1794 }, { "epoch": 0.2, "learning_rate": 0.0001845336355978746, "loss": 0.6734, "step": 1795 }, { "epoch": 0.2, "learning_rate": 0.0001845139632777888, "loss": 0.7322, "step": 1796 }, { "epoch": 0.2, "learning_rate": 0.00018449427950460617, "loss": 0.6485, "step": 1797 }, { "epoch": 0.2, "learning_rate": 0.00018447458428099426, "loss": 0.7097, "step": 1798 }, { "epoch": 0.2, "learning_rate": 0.000184454877609622, "loss": 0.7496, "step": 1799 }, { "epoch": 0.2, "learning_rate": 0.0001844351594931601, "loss": 0.687, "step": 1800 }, { "epoch": 0.2, "learning_rate": 0.00018441542993428062, "loss": 0.7363, "step": 1801 }, { "epoch": 0.2, "learning_rate": 0.00018439568893565734, "loss": 0.6761, "step": 1802 }, { "epoch": 0.2, "learning_rate": 0.00018437593649996544, "loss": 0.679, "step": 1803 }, { "epoch": 0.21, "learning_rate": 0.00018435617262988168, "loss": 0.6649, "step": 1804 }, { "epoch": 0.21, "learning_rate": 0.00018433639732808453, "loss": 0.7229, "step": 1805 }, { "epoch": 0.21, "learning_rate": 0.00018431661059725376, "loss": 0.7088, "step": 1806 }, { "epoch": 0.21, "learning_rate": 0.0001842968124400709, "loss": 0.6701, "step": 1807 }, { "epoch": 0.21, "learning_rate": 0.00018427700285921885, "loss": 0.7155, "step": 1808 }, { "epoch": 0.21, "learning_rate": 0.00018425718185738224, "loss": 0.6475, "step": 1809 }, { "epoch": 0.21, "learning_rate": 0.00018423734943724714, "loss": 0.6924, "step": 1810 }, { "epoch": 0.21, "learning_rate": 0.0001842175056015011, "loss": 0.644, "step": 1811 }, { "epoch": 0.21, "learning_rate": 0.0001841976503528334, "loss": 0.6856, "step": 1812 }, { "epoch": 0.21, "learning_rate": 0.00018417778369393477, "loss": 0.6245, "step": 1813 }, { "epoch": 0.21, "learning_rate": 0.0001841579056274974, "loss": 0.657, "step": 1814 }, { "epoch": 0.21, "learning_rate": 0.00018413801615621518, "loss": 0.7185, "step": 1815 }, { "epoch": 0.21, "learning_rate": 0.00018411811528278342, "loss": 0.6832, "step": 1816 }, { "epoch": 0.21, "learning_rate": 0.0001840982030098991, "loss": 0.6851, "step": 1817 }, { "epoch": 0.21, "learning_rate": 0.00018407827934026062, "loss": 0.6261, "step": 1818 }, { "epoch": 0.21, "learning_rate": 0.000184058344276568, "loss": 0.6538, "step": 1819 }, { "epoch": 0.21, "learning_rate": 0.0001840383978215228, "loss": 0.677, "step": 1820 }, { "epoch": 0.21, "learning_rate": 0.00018401843997782805, "loss": 0.658, "step": 1821 }, { "epoch": 0.21, "learning_rate": 0.00018399847074818847, "loss": 0.7618, "step": 1822 }, { "epoch": 0.21, "learning_rate": 0.0001839784901353102, "loss": 0.6916, "step": 1823 }, { "epoch": 0.21, "learning_rate": 0.0001839584981419009, "loss": 0.7359, "step": 1824 }, { "epoch": 0.21, "learning_rate": 0.00018393849477066988, "loss": 0.7172, "step": 1825 }, { "epoch": 0.21, "learning_rate": 0.00018391848002432797, "loss": 0.6824, "step": 1826 }, { "epoch": 0.21, "learning_rate": 0.00018389845390558745, "loss": 0.6996, "step": 1827 }, { "epoch": 0.21, "learning_rate": 0.00018387841641716223, "loss": 0.6896, "step": 1828 }, { "epoch": 0.21, "learning_rate": 0.00018385836756176774, "loss": 0.6646, "step": 1829 }, { "epoch": 0.21, "learning_rate": 0.00018383830734212096, "loss": 0.6864, "step": 1830 }, { "epoch": 0.21, "learning_rate": 0.00018381823576094035, "loss": 0.6576, "step": 1831 }, { "epoch": 0.21, "learning_rate": 0.000183798152820946, "loss": 0.6365, "step": 1832 }, { "epoch": 0.21, "learning_rate": 0.00018377805852485947, "loss": 0.6955, "step": 1833 }, { "epoch": 0.21, "learning_rate": 0.00018375795287540388, "loss": 0.6989, "step": 1834 }, { "epoch": 0.21, "learning_rate": 0.0001837378358753039, "loss": 0.6412, "step": 1835 }, { "epoch": 0.21, "learning_rate": 0.00018371770752728575, "loss": 0.6943, "step": 1836 }, { "epoch": 0.21, "learning_rate": 0.00018369756783407712, "loss": 0.672, "step": 1837 }, { "epoch": 0.21, "learning_rate": 0.00018367741679840732, "loss": 0.6686, "step": 1838 }, { "epoch": 0.21, "learning_rate": 0.00018365725442300715, "loss": 0.7138, "step": 1839 }, { "epoch": 0.21, "learning_rate": 0.000183637080710609, "loss": 0.6601, "step": 1840 }, { "epoch": 0.21, "learning_rate": 0.00018361689566394668, "loss": 0.6583, "step": 1841 }, { "epoch": 0.21, "learning_rate": 0.00018359669928575567, "loss": 0.6397, "step": 1842 }, { "epoch": 0.21, "learning_rate": 0.0001835764915787729, "loss": 0.7056, "step": 1843 }, { "epoch": 0.21, "learning_rate": 0.00018355627254573685, "loss": 0.7542, "step": 1844 }, { "epoch": 0.21, "learning_rate": 0.0001835360421893876, "loss": 0.6692, "step": 1845 }, { "epoch": 0.21, "learning_rate": 0.00018351580051246665, "loss": 0.6559, "step": 1846 }, { "epoch": 0.21, "learning_rate": 0.00018349554751771714, "loss": 0.6793, "step": 1847 }, { "epoch": 0.21, "learning_rate": 0.00018347528320788369, "loss": 0.735, "step": 1848 }, { "epoch": 0.21, "learning_rate": 0.00018345500758571242, "loss": 0.7448, "step": 1849 }, { "epoch": 0.21, "learning_rate": 0.0001834347206539511, "loss": 0.6635, "step": 1850 }, { "epoch": 0.21, "learning_rate": 0.0001834144224153489, "loss": 0.6924, "step": 1851 }, { "epoch": 0.21, "learning_rate": 0.00018339411287265661, "loss": 0.6531, "step": 1852 }, { "epoch": 0.21, "learning_rate": 0.00018337379202862652, "loss": 0.7278, "step": 1853 }, { "epoch": 0.21, "learning_rate": 0.00018335345988601241, "loss": 0.6447, "step": 1854 }, { "epoch": 0.21, "learning_rate": 0.00018333311644756973, "loss": 0.7638, "step": 1855 }, { "epoch": 0.21, "learning_rate": 0.00018331276171605526, "loss": 0.6835, "step": 1856 }, { "epoch": 0.21, "learning_rate": 0.00018329239569422749, "loss": 0.7512, "step": 1857 }, { "epoch": 0.21, "learning_rate": 0.00018327201838484633, "loss": 0.6937, "step": 1858 }, { "epoch": 0.21, "learning_rate": 0.00018325162979067328, "loss": 0.6546, "step": 1859 }, { "epoch": 0.21, "learning_rate": 0.0001832312299144713, "loss": 0.663, "step": 1860 }, { "epoch": 0.21, "learning_rate": 0.00018321081875900501, "loss": 0.6723, "step": 1861 }, { "epoch": 0.21, "learning_rate": 0.0001831903963270404, "loss": 0.7248, "step": 1862 }, { "epoch": 0.21, "learning_rate": 0.00018316996262134508, "loss": 0.7057, "step": 1863 }, { "epoch": 0.21, "learning_rate": 0.00018314951764468815, "loss": 0.6168, "step": 1864 }, { "epoch": 0.21, "learning_rate": 0.0001831290613998403, "loss": 0.6962, "step": 1865 }, { "epoch": 0.21, "learning_rate": 0.0001831085938895737, "loss": 0.6478, "step": 1866 }, { "epoch": 0.21, "learning_rate": 0.000183088115116662, "loss": 0.6788, "step": 1867 }, { "epoch": 0.21, "learning_rate": 0.00018306762508388044, "loss": 0.6446, "step": 1868 }, { "epoch": 0.21, "learning_rate": 0.00018304712379400582, "loss": 0.6829, "step": 1869 }, { "epoch": 0.21, "learning_rate": 0.00018302661124981637, "loss": 0.7004, "step": 1870 }, { "epoch": 0.21, "learning_rate": 0.00018300608745409192, "loss": 0.7014, "step": 1871 }, { "epoch": 0.21, "learning_rate": 0.0001829855524096138, "loss": 0.6894, "step": 1872 }, { "epoch": 0.21, "learning_rate": 0.00018296500611916482, "loss": 0.7142, "step": 1873 }, { "epoch": 0.21, "learning_rate": 0.0001829444485855294, "loss": 0.688, "step": 1874 }, { "epoch": 0.21, "learning_rate": 0.00018292387981149342, "loss": 0.6491, "step": 1875 }, { "epoch": 0.21, "learning_rate": 0.0001829032997998443, "loss": 0.6398, "step": 1876 }, { "epoch": 0.21, "learning_rate": 0.000182882708553371, "loss": 0.6673, "step": 1877 }, { "epoch": 0.21, "learning_rate": 0.00018286210607486398, "loss": 0.7045, "step": 1878 }, { "epoch": 0.21, "learning_rate": 0.00018284149236711525, "loss": 0.59, "step": 1879 }, { "epoch": 0.21, "learning_rate": 0.0001828208674329183, "loss": 0.675, "step": 1880 }, { "epoch": 0.21, "learning_rate": 0.00018280023127506813, "loss": 0.7515, "step": 1881 }, { "epoch": 0.21, "learning_rate": 0.00018277958389636135, "loss": 0.6835, "step": 1882 }, { "epoch": 0.21, "learning_rate": 0.00018275892529959605, "loss": 0.7128, "step": 1883 }, { "epoch": 0.21, "learning_rate": 0.00018273825548757174, "loss": 0.7168, "step": 1884 }, { "epoch": 0.21, "learning_rate": 0.00018271757446308967, "loss": 0.7923, "step": 1885 }, { "epoch": 0.21, "learning_rate": 0.00018269688222895231, "loss": 0.7588, "step": 1886 }, { "epoch": 0.21, "learning_rate": 0.00018267617878796395, "loss": 0.6765, "step": 1887 }, { "epoch": 0.21, "learning_rate": 0.0001826554641429302, "loss": 0.6963, "step": 1888 }, { "epoch": 0.21, "learning_rate": 0.00018263473829665822, "loss": 0.6954, "step": 1889 }, { "epoch": 0.21, "learning_rate": 0.00018261400125195681, "loss": 0.7383, "step": 1890 }, { "epoch": 0.21, "learning_rate": 0.00018259325301163613, "loss": 0.6789, "step": 1891 }, { "epoch": 0.22, "learning_rate": 0.0001825724935785079, "loss": 0.6764, "step": 1892 }, { "epoch": 0.22, "learning_rate": 0.00018255172295538548, "loss": 0.735, "step": 1893 }, { "epoch": 0.22, "learning_rate": 0.00018253094114508355, "loss": 0.6642, "step": 1894 }, { "epoch": 0.22, "learning_rate": 0.00018251014815041846, "loss": 0.7306, "step": 1895 }, { "epoch": 0.22, "learning_rate": 0.000182489343974208, "loss": 0.7047, "step": 1896 }, { "epoch": 0.22, "learning_rate": 0.0001824685286192715, "loss": 0.7153, "step": 1897 }, { "epoch": 0.22, "learning_rate": 0.0001824477020884298, "loss": 0.6029, "step": 1898 }, { "epoch": 0.22, "learning_rate": 0.0001824268643845052, "loss": 0.7001, "step": 1899 }, { "epoch": 0.22, "learning_rate": 0.00018240601551032163, "loss": 0.7205, "step": 1900 }, { "epoch": 0.22, "learning_rate": 0.00018238515546870448, "loss": 0.7214, "step": 1901 }, { "epoch": 0.22, "learning_rate": 0.0001823642842624806, "loss": 0.6648, "step": 1902 }, { "epoch": 0.22, "learning_rate": 0.00018234340189447843, "loss": 0.7043, "step": 1903 }, { "epoch": 0.22, "learning_rate": 0.00018232250836752788, "loss": 0.6847, "step": 1904 }, { "epoch": 0.22, "learning_rate": 0.00018230160368446033, "loss": 0.6648, "step": 1905 }, { "epoch": 0.22, "learning_rate": 0.00018228068784810884, "loss": 0.7076, "step": 1906 }, { "epoch": 0.22, "learning_rate": 0.00018225976086130776, "loss": 0.7311, "step": 1907 }, { "epoch": 0.22, "learning_rate": 0.0001822388227268931, "loss": 0.7155, "step": 1908 }, { "epoch": 0.22, "learning_rate": 0.00018221787344770236, "loss": 0.6977, "step": 1909 }, { "epoch": 0.22, "learning_rate": 0.00018219691302657449, "loss": 0.6182, "step": 1910 }, { "epoch": 0.22, "learning_rate": 0.00018217594146634997, "loss": 0.7053, "step": 1911 }, { "epoch": 0.22, "learning_rate": 0.0001821549587698709, "loss": 0.7268, "step": 1912 }, { "epoch": 0.22, "learning_rate": 0.0001821339649399807, "loss": 0.7167, "step": 1913 }, { "epoch": 0.22, "learning_rate": 0.00018211295997952443, "loss": 0.6938, "step": 1914 }, { "epoch": 0.22, "learning_rate": 0.0001820919438913486, "loss": 0.6904, "step": 1915 }, { "epoch": 0.22, "learning_rate": 0.0001820709166783013, "loss": 0.6984, "step": 1916 }, { "epoch": 0.22, "learning_rate": 0.00018204987834323207, "loss": 0.7391, "step": 1917 }, { "epoch": 0.22, "learning_rate": 0.0001820288288889919, "loss": 0.7706, "step": 1918 }, { "epoch": 0.22, "learning_rate": 0.00018200776831843346, "loss": 0.7282, "step": 1919 }, { "epoch": 0.22, "learning_rate": 0.00018198669663441072, "loss": 0.7415, "step": 1920 }, { "epoch": 0.22, "learning_rate": 0.00018196561383977935, "loss": 0.6647, "step": 1921 }, { "epoch": 0.22, "learning_rate": 0.00018194451993739635, "loss": 0.696, "step": 1922 }, { "epoch": 0.22, "learning_rate": 0.00018192341493012033, "loss": 0.7023, "step": 1923 }, { "epoch": 0.22, "learning_rate": 0.0001819022988208114, "loss": 0.7318, "step": 1924 }, { "epoch": 0.22, "learning_rate": 0.00018188117161233115, "loss": 0.7367, "step": 1925 }, { "epoch": 0.22, "learning_rate": 0.00018186003330754267, "loss": 0.6984, "step": 1926 }, { "epoch": 0.22, "learning_rate": 0.00018183888390931058, "loss": 0.6874, "step": 1927 }, { "epoch": 0.22, "learning_rate": 0.00018181772342050102, "loss": 0.7446, "step": 1928 }, { "epoch": 0.22, "learning_rate": 0.00018179655184398147, "loss": 0.7426, "step": 1929 }, { "epoch": 0.22, "learning_rate": 0.0001817753691826212, "loss": 0.6491, "step": 1930 }, { "epoch": 0.22, "learning_rate": 0.0001817541754392907, "loss": 0.6884, "step": 1931 }, { "epoch": 0.22, "learning_rate": 0.0001817329706168622, "loss": 0.7362, "step": 1932 }, { "epoch": 0.22, "learning_rate": 0.00018171175471820927, "loss": 0.7317, "step": 1933 }, { "epoch": 0.22, "learning_rate": 0.00018169052774620698, "loss": 0.7535, "step": 1934 }, { "epoch": 0.22, "learning_rate": 0.00018166928970373203, "loss": 0.7072, "step": 1935 }, { "epoch": 0.22, "learning_rate": 0.00018164804059366248, "loss": 0.6989, "step": 1936 }, { "epoch": 0.22, "learning_rate": 0.00018162678041887798, "loss": 0.6998, "step": 1937 }, { "epoch": 0.22, "learning_rate": 0.00018160550918225964, "loss": 0.7048, "step": 1938 }, { "epoch": 0.22, "learning_rate": 0.0001815842268866901, "loss": 0.6061, "step": 1939 }, { "epoch": 0.22, "learning_rate": 0.0001815629335350534, "loss": 0.6027, "step": 1940 }, { "epoch": 0.22, "learning_rate": 0.00018154162913023526, "loss": 0.7381, "step": 1941 }, { "epoch": 0.22, "learning_rate": 0.00018152031367512272, "loss": 0.6991, "step": 1942 }, { "epoch": 0.22, "learning_rate": 0.00018149898717260445, "loss": 0.6404, "step": 1943 }, { "epoch": 0.22, "learning_rate": 0.00018147764962557052, "loss": 0.7229, "step": 1944 }, { "epoch": 0.22, "learning_rate": 0.00018145630103691253, "loss": 0.7744, "step": 1945 }, { "epoch": 0.22, "learning_rate": 0.00018143494140952364, "loss": 0.6441, "step": 1946 }, { "epoch": 0.22, "learning_rate": 0.00018141357074629837, "loss": 0.7311, "step": 1947 }, { "epoch": 0.22, "learning_rate": 0.0001813921890501328, "loss": 0.6858, "step": 1948 }, { "epoch": 0.22, "learning_rate": 0.00018137079632392461, "loss": 0.7545, "step": 1949 }, { "epoch": 0.22, "learning_rate": 0.00018134939257057284, "loss": 0.6786, "step": 1950 }, { "epoch": 0.22, "learning_rate": 0.00018132797779297802, "loss": 0.8058, "step": 1951 }, { "epoch": 0.22, "learning_rate": 0.00018130655199404233, "loss": 0.7067, "step": 1952 }, { "epoch": 0.22, "learning_rate": 0.0001812851151766692, "loss": 0.7196, "step": 1953 }, { "epoch": 0.22, "learning_rate": 0.00018126366734376378, "loss": 0.7424, "step": 1954 }, { "epoch": 0.22, "learning_rate": 0.0001812422084982326, "loss": 0.701, "step": 1955 }, { "epoch": 0.22, "learning_rate": 0.0001812207386429837, "loss": 0.7422, "step": 1956 }, { "epoch": 0.22, "learning_rate": 0.0001811992577809266, "loss": 0.6949, "step": 1957 }, { "epoch": 0.22, "learning_rate": 0.00018117776591497234, "loss": 0.6463, "step": 1958 }, { "epoch": 0.22, "learning_rate": 0.00018115626304803347, "loss": 0.6675, "step": 1959 }, { "epoch": 0.22, "learning_rate": 0.00018113474918302394, "loss": 0.6877, "step": 1960 }, { "epoch": 0.22, "learning_rate": 0.00018111322432285928, "loss": 0.7521, "step": 1961 }, { "epoch": 0.22, "learning_rate": 0.00018109168847045643, "loss": 0.6993, "step": 1962 }, { "epoch": 0.22, "learning_rate": 0.00018107014162873397, "loss": 0.7184, "step": 1963 }, { "epoch": 0.22, "learning_rate": 0.00018104858380061178, "loss": 0.7218, "step": 1964 }, { "epoch": 0.22, "learning_rate": 0.00018102701498901136, "loss": 0.7359, "step": 1965 }, { "epoch": 0.22, "learning_rate": 0.0001810054351968556, "loss": 0.6771, "step": 1966 }, { "epoch": 0.22, "learning_rate": 0.00018098384442706905, "loss": 0.6734, "step": 1967 }, { "epoch": 0.22, "learning_rate": 0.00018096224268257754, "loss": 0.7279, "step": 1968 }, { "epoch": 0.22, "learning_rate": 0.00018094062996630846, "loss": 0.7038, "step": 1969 }, { "epoch": 0.22, "learning_rate": 0.00018091900628119077, "loss": 0.7578, "step": 1970 }, { "epoch": 0.22, "learning_rate": 0.0001808973716301548, "loss": 0.7438, "step": 1971 }, { "epoch": 0.22, "learning_rate": 0.00018087572601613246, "loss": 0.7425, "step": 1972 }, { "epoch": 0.22, "learning_rate": 0.00018085406944205707, "loss": 0.7354, "step": 1973 }, { "epoch": 0.22, "learning_rate": 0.0001808324019108635, "loss": 0.6921, "step": 1974 }, { "epoch": 0.22, "learning_rate": 0.00018081072342548802, "loss": 0.6775, "step": 1975 }, { "epoch": 0.22, "learning_rate": 0.00018078903398886852, "loss": 0.7091, "step": 1976 }, { "epoch": 0.22, "learning_rate": 0.0001807673336039442, "loss": 0.71, "step": 1977 }, { "epoch": 0.22, "learning_rate": 0.0001807456222736559, "loss": 0.7148, "step": 1978 }, { "epoch": 0.22, "learning_rate": 0.00018072390000094582, "loss": 0.6994, "step": 1979 }, { "epoch": 0.23, "learning_rate": 0.0001807021667887578, "loss": 0.6724, "step": 1980 }, { "epoch": 0.23, "learning_rate": 0.000180680422640037, "loss": 0.7938, "step": 1981 }, { "epoch": 0.23, "learning_rate": 0.0001806586675577301, "loss": 0.7333, "step": 1982 }, { "epoch": 0.23, "learning_rate": 0.00018063690154478536, "loss": 0.7493, "step": 1983 }, { "epoch": 0.23, "learning_rate": 0.00018061512460415237, "loss": 0.6629, "step": 1984 }, { "epoch": 0.23, "learning_rate": 0.00018059333673878234, "loss": 0.6592, "step": 1985 }, { "epoch": 0.23, "learning_rate": 0.00018057153795162785, "loss": 0.6629, "step": 1986 }, { "epoch": 0.23, "learning_rate": 0.0001805497282456431, "loss": 0.6904, "step": 1987 }, { "epoch": 0.23, "learning_rate": 0.00018052790762378357, "loss": 0.7037, "step": 1988 }, { "epoch": 0.23, "learning_rate": 0.00018050607608900642, "loss": 0.7783, "step": 1989 }, { "epoch": 0.23, "learning_rate": 0.00018048423364427015, "loss": 0.6719, "step": 1990 }, { "epoch": 0.23, "learning_rate": 0.0001804623802925348, "loss": 0.6725, "step": 1991 }, { "epoch": 0.23, "learning_rate": 0.00018044051603676185, "loss": 0.7038, "step": 1992 }, { "epoch": 0.23, "learning_rate": 0.0001804186408799143, "loss": 0.7002, "step": 1993 }, { "epoch": 0.23, "learning_rate": 0.00018039675482495665, "loss": 0.6971, "step": 1994 }, { "epoch": 0.23, "learning_rate": 0.0001803748578748548, "loss": 0.7703, "step": 1995 }, { "epoch": 0.23, "learning_rate": 0.00018035295003257615, "loss": 0.6773, "step": 1996 }, { "epoch": 0.23, "learning_rate": 0.00018033103130108964, "loss": 0.6739, "step": 1997 }, { "epoch": 0.23, "learning_rate": 0.00018030910168336556, "loss": 0.7167, "step": 1998 }, { "epoch": 0.23, "learning_rate": 0.00018028716118237583, "loss": 0.7091, "step": 1999 }, { "epoch": 0.23, "learning_rate": 0.00018026520980109372, "loss": 0.691, "step": 2000 }, { "epoch": 0.23, "learning_rate": 0.000180243247542494, "loss": 0.6996, "step": 2001 }, { "epoch": 0.23, "learning_rate": 0.00018022127440955302, "loss": 0.6794, "step": 2002 }, { "epoch": 0.23, "learning_rate": 0.0001801992904052484, "loss": 0.6657, "step": 2003 }, { "epoch": 0.23, "learning_rate": 0.00018017729553255945, "loss": 0.7081, "step": 2004 }, { "epoch": 0.23, "learning_rate": 0.0001801552897944668, "loss": 0.6732, "step": 2005 }, { "epoch": 0.23, "learning_rate": 0.00018013327319395264, "loss": 0.6832, "step": 2006 }, { "epoch": 0.23, "learning_rate": 0.00018011124573400056, "loss": 0.6644, "step": 2007 }, { "epoch": 0.23, "learning_rate": 0.00018008920741759566, "loss": 0.6896, "step": 2008 }, { "epoch": 0.23, "learning_rate": 0.00018006715824772459, "loss": 0.6565, "step": 2009 }, { "epoch": 0.23, "learning_rate": 0.0001800450982273753, "loss": 0.6662, "step": 2010 }, { "epoch": 0.23, "learning_rate": 0.00018002302735953735, "loss": 0.7397, "step": 2011 }, { "epoch": 0.23, "learning_rate": 0.0001800009456472017, "loss": 0.729, "step": 2012 }, { "epoch": 0.23, "learning_rate": 0.00017997885309336078, "loss": 0.7001, "step": 2013 }, { "epoch": 0.23, "learning_rate": 0.00017995674970100857, "loss": 0.6824, "step": 2014 }, { "epoch": 0.23, "learning_rate": 0.00017993463547314045, "loss": 0.6955, "step": 2015 }, { "epoch": 0.23, "learning_rate": 0.00017991251041275322, "loss": 0.7289, "step": 2016 }, { "epoch": 0.23, "learning_rate": 0.0001798903745228453, "loss": 0.6866, "step": 2017 }, { "epoch": 0.23, "learning_rate": 0.0001798682278064164, "loss": 0.6888, "step": 2018 }, { "epoch": 0.23, "learning_rate": 0.0001798460702664678, "loss": 0.6692, "step": 2019 }, { "epoch": 0.23, "learning_rate": 0.00017982390190600226, "loss": 0.7409, "step": 2020 }, { "epoch": 0.23, "learning_rate": 0.000179801722728024, "loss": 0.578, "step": 2021 }, { "epoch": 0.23, "learning_rate": 0.00017977953273553855, "loss": 0.7302, "step": 2022 }, { "epoch": 0.23, "learning_rate": 0.0001797573319315532, "loss": 0.7472, "step": 2023 }, { "epoch": 0.23, "learning_rate": 0.00017973512031907638, "loss": 0.7182, "step": 2024 }, { "epoch": 0.23, "learning_rate": 0.00017971289790111826, "loss": 0.7156, "step": 2025 }, { "epoch": 0.23, "learning_rate": 0.00017969066468069035, "loss": 0.7293, "step": 2026 }, { "epoch": 0.23, "learning_rate": 0.0001796684206608056, "loss": 0.7205, "step": 2027 }, { "epoch": 0.23, "learning_rate": 0.0001796461658444785, "loss": 0.6738, "step": 2028 }, { "epoch": 0.23, "learning_rate": 0.00017962390023472488, "loss": 0.6227, "step": 2029 }, { "epoch": 0.23, "learning_rate": 0.00017960162383456218, "loss": 0.7401, "step": 2030 }, { "epoch": 0.23, "learning_rate": 0.00017957933664700923, "loss": 0.6855, "step": 2031 }, { "epoch": 0.23, "learning_rate": 0.00017955703867508633, "loss": 0.6607, "step": 2032 }, { "epoch": 0.23, "learning_rate": 0.0001795347299218152, "loss": 0.6823, "step": 2033 }, { "epoch": 0.23, "learning_rate": 0.00017951241039021912, "loss": 0.701, "step": 2034 }, { "epoch": 0.23, "learning_rate": 0.0001794900800833227, "loss": 0.7473, "step": 2035 }, { "epoch": 0.23, "learning_rate": 0.00017946773900415214, "loss": 0.7717, "step": 2036 }, { "epoch": 0.23, "learning_rate": 0.00017944538715573502, "loss": 0.6823, "step": 2037 }, { "epoch": 0.23, "learning_rate": 0.00017942302454110041, "loss": 0.6168, "step": 2038 }, { "epoch": 0.23, "learning_rate": 0.0001794006511632788, "loss": 0.6876, "step": 2039 }, { "epoch": 0.23, "learning_rate": 0.00017937826702530218, "loss": 0.6725, "step": 2040 }, { "epoch": 0.23, "learning_rate": 0.000179355872130204, "loss": 0.6374, "step": 2041 }, { "epoch": 0.23, "learning_rate": 0.00017933346648101918, "loss": 0.6253, "step": 2042 }, { "epoch": 0.23, "learning_rate": 0.000179311050080784, "loss": 0.7045, "step": 2043 }, { "epoch": 0.23, "learning_rate": 0.00017928862293253633, "loss": 0.6832, "step": 2044 }, { "epoch": 0.23, "learning_rate": 0.0001792661850393154, "loss": 0.6953, "step": 2045 }, { "epoch": 0.23, "learning_rate": 0.00017924373640416192, "loss": 0.7487, "step": 2046 }, { "epoch": 0.23, "learning_rate": 0.0001792212770301181, "loss": 0.7202, "step": 2047 }, { "epoch": 0.23, "learning_rate": 0.00017919880692022756, "loss": 0.6876, "step": 2048 }, { "epoch": 0.23, "learning_rate": 0.00017917632607753538, "loss": 0.7157, "step": 2049 }, { "epoch": 0.23, "learning_rate": 0.00017915383450508814, "loss": 0.7687, "step": 2050 }, { "epoch": 0.23, "learning_rate": 0.00017913133220593376, "loss": 0.706, "step": 2051 }, { "epoch": 0.23, "learning_rate": 0.00017910881918312173, "loss": 0.6846, "step": 2052 }, { "epoch": 0.23, "learning_rate": 0.00017908629543970302, "loss": 0.6625, "step": 2053 }, { "epoch": 0.23, "learning_rate": 0.00017906376097872985, "loss": 0.7336, "step": 2054 }, { "epoch": 0.23, "learning_rate": 0.00017904121580325613, "loss": 0.673, "step": 2055 }, { "epoch": 0.23, "learning_rate": 0.0001790186599163371, "loss": 0.7012, "step": 2056 }, { "epoch": 0.23, "learning_rate": 0.0001789960933210294, "loss": 0.7389, "step": 2057 }, { "epoch": 0.23, "learning_rate": 0.00017897351602039126, "loss": 0.7093, "step": 2058 }, { "epoch": 0.23, "learning_rate": 0.00017895092801748232, "loss": 0.7093, "step": 2059 }, { "epoch": 0.23, "learning_rate": 0.0001789283293153636, "loss": 0.6722, "step": 2060 }, { "epoch": 0.23, "learning_rate": 0.0001789057199170976, "loss": 0.6796, "step": 2061 }, { "epoch": 0.23, "learning_rate": 0.0001788830998257483, "loss": 0.6703, "step": 2062 }, { "epoch": 0.23, "learning_rate": 0.00017886046904438109, "loss": 0.6693, "step": 2063 }, { "epoch": 0.23, "learning_rate": 0.00017883782757606288, "loss": 0.7487, "step": 2064 }, { "epoch": 0.23, "learning_rate": 0.00017881517542386193, "loss": 0.7506, "step": 2065 }, { "epoch": 0.23, "learning_rate": 0.00017879251259084804, "loss": 0.6646, "step": 2066 }, { "epoch": 0.23, "learning_rate": 0.0001787698390800924, "loss": 0.6341, "step": 2067 }, { "epoch": 0.24, "learning_rate": 0.00017874715489466764, "loss": 0.7129, "step": 2068 }, { "epoch": 0.24, "learning_rate": 0.00017872446003764787, "loss": 0.633, "step": 2069 }, { "epoch": 0.24, "learning_rate": 0.00017870175451210863, "loss": 0.7337, "step": 2070 }, { "epoch": 0.24, "learning_rate": 0.0001786790383211269, "loss": 0.7648, "step": 2071 }, { "epoch": 0.24, "learning_rate": 0.00017865631146778114, "loss": 0.6941, "step": 2072 }, { "epoch": 0.24, "learning_rate": 0.00017863357395515124, "loss": 0.6958, "step": 2073 }, { "epoch": 0.24, "learning_rate": 0.00017861082578631848, "loss": 0.6963, "step": 2074 }, { "epoch": 0.24, "learning_rate": 0.00017858806696436562, "loss": 0.7412, "step": 2075 }, { "epoch": 0.24, "learning_rate": 0.00017856529749237695, "loss": 0.6732, "step": 2076 }, { "epoch": 0.24, "learning_rate": 0.00017854251737343808, "loss": 0.7118, "step": 2077 }, { "epoch": 0.24, "learning_rate": 0.00017851972661063608, "loss": 0.6031, "step": 2078 }, { "epoch": 0.24, "learning_rate": 0.00017849692520705953, "loss": 0.7068, "step": 2079 }, { "epoch": 0.24, "learning_rate": 0.0001784741131657984, "loss": 0.68, "step": 2080 }, { "epoch": 0.24, "learning_rate": 0.0001784512904899441, "loss": 0.7127, "step": 2081 }, { "epoch": 0.24, "learning_rate": 0.00017842845718258956, "loss": 0.7634, "step": 2082 }, { "epoch": 0.24, "learning_rate": 0.000178405613246829, "loss": 0.6905, "step": 2083 }, { "epoch": 0.24, "learning_rate": 0.0001783827586857582, "loss": 0.7268, "step": 2084 }, { "epoch": 0.24, "learning_rate": 0.00017835989350247435, "loss": 0.6885, "step": 2085 }, { "epoch": 0.24, "learning_rate": 0.00017833701770007606, "loss": 0.6813, "step": 2086 }, { "epoch": 0.24, "learning_rate": 0.00017831413128166344, "loss": 0.6268, "step": 2087 }, { "epoch": 0.24, "learning_rate": 0.00017829123425033795, "loss": 0.7003, "step": 2088 }, { "epoch": 0.24, "learning_rate": 0.00017826832660920253, "loss": 0.6377, "step": 2089 }, { "epoch": 0.24, "learning_rate": 0.0001782454083613616, "loss": 0.6943, "step": 2090 }, { "epoch": 0.24, "learning_rate": 0.00017822247950992093, "loss": 0.7765, "step": 2091 }, { "epoch": 0.24, "learning_rate": 0.0001781995400579878, "loss": 0.7257, "step": 2092 }, { "epoch": 0.24, "learning_rate": 0.00017817659000867093, "loss": 0.7461, "step": 2093 }, { "epoch": 0.24, "learning_rate": 0.0001781536293650804, "loss": 0.6751, "step": 2094 }, { "epoch": 0.24, "learning_rate": 0.0001781306581303278, "loss": 0.7236, "step": 2095 }, { "epoch": 0.24, "learning_rate": 0.00017810767630752606, "loss": 0.7177, "step": 2096 }, { "epoch": 0.24, "learning_rate": 0.0001780846838997897, "loss": 0.7207, "step": 2097 }, { "epoch": 0.24, "learning_rate": 0.00017806168091023453, "loss": 0.6704, "step": 2098 }, { "epoch": 0.24, "learning_rate": 0.00017803866734197792, "loss": 0.6692, "step": 2099 }, { "epoch": 0.24, "learning_rate": 0.00017801564319813853, "loss": 0.683, "step": 2100 }, { "epoch": 0.24, "learning_rate": 0.00017799260848183653, "loss": 0.7176, "step": 2101 }, { "epoch": 0.24, "learning_rate": 0.0001779695631961936, "loss": 0.6798, "step": 2102 }, { "epoch": 0.24, "learning_rate": 0.0001779465073443327, "loss": 0.7715, "step": 2103 }, { "epoch": 0.24, "learning_rate": 0.00017792344092937832, "loss": 0.6468, "step": 2104 }, { "epoch": 0.24, "learning_rate": 0.00017790036395445635, "loss": 0.6322, "step": 2105 }, { "epoch": 0.24, "learning_rate": 0.0001778772764226941, "loss": 0.7219, "step": 2106 }, { "epoch": 0.24, "learning_rate": 0.00017785417833722037, "loss": 0.6952, "step": 2107 }, { "epoch": 0.24, "learning_rate": 0.00017783106970116532, "loss": 0.7014, "step": 2108 }, { "epoch": 0.24, "learning_rate": 0.00017780795051766055, "loss": 0.721, "step": 2109 }, { "epoch": 0.24, "learning_rate": 0.00017778482078983915, "loss": 0.7083, "step": 2110 }, { "epoch": 0.24, "learning_rate": 0.00017776168052083556, "loss": 0.656, "step": 2111 }, { "epoch": 0.24, "learning_rate": 0.00017773852971378576, "loss": 0.712, "step": 2112 }, { "epoch": 0.24, "learning_rate": 0.00017771536837182697, "loss": 0.6536, "step": 2113 }, { "epoch": 0.24, "learning_rate": 0.000177692196498098, "loss": 0.7351, "step": 2114 }, { "epoch": 0.24, "learning_rate": 0.00017766901409573907, "loss": 0.6652, "step": 2115 }, { "epoch": 0.24, "learning_rate": 0.00017764582116789175, "loss": 0.7185, "step": 2116 }, { "epoch": 0.24, "learning_rate": 0.0001776226177176991, "loss": 0.7044, "step": 2117 }, { "epoch": 0.24, "learning_rate": 0.00017759940374830559, "loss": 0.7097, "step": 2118 }, { "epoch": 0.24, "learning_rate": 0.0001775761792628571, "loss": 0.6922, "step": 2119 }, { "epoch": 0.24, "learning_rate": 0.00017755294426450097, "loss": 0.646, "step": 2120 }, { "epoch": 0.24, "learning_rate": 0.00017752969875638592, "loss": 0.807, "step": 2121 }, { "epoch": 0.24, "learning_rate": 0.00017750644274166212, "loss": 0.711, "step": 2122 }, { "epoch": 0.24, "learning_rate": 0.00017748317622348116, "loss": 0.6871, "step": 2123 }, { "epoch": 0.24, "learning_rate": 0.00017745989920499606, "loss": 0.6525, "step": 2124 }, { "epoch": 0.24, "learning_rate": 0.00017743661168936127, "loss": 0.7192, "step": 2125 }, { "epoch": 0.24, "learning_rate": 0.0001774133136797326, "loss": 0.6977, "step": 2126 }, { "epoch": 0.24, "learning_rate": 0.0001773900051792674, "loss": 0.62, "step": 2127 }, { "epoch": 0.24, "learning_rate": 0.00017736668619112433, "loss": 0.7334, "step": 2128 }, { "epoch": 0.24, "learning_rate": 0.00017734335671846352, "loss": 0.7071, "step": 2129 }, { "epoch": 0.24, "learning_rate": 0.0001773200167644465, "loss": 0.7287, "step": 2130 }, { "epoch": 0.24, "learning_rate": 0.00017729666633223626, "loss": 0.6882, "step": 2131 }, { "epoch": 0.24, "learning_rate": 0.00017727330542499718, "loss": 0.6772, "step": 2132 }, { "epoch": 0.24, "learning_rate": 0.00017724993404589508, "loss": 0.7125, "step": 2133 }, { "epoch": 0.24, "learning_rate": 0.00017722655219809717, "loss": 0.7488, "step": 2134 }, { "epoch": 0.24, "learning_rate": 0.00017720315988477205, "loss": 0.6988, "step": 2135 }, { "epoch": 0.24, "learning_rate": 0.00017717975710908985, "loss": 0.7094, "step": 2136 }, { "epoch": 0.24, "learning_rate": 0.00017715634387422205, "loss": 0.6673, "step": 2137 }, { "epoch": 0.24, "learning_rate": 0.00017713292018334145, "loss": 0.6649, "step": 2138 }, { "epoch": 0.24, "learning_rate": 0.00017710948603962248, "loss": 0.6809, "step": 2139 }, { "epoch": 0.24, "learning_rate": 0.0001770860414462408, "loss": 0.6979, "step": 2140 }, { "epoch": 0.24, "learning_rate": 0.0001770625864063736, "loss": 0.7366, "step": 2141 }, { "epoch": 0.24, "learning_rate": 0.00017703912092319942, "loss": 0.7078, "step": 2142 }, { "epoch": 0.24, "learning_rate": 0.00017701564499989818, "loss": 0.7689, "step": 2143 }, { "epoch": 0.24, "learning_rate": 0.00017699215863965138, "loss": 0.5963, "step": 2144 }, { "epoch": 0.24, "learning_rate": 0.00017696866184564174, "loss": 0.7244, "step": 2145 }, { "epoch": 0.24, "learning_rate": 0.00017694515462105353, "loss": 0.6017, "step": 2146 }, { "epoch": 0.24, "learning_rate": 0.00017692163696907235, "loss": 0.7179, "step": 2147 }, { "epoch": 0.24, "learning_rate": 0.00017689810889288528, "loss": 0.6722, "step": 2148 }, { "epoch": 0.24, "learning_rate": 0.00017687457039568076, "loss": 0.7686, "step": 2149 }, { "epoch": 0.24, "learning_rate": 0.00017685102148064864, "loss": 0.7252, "step": 2150 }, { "epoch": 0.24, "learning_rate": 0.00017682746215098028, "loss": 0.6819, "step": 2151 }, { "epoch": 0.24, "learning_rate": 0.0001768038924098683, "loss": 0.6931, "step": 2152 }, { "epoch": 0.24, "learning_rate": 0.00017678031226050678, "loss": 0.6934, "step": 2153 }, { "epoch": 0.24, "learning_rate": 0.00017675672170609135, "loss": 0.7655, "step": 2154 }, { "epoch": 0.24, "learning_rate": 0.0001767331207498188, "loss": 0.7163, "step": 2155 }, { "epoch": 0.25, "learning_rate": 0.0001767095093948876, "loss": 0.6694, "step": 2156 }, { "epoch": 0.25, "learning_rate": 0.0001766858876444974, "loss": 0.7041, "step": 2157 }, { "epoch": 0.25, "learning_rate": 0.00017666225550184937, "loss": 0.6941, "step": 2158 }, { "epoch": 0.25, "learning_rate": 0.00017663861297014612, "loss": 0.6921, "step": 2159 }, { "epoch": 0.25, "learning_rate": 0.00017661496005259158, "loss": 0.6532, "step": 2160 }, { "epoch": 0.25, "learning_rate": 0.0001765912967523911, "loss": 0.7339, "step": 2161 }, { "epoch": 0.25, "learning_rate": 0.00017656762307275155, "loss": 0.6773, "step": 2162 }, { "epoch": 0.25, "learning_rate": 0.00017654393901688105, "loss": 0.6577, "step": 2163 }, { "epoch": 0.25, "learning_rate": 0.0001765202445879892, "loss": 0.6991, "step": 2164 }, { "epoch": 0.25, "learning_rate": 0.00017649653978928705, "loss": 0.7113, "step": 2165 }, { "epoch": 0.25, "learning_rate": 0.00017647282462398693, "loss": 0.6598, "step": 2166 }, { "epoch": 0.25, "learning_rate": 0.00017644909909530273, "loss": 0.6832, "step": 2167 }, { "epoch": 0.25, "learning_rate": 0.00017642536320644964, "loss": 0.6578, "step": 2168 }, { "epoch": 0.25, "learning_rate": 0.0001764016169606443, "loss": 0.7333, "step": 2169 }, { "epoch": 0.25, "learning_rate": 0.00017637786036110468, "loss": 0.6829, "step": 2170 }, { "epoch": 0.25, "learning_rate": 0.00017635409341105026, "loss": 0.6694, "step": 2171 }, { "epoch": 0.25, "learning_rate": 0.00017633031611370185, "loss": 0.6724, "step": 2172 }, { "epoch": 0.25, "learning_rate": 0.0001763065284722817, "loss": 0.642, "step": 2173 }, { "epoch": 0.25, "learning_rate": 0.0001762827304900134, "loss": 0.6406, "step": 2174 }, { "epoch": 0.25, "learning_rate": 0.00017625892217012205, "loss": 0.6926, "step": 2175 }, { "epoch": 0.25, "learning_rate": 0.00017623510351583404, "loss": 0.7341, "step": 2176 }, { "epoch": 0.25, "learning_rate": 0.00017621127453037726, "loss": 0.6343, "step": 2177 }, { "epoch": 0.25, "learning_rate": 0.00017618743521698087, "loss": 0.6951, "step": 2178 }, { "epoch": 0.25, "learning_rate": 0.00017616358557887555, "loss": 0.703, "step": 2179 }, { "epoch": 0.25, "learning_rate": 0.00017613972561929335, "loss": 0.652, "step": 2180 }, { "epoch": 0.25, "learning_rate": 0.00017611585534146767, "loss": 0.7027, "step": 2181 }, { "epoch": 0.25, "learning_rate": 0.0001760919747486334, "loss": 0.6936, "step": 2182 }, { "epoch": 0.25, "learning_rate": 0.0001760680838440267, "loss": 0.7612, "step": 2183 }, { "epoch": 0.25, "learning_rate": 0.00017604418263088528, "loss": 0.6451, "step": 2184 }, { "epoch": 0.25, "learning_rate": 0.00017602027111244804, "loss": 0.6592, "step": 2185 }, { "epoch": 0.25, "learning_rate": 0.00017599634929195553, "loss": 0.6482, "step": 2186 }, { "epoch": 0.25, "learning_rate": 0.00017597241717264952, "loss": 0.7082, "step": 2187 }, { "epoch": 0.25, "learning_rate": 0.00017594847475777323, "loss": 0.7048, "step": 2188 }, { "epoch": 0.25, "learning_rate": 0.00017592452205057127, "loss": 0.7285, "step": 2189 }, { "epoch": 0.25, "learning_rate": 0.00017590055905428962, "loss": 0.6869, "step": 2190 }, { "epoch": 0.25, "learning_rate": 0.00017587658577217571, "loss": 0.6964, "step": 2191 }, { "epoch": 0.25, "learning_rate": 0.00017585260220747832, "loss": 0.6834, "step": 2192 }, { "epoch": 0.25, "learning_rate": 0.00017582860836344762, "loss": 0.7085, "step": 2193 }, { "epoch": 0.25, "learning_rate": 0.0001758046042433352, "loss": 0.6343, "step": 2194 }, { "epoch": 0.25, "learning_rate": 0.00017578058985039406, "loss": 0.6832, "step": 2195 }, { "epoch": 0.25, "learning_rate": 0.00017575656518787854, "loss": 0.6942, "step": 2196 }, { "epoch": 0.25, "learning_rate": 0.00017573253025904436, "loss": 0.6264, "step": 2197 }, { "epoch": 0.25, "learning_rate": 0.0001757084850671487, "loss": 0.6882, "step": 2198 }, { "epoch": 0.25, "learning_rate": 0.00017568442961545013, "loss": 0.717, "step": 2199 }, { "epoch": 0.25, "learning_rate": 0.00017566036390720852, "loss": 0.6498, "step": 2200 }, { "epoch": 0.25, "learning_rate": 0.00017563628794568526, "loss": 0.6857, "step": 2201 }, { "epoch": 0.25, "learning_rate": 0.00017561220173414297, "loss": 0.6957, "step": 2202 }, { "epoch": 0.25, "learning_rate": 0.00017558810527584578, "loss": 0.6998, "step": 2203 }, { "epoch": 0.25, "learning_rate": 0.0001755639985740592, "loss": 0.7495, "step": 2204 }, { "epoch": 0.25, "learning_rate": 0.00017553988163205008, "loss": 0.6751, "step": 2205 }, { "epoch": 0.25, "learning_rate": 0.0001755157544530867, "loss": 0.6736, "step": 2206 }, { "epoch": 0.25, "learning_rate": 0.00017549161704043869, "loss": 0.6796, "step": 2207 }, { "epoch": 0.25, "learning_rate": 0.00017546746939737707, "loss": 0.6869, "step": 2208 }, { "epoch": 0.25, "learning_rate": 0.0001754433115271743, "loss": 0.7659, "step": 2209 }, { "epoch": 0.25, "learning_rate": 0.00017541914343310416, "loss": 0.6909, "step": 2210 }, { "epoch": 0.25, "learning_rate": 0.00017539496511844184, "loss": 0.7273, "step": 2211 }, { "epoch": 0.25, "learning_rate": 0.00017537077658646391, "loss": 0.7275, "step": 2212 }, { "epoch": 0.25, "learning_rate": 0.0001753465778404484, "loss": 0.6792, "step": 2213 }, { "epoch": 0.25, "learning_rate": 0.00017532236888367458, "loss": 0.6279, "step": 2214 }, { "epoch": 0.25, "learning_rate": 0.00017529814971942322, "loss": 0.6467, "step": 2215 }, { "epoch": 0.25, "learning_rate": 0.00017527392035097643, "loss": 0.72, "step": 2216 }, { "epoch": 0.25, "learning_rate": 0.00017524968078161765, "loss": 0.73, "step": 2217 }, { "epoch": 0.25, "learning_rate": 0.00017522543101463185, "loss": 0.6868, "step": 2218 }, { "epoch": 0.25, "learning_rate": 0.00017520117105330525, "loss": 0.6188, "step": 2219 }, { "epoch": 0.25, "learning_rate": 0.00017517690090092548, "loss": 0.7553, "step": 2220 }, { "epoch": 0.25, "learning_rate": 0.00017515262056078153, "loss": 0.6887, "step": 2221 }, { "epoch": 0.25, "learning_rate": 0.0001751283300361639, "loss": 0.7021, "step": 2222 }, { "epoch": 0.25, "learning_rate": 0.0001751040293303643, "loss": 0.7067, "step": 2223 }, { "epoch": 0.25, "learning_rate": 0.00017507971844667593, "loss": 0.7122, "step": 2224 }, { "epoch": 0.25, "learning_rate": 0.00017505539738839332, "loss": 0.586, "step": 2225 }, { "epoch": 0.25, "learning_rate": 0.00017503106615881237, "loss": 0.6898, "step": 2226 }, { "epoch": 0.25, "learning_rate": 0.0001750067247612304, "loss": 0.6454, "step": 2227 }, { "epoch": 0.25, "learning_rate": 0.0001749823731989461, "loss": 0.729, "step": 2228 }, { "epoch": 0.25, "learning_rate": 0.00017495801147525953, "loss": 0.7104, "step": 2229 }, { "epoch": 0.25, "learning_rate": 0.0001749336395934721, "loss": 0.6811, "step": 2230 }, { "epoch": 0.25, "learning_rate": 0.0001749092575568866, "loss": 0.6732, "step": 2231 }, { "epoch": 0.25, "learning_rate": 0.00017488486536880728, "loss": 0.6803, "step": 2232 }, { "epoch": 0.25, "learning_rate": 0.00017486046303253965, "loss": 0.6839, "step": 2233 }, { "epoch": 0.25, "learning_rate": 0.00017483605055139065, "loss": 0.6791, "step": 2234 }, { "epoch": 0.25, "learning_rate": 0.00017481162792866862, "loss": 0.7592, "step": 2235 }, { "epoch": 0.25, "learning_rate": 0.00017478719516768324, "loss": 0.7097, "step": 2236 }, { "epoch": 0.25, "learning_rate": 0.0001747627522717455, "loss": 0.715, "step": 2237 }, { "epoch": 0.25, "learning_rate": 0.00017473829924416796, "loss": 0.661, "step": 2238 }, { "epoch": 0.25, "learning_rate": 0.00017471383608826436, "loss": 0.6838, "step": 2239 }, { "epoch": 0.25, "learning_rate": 0.00017468936280734982, "loss": 0.6554, "step": 2240 }, { "epoch": 0.25, "learning_rate": 0.00017466487940474097, "loss": 0.7118, "step": 2241 }, { "epoch": 0.25, "learning_rate": 0.00017464038588375572, "loss": 0.7146, "step": 2242 }, { "epoch": 0.25, "learning_rate": 0.00017461588224771334, "loss": 0.6231, "step": 2243 }, { "epoch": 0.26, "learning_rate": 0.00017459136849993451, "loss": 0.6706, "step": 2244 }, { "epoch": 0.26, "learning_rate": 0.00017456684464374126, "loss": 0.7243, "step": 2245 }, { "epoch": 0.26, "learning_rate": 0.00017454231068245703, "loss": 0.6752, "step": 2246 }, { "epoch": 0.26, "learning_rate": 0.00017451776661940653, "loss": 0.7333, "step": 2247 }, { "epoch": 0.26, "learning_rate": 0.00017449321245791594, "loss": 0.6673, "step": 2248 }, { "epoch": 0.26, "learning_rate": 0.00017446864820131277, "loss": 0.7247, "step": 2249 }, { "epoch": 0.26, "learning_rate": 0.00017444407385292586, "loss": 0.687, "step": 2250 }, { "epoch": 0.26, "learning_rate": 0.00017441948941608555, "loss": 0.652, "step": 2251 }, { "epoch": 0.26, "learning_rate": 0.00017439489489412337, "loss": 0.7039, "step": 2252 }, { "epoch": 0.26, "learning_rate": 0.00017437029029037233, "loss": 0.6996, "step": 2253 }, { "epoch": 0.26, "learning_rate": 0.00017434567560816678, "loss": 0.5904, "step": 2254 }, { "epoch": 0.26, "learning_rate": 0.00017432105085084243, "loss": 0.7248, "step": 2255 }, { "epoch": 0.26, "learning_rate": 0.00017429641602173635, "loss": 0.6987, "step": 2256 }, { "epoch": 0.26, "learning_rate": 0.00017427177112418698, "loss": 0.6063, "step": 2257 }, { "epoch": 0.26, "learning_rate": 0.00017424711616153415, "loss": 0.6548, "step": 2258 }, { "epoch": 0.26, "learning_rate": 0.000174222451137119, "loss": 0.7223, "step": 2259 }, { "epoch": 0.26, "learning_rate": 0.0001741977760542841, "loss": 0.733, "step": 2260 }, { "epoch": 0.26, "learning_rate": 0.00017417309091637338, "loss": 0.6547, "step": 2261 }, { "epoch": 0.26, "learning_rate": 0.000174148395726732, "loss": 0.6418, "step": 2262 }, { "epoch": 0.26, "learning_rate": 0.00017412369048870664, "loss": 0.6938, "step": 2263 }, { "epoch": 0.26, "learning_rate": 0.00017409897520564532, "loss": 0.6922, "step": 2264 }, { "epoch": 0.26, "learning_rate": 0.00017407424988089733, "loss": 0.6826, "step": 2265 }, { "epoch": 0.26, "learning_rate": 0.0001740495145178134, "loss": 0.6773, "step": 2266 }, { "epoch": 0.26, "learning_rate": 0.0001740247691197456, "loss": 0.6623, "step": 2267 }, { "epoch": 0.26, "learning_rate": 0.00017400001369004733, "loss": 0.7259, "step": 2268 }, { "epoch": 0.26, "learning_rate": 0.0001739752482320734, "loss": 0.6608, "step": 2269 }, { "epoch": 0.26, "learning_rate": 0.00017395047274917994, "loss": 0.6697, "step": 2270 }, { "epoch": 0.26, "learning_rate": 0.00017392568724472452, "loss": 0.6517, "step": 2271 }, { "epoch": 0.26, "learning_rate": 0.00017390089172206592, "loss": 0.72, "step": 2272 }, { "epoch": 0.26, "learning_rate": 0.0001738760861845644, "loss": 0.6651, "step": 2273 }, { "epoch": 0.26, "learning_rate": 0.00017385127063558153, "loss": 0.6788, "step": 2274 }, { "epoch": 0.26, "learning_rate": 0.00017382644507848023, "loss": 0.627, "step": 2275 }, { "epoch": 0.26, "learning_rate": 0.00017380160951662482, "loss": 0.7688, "step": 2276 }, { "epoch": 0.26, "learning_rate": 0.00017377676395338091, "loss": 0.674, "step": 2277 }, { "epoch": 0.26, "learning_rate": 0.00017375190839211553, "loss": 0.6956, "step": 2278 }, { "epoch": 0.26, "learning_rate": 0.00017372704283619706, "loss": 0.734, "step": 2279 }, { "epoch": 0.26, "learning_rate": 0.00017370216728899513, "loss": 0.6889, "step": 2280 }, { "epoch": 0.26, "learning_rate": 0.00017367728175388084, "loss": 0.6915, "step": 2281 }, { "epoch": 0.26, "learning_rate": 0.00017365238623422667, "loss": 0.6936, "step": 2282 }, { "epoch": 0.26, "learning_rate": 0.00017362748073340633, "loss": 0.6927, "step": 2283 }, { "epoch": 0.26, "learning_rate": 0.00017360256525479495, "loss": 0.665, "step": 2284 }, { "epoch": 0.26, "learning_rate": 0.000173577639801769, "loss": 0.702, "step": 2285 }, { "epoch": 0.26, "learning_rate": 0.00017355270437770636, "loss": 0.718, "step": 2286 }, { "epoch": 0.26, "learning_rate": 0.00017352775898598616, "loss": 0.7191, "step": 2287 }, { "epoch": 0.26, "learning_rate": 0.0001735028036299889, "loss": 0.7191, "step": 2288 }, { "epoch": 0.26, "learning_rate": 0.00017347783831309652, "loss": 0.7302, "step": 2289 }, { "epoch": 0.26, "learning_rate": 0.00017345286303869226, "loss": 0.6719, "step": 2290 }, { "epoch": 0.26, "learning_rate": 0.00017342787781016064, "loss": 0.7219, "step": 2291 }, { "epoch": 0.26, "learning_rate": 0.00017340288263088764, "loss": 0.6353, "step": 2292 }, { "epoch": 0.26, "learning_rate": 0.0001733778775042605, "loss": 0.6692, "step": 2293 }, { "epoch": 0.26, "learning_rate": 0.00017335286243366787, "loss": 0.7651, "step": 2294 }, { "epoch": 0.26, "learning_rate": 0.00017332783742249967, "loss": 0.6496, "step": 2295 }, { "epoch": 0.26, "learning_rate": 0.00017330280247414731, "loss": 0.7718, "step": 2296 }, { "epoch": 0.26, "learning_rate": 0.0001732777575920034, "loss": 0.7069, "step": 2297 }, { "epoch": 0.26, "learning_rate": 0.00017325270277946197, "loss": 0.6822, "step": 2298 }, { "epoch": 0.26, "learning_rate": 0.00017322763803991837, "loss": 0.7026, "step": 2299 }, { "epoch": 0.26, "learning_rate": 0.00017320256337676932, "loss": 0.6161, "step": 2300 }, { "epoch": 0.26, "learning_rate": 0.00017317747879341282, "loss": 0.6079, "step": 2301 }, { "epoch": 0.26, "learning_rate": 0.0001731523842932483, "loss": 0.6625, "step": 2302 }, { "epoch": 0.26, "learning_rate": 0.0001731272798796765, "loss": 0.6994, "step": 2303 }, { "epoch": 0.26, "learning_rate": 0.0001731021655560995, "loss": 0.5996, "step": 2304 }, { "epoch": 0.26, "learning_rate": 0.0001730770413259207, "loss": 0.6344, "step": 2305 }, { "epoch": 0.26, "learning_rate": 0.0001730519071925449, "loss": 0.679, "step": 2306 }, { "epoch": 0.26, "learning_rate": 0.00017302676315937817, "loss": 0.698, "step": 2307 }, { "epoch": 0.26, "learning_rate": 0.000173001609229828, "loss": 0.7198, "step": 2308 }, { "epoch": 0.26, "learning_rate": 0.00017297644540730317, "loss": 0.6966, "step": 2309 }, { "epoch": 0.26, "learning_rate": 0.00017295127169521376, "loss": 0.6564, "step": 2310 }, { "epoch": 0.26, "learning_rate": 0.00017292608809697132, "loss": 0.7116, "step": 2311 }, { "epoch": 0.26, "learning_rate": 0.0001729008946159886, "loss": 0.7411, "step": 2312 }, { "epoch": 0.26, "learning_rate": 0.00017287569125567977, "loss": 0.6164, "step": 2313 }, { "epoch": 0.26, "learning_rate": 0.00017285047801946033, "loss": 0.6847, "step": 2314 }, { "epoch": 0.26, "learning_rate": 0.0001728252549107471, "loss": 0.654, "step": 2315 }, { "epoch": 0.26, "learning_rate": 0.00017280002193295824, "loss": 0.6623, "step": 2316 }, { "epoch": 0.26, "learning_rate": 0.00017277477908951325, "loss": 0.69, "step": 2317 }, { "epoch": 0.26, "learning_rate": 0.00017274952638383302, "loss": 0.6618, "step": 2318 }, { "epoch": 0.26, "learning_rate": 0.00017272426381933963, "loss": 0.7572, "step": 2319 }, { "epoch": 0.26, "learning_rate": 0.0001726989913994567, "loss": 0.6788, "step": 2320 }, { "epoch": 0.26, "learning_rate": 0.000172673709127609, "loss": 0.7347, "step": 2321 }, { "epoch": 0.26, "learning_rate": 0.00017264841700722272, "loss": 0.7187, "step": 2322 }, { "epoch": 0.26, "learning_rate": 0.0001726231150417254, "loss": 0.7174, "step": 2323 }, { "epoch": 0.26, "learning_rate": 0.00017259780323454588, "loss": 0.6581, "step": 2324 }, { "epoch": 0.26, "learning_rate": 0.00017257248158911436, "loss": 0.7131, "step": 2325 }, { "epoch": 0.26, "learning_rate": 0.00017254715010886238, "loss": 0.6785, "step": 2326 }, { "epoch": 0.26, "learning_rate": 0.00017252180879722271, "loss": 0.6347, "step": 2327 }, { "epoch": 0.26, "learning_rate": 0.00017249645765762966, "loss": 0.7101, "step": 2328 }, { "epoch": 0.26, "learning_rate": 0.0001724710966935186, "loss": 0.669, "step": 2329 }, { "epoch": 0.26, "learning_rate": 0.00017244572590832647, "loss": 0.7214, "step": 2330 }, { "epoch": 0.26, "learning_rate": 0.00017242034530549148, "loss": 0.6641, "step": 2331 }, { "epoch": 0.27, "learning_rate": 0.000172394954888453, "loss": 0.7084, "step": 2332 }, { "epoch": 0.27, "learning_rate": 0.00017236955466065203, "loss": 0.7202, "step": 2333 }, { "epoch": 0.27, "learning_rate": 0.00017234414462553063, "loss": 0.6971, "step": 2334 }, { "epoch": 0.27, "learning_rate": 0.00017231872478653233, "loss": 0.6811, "step": 2335 }, { "epoch": 0.27, "learning_rate": 0.00017229329514710195, "loss": 0.6739, "step": 2336 }, { "epoch": 0.27, "learning_rate": 0.0001722678557106857, "loss": 0.6828, "step": 2337 }, { "epoch": 0.27, "learning_rate": 0.00017224240648073096, "loss": 0.6722, "step": 2338 }, { "epoch": 0.27, "learning_rate": 0.00017221694746068659, "loss": 0.7245, "step": 2339 }, { "epoch": 0.27, "learning_rate": 0.00017219147865400272, "loss": 0.7553, "step": 2340 }, { "epoch": 0.27, "learning_rate": 0.00017216600006413085, "loss": 0.6723, "step": 2341 }, { "epoch": 0.27, "learning_rate": 0.0001721405116945237, "loss": 0.6829, "step": 2342 }, { "epoch": 0.27, "learning_rate": 0.00017211501354863544, "loss": 0.6611, "step": 2343 }, { "epoch": 0.27, "learning_rate": 0.0001720895056299215, "loss": 0.6817, "step": 2344 }, { "epoch": 0.27, "learning_rate": 0.0001720639879418386, "loss": 0.6934, "step": 2345 }, { "epoch": 0.27, "learning_rate": 0.00017203846048784489, "loss": 0.6627, "step": 2346 }, { "epoch": 0.27, "learning_rate": 0.00017201292327139971, "loss": 0.7556, "step": 2347 }, { "epoch": 0.27, "learning_rate": 0.0001719873762959638, "loss": 0.6552, "step": 2348 }, { "epoch": 0.27, "learning_rate": 0.0001719618195649993, "loss": 0.7167, "step": 2349 }, { "epoch": 0.27, "learning_rate": 0.0001719362530819695, "loss": 0.712, "step": 2350 }, { "epoch": 0.27, "learning_rate": 0.00017191067685033912, "loss": 0.7666, "step": 2351 }, { "epoch": 0.27, "learning_rate": 0.0001718850908735742, "loss": 0.753, "step": 2352 }, { "epoch": 0.27, "learning_rate": 0.00017185949515514205, "loss": 0.7145, "step": 2353 }, { "epoch": 0.27, "learning_rate": 0.00017183388969851135, "loss": 0.7097, "step": 2354 }, { "epoch": 0.27, "learning_rate": 0.00017180827450715208, "loss": 0.6829, "step": 2355 }, { "epoch": 0.27, "learning_rate": 0.00017178264958453554, "loss": 0.6789, "step": 2356 }, { "epoch": 0.27, "learning_rate": 0.00017175701493413434, "loss": 0.6673, "step": 2357 }, { "epoch": 0.27, "learning_rate": 0.00017173137055942242, "loss": 0.667, "step": 2358 }, { "epoch": 0.27, "learning_rate": 0.00017170571646387504, "loss": 0.7273, "step": 2359 }, { "epoch": 0.27, "learning_rate": 0.00017168005265096877, "loss": 0.741, "step": 2360 }, { "epoch": 0.27, "learning_rate": 0.00017165437912418146, "loss": 0.704, "step": 2361 }, { "epoch": 0.27, "learning_rate": 0.00017162869588699238, "loss": 0.7532, "step": 2362 }, { "epoch": 0.27, "learning_rate": 0.00017160300294288204, "loss": 0.7263, "step": 2363 }, { "epoch": 0.27, "learning_rate": 0.0001715773002953322, "loss": 0.7078, "step": 2364 }, { "epoch": 0.27, "learning_rate": 0.0001715515879478261, "loss": 0.7089, "step": 2365 }, { "epoch": 0.27, "learning_rate": 0.00017152586590384817, "loss": 0.7162, "step": 2366 }, { "epoch": 0.27, "learning_rate": 0.0001715001341668842, "loss": 0.7303, "step": 2367 }, { "epoch": 0.27, "learning_rate": 0.00017147439274042126, "loss": 0.732, "step": 2368 }, { "epoch": 0.27, "learning_rate": 0.00017144864162794778, "loss": 0.7046, "step": 2369 }, { "epoch": 0.27, "learning_rate": 0.0001714228808329535, "loss": 0.6098, "step": 2370 }, { "epoch": 0.27, "learning_rate": 0.00017139711035892935, "loss": 0.7355, "step": 2371 }, { "epoch": 0.27, "learning_rate": 0.00017137133020936782, "loss": 0.6477, "step": 2372 }, { "epoch": 0.27, "learning_rate": 0.00017134554038776244, "loss": 0.7047, "step": 2373 }, { "epoch": 0.27, "learning_rate": 0.00017131974089760826, "loss": 0.688, "step": 2374 }, { "epoch": 0.27, "learning_rate": 0.0001712939317424015, "loss": 0.7104, "step": 2375 }, { "epoch": 0.27, "learning_rate": 0.0001712681129256398, "loss": 0.6924, "step": 2376 }, { "epoch": 0.27, "learning_rate": 0.00017124228445082194, "loss": 0.6843, "step": 2377 }, { "epoch": 0.27, "learning_rate": 0.00017121644632144827, "loss": 0.6753, "step": 2378 }, { "epoch": 0.27, "learning_rate": 0.0001711905985410202, "loss": 0.6223, "step": 2379 }, { "epoch": 0.27, "learning_rate": 0.00017116474111304058, "loss": 0.6403, "step": 2380 }, { "epoch": 0.27, "learning_rate": 0.00017113887404101354, "loss": 0.6894, "step": 2381 }, { "epoch": 0.27, "learning_rate": 0.00017111299732844453, "loss": 0.7733, "step": 2382 }, { "epoch": 0.27, "learning_rate": 0.00017108711097884026, "loss": 0.6278, "step": 2383 }, { "epoch": 0.27, "learning_rate": 0.00017106121499570878, "loss": 0.7592, "step": 2384 }, { "epoch": 0.27, "learning_rate": 0.00017103530938255947, "loss": 0.6687, "step": 2385 }, { "epoch": 0.27, "learning_rate": 0.00017100939414290296, "loss": 0.7104, "step": 2386 }, { "epoch": 0.27, "learning_rate": 0.00017098346928025123, "loss": 0.6864, "step": 2387 }, { "epoch": 0.27, "learning_rate": 0.0001709575347981175, "loss": 0.7385, "step": 2388 }, { "epoch": 0.27, "learning_rate": 0.00017093159070001636, "loss": 0.6284, "step": 2389 }, { "epoch": 0.27, "learning_rate": 0.00017090563698946373, "loss": 0.7239, "step": 2390 }, { "epoch": 0.27, "learning_rate": 0.00017087967366997674, "loss": 0.6978, "step": 2391 }, { "epoch": 0.27, "learning_rate": 0.00017085370074507386, "loss": 0.6656, "step": 2392 }, { "epoch": 0.27, "learning_rate": 0.0001708277182182749, "loss": 0.6415, "step": 2393 }, { "epoch": 0.27, "learning_rate": 0.0001708017260931009, "loss": 0.6838, "step": 2394 }, { "epoch": 0.27, "learning_rate": 0.00017077572437307426, "loss": 0.7206, "step": 2395 }, { "epoch": 0.27, "learning_rate": 0.0001707497130617187, "loss": 0.6655, "step": 2396 }, { "epoch": 0.27, "learning_rate": 0.00017072369216255913, "loss": 0.7119, "step": 2397 }, { "epoch": 0.27, "learning_rate": 0.00017069766167912188, "loss": 0.6662, "step": 2398 }, { "epoch": 0.27, "learning_rate": 0.00017067162161493447, "loss": 0.6571, "step": 2399 }, { "epoch": 0.27, "learning_rate": 0.00017064557197352586, "loss": 0.7189, "step": 2400 }, { "epoch": 0.27, "learning_rate": 0.0001706195127584262, "loss": 0.6311, "step": 2401 }, { "epoch": 0.27, "learning_rate": 0.0001705934439731669, "loss": 0.6889, "step": 2402 }, { "epoch": 0.27, "learning_rate": 0.0001705673656212808, "loss": 0.6921, "step": 2403 }, { "epoch": 0.27, "learning_rate": 0.00017054127770630193, "loss": 0.6503, "step": 2404 }, { "epoch": 0.27, "learning_rate": 0.00017051518023176567, "loss": 0.744, "step": 2405 }, { "epoch": 0.27, "learning_rate": 0.00017048907320120867, "loss": 0.6808, "step": 2406 }, { "epoch": 0.27, "learning_rate": 0.00017046295661816884, "loss": 0.7376, "step": 2407 }, { "epoch": 0.27, "learning_rate": 0.00017043683048618554, "loss": 0.7733, "step": 2408 }, { "epoch": 0.27, "learning_rate": 0.0001704106948087992, "loss": 0.7006, "step": 2409 }, { "epoch": 0.27, "learning_rate": 0.00017038454958955167, "loss": 0.7197, "step": 2410 }, { "epoch": 0.27, "learning_rate": 0.00017035839483198615, "loss": 0.7453, "step": 2411 }, { "epoch": 0.27, "learning_rate": 0.00017033223053964698, "loss": 0.6734, "step": 2412 }, { "epoch": 0.27, "learning_rate": 0.0001703060567160799, "loss": 0.7091, "step": 2413 }, { "epoch": 0.27, "learning_rate": 0.0001702798733648319, "loss": 0.6561, "step": 2414 }, { "epoch": 0.27, "learning_rate": 0.0001702536804894513, "loss": 0.6777, "step": 2415 }, { "epoch": 0.27, "learning_rate": 0.00017022747809348769, "loss": 0.6875, "step": 2416 }, { "epoch": 0.27, "learning_rate": 0.00017020126618049193, "loss": 0.6732, "step": 2417 }, { "epoch": 0.27, "learning_rate": 0.0001701750447540162, "loss": 0.6385, "step": 2418 }, { "epoch": 0.27, "learning_rate": 0.00017014881381761392, "loss": 0.6588, "step": 2419 }, { "epoch": 0.28, "learning_rate": 0.00017012257337483986, "loss": 0.6088, "step": 2420 }, { "epoch": 0.28, "learning_rate": 0.00017009632342925005, "loss": 0.7278, "step": 2421 }, { "epoch": 0.28, "learning_rate": 0.00017007006398440176, "loss": 0.761, "step": 2422 }, { "epoch": 0.28, "learning_rate": 0.0001700437950438537, "loss": 0.6765, "step": 2423 }, { "epoch": 0.28, "learning_rate": 0.00017001751661116567, "loss": 0.7016, "step": 2424 }, { "epoch": 0.28, "learning_rate": 0.00016999122868989895, "loss": 0.7087, "step": 2425 }, { "epoch": 0.28, "learning_rate": 0.00016996493128361586, "loss": 0.7209, "step": 2426 }, { "epoch": 0.28, "learning_rate": 0.00016993862439588025, "loss": 0.7356, "step": 2427 }, { "epoch": 0.28, "learning_rate": 0.00016991230803025718, "loss": 0.7002, "step": 2428 }, { "epoch": 0.28, "learning_rate": 0.00016988598219031288, "loss": 0.6929, "step": 2429 }, { "epoch": 0.28, "learning_rate": 0.00016985964687961507, "loss": 0.6878, "step": 2430 }, { "epoch": 0.28, "learning_rate": 0.0001698333021017325, "loss": 0.6452, "step": 2431 }, { "epoch": 0.28, "learning_rate": 0.00016980694786023544, "loss": 0.6783, "step": 2432 }, { "epoch": 0.28, "learning_rate": 0.00016978058415869534, "loss": 0.6875, "step": 2433 }, { "epoch": 0.28, "learning_rate": 0.0001697542110006849, "loss": 0.7088, "step": 2434 }, { "epoch": 0.28, "learning_rate": 0.00016972782838977813, "loss": 0.6565, "step": 2435 }, { "epoch": 0.28, "learning_rate": 0.00016970143632955037, "loss": 0.6872, "step": 2436 }, { "epoch": 0.28, "learning_rate": 0.00016967503482357815, "loss": 0.7441, "step": 2437 }, { "epoch": 0.28, "learning_rate": 0.00016964862387543937, "loss": 0.6544, "step": 2438 }, { "epoch": 0.28, "learning_rate": 0.00016962220348871315, "loss": 0.7532, "step": 2439 }, { "epoch": 0.28, "learning_rate": 0.0001695957736669799, "loss": 0.7075, "step": 2440 }, { "epoch": 0.28, "learning_rate": 0.00016956933441382134, "loss": 0.698, "step": 2441 }, { "epoch": 0.28, "learning_rate": 0.00016954288573282043, "loss": 0.6088, "step": 2442 }, { "epoch": 0.28, "learning_rate": 0.0001695164276275614, "loss": 0.6694, "step": 2443 }, { "epoch": 0.28, "learning_rate": 0.0001694899601016298, "loss": 0.5776, "step": 2444 }, { "epoch": 0.28, "learning_rate": 0.00016946348315861247, "loss": 0.6467, "step": 2445 }, { "epoch": 0.28, "learning_rate": 0.0001694369968020974, "loss": 0.7521, "step": 2446 }, { "epoch": 0.28, "learning_rate": 0.00016941050103567404, "loss": 0.7369, "step": 2447 }, { "epoch": 0.28, "learning_rate": 0.000169383995862933, "loss": 0.6493, "step": 2448 }, { "epoch": 0.28, "learning_rate": 0.00016935748128746612, "loss": 0.7052, "step": 2449 }, { "epoch": 0.28, "learning_rate": 0.00016933095731286668, "loss": 0.6927, "step": 2450 }, { "epoch": 0.28, "learning_rate": 0.0001693044239427291, "loss": 0.6662, "step": 2451 }, { "epoch": 0.28, "learning_rate": 0.00016927788118064905, "loss": 0.6683, "step": 2452 }, { "epoch": 0.28, "learning_rate": 0.0001692513290302236, "loss": 0.6719, "step": 2453 }, { "epoch": 0.28, "learning_rate": 0.00016922476749505098, "loss": 0.6703, "step": 2454 }, { "epoch": 0.28, "learning_rate": 0.0001691981965787308, "loss": 0.6431, "step": 2455 }, { "epoch": 0.28, "learning_rate": 0.00016917161628486382, "loss": 0.7085, "step": 2456 }, { "epoch": 0.28, "learning_rate": 0.00016914502661705214, "loss": 0.642, "step": 2457 }, { "epoch": 0.28, "learning_rate": 0.0001691184275788991, "loss": 0.705, "step": 2458 }, { "epoch": 0.28, "learning_rate": 0.00016909181917400937, "loss": 0.6296, "step": 2459 }, { "epoch": 0.28, "learning_rate": 0.0001690652014059888, "loss": 0.7052, "step": 2460 }, { "epoch": 0.28, "learning_rate": 0.00016903857427844459, "loss": 0.6958, "step": 2461 }, { "epoch": 0.28, "learning_rate": 0.00016901193779498517, "loss": 0.6746, "step": 2462 }, { "epoch": 0.28, "learning_rate": 0.00016898529195922022, "loss": 0.7047, "step": 2463 }, { "epoch": 0.28, "learning_rate": 0.00016895863677476075, "loss": 0.6758, "step": 2464 }, { "epoch": 0.28, "learning_rate": 0.00016893197224521894, "loss": 0.6624, "step": 2465 }, { "epoch": 0.28, "learning_rate": 0.00016890529837420835, "loss": 0.7298, "step": 2466 }, { "epoch": 0.28, "learning_rate": 0.00016887861516534368, "loss": 0.6598, "step": 2467 }, { "epoch": 0.28, "learning_rate": 0.00016885192262224106, "loss": 0.6605, "step": 2468 }, { "epoch": 0.28, "learning_rate": 0.0001688252207485177, "loss": 0.605, "step": 2469 }, { "epoch": 0.28, "learning_rate": 0.0001687985095477922, "loss": 0.6957, "step": 2470 }, { "epoch": 0.28, "learning_rate": 0.00016877178902368443, "loss": 0.6611, "step": 2471 }, { "epoch": 0.28, "learning_rate": 0.0001687450591798154, "loss": 0.7047, "step": 2472 }, { "epoch": 0.28, "learning_rate": 0.00016871832001980752, "loss": 0.7459, "step": 2473 }, { "epoch": 0.28, "learning_rate": 0.00016869157154728436, "loss": 0.7093, "step": 2474 }, { "epoch": 0.28, "learning_rate": 0.00016866481376587083, "loss": 0.6797, "step": 2475 }, { "epoch": 0.28, "learning_rate": 0.0001686380466791931, "loss": 0.6516, "step": 2476 }, { "epoch": 0.28, "learning_rate": 0.0001686112702908785, "loss": 0.5928, "step": 2477 }, { "epoch": 0.28, "learning_rate": 0.00016858448460455575, "loss": 0.6987, "step": 2478 }, { "epoch": 0.28, "learning_rate": 0.00016855768962385477, "loss": 0.7643, "step": 2479 }, { "epoch": 0.28, "learning_rate": 0.00016853088535240666, "loss": 0.6585, "step": 2480 }, { "epoch": 0.28, "learning_rate": 0.00016850407179384397, "loss": 0.6997, "step": 2481 }, { "epoch": 0.28, "learning_rate": 0.00016847724895180038, "loss": 0.6938, "step": 2482 }, { "epoch": 0.28, "learning_rate": 0.00016845041682991076, "loss": 0.6866, "step": 2483 }, { "epoch": 0.28, "learning_rate": 0.00016842357543181137, "loss": 0.6859, "step": 2484 }, { "epoch": 0.28, "learning_rate": 0.00016839672476113974, "loss": 0.6859, "step": 2485 }, { "epoch": 0.28, "learning_rate": 0.0001683698648215345, "loss": 0.7046, "step": 2486 }, { "epoch": 0.28, "learning_rate": 0.00016834299561663575, "loss": 0.6646, "step": 2487 }, { "epoch": 0.28, "learning_rate": 0.00016831611715008462, "loss": 0.7525, "step": 2488 }, { "epoch": 0.28, "learning_rate": 0.00016828922942552368, "loss": 0.6942, "step": 2489 }, { "epoch": 0.28, "learning_rate": 0.00016826233244659661, "loss": 0.6967, "step": 2490 }, { "epoch": 0.28, "learning_rate": 0.0001682354262169485, "loss": 0.6476, "step": 2491 }, { "epoch": 0.28, "learning_rate": 0.00016820851074022554, "loss": 0.6748, "step": 2492 }, { "epoch": 0.28, "learning_rate": 0.0001681815860200753, "loss": 0.6689, "step": 2493 }, { "epoch": 0.28, "learning_rate": 0.00016815465206014641, "loss": 0.7268, "step": 2494 }, { "epoch": 0.28, "learning_rate": 0.00016812770886408905, "loss": 0.7833, "step": 2495 }, { "epoch": 0.28, "learning_rate": 0.00016810075643555438, "loss": 0.6794, "step": 2496 }, { "epoch": 0.28, "learning_rate": 0.00016807379477819497, "loss": 0.6926, "step": 2497 }, { "epoch": 0.28, "learning_rate": 0.0001680468238956646, "loss": 0.7425, "step": 2498 }, { "epoch": 0.28, "learning_rate": 0.00016801984379161825, "loss": 0.6507, "step": 2499 }, { "epoch": 0.28, "learning_rate": 0.00016799285446971216, "loss": 0.6414, "step": 2500 }, { "epoch": 0.28, "learning_rate": 0.00016796585593360392, "loss": 0.7045, "step": 2501 }, { "epoch": 0.28, "learning_rate": 0.00016793884818695225, "loss": 0.6878, "step": 2502 }, { "epoch": 0.28, "learning_rate": 0.0001679118312334172, "loss": 0.7455, "step": 2503 }, { "epoch": 0.28, "learning_rate": 0.00016788480507665997, "loss": 0.5972, "step": 2504 }, { "epoch": 0.28, "learning_rate": 0.00016785776972034317, "loss": 0.6826, "step": 2505 }, { "epoch": 0.28, "learning_rate": 0.00016783072516813046, "loss": 0.7273, "step": 2506 }, { "epoch": 0.28, "learning_rate": 0.00016780367142368686, "loss": 0.6786, "step": 2507 }, { "epoch": 0.29, "learning_rate": 0.00016777660849067868, "loss": 0.6572, "step": 2508 }, { "epoch": 0.29, "learning_rate": 0.00016774953637277334, "loss": 0.689, "step": 2509 }, { "epoch": 0.29, "learning_rate": 0.00016772245507363964, "loss": 0.6667, "step": 2510 }, { "epoch": 0.29, "learning_rate": 0.0001676953645969475, "loss": 0.6334, "step": 2511 }, { "epoch": 0.29, "learning_rate": 0.0001676682649463682, "loss": 0.6064, "step": 2512 }, { "epoch": 0.29, "learning_rate": 0.0001676411561255742, "loss": 0.7131, "step": 2513 }, { "epoch": 0.29, "learning_rate": 0.00016761403813823913, "loss": 0.7593, "step": 2514 }, { "epoch": 0.29, "learning_rate": 0.00016758691098803805, "loss": 0.6514, "step": 2515 }, { "epoch": 0.29, "learning_rate": 0.00016755977467864714, "loss": 0.6778, "step": 2516 }, { "epoch": 0.29, "learning_rate": 0.0001675326292137438, "loss": 0.7079, "step": 2517 }, { "epoch": 0.29, "learning_rate": 0.0001675054745970067, "loss": 0.7239, "step": 2518 }, { "epoch": 0.29, "learning_rate": 0.0001674783108321158, "loss": 0.6712, "step": 2519 }, { "epoch": 0.29, "learning_rate": 0.00016745113792275223, "loss": 0.6826, "step": 2520 }, { "epoch": 0.29, "learning_rate": 0.0001674239558725984, "loss": 0.6571, "step": 2521 }, { "epoch": 0.29, "learning_rate": 0.00016739676468533797, "loss": 0.6822, "step": 2522 }, { "epoch": 0.29, "learning_rate": 0.00016736956436465573, "loss": 0.7098, "step": 2523 }, { "epoch": 0.29, "learning_rate": 0.00016734235491423788, "loss": 0.7114, "step": 2524 }, { "epoch": 0.29, "learning_rate": 0.0001673151363377717, "loss": 0.6652, "step": 2525 }, { "epoch": 0.29, "learning_rate": 0.00016728790863894586, "loss": 0.689, "step": 2526 }, { "epoch": 0.29, "learning_rate": 0.00016726067182145008, "loss": 0.6583, "step": 2527 }, { "epoch": 0.29, "learning_rate": 0.00016723342588897554, "loss": 0.7338, "step": 2528 }, { "epoch": 0.29, "learning_rate": 0.0001672061708452144, "loss": 0.6736, "step": 2529 }, { "epoch": 0.29, "learning_rate": 0.00016717890669386027, "loss": 0.7327, "step": 2530 }, { "epoch": 0.29, "learning_rate": 0.0001671516334386079, "loss": 0.7045, "step": 2531 }, { "epoch": 0.29, "learning_rate": 0.00016712435108315327, "loss": 0.7039, "step": 2532 }, { "epoch": 0.29, "learning_rate": 0.00016709705963119365, "loss": 0.7479, "step": 2533 }, { "epoch": 0.29, "learning_rate": 0.00016706975908642742, "loss": 0.7392, "step": 2534 }, { "epoch": 0.29, "learning_rate": 0.00016704244945255433, "loss": 0.6987, "step": 2535 }, { "epoch": 0.29, "learning_rate": 0.00016701513073327532, "loss": 0.6692, "step": 2536 }, { "epoch": 0.29, "learning_rate": 0.00016698780293229252, "loss": 0.7095, "step": 2537 }, { "epoch": 0.29, "learning_rate": 0.0001669604660533093, "loss": 0.6975, "step": 2538 }, { "epoch": 0.29, "learning_rate": 0.00016693312010003034, "loss": 0.6866, "step": 2539 }, { "epoch": 0.29, "learning_rate": 0.0001669057650761614, "loss": 0.717, "step": 2540 }, { "epoch": 0.29, "learning_rate": 0.00016687840098540961, "loss": 0.6837, "step": 2541 }, { "epoch": 0.29, "learning_rate": 0.0001668510278314833, "loss": 0.6486, "step": 2542 }, { "epoch": 0.29, "learning_rate": 0.00016682364561809197, "loss": 0.6598, "step": 2543 }, { "epoch": 0.29, "learning_rate": 0.00016679625434894634, "loss": 0.7316, "step": 2544 }, { "epoch": 0.29, "learning_rate": 0.00016676885402775848, "loss": 0.7196, "step": 2545 }, { "epoch": 0.29, "learning_rate": 0.00016674144465824155, "loss": 0.7083, "step": 2546 }, { "epoch": 0.29, "learning_rate": 0.00016671402624411004, "loss": 0.6901, "step": 2547 }, { "epoch": 0.29, "learning_rate": 0.00016668659878907955, "loss": 0.5847, "step": 2548 }, { "epoch": 0.29, "learning_rate": 0.000166659162296867, "loss": 0.6506, "step": 2549 }, { "epoch": 0.29, "learning_rate": 0.00016663171677119056, "loss": 0.6718, "step": 2550 }, { "epoch": 0.29, "learning_rate": 0.0001666042622157695, "loss": 0.7556, "step": 2551 }, { "epoch": 0.29, "learning_rate": 0.00016657679863432438, "loss": 0.6584, "step": 2552 }, { "epoch": 0.29, "learning_rate": 0.0001665493260305771, "loss": 0.7158, "step": 2553 }, { "epoch": 0.29, "learning_rate": 0.0001665218444082505, "loss": 0.6195, "step": 2554 }, { "epoch": 0.29, "learning_rate": 0.00016649435377106894, "loss": 0.703, "step": 2555 }, { "epoch": 0.29, "learning_rate": 0.00016646685412275786, "loss": 0.677, "step": 2556 }, { "epoch": 0.29, "learning_rate": 0.00016643934546704388, "loss": 0.7167, "step": 2557 }, { "epoch": 0.29, "learning_rate": 0.00016641182780765496, "loss": 0.6421, "step": 2558 }, { "epoch": 0.29, "learning_rate": 0.00016638430114832015, "loss": 0.642, "step": 2559 }, { "epoch": 0.29, "learning_rate": 0.00016635676549276983, "loss": 0.6559, "step": 2560 }, { "epoch": 0.29, "learning_rate": 0.00016632922084473556, "loss": 0.7806, "step": 2561 }, { "epoch": 0.29, "learning_rate": 0.00016630166720795012, "loss": 0.7242, "step": 2562 }, { "epoch": 0.29, "learning_rate": 0.00016627410458614744, "loss": 0.7436, "step": 2563 }, { "epoch": 0.29, "learning_rate": 0.00016624653298306282, "loss": 0.71, "step": 2564 }, { "epoch": 0.29, "learning_rate": 0.0001662189524024326, "loss": 0.6303, "step": 2565 }, { "epoch": 0.29, "learning_rate": 0.00016619136284799448, "loss": 0.6529, "step": 2566 }, { "epoch": 0.29, "learning_rate": 0.00016616376432348733, "loss": 0.7232, "step": 2567 }, { "epoch": 0.29, "learning_rate": 0.00016613615683265116, "loss": 0.6971, "step": 2568 }, { "epoch": 0.29, "learning_rate": 0.0001661085403792273, "loss": 0.6867, "step": 2569 }, { "epoch": 0.29, "learning_rate": 0.00016608091496695825, "loss": 0.6597, "step": 2570 }, { "epoch": 0.29, "learning_rate": 0.00016605328059958775, "loss": 0.6955, "step": 2571 }, { "epoch": 0.29, "learning_rate": 0.0001660256372808607, "loss": 0.6932, "step": 2572 }, { "epoch": 0.29, "learning_rate": 0.00016599798501452327, "loss": 0.6924, "step": 2573 }, { "epoch": 0.29, "learning_rate": 0.00016597032380432278, "loss": 0.6743, "step": 2574 }, { "epoch": 0.29, "learning_rate": 0.00016594265365400785, "loss": 0.6888, "step": 2575 }, { "epoch": 0.29, "learning_rate": 0.00016591497456732826, "loss": 0.6752, "step": 2576 }, { "epoch": 0.29, "learning_rate": 0.00016588728654803493, "loss": 0.7148, "step": 2577 }, { "epoch": 0.29, "learning_rate": 0.00016585958959988018, "loss": 0.6961, "step": 2578 }, { "epoch": 0.29, "learning_rate": 0.00016583188372661732, "loss": 0.712, "step": 2579 }, { "epoch": 0.29, "learning_rate": 0.00016580416893200104, "loss": 0.7219, "step": 2580 }, { "epoch": 0.29, "learning_rate": 0.0001657764452197871, "loss": 0.6416, "step": 2581 }, { "epoch": 0.29, "learning_rate": 0.00016574871259373262, "loss": 0.658, "step": 2582 }, { "epoch": 0.29, "learning_rate": 0.00016572097105759578, "loss": 0.6967, "step": 2583 }, { "epoch": 0.29, "learning_rate": 0.0001656932206151361, "loss": 0.6743, "step": 2584 }, { "epoch": 0.29, "learning_rate": 0.0001656654612701142, "loss": 0.6234, "step": 2585 }, { "epoch": 0.29, "learning_rate": 0.00016563769302629195, "loss": 0.7108, "step": 2586 }, { "epoch": 0.29, "learning_rate": 0.00016560991588743243, "loss": 0.7008, "step": 2587 }, { "epoch": 0.29, "learning_rate": 0.00016558212985729994, "loss": 0.7304, "step": 2588 }, { "epoch": 0.29, "learning_rate": 0.00016555433493965996, "loss": 0.6925, "step": 2589 }, { "epoch": 0.29, "learning_rate": 0.00016552653113827915, "loss": 0.6905, "step": 2590 }, { "epoch": 0.29, "learning_rate": 0.00016549871845692542, "loss": 0.6421, "step": 2591 }, { "epoch": 0.29, "learning_rate": 0.00016547089689936784, "loss": 0.7065, "step": 2592 }, { "epoch": 0.29, "learning_rate": 0.0001654430664693768, "loss": 0.7099, "step": 2593 }, { "epoch": 0.29, "learning_rate": 0.00016541522717072372, "loss": 0.6845, "step": 2594 }, { "epoch": 0.29, "learning_rate": 0.00016538737900718132, "loss": 0.7239, "step": 2595 }, { "epoch": 0.3, "learning_rate": 0.00016535952198252357, "loss": 0.6103, "step": 2596 }, { "epoch": 0.3, "learning_rate": 0.00016533165610052545, "loss": 0.687, "step": 2597 }, { "epoch": 0.3, "learning_rate": 0.00016530378136496335, "loss": 0.6971, "step": 2598 }, { "epoch": 0.3, "learning_rate": 0.00016527589777961478, "loss": 0.6475, "step": 2599 }, { "epoch": 0.3, "learning_rate": 0.0001652480053482584, "loss": 0.6398, "step": 2600 }, { "epoch": 0.3, "learning_rate": 0.00016522010407467414, "loss": 0.6978, "step": 2601 }, { "epoch": 0.3, "learning_rate": 0.00016519219396264316, "loss": 0.7031, "step": 2602 }, { "epoch": 0.3, "learning_rate": 0.00016516427501594766, "loss": 0.7142, "step": 2603 }, { "epoch": 0.3, "learning_rate": 0.00016513634723837117, "loss": 0.703, "step": 2604 }, { "epoch": 0.3, "learning_rate": 0.00016510841063369845, "loss": 0.7242, "step": 2605 }, { "epoch": 0.3, "learning_rate": 0.0001650804652057153, "loss": 0.7222, "step": 2606 }, { "epoch": 0.3, "learning_rate": 0.00016505251095820888, "loss": 0.6873, "step": 2607 }, { "epoch": 0.3, "learning_rate": 0.0001650245478949674, "loss": 0.6893, "step": 2608 }, { "epoch": 0.3, "learning_rate": 0.00016499657601978037, "loss": 0.7062, "step": 2609 }, { "epoch": 0.3, "learning_rate": 0.00016496859533643852, "loss": 0.6662, "step": 2610 }, { "epoch": 0.3, "learning_rate": 0.0001649406058487336, "loss": 0.7087, "step": 2611 }, { "epoch": 0.3, "learning_rate": 0.00016491260756045875, "loss": 0.672, "step": 2612 }, { "epoch": 0.3, "learning_rate": 0.00016488460047540818, "loss": 0.7532, "step": 2613 }, { "epoch": 0.3, "learning_rate": 0.00016485658459737738, "loss": 0.7048, "step": 2614 }, { "epoch": 0.3, "learning_rate": 0.00016482855993016292, "loss": 0.7229, "step": 2615 }, { "epoch": 0.3, "learning_rate": 0.00016480052647756268, "loss": 0.7213, "step": 2616 }, { "epoch": 0.3, "learning_rate": 0.00016477248424337564, "loss": 0.7597, "step": 2617 }, { "epoch": 0.3, "learning_rate": 0.00016474443323140204, "loss": 0.7351, "step": 2618 }, { "epoch": 0.3, "learning_rate": 0.00016471637344544324, "loss": 0.7067, "step": 2619 }, { "epoch": 0.3, "learning_rate": 0.0001646883048893018, "loss": 0.6735, "step": 2620 }, { "epoch": 0.3, "learning_rate": 0.00016466022756678157, "loss": 0.6383, "step": 2621 }, { "epoch": 0.3, "learning_rate": 0.00016463214148168745, "loss": 0.6793, "step": 2622 }, { "epoch": 0.3, "learning_rate": 0.00016460404663782563, "loss": 0.664, "step": 2623 }, { "epoch": 0.3, "learning_rate": 0.00016457594303900344, "loss": 0.6626, "step": 2624 }, { "epoch": 0.3, "learning_rate": 0.00016454783068902933, "loss": 0.7371, "step": 2625 }, { "epoch": 0.3, "learning_rate": 0.00016451970959171307, "loss": 0.6955, "step": 2626 }, { "epoch": 0.3, "learning_rate": 0.00016449157975086557, "loss": 0.6586, "step": 2627 }, { "epoch": 0.3, "learning_rate": 0.0001644634411702989, "loss": 0.7221, "step": 2628 }, { "epoch": 0.3, "learning_rate": 0.00016443529385382622, "loss": 0.6776, "step": 2629 }, { "epoch": 0.3, "learning_rate": 0.00016440713780526217, "loss": 0.6965, "step": 2630 }, { "epoch": 0.3, "learning_rate": 0.0001643789730284222, "loss": 0.6801, "step": 2631 }, { "epoch": 0.3, "learning_rate": 0.00016435079952712317, "loss": 0.6795, "step": 2632 }, { "epoch": 0.3, "learning_rate": 0.00016432261730518316, "loss": 0.7002, "step": 2633 }, { "epoch": 0.3, "learning_rate": 0.00016429442636642125, "loss": 0.7485, "step": 2634 }, { "epoch": 0.3, "learning_rate": 0.00016426622671465783, "loss": 0.7406, "step": 2635 }, { "epoch": 0.3, "learning_rate": 0.00016423801835371444, "loss": 0.6065, "step": 2636 }, { "epoch": 0.3, "learning_rate": 0.0001642098012874138, "loss": 0.6332, "step": 2637 }, { "epoch": 0.3, "learning_rate": 0.00016418157551957978, "loss": 0.6834, "step": 2638 }, { "epoch": 0.3, "learning_rate": 0.0001641533410540375, "loss": 0.6991, "step": 2639 }, { "epoch": 0.3, "learning_rate": 0.00016412509789461322, "loss": 0.6689, "step": 2640 }, { "epoch": 0.3, "learning_rate": 0.0001640968460451343, "loss": 0.6897, "step": 2641 }, { "epoch": 0.3, "learning_rate": 0.00016406858550942945, "loss": 0.711, "step": 2642 }, { "epoch": 0.3, "learning_rate": 0.0001640403162913284, "loss": 0.6905, "step": 2643 }, { "epoch": 0.3, "learning_rate": 0.00016401203839466213, "loss": 0.7047, "step": 2644 }, { "epoch": 0.3, "learning_rate": 0.00016398375182326278, "loss": 0.7192, "step": 2645 }, { "epoch": 0.3, "learning_rate": 0.00016395545658096365, "loss": 0.7057, "step": 2646 }, { "epoch": 0.3, "learning_rate": 0.00016392715267159926, "loss": 0.6795, "step": 2647 }, { "epoch": 0.3, "learning_rate": 0.00016389884009900528, "loss": 0.6445, "step": 2648 }, { "epoch": 0.3, "learning_rate": 0.0001638705188670185, "loss": 0.7248, "step": 2649 }, { "epoch": 0.3, "learning_rate": 0.000163842188979477, "loss": 0.7027, "step": 2650 }, { "epoch": 0.3, "learning_rate": 0.00016381385044021994, "loss": 0.7378, "step": 2651 }, { "epoch": 0.3, "learning_rate": 0.00016378550325308767, "loss": 0.7144, "step": 2652 }, { "epoch": 0.3, "learning_rate": 0.00016375714742192175, "loss": 0.6772, "step": 2653 }, { "epoch": 0.3, "learning_rate": 0.00016372878295056487, "loss": 0.755, "step": 2654 }, { "epoch": 0.3, "learning_rate": 0.00016370040984286087, "loss": 0.7309, "step": 2655 }, { "epoch": 0.3, "learning_rate": 0.00016367202810265485, "loss": 0.5871, "step": 2656 }, { "epoch": 0.3, "learning_rate": 0.00016364363773379296, "loss": 0.6976, "step": 2657 }, { "epoch": 0.3, "learning_rate": 0.00016361523874012265, "loss": 0.7166, "step": 2658 }, { "epoch": 0.3, "learning_rate": 0.00016358683112549245, "loss": 0.7041, "step": 2659 }, { "epoch": 0.3, "learning_rate": 0.00016355841489375207, "loss": 0.7263, "step": 2660 }, { "epoch": 0.3, "learning_rate": 0.0001635299900487524, "loss": 0.6951, "step": 2661 }, { "epoch": 0.3, "learning_rate": 0.0001635015565943455, "loss": 0.6904, "step": 2662 }, { "epoch": 0.3, "learning_rate": 0.00016347311453438455, "loss": 0.7119, "step": 2663 }, { "epoch": 0.3, "learning_rate": 0.00016344466387272405, "loss": 0.762, "step": 2664 }, { "epoch": 0.3, "learning_rate": 0.00016341620461321946, "loss": 0.6483, "step": 2665 }, { "epoch": 0.3, "learning_rate": 0.0001633877367597275, "loss": 0.7175, "step": 2666 }, { "epoch": 0.3, "learning_rate": 0.0001633592603161061, "loss": 0.6629, "step": 2667 }, { "epoch": 0.3, "learning_rate": 0.00016333077528621427, "loss": 0.6685, "step": 2668 }, { "epoch": 0.3, "learning_rate": 0.00016330228167391224, "loss": 0.7221, "step": 2669 }, { "epoch": 0.3, "learning_rate": 0.0001632737794830614, "loss": 0.6657, "step": 2670 }, { "epoch": 0.3, "learning_rate": 0.00016324526871752427, "loss": 0.7255, "step": 2671 }, { "epoch": 0.3, "learning_rate": 0.00016321674938116453, "loss": 0.7211, "step": 2672 }, { "epoch": 0.3, "learning_rate": 0.00016318822147784706, "loss": 0.6243, "step": 2673 }, { "epoch": 0.3, "learning_rate": 0.00016315968501143791, "loss": 0.6851, "step": 2674 }, { "epoch": 0.3, "learning_rate": 0.0001631311399858042, "loss": 0.6778, "step": 2675 }, { "epoch": 0.3, "learning_rate": 0.00016310258640481434, "loss": 0.685, "step": 2676 }, { "epoch": 0.3, "learning_rate": 0.0001630740242723378, "loss": 0.7035, "step": 2677 }, { "epoch": 0.3, "learning_rate": 0.0001630454535922452, "loss": 0.6756, "step": 2678 }, { "epoch": 0.3, "learning_rate": 0.00016301687436840847, "loss": 0.6704, "step": 2679 }, { "epoch": 0.3, "learning_rate": 0.00016298828660470048, "loss": 0.709, "step": 2680 }, { "epoch": 0.3, "learning_rate": 0.00016295969030499539, "loss": 0.6356, "step": 2681 }, { "epoch": 0.3, "learning_rate": 0.0001629310854731685, "loss": 0.6211, "step": 2682 }, { "epoch": 0.3, "learning_rate": 0.0001629024721130963, "loss": 0.6148, "step": 2683 }, { "epoch": 0.31, "learning_rate": 0.0001628738502286563, "loss": 0.6639, "step": 2684 }, { "epoch": 0.31, "learning_rate": 0.0001628452198237273, "loss": 0.6884, "step": 2685 }, { "epoch": 0.31, "learning_rate": 0.00016281658090218926, "loss": 0.6469, "step": 2686 }, { "epoch": 0.31, "learning_rate": 0.0001627879334679232, "loss": 0.6501, "step": 2687 }, { "epoch": 0.31, "learning_rate": 0.00016275927752481132, "loss": 0.646, "step": 2688 }, { "epoch": 0.31, "learning_rate": 0.00016273061307673706, "loss": 0.6955, "step": 2689 }, { "epoch": 0.31, "learning_rate": 0.0001627019401275849, "loss": 0.7876, "step": 2690 }, { "epoch": 0.31, "learning_rate": 0.00016267325868124052, "loss": 0.6999, "step": 2691 }, { "epoch": 0.31, "learning_rate": 0.00016264456874159075, "loss": 0.7242, "step": 2692 }, { "epoch": 0.31, "learning_rate": 0.00016261587031252361, "loss": 0.6964, "step": 2693 }, { "epoch": 0.31, "learning_rate": 0.00016258716339792817, "loss": 0.6052, "step": 2694 }, { "epoch": 0.31, "learning_rate": 0.00016255844800169473, "loss": 0.7035, "step": 2695 }, { "epoch": 0.31, "learning_rate": 0.00016252972412771476, "loss": 0.6499, "step": 2696 }, { "epoch": 0.31, "learning_rate": 0.0001625009917798808, "loss": 0.6407, "step": 2697 }, { "epoch": 0.31, "learning_rate": 0.00016247225096208655, "loss": 0.6843, "step": 2698 }, { "epoch": 0.31, "learning_rate": 0.00016244350167822697, "loss": 0.734, "step": 2699 }, { "epoch": 0.31, "learning_rate": 0.000162414743932198, "loss": 0.7138, "step": 2700 }, { "epoch": 0.31, "learning_rate": 0.00016238597772789688, "loss": 0.7024, "step": 2701 }, { "epoch": 0.31, "learning_rate": 0.00016235720306922188, "loss": 0.6803, "step": 2702 }, { "epoch": 0.31, "learning_rate": 0.00016232841996007246, "loss": 0.7416, "step": 2703 }, { "epoch": 0.31, "learning_rate": 0.00016229962840434925, "loss": 0.6865, "step": 2704 }, { "epoch": 0.31, "learning_rate": 0.00016227082840595397, "loss": 0.719, "step": 2705 }, { "epoch": 0.31, "learning_rate": 0.00016224201996878956, "loss": 0.6672, "step": 2706 }, { "epoch": 0.31, "learning_rate": 0.00016221320309676003, "loss": 0.6591, "step": 2707 }, { "epoch": 0.31, "learning_rate": 0.00016218437779377058, "loss": 0.6733, "step": 2708 }, { "epoch": 0.31, "learning_rate": 0.0001621555440637275, "loss": 0.7187, "step": 2709 }, { "epoch": 0.31, "learning_rate": 0.0001621267019105383, "loss": 0.6674, "step": 2710 }, { "epoch": 0.31, "learning_rate": 0.00016209785133811154, "loss": 0.7908, "step": 2711 }, { "epoch": 0.31, "learning_rate": 0.00016206899235035702, "loss": 0.7115, "step": 2712 }, { "epoch": 0.31, "learning_rate": 0.0001620401249511856, "loss": 0.6707, "step": 2713 }, { "epoch": 0.31, "learning_rate": 0.0001620112491445093, "loss": 0.6708, "step": 2714 }, { "epoch": 0.31, "learning_rate": 0.0001619823649342413, "loss": 0.6922, "step": 2715 }, { "epoch": 0.31, "learning_rate": 0.00016195347232429597, "loss": 0.6966, "step": 2716 }, { "epoch": 0.31, "learning_rate": 0.00016192457131858863, "loss": 0.6555, "step": 2717 }, { "epoch": 0.31, "learning_rate": 0.00016189566192103598, "loss": 0.6754, "step": 2718 }, { "epoch": 0.31, "learning_rate": 0.00016186674413555565, "loss": 0.6765, "step": 2719 }, { "epoch": 0.31, "learning_rate": 0.00016183781796606656, "loss": 0.6375, "step": 2720 }, { "epoch": 0.31, "learning_rate": 0.0001618088834164887, "loss": 0.728, "step": 2721 }, { "epoch": 0.31, "learning_rate": 0.00016177994049074314, "loss": 0.6896, "step": 2722 }, { "epoch": 0.31, "learning_rate": 0.00016175098919275223, "loss": 0.6791, "step": 2723 }, { "epoch": 0.31, "learning_rate": 0.00016172202952643934, "loss": 0.7159, "step": 2724 }, { "epoch": 0.31, "learning_rate": 0.00016169306149572897, "loss": 0.7371, "step": 2725 }, { "epoch": 0.31, "learning_rate": 0.00016166408510454678, "loss": 0.6291, "step": 2726 }, { "epoch": 0.31, "learning_rate": 0.00016163510035681962, "loss": 0.7317, "step": 2727 }, { "epoch": 0.31, "learning_rate": 0.0001616061072564754, "loss": 0.6938, "step": 2728 }, { "epoch": 0.31, "learning_rate": 0.0001615771058074432, "loss": 0.7291, "step": 2729 }, { "epoch": 0.31, "learning_rate": 0.00016154809601365318, "loss": 0.6831, "step": 2730 }, { "epoch": 0.31, "learning_rate": 0.0001615190778790367, "loss": 0.7165, "step": 2731 }, { "epoch": 0.31, "learning_rate": 0.0001614900514075262, "loss": 0.6767, "step": 2732 }, { "epoch": 0.31, "learning_rate": 0.00016146101660305525, "loss": 0.674, "step": 2733 }, { "epoch": 0.31, "learning_rate": 0.00016143197346955862, "loss": 0.6469, "step": 2734 }, { "epoch": 0.31, "learning_rate": 0.0001614029220109721, "loss": 0.7141, "step": 2735 }, { "epoch": 0.31, "learning_rate": 0.00016137386223123268, "loss": 0.7056, "step": 2736 }, { "epoch": 0.31, "learning_rate": 0.00016134479413427844, "loss": 0.6751, "step": 2737 }, { "epoch": 0.31, "learning_rate": 0.0001613157177240487, "loss": 0.67, "step": 2738 }, { "epoch": 0.31, "learning_rate": 0.00016128663300448367, "loss": 0.7151, "step": 2739 }, { "epoch": 0.31, "learning_rate": 0.00016125753997952495, "loss": 0.7123, "step": 2740 }, { "epoch": 0.31, "learning_rate": 0.0001612284386531151, "loss": 0.6743, "step": 2741 }, { "epoch": 0.31, "learning_rate": 0.00016119932902919782, "loss": 0.6629, "step": 2742 }, { "epoch": 0.31, "learning_rate": 0.000161170211111718, "loss": 0.7434, "step": 2743 }, { "epoch": 0.31, "learning_rate": 0.00016114108490462164, "loss": 0.7706, "step": 2744 }, { "epoch": 0.31, "learning_rate": 0.0001611119504118558, "loss": 0.588, "step": 2745 }, { "epoch": 0.31, "learning_rate": 0.0001610828076373687, "loss": 0.7061, "step": 2746 }, { "epoch": 0.31, "learning_rate": 0.00016105365658510977, "loss": 0.7202, "step": 2747 }, { "epoch": 0.31, "learning_rate": 0.0001610244972590294, "loss": 0.6648, "step": 2748 }, { "epoch": 0.31, "learning_rate": 0.00016099532966307916, "loss": 0.6862, "step": 2749 }, { "epoch": 0.31, "learning_rate": 0.00016096615380121185, "loss": 0.7333, "step": 2750 }, { "epoch": 0.31, "learning_rate": 0.0001609369696773812, "loss": 0.6455, "step": 2751 }, { "epoch": 0.31, "learning_rate": 0.00016090777729554226, "loss": 0.621, "step": 2752 }, { "epoch": 0.31, "learning_rate": 0.00016087857665965106, "loss": 0.7134, "step": 2753 }, { "epoch": 0.31, "learning_rate": 0.00016084936777366476, "loss": 0.751, "step": 2754 }, { "epoch": 0.31, "learning_rate": 0.0001608201506415417, "loss": 0.6866, "step": 2755 }, { "epoch": 0.31, "learning_rate": 0.00016079092526724128, "loss": 0.6677, "step": 2756 }, { "epoch": 0.31, "learning_rate": 0.00016076169165472407, "loss": 0.6439, "step": 2757 }, { "epoch": 0.31, "learning_rate": 0.0001607324498079517, "loss": 0.681, "step": 2758 }, { "epoch": 0.31, "learning_rate": 0.000160703199730887, "loss": 0.6229, "step": 2759 }, { "epoch": 0.31, "learning_rate": 0.00016067394142749378, "loss": 0.6529, "step": 2760 }, { "epoch": 0.31, "learning_rate": 0.00016064467490173708, "loss": 0.7371, "step": 2761 }, { "epoch": 0.31, "learning_rate": 0.000160615400157583, "loss": 0.6679, "step": 2762 }, { "epoch": 0.31, "learning_rate": 0.00016058611719899882, "loss": 0.6924, "step": 2763 }, { "epoch": 0.31, "learning_rate": 0.00016055682602995287, "loss": 0.7042, "step": 2764 }, { "epoch": 0.31, "learning_rate": 0.00016052752665441454, "loss": 0.7383, "step": 2765 }, { "epoch": 0.31, "learning_rate": 0.00016049821907635446, "loss": 0.6417, "step": 2766 }, { "epoch": 0.31, "learning_rate": 0.00016046890329974437, "loss": 0.652, "step": 2767 }, { "epoch": 0.31, "learning_rate": 0.0001604395793285569, "loss": 0.6994, "step": 2768 }, { "epoch": 0.31, "learning_rate": 0.0001604102471667661, "loss": 0.6233, "step": 2769 }, { "epoch": 0.31, "learning_rate": 0.00016038090681834695, "loss": 0.6858, "step": 2770 }, { "epoch": 0.31, "learning_rate": 0.00016035155828727552, "loss": 0.6974, "step": 2771 }, { "epoch": 0.32, "learning_rate": 0.0001603222015775291, "loss": 0.6041, "step": 2772 }, { "epoch": 0.32, "learning_rate": 0.000160292836693086, "loss": 0.6883, "step": 2773 }, { "epoch": 0.32, "learning_rate": 0.00016026346363792567, "loss": 0.7147, "step": 2774 }, { "epoch": 0.32, "learning_rate": 0.00016023408241602863, "loss": 0.7521, "step": 2775 }, { "epoch": 0.32, "learning_rate": 0.00016020469303137662, "loss": 0.6661, "step": 2776 }, { "epoch": 0.32, "learning_rate": 0.00016017529548795233, "loss": 0.6988, "step": 2777 }, { "epoch": 0.32, "learning_rate": 0.0001601458897897397, "loss": 0.6644, "step": 2778 }, { "epoch": 0.32, "learning_rate": 0.00016011647594072368, "loss": 0.6718, "step": 2779 }, { "epoch": 0.32, "learning_rate": 0.00016008705394489033, "loss": 0.6765, "step": 2780 }, { "epoch": 0.32, "learning_rate": 0.00016005762380622688, "loss": 0.7063, "step": 2781 }, { "epoch": 0.32, "learning_rate": 0.00016002818552872156, "loss": 0.6444, "step": 2782 }, { "epoch": 0.32, "learning_rate": 0.0001599987391163638, "loss": 0.6663, "step": 2783 }, { "epoch": 0.32, "learning_rate": 0.00015996928457314414, "loss": 0.6904, "step": 2784 }, { "epoch": 0.32, "learning_rate": 0.00015993982190305408, "loss": 0.6869, "step": 2785 }, { "epoch": 0.32, "learning_rate": 0.0001599103511100864, "loss": 0.7053, "step": 2786 }, { "epoch": 0.32, "learning_rate": 0.00015988087219823488, "loss": 0.7045, "step": 2787 }, { "epoch": 0.32, "learning_rate": 0.00015985138517149442, "loss": 0.65, "step": 2788 }, { "epoch": 0.32, "learning_rate": 0.00015982189003386097, "loss": 0.7114, "step": 2789 }, { "epoch": 0.32, "learning_rate": 0.0001597923867893317, "loss": 0.6451, "step": 2790 }, { "epoch": 0.32, "learning_rate": 0.0001597628754419048, "loss": 0.6789, "step": 2791 }, { "epoch": 0.32, "learning_rate": 0.00015973335599557952, "loss": 0.6739, "step": 2792 }, { "epoch": 0.32, "learning_rate": 0.00015970382845435625, "loss": 0.7037, "step": 2793 }, { "epoch": 0.32, "learning_rate": 0.00015967429282223654, "loss": 0.706, "step": 2794 }, { "epoch": 0.32, "learning_rate": 0.00015964474910322294, "loss": 0.7013, "step": 2795 }, { "epoch": 0.32, "learning_rate": 0.00015961519730131913, "loss": 0.6791, "step": 2796 }, { "epoch": 0.32, "learning_rate": 0.0001595856374205299, "loss": 0.6622, "step": 2797 }, { "epoch": 0.32, "learning_rate": 0.0001595560694648611, "loss": 0.6522, "step": 2798 }, { "epoch": 0.32, "learning_rate": 0.00015952649343831972, "loss": 0.6664, "step": 2799 }, { "epoch": 0.32, "learning_rate": 0.00015949690934491381, "loss": 0.6771, "step": 2800 }, { "epoch": 0.32, "learning_rate": 0.00015946731718865256, "loss": 0.5938, "step": 2801 }, { "epoch": 0.32, "learning_rate": 0.00015943771697354614, "loss": 0.7018, "step": 2802 }, { "epoch": 0.32, "learning_rate": 0.00015940810870360595, "loss": 0.6464, "step": 2803 }, { "epoch": 0.32, "learning_rate": 0.00015937849238284444, "loss": 0.6218, "step": 2804 }, { "epoch": 0.32, "learning_rate": 0.00015934886801527505, "loss": 0.6719, "step": 2805 }, { "epoch": 0.32, "learning_rate": 0.00015931923560491245, "loss": 0.7244, "step": 2806 }, { "epoch": 0.32, "learning_rate": 0.00015928959515577233, "loss": 0.6768, "step": 2807 }, { "epoch": 0.32, "learning_rate": 0.00015925994667187148, "loss": 0.7252, "step": 2808 }, { "epoch": 0.32, "learning_rate": 0.00015923029015722776, "loss": 0.7016, "step": 2809 }, { "epoch": 0.32, "learning_rate": 0.0001592006256158602, "loss": 0.6671, "step": 2810 }, { "epoch": 0.32, "learning_rate": 0.00015917095305178876, "loss": 0.7999, "step": 2811 }, { "epoch": 0.32, "learning_rate": 0.00015914127246903468, "loss": 0.6997, "step": 2812 }, { "epoch": 0.32, "learning_rate": 0.00015911158387162014, "loss": 0.6377, "step": 2813 }, { "epoch": 0.32, "learning_rate": 0.00015908188726356843, "loss": 0.7032, "step": 2814 }, { "epoch": 0.32, "learning_rate": 0.00015905218264890403, "loss": 0.6742, "step": 2815 }, { "epoch": 0.32, "learning_rate": 0.00015902247003165234, "loss": 0.7495, "step": 2816 }, { "epoch": 0.32, "learning_rate": 0.00015899274941583996, "loss": 0.7298, "step": 2817 }, { "epoch": 0.32, "learning_rate": 0.0001589630208054946, "loss": 0.7061, "step": 2818 }, { "epoch": 0.32, "learning_rate": 0.00015893328420464492, "loss": 0.6404, "step": 2819 }, { "epoch": 0.32, "learning_rate": 0.0001589035396173208, "loss": 0.6795, "step": 2820 }, { "epoch": 0.32, "learning_rate": 0.00015887378704755313, "loss": 0.6482, "step": 2821 }, { "epoch": 0.32, "learning_rate": 0.00015884402649937387, "loss": 0.6277, "step": 2822 }, { "epoch": 0.32, "learning_rate": 0.0001588142579768161, "loss": 0.7105, "step": 2823 }, { "epoch": 0.32, "learning_rate": 0.000158784481483914, "loss": 0.6174, "step": 2824 }, { "epoch": 0.32, "learning_rate": 0.00015875469702470273, "loss": 0.66, "step": 2825 }, { "epoch": 0.32, "learning_rate": 0.00015872490460321865, "loss": 0.7025, "step": 2826 }, { "epoch": 0.32, "learning_rate": 0.00015869510422349912, "loss": 0.6853, "step": 2827 }, { "epoch": 0.32, "learning_rate": 0.00015866529588958264, "loss": 0.6951, "step": 2828 }, { "epoch": 0.32, "learning_rate": 0.0001586354796055087, "loss": 0.6629, "step": 2829 }, { "epoch": 0.32, "learning_rate": 0.00015860565537531793, "loss": 0.6653, "step": 2830 }, { "epoch": 0.32, "learning_rate": 0.00015857582320305208, "loss": 0.7191, "step": 2831 }, { "epoch": 0.32, "learning_rate": 0.00015854598309275386, "loss": 0.6675, "step": 2832 }, { "epoch": 0.32, "learning_rate": 0.00015851613504846713, "loss": 0.6726, "step": 2833 }, { "epoch": 0.32, "learning_rate": 0.00015848627907423686, "loss": 0.6783, "step": 2834 }, { "epoch": 0.32, "learning_rate": 0.00015845641517410903, "loss": 0.6739, "step": 2835 }, { "epoch": 0.32, "learning_rate": 0.00015842654335213068, "loss": 0.7132, "step": 2836 }, { "epoch": 0.32, "learning_rate": 0.00015839666361234996, "loss": 0.6553, "step": 2837 }, { "epoch": 0.32, "learning_rate": 0.00015836677595881612, "loss": 0.7182, "step": 2838 }, { "epoch": 0.32, "learning_rate": 0.0001583368803955794, "loss": 0.7076, "step": 2839 }, { "epoch": 0.32, "learning_rate": 0.00015830697692669125, "loss": 0.7165, "step": 2840 }, { "epoch": 0.32, "learning_rate": 0.00015827706555620404, "loss": 0.7556, "step": 2841 }, { "epoch": 0.32, "learning_rate": 0.00015824714628817125, "loss": 0.6922, "step": 2842 }, { "epoch": 0.32, "learning_rate": 0.00015821721912664757, "loss": 0.6086, "step": 2843 }, { "epoch": 0.32, "learning_rate": 0.0001581872840756885, "loss": 0.7222, "step": 2844 }, { "epoch": 0.32, "learning_rate": 0.00015815734113935087, "loss": 0.6332, "step": 2845 }, { "epoch": 0.32, "learning_rate": 0.00015812739032169238, "loss": 0.6673, "step": 2846 }, { "epoch": 0.32, "learning_rate": 0.00015809743162677195, "loss": 0.6906, "step": 2847 }, { "epoch": 0.32, "learning_rate": 0.00015806746505864946, "loss": 0.7178, "step": 2848 }, { "epoch": 0.32, "learning_rate": 0.00015803749062138592, "loss": 0.5944, "step": 2849 }, { "epoch": 0.32, "learning_rate": 0.00015800750831904334, "loss": 0.6716, "step": 2850 }, { "epoch": 0.32, "learning_rate": 0.0001579775181556849, "loss": 0.6755, "step": 2851 }, { "epoch": 0.32, "learning_rate": 0.0001579475201353747, "loss": 0.6925, "step": 2852 }, { "epoch": 0.32, "learning_rate": 0.00015791751426217807, "loss": 0.6359, "step": 2853 }, { "epoch": 0.32, "learning_rate": 0.00015788750054016127, "loss": 0.6798, "step": 2854 }, { "epoch": 0.32, "learning_rate": 0.00015785747897339173, "loss": 0.5933, "step": 2855 }, { "epoch": 0.32, "learning_rate": 0.0001578274495659378, "loss": 0.7445, "step": 2856 }, { "epoch": 0.32, "learning_rate": 0.00015779741232186905, "loss": 0.6557, "step": 2857 }, { "epoch": 0.32, "learning_rate": 0.00015776736724525608, "loss": 0.7646, "step": 2858 }, { "epoch": 0.32, "learning_rate": 0.0001577373143401704, "loss": 0.6979, "step": 2859 }, { "epoch": 0.33, "learning_rate": 0.00015770725361068482, "loss": 0.6651, "step": 2860 }, { "epoch": 0.33, "learning_rate": 0.00015767718506087299, "loss": 0.7115, "step": 2861 }, { "epoch": 0.33, "learning_rate": 0.00015764710869480973, "loss": 0.6798, "step": 2862 }, { "epoch": 0.33, "learning_rate": 0.00015761702451657096, "loss": 0.6964, "step": 2863 }, { "epoch": 0.33, "learning_rate": 0.00015758693253023357, "loss": 0.6922, "step": 2864 }, { "epoch": 0.33, "learning_rate": 0.00015755683273987553, "loss": 0.7081, "step": 2865 }, { "epoch": 0.33, "learning_rate": 0.00015752672514957592, "loss": 0.6979, "step": 2866 }, { "epoch": 0.33, "learning_rate": 0.0001574966097634148, "loss": 0.6662, "step": 2867 }, { "epoch": 0.33, "learning_rate": 0.00015746648658547332, "loss": 0.678, "step": 2868 }, { "epoch": 0.33, "learning_rate": 0.0001574363556198337, "loss": 0.6851, "step": 2869 }, { "epoch": 0.33, "learning_rate": 0.00015740621687057924, "loss": 0.7068, "step": 2870 }, { "epoch": 0.33, "learning_rate": 0.0001573760703417942, "loss": 0.724, "step": 2871 }, { "epoch": 0.33, "learning_rate": 0.000157345916037564, "loss": 0.7402, "step": 2872 }, { "epoch": 0.33, "learning_rate": 0.00015731575396197504, "loss": 0.7077, "step": 2873 }, { "epoch": 0.33, "learning_rate": 0.0001572855841191148, "loss": 0.7247, "step": 2874 }, { "epoch": 0.33, "learning_rate": 0.00015725540651307182, "loss": 0.6885, "step": 2875 }, { "epoch": 0.33, "learning_rate": 0.0001572252211479357, "loss": 0.7152, "step": 2876 }, { "epoch": 0.33, "learning_rate": 0.00015719502802779704, "loss": 0.6782, "step": 2877 }, { "epoch": 0.33, "learning_rate": 0.00015716482715674753, "loss": 0.6744, "step": 2878 }, { "epoch": 0.33, "learning_rate": 0.00015713461853888, "loss": 0.6711, "step": 2879 }, { "epoch": 0.33, "learning_rate": 0.0001571044021782881, "loss": 0.6869, "step": 2880 }, { "epoch": 0.33, "learning_rate": 0.00015707417807906676, "loss": 0.6536, "step": 2881 }, { "epoch": 0.33, "learning_rate": 0.00015704394624531184, "loss": 0.6836, "step": 2882 }, { "epoch": 0.33, "learning_rate": 0.00015701370668112026, "loss": 0.7168, "step": 2883 }, { "epoch": 0.33, "learning_rate": 0.00015698345939059002, "loss": 0.6529, "step": 2884 }, { "epoch": 0.33, "learning_rate": 0.00015695320437782016, "loss": 0.7148, "step": 2885 }, { "epoch": 0.33, "learning_rate": 0.00015692294164691071, "loss": 0.7138, "step": 2886 }, { "epoch": 0.33, "learning_rate": 0.00015689267120196285, "loss": 0.6834, "step": 2887 }, { "epoch": 0.33, "learning_rate": 0.00015686239304707868, "loss": 0.723, "step": 2888 }, { "epoch": 0.33, "learning_rate": 0.00015683210718636146, "loss": 0.7009, "step": 2889 }, { "epoch": 0.33, "learning_rate": 0.00015680181362391545, "loss": 0.68, "step": 2890 }, { "epoch": 0.33, "learning_rate": 0.0001567715123638459, "loss": 0.7477, "step": 2891 }, { "epoch": 0.33, "learning_rate": 0.00015674120341025919, "loss": 0.5988, "step": 2892 }, { "epoch": 0.33, "learning_rate": 0.0001567108867672627, "loss": 0.7085, "step": 2893 }, { "epoch": 0.33, "learning_rate": 0.00015668056243896484, "loss": 0.6686, "step": 2894 }, { "epoch": 0.33, "learning_rate": 0.00015665023042947516, "loss": 0.6893, "step": 2895 }, { "epoch": 0.33, "learning_rate": 0.00015661989074290404, "loss": 0.6751, "step": 2896 }, { "epoch": 0.33, "learning_rate": 0.0001565895433833631, "loss": 0.675, "step": 2897 }, { "epoch": 0.33, "learning_rate": 0.00015655918835496494, "loss": 0.7332, "step": 2898 }, { "epoch": 0.33, "learning_rate": 0.00015652882566182314, "loss": 0.6756, "step": 2899 }, { "epoch": 0.33, "learning_rate": 0.00015649845530805241, "loss": 0.7286, "step": 2900 }, { "epoch": 0.33, "learning_rate": 0.00015646807729776847, "loss": 0.6678, "step": 2901 }, { "epoch": 0.33, "learning_rate": 0.00015643769163508803, "loss": 0.6897, "step": 2902 }, { "epoch": 0.33, "learning_rate": 0.00015640729832412886, "loss": 0.6735, "step": 2903 }, { "epoch": 0.33, "learning_rate": 0.0001563768973690098, "loss": 0.6681, "step": 2904 }, { "epoch": 0.33, "learning_rate": 0.0001563464887738507, "loss": 0.6364, "step": 2905 }, { "epoch": 0.33, "learning_rate": 0.00015631607254277245, "loss": 0.7053, "step": 2906 }, { "epoch": 0.33, "learning_rate": 0.00015628564867989697, "loss": 0.7483, "step": 2907 }, { "epoch": 0.33, "learning_rate": 0.00015625521718934718, "loss": 0.6641, "step": 2908 }, { "epoch": 0.33, "learning_rate": 0.00015622477807524716, "loss": 0.6956, "step": 2909 }, { "epoch": 0.33, "learning_rate": 0.00015619433134172184, "loss": 0.6859, "step": 2910 }, { "epoch": 0.33, "learning_rate": 0.00015616387699289735, "loss": 0.7038, "step": 2911 }, { "epoch": 0.33, "learning_rate": 0.00015613341503290074, "loss": 0.6638, "step": 2912 }, { "epoch": 0.33, "learning_rate": 0.0001561029454658601, "loss": 0.7024, "step": 2913 }, { "epoch": 0.33, "learning_rate": 0.00015607246829590462, "loss": 0.6792, "step": 2914 }, { "epoch": 0.33, "learning_rate": 0.00015604198352716452, "loss": 0.6819, "step": 2915 }, { "epoch": 0.33, "learning_rate": 0.00015601149116377093, "loss": 0.7193, "step": 2916 }, { "epoch": 0.33, "learning_rate": 0.00015598099120985617, "loss": 0.6371, "step": 2917 }, { "epoch": 0.33, "learning_rate": 0.00015595048366955343, "loss": 0.6786, "step": 2918 }, { "epoch": 0.33, "learning_rate": 0.00015591996854699705, "loss": 0.6913, "step": 2919 }, { "epoch": 0.33, "learning_rate": 0.00015588944584632236, "loss": 0.7219, "step": 2920 }, { "epoch": 0.33, "learning_rate": 0.00015585891557166567, "loss": 0.6983, "step": 2921 }, { "epoch": 0.33, "learning_rate": 0.0001558283777271644, "loss": 0.6722, "step": 2922 }, { "epoch": 0.33, "learning_rate": 0.00015579783231695697, "loss": 0.6977, "step": 2923 }, { "epoch": 0.33, "learning_rate": 0.00015576727934518277, "loss": 0.7052, "step": 2924 }, { "epoch": 0.33, "learning_rate": 0.00015573671881598223, "loss": 0.6854, "step": 2925 }, { "epoch": 0.33, "learning_rate": 0.00015570615073349687, "loss": 0.6327, "step": 2926 }, { "epoch": 0.33, "learning_rate": 0.0001556755751018692, "loss": 0.6229, "step": 2927 }, { "epoch": 0.33, "learning_rate": 0.00015564499192524274, "loss": 0.6717, "step": 2928 }, { "epoch": 0.33, "learning_rate": 0.00015561440120776202, "loss": 0.6748, "step": 2929 }, { "epoch": 0.33, "learning_rate": 0.00015558380295357257, "loss": 0.6986, "step": 2930 }, { "epoch": 0.33, "learning_rate": 0.00015555319716682107, "loss": 0.7139, "step": 2931 }, { "epoch": 0.33, "learning_rate": 0.00015552258385165504, "loss": 0.667, "step": 2932 }, { "epoch": 0.33, "learning_rate": 0.0001554919630122232, "loss": 0.6945, "step": 2933 }, { "epoch": 0.33, "learning_rate": 0.0001554613346526751, "loss": 0.6501, "step": 2934 }, { "epoch": 0.33, "learning_rate": 0.0001554306987771615, "loss": 0.6413, "step": 2935 }, { "epoch": 0.33, "learning_rate": 0.0001554000553898341, "loss": 0.6863, "step": 2936 }, { "epoch": 0.33, "learning_rate": 0.0001553694044948455, "loss": 0.6374, "step": 2937 }, { "epoch": 0.33, "learning_rate": 0.0001553387460963495, "loss": 0.7043, "step": 2938 }, { "epoch": 0.33, "learning_rate": 0.00015530808019850083, "loss": 0.7485, "step": 2939 }, { "epoch": 0.33, "learning_rate": 0.0001552774068054552, "loss": 0.6486, "step": 2940 }, { "epoch": 0.33, "learning_rate": 0.0001552467259213695, "loss": 0.7063, "step": 2941 }, { "epoch": 0.33, "learning_rate": 0.00015521603755040139, "loss": 0.6725, "step": 2942 }, { "epoch": 0.33, "learning_rate": 0.00015518534169670976, "loss": 0.7072, "step": 2943 }, { "epoch": 0.33, "learning_rate": 0.00015515463836445435, "loss": 0.6283, "step": 2944 }, { "epoch": 0.33, "learning_rate": 0.00015512392755779605, "loss": 0.7009, "step": 2945 }, { "epoch": 0.33, "learning_rate": 0.00015509320928089673, "loss": 0.7266, "step": 2946 }, { "epoch": 0.33, "learning_rate": 0.00015506248353791912, "loss": 0.6612, "step": 2947 }, { "epoch": 0.34, "learning_rate": 0.0001550317503330272, "loss": 0.7026, "step": 2948 }, { "epoch": 0.34, "learning_rate": 0.00015500100967038587, "loss": 0.6807, "step": 2949 }, { "epoch": 0.34, "learning_rate": 0.00015497026155416089, "loss": 0.6911, "step": 2950 }, { "epoch": 0.34, "learning_rate": 0.00015493950598851925, "loss": 0.6901, "step": 2951 }, { "epoch": 0.34, "learning_rate": 0.00015490874297762884, "loss": 0.6786, "step": 2952 }, { "epoch": 0.34, "learning_rate": 0.0001548779725256586, "loss": 0.6547, "step": 2953 }, { "epoch": 0.34, "learning_rate": 0.00015484719463677843, "loss": 0.6247, "step": 2954 }, { "epoch": 0.34, "learning_rate": 0.00015481640931515927, "loss": 0.6403, "step": 2955 }, { "epoch": 0.34, "learning_rate": 0.00015478561656497304, "loss": 0.7687, "step": 2956 }, { "epoch": 0.34, "learning_rate": 0.00015475481639039274, "loss": 0.7123, "step": 2957 }, { "epoch": 0.34, "learning_rate": 0.0001547240087955923, "loss": 0.6815, "step": 2958 }, { "epoch": 0.34, "learning_rate": 0.00015469319378474662, "loss": 0.7261, "step": 2959 }, { "epoch": 0.34, "learning_rate": 0.00015466237136203175, "loss": 0.671, "step": 2960 }, { "epoch": 0.34, "learning_rate": 0.00015463154153162463, "loss": 0.6713, "step": 2961 }, { "epoch": 0.34, "learning_rate": 0.0001546007042977032, "loss": 0.679, "step": 2962 }, { "epoch": 0.34, "learning_rate": 0.00015456985966444647, "loss": 0.7192, "step": 2963 }, { "epoch": 0.34, "learning_rate": 0.00015453900763603444, "loss": 0.6898, "step": 2964 }, { "epoch": 0.34, "learning_rate": 0.00015450814821664803, "loss": 0.732, "step": 2965 }, { "epoch": 0.34, "learning_rate": 0.0001544772814104693, "loss": 0.6337, "step": 2966 }, { "epoch": 0.34, "learning_rate": 0.00015444640722168113, "loss": 0.672, "step": 2967 }, { "epoch": 0.34, "learning_rate": 0.0001544155256544676, "loss": 0.7137, "step": 2968 }, { "epoch": 0.34, "learning_rate": 0.00015438463671301364, "loss": 0.6824, "step": 2969 }, { "epoch": 0.34, "learning_rate": 0.00015435374040150527, "loss": 0.6594, "step": 2970 }, { "epoch": 0.34, "learning_rate": 0.00015432283672412944, "loss": 0.745, "step": 2971 }, { "epoch": 0.34, "learning_rate": 0.00015429192568507417, "loss": 0.6457, "step": 2972 }, { "epoch": 0.34, "learning_rate": 0.00015426100728852833, "loss": 0.7303, "step": 2973 }, { "epoch": 0.34, "learning_rate": 0.00015423008153868205, "loss": 0.6931, "step": 2974 }, { "epoch": 0.34, "learning_rate": 0.00015419914843972621, "loss": 0.6557, "step": 2975 }, { "epoch": 0.34, "learning_rate": 0.00015416820799585282, "loss": 0.7137, "step": 2976 }, { "epoch": 0.34, "learning_rate": 0.00015413726021125474, "loss": 0.6996, "step": 2977 }, { "epoch": 0.34, "learning_rate": 0.00015410630509012606, "loss": 0.7427, "step": 2978 }, { "epoch": 0.34, "learning_rate": 0.00015407534263666168, "loss": 0.6806, "step": 2979 }, { "epoch": 0.34, "learning_rate": 0.00015404437285505753, "loss": 0.6881, "step": 2980 }, { "epoch": 0.34, "learning_rate": 0.00015401339574951057, "loss": 0.6238, "step": 2981 }, { "epoch": 0.34, "learning_rate": 0.0001539824113242187, "loss": 0.7694, "step": 2982 }, { "epoch": 0.34, "learning_rate": 0.0001539514195833809, "loss": 0.6552, "step": 2983 }, { "epoch": 0.34, "learning_rate": 0.00015392042053119699, "loss": 0.7016, "step": 2984 }, { "epoch": 0.34, "learning_rate": 0.00015388941417186796, "loss": 0.6627, "step": 2985 }, { "epoch": 0.34, "learning_rate": 0.0001538584005095957, "loss": 0.7332, "step": 2986 }, { "epoch": 0.34, "learning_rate": 0.00015382737954858306, "loss": 0.6481, "step": 2987 }, { "epoch": 0.34, "learning_rate": 0.0001537963512930339, "loss": 0.6715, "step": 2988 }, { "epoch": 0.34, "learning_rate": 0.00015376531574715316, "loss": 0.6854, "step": 2989 }, { "epoch": 0.34, "learning_rate": 0.0001537342729151466, "loss": 0.6638, "step": 2990 }, { "epoch": 0.34, "learning_rate": 0.00015370322280122115, "loss": 0.6632, "step": 2991 }, { "epoch": 0.34, "learning_rate": 0.00015367216540958456, "loss": 0.6796, "step": 2992 }, { "epoch": 0.34, "learning_rate": 0.00015364110074444568, "loss": 0.6819, "step": 2993 }, { "epoch": 0.34, "learning_rate": 0.00015361002881001426, "loss": 0.641, "step": 2994 }, { "epoch": 0.34, "learning_rate": 0.00015357894961050113, "loss": 0.6871, "step": 2995 }, { "epoch": 0.34, "learning_rate": 0.00015354786315011806, "loss": 0.7091, "step": 2996 }, { "epoch": 0.34, "learning_rate": 0.00015351676943307774, "loss": 0.6357, "step": 2997 }, { "epoch": 0.34, "learning_rate": 0.000153485668463594, "loss": 0.6762, "step": 2998 }, { "epoch": 0.34, "learning_rate": 0.00015345456024588145, "loss": 0.6774, "step": 2999 }, { "epoch": 0.34, "learning_rate": 0.00015342344478415587, "loss": 0.6262, "step": 3000 }, { "epoch": 0.34, "learning_rate": 0.00015339232208263392, "loss": 0.6787, "step": 3001 }, { "epoch": 0.34, "learning_rate": 0.0001533611921455332, "loss": 0.7018, "step": 3002 }, { "epoch": 0.34, "learning_rate": 0.00015333005497707248, "loss": 0.7639, "step": 3003 }, { "epoch": 0.34, "learning_rate": 0.0001532989105814713, "loss": 0.7158, "step": 3004 }, { "epoch": 0.34, "learning_rate": 0.00015326775896295022, "loss": 0.6971, "step": 3005 }, { "epoch": 0.34, "learning_rate": 0.00015323660012573086, "loss": 0.7253, "step": 3006 }, { "epoch": 0.34, "learning_rate": 0.00015320543407403584, "loss": 0.6759, "step": 3007 }, { "epoch": 0.34, "learning_rate": 0.00015317426081208865, "loss": 0.7133, "step": 3008 }, { "epoch": 0.34, "learning_rate": 0.00015314308034411375, "loss": 0.7578, "step": 3009 }, { "epoch": 0.34, "learning_rate": 0.00015311189267433673, "loss": 0.6871, "step": 3010 }, { "epoch": 0.34, "learning_rate": 0.00015308069780698398, "loss": 0.7138, "step": 3011 }, { "epoch": 0.34, "learning_rate": 0.000153049495746283, "loss": 0.7171, "step": 3012 }, { "epoch": 0.34, "learning_rate": 0.00015301828649646212, "loss": 0.7452, "step": 3013 }, { "epoch": 0.34, "learning_rate": 0.00015298707006175083, "loss": 0.6196, "step": 3014 }, { "epoch": 0.34, "learning_rate": 0.00015295584644637943, "loss": 0.6989, "step": 3015 }, { "epoch": 0.34, "learning_rate": 0.00015292461565457927, "loss": 0.7255, "step": 3016 }, { "epoch": 0.34, "learning_rate": 0.00015289337769058267, "loss": 0.6746, "step": 3017 }, { "epoch": 0.34, "learning_rate": 0.00015286213255862293, "loss": 0.6696, "step": 3018 }, { "epoch": 0.34, "learning_rate": 0.00015283088026293425, "loss": 0.7061, "step": 3019 }, { "epoch": 0.34, "learning_rate": 0.00015279962080775192, "loss": 0.7507, "step": 3020 }, { "epoch": 0.34, "learning_rate": 0.0001527683541973121, "loss": 0.7256, "step": 3021 }, { "epoch": 0.34, "learning_rate": 0.0001527370804358519, "loss": 0.6567, "step": 3022 }, { "epoch": 0.34, "learning_rate": 0.00015270579952760956, "loss": 0.7014, "step": 3023 }, { "epoch": 0.34, "learning_rate": 0.00015267451147682408, "loss": 0.6826, "step": 3024 }, { "epoch": 0.34, "learning_rate": 0.0001526432162877356, "loss": 0.6701, "step": 3025 }, { "epoch": 0.34, "learning_rate": 0.00015261191396458515, "loss": 0.7309, "step": 3026 }, { "epoch": 0.34, "learning_rate": 0.00015258060451161468, "loss": 0.7056, "step": 3027 }, { "epoch": 0.34, "learning_rate": 0.00015254928793306723, "loss": 0.7261, "step": 3028 }, { "epoch": 0.34, "learning_rate": 0.0001525179642331867, "loss": 0.6856, "step": 3029 }, { "epoch": 0.34, "learning_rate": 0.00015248663341621796, "loss": 0.6483, "step": 3030 }, { "epoch": 0.34, "learning_rate": 0.00015245529548640695, "loss": 0.7192, "step": 3031 }, { "epoch": 0.34, "learning_rate": 0.00015242395044800041, "loss": 0.758, "step": 3032 }, { "epoch": 0.34, "learning_rate": 0.00015239259830524625, "loss": 0.7629, "step": 3033 }, { "epoch": 0.34, "learning_rate": 0.0001523612390623931, "loss": 0.6702, "step": 3034 }, { "epoch": 0.34, "learning_rate": 0.00015232987272369074, "loss": 0.7019, "step": 3035 }, { "epoch": 0.35, "learning_rate": 0.00015229849929338985, "loss": 0.7433, "step": 3036 }, { "epoch": 0.35, "learning_rate": 0.00015226711877574207, "loss": 0.7143, "step": 3037 }, { "epoch": 0.35, "learning_rate": 0.00015223573117499996, "loss": 0.6925, "step": 3038 }, { "epoch": 0.35, "learning_rate": 0.00015220433649541714, "loss": 0.6496, "step": 3039 }, { "epoch": 0.35, "learning_rate": 0.00015217293474124811, "loss": 0.6202, "step": 3040 }, { "epoch": 0.35, "learning_rate": 0.0001521415259167483, "loss": 0.7238, "step": 3041 }, { "epoch": 0.35, "learning_rate": 0.0001521101100261742, "loss": 0.7399, "step": 3042 }, { "epoch": 0.35, "learning_rate": 0.00015207868707378322, "loss": 0.6929, "step": 3043 }, { "epoch": 0.35, "learning_rate": 0.00015204725706383364, "loss": 0.6793, "step": 3044 }, { "epoch": 0.35, "learning_rate": 0.00015201582000058482, "loss": 0.6295, "step": 3045 }, { "epoch": 0.35, "learning_rate": 0.00015198437588829702, "loss": 0.7501, "step": 3046 }, { "epoch": 0.35, "learning_rate": 0.00015195292473123146, "loss": 0.7664, "step": 3047 }, { "epoch": 0.35, "learning_rate": 0.00015192146653365026, "loss": 0.6596, "step": 3048 }, { "epoch": 0.35, "learning_rate": 0.00015189000129981663, "loss": 0.7056, "step": 3049 }, { "epoch": 0.35, "learning_rate": 0.00015185852903399459, "loss": 0.6871, "step": 3050 }, { "epoch": 0.35, "learning_rate": 0.0001518270497404492, "loss": 0.6806, "step": 3051 }, { "epoch": 0.35, "learning_rate": 0.00015179556342344644, "loss": 0.6523, "step": 3052 }, { "epoch": 0.35, "learning_rate": 0.00015176407008725325, "loss": 0.6586, "step": 3053 }, { "epoch": 0.35, "learning_rate": 0.0001517325697361375, "loss": 0.6439, "step": 3054 }, { "epoch": 0.35, "learning_rate": 0.00015170106237436806, "loss": 0.6745, "step": 3055 }, { "epoch": 0.35, "learning_rate": 0.00015166954800621473, "loss": 0.7176, "step": 3056 }, { "epoch": 0.35, "learning_rate": 0.0001516380266359482, "loss": 0.6843, "step": 3057 }, { "epoch": 0.35, "learning_rate": 0.00015160649826784017, "loss": 0.6735, "step": 3058 }, { "epoch": 0.35, "learning_rate": 0.0001515749629061633, "loss": 0.7335, "step": 3059 }, { "epoch": 0.35, "learning_rate": 0.0001515434205551912, "loss": 0.7135, "step": 3060 }, { "epoch": 0.35, "learning_rate": 0.00015151187121919835, "loss": 0.6916, "step": 3061 }, { "epoch": 0.35, "learning_rate": 0.0001514803149024602, "loss": 0.6362, "step": 3062 }, { "epoch": 0.35, "learning_rate": 0.0001514487516092533, "loss": 0.6572, "step": 3063 }, { "epoch": 0.35, "learning_rate": 0.00015141718134385488, "loss": 0.6855, "step": 3064 }, { "epoch": 0.35, "learning_rate": 0.00015138560411054333, "loss": 0.6736, "step": 3065 }, { "epoch": 0.35, "learning_rate": 0.0001513540199135979, "loss": 0.6791, "step": 3066 }, { "epoch": 0.35, "learning_rate": 0.00015132242875729877, "loss": 0.6098, "step": 3067 }, { "epoch": 0.35, "learning_rate": 0.00015129083064592712, "loss": 0.5994, "step": 3068 }, { "epoch": 0.35, "learning_rate": 0.000151259225583765, "loss": 0.6189, "step": 3069 }, { "epoch": 0.35, "learning_rate": 0.00015122761357509544, "loss": 0.6693, "step": 3070 }, { "epoch": 0.35, "learning_rate": 0.00015119599462420246, "loss": 0.6456, "step": 3071 }, { "epoch": 0.35, "learning_rate": 0.00015116436873537095, "loss": 0.6864, "step": 3072 }, { "epoch": 0.35, "learning_rate": 0.00015113273591288673, "loss": 0.6947, "step": 3073 }, { "epoch": 0.35, "learning_rate": 0.00015110109616103663, "loss": 0.7329, "step": 3074 }, { "epoch": 0.35, "learning_rate": 0.00015106944948410837, "loss": 0.6611, "step": 3075 }, { "epoch": 0.35, "learning_rate": 0.0001510377958863906, "loss": 0.6487, "step": 3076 }, { "epoch": 0.35, "learning_rate": 0.00015100613537217297, "loss": 0.6854, "step": 3077 }, { "epoch": 0.35, "learning_rate": 0.00015097446794574596, "loss": 0.6797, "step": 3078 }, { "epoch": 0.35, "learning_rate": 0.0001509427936114011, "loss": 0.648, "step": 3079 }, { "epoch": 0.35, "learning_rate": 0.0001509111123734308, "loss": 0.7196, "step": 3080 }, { "epoch": 0.35, "learning_rate": 0.0001508794242361284, "loss": 0.7151, "step": 3081 }, { "epoch": 0.35, "learning_rate": 0.00015084772920378821, "loss": 0.7798, "step": 3082 }, { "epoch": 0.35, "learning_rate": 0.00015081602728070546, "loss": 0.6989, "step": 3083 }, { "epoch": 0.35, "learning_rate": 0.00015078431847117627, "loss": 0.7115, "step": 3084 }, { "epoch": 0.35, "learning_rate": 0.0001507526027794977, "loss": 0.7553, "step": 3085 }, { "epoch": 0.35, "learning_rate": 0.0001507208802099679, "loss": 0.6793, "step": 3086 }, { "epoch": 0.35, "learning_rate": 0.0001506891507668857, "loss": 0.719, "step": 3087 }, { "epoch": 0.35, "learning_rate": 0.00015065741445455103, "loss": 0.6742, "step": 3088 }, { "epoch": 0.35, "learning_rate": 0.00015062567127726472, "loss": 0.7028, "step": 3089 }, { "epoch": 0.35, "learning_rate": 0.0001505939212393285, "loss": 0.6627, "step": 3090 }, { "epoch": 0.35, "learning_rate": 0.00015056216434504503, "loss": 0.7432, "step": 3091 }, { "epoch": 0.35, "learning_rate": 0.00015053040059871795, "loss": 0.6415, "step": 3092 }, { "epoch": 0.35, "learning_rate": 0.00015049863000465177, "loss": 0.6476, "step": 3093 }, { "epoch": 0.35, "learning_rate": 0.00015046685256715197, "loss": 0.6967, "step": 3094 }, { "epoch": 0.35, "learning_rate": 0.00015043506829052493, "loss": 0.7201, "step": 3095 }, { "epoch": 0.35, "learning_rate": 0.00015040327717907797, "loss": 0.7149, "step": 3096 }, { "epoch": 0.35, "learning_rate": 0.00015037147923711934, "loss": 0.6687, "step": 3097 }, { "epoch": 0.35, "learning_rate": 0.00015033967446895815, "loss": 0.6894, "step": 3098 }, { "epoch": 0.35, "learning_rate": 0.00015030786287890458, "loss": 0.6611, "step": 3099 }, { "epoch": 0.35, "learning_rate": 0.00015027604447126963, "loss": 0.6417, "step": 3100 }, { "epoch": 0.35, "learning_rate": 0.0001502442192503652, "loss": 0.7065, "step": 3101 }, { "epoch": 0.35, "learning_rate": 0.00015021238722050416, "loss": 0.633, "step": 3102 }, { "epoch": 0.35, "learning_rate": 0.00015018054838600032, "loss": 0.6776, "step": 3103 }, { "epoch": 0.35, "learning_rate": 0.00015014870275116844, "loss": 0.6298, "step": 3104 }, { "epoch": 0.35, "learning_rate": 0.00015011685032032405, "loss": 0.6448, "step": 3105 }, { "epoch": 0.35, "learning_rate": 0.00015008499109778377, "loss": 0.7033, "step": 3106 }, { "epoch": 0.35, "learning_rate": 0.00015005312508786501, "loss": 0.7361, "step": 3107 }, { "epoch": 0.35, "learning_rate": 0.00015002125229488623, "loss": 0.6852, "step": 3108 }, { "epoch": 0.35, "learning_rate": 0.00014998937272316676, "loss": 0.6681, "step": 3109 }, { "epoch": 0.35, "learning_rate": 0.00014995748637702672, "loss": 0.7337, "step": 3110 }, { "epoch": 0.35, "learning_rate": 0.0001499255932607874, "loss": 0.7652, "step": 3111 }, { "epoch": 0.35, "learning_rate": 0.00014989369337877075, "loss": 0.6604, "step": 3112 }, { "epoch": 0.35, "learning_rate": 0.0001498617867352998, "loss": 0.7033, "step": 3113 }, { "epoch": 0.35, "learning_rate": 0.00014982987333469846, "loss": 0.7227, "step": 3114 }, { "epoch": 0.35, "learning_rate": 0.00014979795318129154, "loss": 0.7247, "step": 3115 }, { "epoch": 0.35, "learning_rate": 0.00014976602627940472, "loss": 0.708, "step": 3116 }, { "epoch": 0.35, "learning_rate": 0.00014973409263336474, "loss": 0.731, "step": 3117 }, { "epoch": 0.35, "learning_rate": 0.00014970215224749907, "loss": 0.6372, "step": 3118 }, { "epoch": 0.35, "learning_rate": 0.00014967020512613623, "loss": 0.7037, "step": 3119 }, { "epoch": 0.35, "learning_rate": 0.0001496382512736056, "loss": 0.6954, "step": 3120 }, { "epoch": 0.35, "learning_rate": 0.00014960629069423744, "loss": 0.692, "step": 3121 }, { "epoch": 0.35, "learning_rate": 0.00014957432339236302, "loss": 0.7039, "step": 3122 }, { "epoch": 0.35, "learning_rate": 0.0001495423493723144, "loss": 0.7417, "step": 3123 }, { "epoch": 0.36, "learning_rate": 0.00014951036863842466, "loss": 0.6667, "step": 3124 }, { "epoch": 0.36, "learning_rate": 0.0001494783811950277, "loss": 0.6996, "step": 3125 }, { "epoch": 0.36, "learning_rate": 0.0001494463870464584, "loss": 0.7565, "step": 3126 }, { "epoch": 0.36, "learning_rate": 0.00014941438619705253, "loss": 0.6452, "step": 3127 }, { "epoch": 0.36, "learning_rate": 0.0001493823786511467, "loss": 0.5877, "step": 3128 }, { "epoch": 0.36, "learning_rate": 0.00014935036441307851, "loss": 0.7289, "step": 3129 }, { "epoch": 0.36, "learning_rate": 0.00014931834348718646, "loss": 0.6873, "step": 3130 }, { "epoch": 0.36, "learning_rate": 0.0001492863158778099, "loss": 0.6763, "step": 3131 }, { "epoch": 0.36, "learning_rate": 0.0001492542815892892, "loss": 0.65, "step": 3132 }, { "epoch": 0.36, "learning_rate": 0.0001492222406259654, "loss": 0.6445, "step": 3133 }, { "epoch": 0.36, "learning_rate": 0.0001491901929921808, "loss": 0.7203, "step": 3134 }, { "epoch": 0.36, "learning_rate": 0.00014915813869227827, "loss": 0.6724, "step": 3135 }, { "epoch": 0.36, "learning_rate": 0.00014912607773060174, "loss": 0.7128, "step": 3136 }, { "epoch": 0.36, "learning_rate": 0.0001490940101114961, "loss": 0.7242, "step": 3137 }, { "epoch": 0.36, "learning_rate": 0.00014906193583930696, "loss": 0.7238, "step": 3138 }, { "epoch": 0.36, "learning_rate": 0.00014902985491838097, "loss": 0.6953, "step": 3139 }, { "epoch": 0.36, "learning_rate": 0.0001489977673530657, "loss": 0.692, "step": 3140 }, { "epoch": 0.36, "learning_rate": 0.0001489656731477095, "loss": 0.6857, "step": 3141 }, { "epoch": 0.36, "learning_rate": 0.00014893357230666172, "loss": 0.6983, "step": 3142 }, { "epoch": 0.36, "learning_rate": 0.00014890146483427258, "loss": 0.6719, "step": 3143 }, { "epoch": 0.36, "learning_rate": 0.00014886935073489316, "loss": 0.6658, "step": 3144 }, { "epoch": 0.36, "learning_rate": 0.0001488372300128755, "loss": 0.6745, "step": 3145 }, { "epoch": 0.36, "learning_rate": 0.00014880510267257252, "loss": 0.6755, "step": 3146 }, { "epoch": 0.36, "learning_rate": 0.00014877296871833803, "loss": 0.7207, "step": 3147 }, { "epoch": 0.36, "learning_rate": 0.0001487408281545267, "loss": 0.617, "step": 3148 }, { "epoch": 0.36, "learning_rate": 0.00014870868098549418, "loss": 0.7012, "step": 3149 }, { "epoch": 0.36, "learning_rate": 0.0001486765272155969, "loss": 0.6501, "step": 3150 }, { "epoch": 0.36, "learning_rate": 0.0001486443668491923, "loss": 0.6661, "step": 3151 }, { "epoch": 0.36, "learning_rate": 0.00014861219989063863, "loss": 0.6842, "step": 3152 }, { "epoch": 0.36, "learning_rate": 0.00014858002634429512, "loss": 0.6938, "step": 3153 }, { "epoch": 0.36, "learning_rate": 0.00014854784621452175, "loss": 0.7239, "step": 3154 }, { "epoch": 0.36, "learning_rate": 0.00014851565950567958, "loss": 0.7069, "step": 3155 }, { "epoch": 0.36, "learning_rate": 0.00014848346622213038, "loss": 0.6801, "step": 3156 }, { "epoch": 0.36, "learning_rate": 0.00014845126636823698, "loss": 0.6848, "step": 3157 }, { "epoch": 0.36, "learning_rate": 0.00014841905994836293, "loss": 0.6535, "step": 3158 }, { "epoch": 0.36, "learning_rate": 0.00014838684696687283, "loss": 0.6189, "step": 3159 }, { "epoch": 0.36, "learning_rate": 0.00014835462742813203, "loss": 0.6929, "step": 3160 }, { "epoch": 0.36, "learning_rate": 0.00014832240133650683, "loss": 0.6416, "step": 3161 }, { "epoch": 0.36, "learning_rate": 0.00014829016869636447, "loss": 0.6835, "step": 3162 }, { "epoch": 0.36, "learning_rate": 0.00014825792951207302, "loss": 0.6592, "step": 3163 }, { "epoch": 0.36, "learning_rate": 0.0001482256837880014, "loss": 0.6706, "step": 3164 }, { "epoch": 0.36, "learning_rate": 0.0001481934315285195, "loss": 0.6903, "step": 3165 }, { "epoch": 0.36, "learning_rate": 0.00014816117273799807, "loss": 0.6527, "step": 3166 }, { "epoch": 0.36, "learning_rate": 0.00014812890742080866, "loss": 0.6754, "step": 3167 }, { "epoch": 0.36, "learning_rate": 0.00014809663558132389, "loss": 0.7009, "step": 3168 }, { "epoch": 0.36, "learning_rate": 0.00014806435722391703, "loss": 0.6045, "step": 3169 }, { "epoch": 0.36, "learning_rate": 0.00014803207235296242, "loss": 0.6109, "step": 3170 }, { "epoch": 0.36, "learning_rate": 0.0001479997809728352, "loss": 0.6347, "step": 3171 }, { "epoch": 0.36, "learning_rate": 0.00014796748308791143, "loss": 0.7328, "step": 3172 }, { "epoch": 0.36, "learning_rate": 0.00014793517870256796, "loss": 0.7054, "step": 3173 }, { "epoch": 0.36, "learning_rate": 0.00014790286782118267, "loss": 0.7723, "step": 3174 }, { "epoch": 0.36, "learning_rate": 0.00014787055044813424, "loss": 0.6902, "step": 3175 }, { "epoch": 0.36, "learning_rate": 0.00014783822658780214, "loss": 0.7435, "step": 3176 }, { "epoch": 0.36, "learning_rate": 0.00014780589624456688, "loss": 0.6803, "step": 3177 }, { "epoch": 0.36, "learning_rate": 0.0001477735594228098, "loss": 0.6984, "step": 3178 }, { "epoch": 0.36, "learning_rate": 0.00014774121612691303, "loss": 0.6599, "step": 3179 }, { "epoch": 0.36, "learning_rate": 0.0001477088663612597, "loss": 0.6898, "step": 3180 }, { "epoch": 0.36, "learning_rate": 0.00014767651013023372, "loss": 0.7192, "step": 3181 }, { "epoch": 0.36, "learning_rate": 0.00014764414743821992, "loss": 0.7189, "step": 3182 }, { "epoch": 0.36, "learning_rate": 0.00014761177828960406, "loss": 0.6734, "step": 3183 }, { "epoch": 0.36, "learning_rate": 0.00014757940268877266, "loss": 0.6297, "step": 3184 }, { "epoch": 0.36, "learning_rate": 0.00014754702064011317, "loss": 0.7497, "step": 3185 }, { "epoch": 0.36, "learning_rate": 0.00014751463214801393, "loss": 0.6398, "step": 3186 }, { "epoch": 0.36, "learning_rate": 0.00014748223721686415, "loss": 0.6933, "step": 3187 }, { "epoch": 0.36, "learning_rate": 0.00014744983585105386, "loss": 0.7384, "step": 3188 }, { "epoch": 0.36, "learning_rate": 0.00014741742805497404, "loss": 0.6842, "step": 3189 }, { "epoch": 0.36, "learning_rate": 0.0001473850138330165, "loss": 0.7037, "step": 3190 }, { "epoch": 0.36, "learning_rate": 0.00014735259318957394, "loss": 0.6951, "step": 3191 }, { "epoch": 0.36, "learning_rate": 0.00014732016612903988, "loss": 0.6813, "step": 3192 }, { "epoch": 0.36, "learning_rate": 0.00014728773265580873, "loss": 0.6577, "step": 3193 }, { "epoch": 0.36, "learning_rate": 0.00014725529277427585, "loss": 0.6456, "step": 3194 }, { "epoch": 0.36, "learning_rate": 0.00014722284648883735, "loss": 0.7229, "step": 3195 }, { "epoch": 0.36, "learning_rate": 0.00014719039380389027, "loss": 0.6911, "step": 3196 }, { "epoch": 0.36, "learning_rate": 0.00014715793472383252, "loss": 0.7107, "step": 3197 }, { "epoch": 0.36, "learning_rate": 0.00014712546925306285, "loss": 0.6966, "step": 3198 }, { "epoch": 0.36, "learning_rate": 0.00014709299739598092, "loss": 0.7117, "step": 3199 }, { "epoch": 0.36, "learning_rate": 0.0001470605191569872, "loss": 0.6231, "step": 3200 }, { "epoch": 0.36, "learning_rate": 0.00014702803454048305, "loss": 0.7003, "step": 3201 }, { "epoch": 0.36, "learning_rate": 0.00014699554355087065, "loss": 0.677, "step": 3202 }, { "epoch": 0.36, "learning_rate": 0.00014696304619255318, "loss": 0.7117, "step": 3203 }, { "epoch": 0.36, "learning_rate": 0.00014693054246993454, "loss": 0.6719, "step": 3204 }, { "epoch": 0.36, "learning_rate": 0.00014689803238741956, "loss": 0.6113, "step": 3205 }, { "epoch": 0.36, "learning_rate": 0.0001468655159494139, "loss": 0.6352, "step": 3206 }, { "epoch": 0.36, "learning_rate": 0.00014683299316032412, "loss": 0.6445, "step": 3207 }, { "epoch": 0.36, "learning_rate": 0.0001468004640245576, "loss": 0.6745, "step": 3208 }, { "epoch": 0.36, "learning_rate": 0.00014676792854652256, "loss": 0.7546, "step": 3209 }, { "epoch": 0.36, "learning_rate": 0.0001467353867306282, "loss": 0.7166, "step": 3210 }, { "epoch": 0.36, "learning_rate": 0.00014670283858128446, "loss": 0.7067, "step": 3211 }, { "epoch": 0.37, "learning_rate": 0.00014667028410290212, "loss": 0.6392, "step": 3212 }, { "epoch": 0.37, "learning_rate": 0.00014663772329989296, "loss": 0.7387, "step": 3213 }, { "epoch": 0.37, "learning_rate": 0.0001466051561766695, "loss": 0.6863, "step": 3214 }, { "epoch": 0.37, "learning_rate": 0.00014657258273764512, "loss": 0.6917, "step": 3215 }, { "epoch": 0.37, "learning_rate": 0.0001465400029872341, "loss": 0.759, "step": 3216 }, { "epoch": 0.37, "learning_rate": 0.00014650741692985155, "loss": 0.6814, "step": 3217 }, { "epoch": 0.37, "learning_rate": 0.00014647482456991344, "loss": 0.6838, "step": 3218 }, { "epoch": 0.37, "learning_rate": 0.0001464422259118366, "loss": 0.6856, "step": 3219 }, { "epoch": 0.37, "learning_rate": 0.00014640962096003875, "loss": 0.622, "step": 3220 }, { "epoch": 0.37, "learning_rate": 0.00014637700971893833, "loss": 0.6598, "step": 3221 }, { "epoch": 0.37, "learning_rate": 0.00014634439219295478, "loss": 0.7216, "step": 3222 }, { "epoch": 0.37, "learning_rate": 0.00014631176838650838, "loss": 0.6843, "step": 3223 }, { "epoch": 0.37, "learning_rate": 0.00014627913830402015, "loss": 0.7173, "step": 3224 }, { "epoch": 0.37, "learning_rate": 0.00014624650194991202, "loss": 0.6851, "step": 3225 }, { "epoch": 0.37, "learning_rate": 0.00014621385932860683, "loss": 0.6724, "step": 3226 }, { "epoch": 0.37, "learning_rate": 0.0001461812104445282, "loss": 0.6839, "step": 3227 }, { "epoch": 0.37, "learning_rate": 0.0001461485553021006, "loss": 0.7444, "step": 3228 }, { "epoch": 0.37, "learning_rate": 0.0001461158939057494, "loss": 0.7412, "step": 3229 }, { "epoch": 0.37, "learning_rate": 0.00014608322625990074, "loss": 0.6696, "step": 3230 }, { "epoch": 0.37, "learning_rate": 0.00014605055236898166, "loss": 0.6158, "step": 3231 }, { "epoch": 0.37, "learning_rate": 0.00014601787223742004, "loss": 0.7267, "step": 3232 }, { "epoch": 0.37, "learning_rate": 0.00014598518586964458, "loss": 0.6807, "step": 3233 }, { "epoch": 0.37, "learning_rate": 0.0001459524932700849, "loss": 0.6776, "step": 3234 }, { "epoch": 0.37, "learning_rate": 0.00014591979444317135, "loss": 0.6601, "step": 3235 }, { "epoch": 0.37, "learning_rate": 0.00014588708939333522, "loss": 0.6602, "step": 3236 }, { "epoch": 0.37, "learning_rate": 0.0001458543781250086, "loss": 0.718, "step": 3237 }, { "epoch": 0.37, "learning_rate": 0.00014582166064262443, "loss": 0.7288, "step": 3238 }, { "epoch": 0.37, "learning_rate": 0.00014578893695061645, "loss": 0.6536, "step": 3239 }, { "epoch": 0.37, "learning_rate": 0.00014575620705341934, "loss": 0.6476, "step": 3240 }, { "epoch": 0.37, "learning_rate": 0.00014572347095546855, "loss": 0.706, "step": 3241 }, { "epoch": 0.37, "learning_rate": 0.00014569072866120038, "loss": 0.7128, "step": 3242 }, { "epoch": 0.37, "learning_rate": 0.00014565798017505198, "loss": 0.6654, "step": 3243 }, { "epoch": 0.37, "learning_rate": 0.0001456252255014613, "loss": 0.7129, "step": 3244 }, { "epoch": 0.37, "learning_rate": 0.00014559246464486723, "loss": 0.7407, "step": 3245 }, { "epoch": 0.37, "learning_rate": 0.00014555969760970939, "loss": 0.6658, "step": 3246 }, { "epoch": 0.37, "learning_rate": 0.00014552692440042826, "loss": 0.7609, "step": 3247 }, { "epoch": 0.37, "learning_rate": 0.0001454941450214652, "loss": 0.7221, "step": 3248 }, { "epoch": 0.37, "learning_rate": 0.00014546135947726235, "loss": 0.6583, "step": 3249 }, { "epoch": 0.37, "learning_rate": 0.00014542856777226274, "loss": 0.7095, "step": 3250 }, { "epoch": 0.37, "learning_rate": 0.0001453957699109102, "loss": 0.6557, "step": 3251 }, { "epoch": 0.37, "learning_rate": 0.00014536296589764944, "loss": 0.7134, "step": 3252 }, { "epoch": 0.37, "learning_rate": 0.00014533015573692595, "loss": 0.6279, "step": 3253 }, { "epoch": 0.37, "learning_rate": 0.00014529733943318605, "loss": 0.6552, "step": 3254 }, { "epoch": 0.37, "learning_rate": 0.0001452645169908769, "loss": 0.7512, "step": 3255 }, { "epoch": 0.37, "learning_rate": 0.00014523168841444657, "loss": 0.6841, "step": 3256 }, { "epoch": 0.37, "learning_rate": 0.00014519885370834385, "loss": 0.7156, "step": 3257 }, { "epoch": 0.37, "learning_rate": 0.00014516601287701842, "loss": 0.7021, "step": 3258 }, { "epoch": 0.37, "learning_rate": 0.00014513316592492076, "loss": 0.7507, "step": 3259 }, { "epoch": 0.37, "learning_rate": 0.00014510031285650224, "loss": 0.7315, "step": 3260 }, { "epoch": 0.37, "learning_rate": 0.00014506745367621495, "loss": 0.6393, "step": 3261 }, { "epoch": 0.37, "learning_rate": 0.00014503458838851192, "loss": 0.7433, "step": 3262 }, { "epoch": 0.37, "learning_rate": 0.000145001716997847, "loss": 0.6185, "step": 3263 }, { "epoch": 0.37, "learning_rate": 0.00014496883950867475, "loss": 0.7748, "step": 3264 }, { "epoch": 0.37, "learning_rate": 0.00014493595592545067, "loss": 0.6537, "step": 3265 }, { "epoch": 0.37, "learning_rate": 0.00014490306625263109, "loss": 0.5943, "step": 3266 }, { "epoch": 0.37, "learning_rate": 0.00014487017049467303, "loss": 0.7083, "step": 3267 }, { "epoch": 0.37, "learning_rate": 0.00014483726865603452, "loss": 0.7349, "step": 3268 }, { "epoch": 0.37, "learning_rate": 0.0001448043607411743, "loss": 0.6866, "step": 3269 }, { "epoch": 0.37, "learning_rate": 0.00014477144675455197, "loss": 0.6297, "step": 3270 }, { "epoch": 0.37, "learning_rate": 0.0001447385267006279, "loss": 0.6686, "step": 3271 }, { "epoch": 0.37, "learning_rate": 0.00014470560058386337, "loss": 0.7178, "step": 3272 }, { "epoch": 0.37, "learning_rate": 0.0001446726684087204, "loss": 0.6569, "step": 3273 }, { "epoch": 0.37, "learning_rate": 0.0001446397301796619, "loss": 0.6428, "step": 3274 }, { "epoch": 0.37, "learning_rate": 0.00014460678590115153, "loss": 0.678, "step": 3275 }, { "epoch": 0.37, "learning_rate": 0.00014457383557765386, "loss": 0.6573, "step": 3276 }, { "epoch": 0.37, "learning_rate": 0.00014454087921363416, "loss": 0.685, "step": 3277 }, { "epoch": 0.37, "learning_rate": 0.00014450791681355863, "loss": 0.679, "step": 3278 }, { "epoch": 0.37, "learning_rate": 0.00014447494838189422, "loss": 0.6529, "step": 3279 }, { "epoch": 0.37, "learning_rate": 0.00014444197392310875, "loss": 0.648, "step": 3280 }, { "epoch": 0.37, "learning_rate": 0.00014440899344167078, "loss": 0.7275, "step": 3281 }, { "epoch": 0.37, "learning_rate": 0.00014437600694204981, "loss": 0.6841, "step": 3282 }, { "epoch": 0.37, "learning_rate": 0.000144343014428716, "loss": 0.7401, "step": 3283 }, { "epoch": 0.37, "learning_rate": 0.0001443100159061404, "loss": 0.7067, "step": 3284 }, { "epoch": 0.37, "learning_rate": 0.00014427701137879493, "loss": 0.6647, "step": 3285 }, { "epoch": 0.37, "learning_rate": 0.0001442440008511523, "loss": 0.6209, "step": 3286 }, { "epoch": 0.37, "learning_rate": 0.0001442109843276859, "loss": 0.6876, "step": 3287 }, { "epoch": 0.37, "learning_rate": 0.0001441779618128701, "loss": 0.6801, "step": 3288 }, { "epoch": 0.37, "learning_rate": 0.00014414493331118004, "loss": 0.6656, "step": 3289 }, { "epoch": 0.37, "learning_rate": 0.0001441118988270916, "loss": 0.6848, "step": 3290 }, { "epoch": 0.37, "learning_rate": 0.00014407885836508158, "loss": 0.6753, "step": 3291 }, { "epoch": 0.37, "learning_rate": 0.00014404581192962743, "loss": 0.6873, "step": 3292 }, { "epoch": 0.37, "learning_rate": 0.0001440127595252076, "loss": 0.6804, "step": 3293 }, { "epoch": 0.37, "learning_rate": 0.00014397970115630128, "loss": 0.6986, "step": 3294 }, { "epoch": 0.37, "learning_rate": 0.00014394663682738837, "loss": 0.7396, "step": 3295 }, { "epoch": 0.37, "learning_rate": 0.0001439135665429497, "loss": 0.7032, "step": 3296 }, { "epoch": 0.37, "learning_rate": 0.00014388049030746687, "loss": 0.7086, "step": 3297 }, { "epoch": 0.37, "learning_rate": 0.00014384740812542225, "loss": 0.6433, "step": 3298 }, { "epoch": 0.37, "learning_rate": 0.000143814320001299, "loss": 0.7697, "step": 3299 }, { "epoch": 0.38, "learning_rate": 0.00014378122593958125, "loss": 0.7288, "step": 3300 }, { "epoch": 0.38, "learning_rate": 0.00014374812594475372, "loss": 0.6357, "step": 3301 }, { "epoch": 0.38, "learning_rate": 0.0001437150200213021, "loss": 0.7244, "step": 3302 }, { "epoch": 0.38, "learning_rate": 0.00014368190817371274, "loss": 0.7097, "step": 3303 }, { "epoch": 0.38, "learning_rate": 0.00014364879040647293, "loss": 0.6397, "step": 3304 }, { "epoch": 0.38, "learning_rate": 0.00014361566672407066, "loss": 0.6763, "step": 3305 }, { "epoch": 0.38, "learning_rate": 0.00014358253713099475, "loss": 0.7178, "step": 3306 }, { "epoch": 0.38, "learning_rate": 0.00014354940163173485, "loss": 0.7151, "step": 3307 }, { "epoch": 0.38, "learning_rate": 0.0001435162602307814, "loss": 0.7046, "step": 3308 }, { "epoch": 0.38, "learning_rate": 0.0001434831129326256, "loss": 0.6914, "step": 3309 }, { "epoch": 0.38, "learning_rate": 0.0001434499597417595, "loss": 0.6422, "step": 3310 }, { "epoch": 0.38, "learning_rate": 0.00014341680066267597, "loss": 0.6226, "step": 3311 }, { "epoch": 0.38, "learning_rate": 0.00014338363569986852, "loss": 0.8043, "step": 3312 }, { "epoch": 0.38, "learning_rate": 0.00014335046485783169, "loss": 0.7256, "step": 3313 }, { "epoch": 0.38, "learning_rate": 0.00014331728814106064, "loss": 0.6689, "step": 3314 }, { "epoch": 0.38, "learning_rate": 0.0001432841055540514, "loss": 0.6993, "step": 3315 }, { "epoch": 0.38, "learning_rate": 0.00014325091710130078, "loss": 0.6783, "step": 3316 }, { "epoch": 0.38, "learning_rate": 0.00014321772278730641, "loss": 0.7094, "step": 3317 }, { "epoch": 0.38, "learning_rate": 0.00014318452261656664, "loss": 0.7022, "step": 3318 }, { "epoch": 0.38, "learning_rate": 0.00014315131659358072, "loss": 0.6948, "step": 3319 }, { "epoch": 0.38, "learning_rate": 0.0001431181047228486, "loss": 0.7108, "step": 3320 }, { "epoch": 0.38, "learning_rate": 0.00014308488700887109, "loss": 0.6388, "step": 3321 }, { "epoch": 0.38, "learning_rate": 0.00014305166345614972, "loss": 0.6989, "step": 3322 }, { "epoch": 0.38, "learning_rate": 0.0001430184340691869, "loss": 0.6994, "step": 3323 }, { "epoch": 0.38, "learning_rate": 0.00014298519885248573, "loss": 0.6287, "step": 3324 }, { "epoch": 0.38, "learning_rate": 0.00014295195781055019, "loss": 0.6238, "step": 3325 }, { "epoch": 0.38, "learning_rate": 0.00014291871094788503, "loss": 0.698, "step": 3326 }, { "epoch": 0.38, "learning_rate": 0.00014288545826899573, "loss": 0.6939, "step": 3327 }, { "epoch": 0.38, "learning_rate": 0.00014285219977838864, "loss": 0.7319, "step": 3328 }, { "epoch": 0.38, "learning_rate": 0.00014281893548057084, "loss": 0.7018, "step": 3329 }, { "epoch": 0.38, "learning_rate": 0.0001427856653800502, "loss": 0.7682, "step": 3330 }, { "epoch": 0.38, "learning_rate": 0.00014275238948133543, "loss": 0.7014, "step": 3331 }, { "epoch": 0.38, "learning_rate": 0.00014271910778893593, "loss": 0.6193, "step": 3332 }, { "epoch": 0.38, "learning_rate": 0.000142685820307362, "loss": 0.6679, "step": 3333 }, { "epoch": 0.38, "learning_rate": 0.00014265252704112464, "loss": 0.7101, "step": 3334 }, { "epoch": 0.38, "learning_rate": 0.00014261922799473564, "loss": 0.6844, "step": 3335 }, { "epoch": 0.38, "learning_rate": 0.00014258592317270764, "loss": 0.6187, "step": 3336 }, { "epoch": 0.38, "learning_rate": 0.00014255261257955398, "loss": 0.6676, "step": 3337 }, { "epoch": 0.38, "learning_rate": 0.00014251929621978885, "loss": 0.6359, "step": 3338 }, { "epoch": 0.38, "learning_rate": 0.00014248597409792719, "loss": 0.686, "step": 3339 }, { "epoch": 0.38, "learning_rate": 0.00014245264621848467, "loss": 0.7127, "step": 3340 }, { "epoch": 0.38, "learning_rate": 0.0001424193125859778, "loss": 0.7195, "step": 3341 }, { "epoch": 0.38, "learning_rate": 0.00014238597320492393, "loss": 0.6629, "step": 3342 }, { "epoch": 0.38, "learning_rate": 0.00014235262807984106, "loss": 0.6504, "step": 3343 }, { "epoch": 0.38, "learning_rate": 0.00014231927721524803, "loss": 0.6774, "step": 3344 }, { "epoch": 0.38, "learning_rate": 0.0001422859206156645, "loss": 0.6456, "step": 3345 }, { "epoch": 0.38, "learning_rate": 0.00014225255828561082, "loss": 0.7609, "step": 3346 }, { "epoch": 0.38, "learning_rate": 0.00014221919022960818, "loss": 0.7273, "step": 3347 }, { "epoch": 0.38, "learning_rate": 0.0001421858164521785, "loss": 0.6705, "step": 3348 }, { "epoch": 0.38, "learning_rate": 0.00014215243695784452, "loss": 0.5798, "step": 3349 }, { "epoch": 0.38, "learning_rate": 0.00014211905175112976, "loss": 0.6591, "step": 3350 }, { "epoch": 0.38, "learning_rate": 0.00014208566083655845, "loss": 0.6498, "step": 3351 }, { "epoch": 0.38, "learning_rate": 0.00014205226421865565, "loss": 0.6391, "step": 3352 }, { "epoch": 0.38, "learning_rate": 0.0001420188619019472, "loss": 0.7164, "step": 3353 }, { "epoch": 0.38, "learning_rate": 0.00014198545389095967, "loss": 0.6988, "step": 3354 }, { "epoch": 0.38, "learning_rate": 0.00014195204019022039, "loss": 0.6646, "step": 3355 }, { "epoch": 0.38, "learning_rate": 0.00014191862080425752, "loss": 0.6877, "step": 3356 }, { "epoch": 0.38, "learning_rate": 0.0001418851957376, "loss": 0.7302, "step": 3357 }, { "epoch": 0.38, "learning_rate": 0.00014185176499477743, "loss": 0.75, "step": 3358 }, { "epoch": 0.38, "learning_rate": 0.0001418183285803203, "loss": 0.7515, "step": 3359 }, { "epoch": 0.38, "learning_rate": 0.00014178488649875976, "loss": 0.6402, "step": 3360 }, { "epoch": 0.38, "learning_rate": 0.00014175143875462786, "loss": 0.7098, "step": 3361 }, { "epoch": 0.38, "learning_rate": 0.00014171798535245731, "loss": 0.6702, "step": 3362 }, { "epoch": 0.38, "learning_rate": 0.00014168452629678165, "loss": 0.6605, "step": 3363 }, { "epoch": 0.38, "learning_rate": 0.00014165106159213514, "loss": 0.6931, "step": 3364 }, { "epoch": 0.38, "learning_rate": 0.0001416175912430528, "loss": 0.6947, "step": 3365 }, { "epoch": 0.38, "learning_rate": 0.00014158411525407044, "loss": 0.6875, "step": 3366 }, { "epoch": 0.38, "learning_rate": 0.00014155063362972467, "loss": 0.7005, "step": 3367 }, { "epoch": 0.38, "learning_rate": 0.00014151714637455283, "loss": 0.6818, "step": 3368 }, { "epoch": 0.38, "learning_rate": 0.00014148365349309297, "loss": 0.6976, "step": 3369 }, { "epoch": 0.38, "learning_rate": 0.000141450154989884, "loss": 0.6893, "step": 3370 }, { "epoch": 0.38, "learning_rate": 0.0001414166508694655, "loss": 0.7216, "step": 3371 }, { "epoch": 0.38, "learning_rate": 0.00014138314113637786, "loss": 0.6984, "step": 3372 }, { "epoch": 0.38, "learning_rate": 0.00014134962579516228, "loss": 0.6165, "step": 3373 }, { "epoch": 0.38, "learning_rate": 0.00014131610485036063, "loss": 0.6672, "step": 3374 }, { "epoch": 0.38, "learning_rate": 0.00014128257830651556, "loss": 0.6953, "step": 3375 }, { "epoch": 0.38, "learning_rate": 0.0001412490461681705, "loss": 0.6553, "step": 3376 }, { "epoch": 0.38, "learning_rate": 0.00014121550843986967, "loss": 0.7104, "step": 3377 }, { "epoch": 0.38, "learning_rate": 0.00014118196512615794, "loss": 0.7081, "step": 3378 }, { "epoch": 0.38, "learning_rate": 0.0001411484162315811, "loss": 0.6911, "step": 3379 }, { "epoch": 0.38, "learning_rate": 0.00014111486176068548, "loss": 0.635, "step": 3380 }, { "epoch": 0.38, "learning_rate": 0.0001410813017180184, "loss": 0.6394, "step": 3381 }, { "epoch": 0.38, "learning_rate": 0.00014104773610812776, "loss": 0.6714, "step": 3382 }, { "epoch": 0.38, "learning_rate": 0.0001410141649355623, "loss": 0.6905, "step": 3383 }, { "epoch": 0.38, "learning_rate": 0.0001409805882048715, "loss": 0.6542, "step": 3384 }, { "epoch": 0.38, "learning_rate": 0.0001409470059206056, "loss": 0.6516, "step": 3385 }, { "epoch": 0.38, "learning_rate": 0.0001409134180873155, "loss": 0.6899, "step": 3386 }, { "epoch": 0.38, "learning_rate": 0.000140879824709553, "loss": 0.6824, "step": 3387 }, { "epoch": 0.39, "learning_rate": 0.00014084622579187058, "loss": 0.6651, "step": 3388 }, { "epoch": 0.39, "learning_rate": 0.00014081262133882144, "loss": 0.6703, "step": 3389 }, { "epoch": 0.39, "learning_rate": 0.0001407790113549596, "loss": 0.6863, "step": 3390 }, { "epoch": 0.39, "learning_rate": 0.00014074539584483974, "loss": 0.6592, "step": 3391 }, { "epoch": 0.39, "learning_rate": 0.0001407117748130174, "loss": 0.7382, "step": 3392 }, { "epoch": 0.39, "learning_rate": 0.00014067814826404873, "loss": 0.6328, "step": 3393 }, { "epoch": 0.39, "learning_rate": 0.0001406445162024908, "loss": 0.7332, "step": 3394 }, { "epoch": 0.39, "learning_rate": 0.00014061087863290124, "loss": 0.6766, "step": 3395 }, { "epoch": 0.39, "learning_rate": 0.0001405772355598386, "loss": 0.7012, "step": 3396 }, { "epoch": 0.39, "learning_rate": 0.00014054358698786204, "loss": 0.6866, "step": 3397 }, { "epoch": 0.39, "learning_rate": 0.0001405099329215316, "loss": 0.6641, "step": 3398 }, { "epoch": 0.39, "learning_rate": 0.00014047627336540784, "loss": 0.7029, "step": 3399 }, { "epoch": 0.39, "learning_rate": 0.00014044260832405233, "loss": 0.7163, "step": 3400 }, { "epoch": 0.39, "learning_rate": 0.00014040893780202724, "loss": 0.6165, "step": 3401 }, { "epoch": 0.39, "learning_rate": 0.0001403752618038955, "loss": 0.6468, "step": 3402 }, { "epoch": 0.39, "learning_rate": 0.00014034158033422077, "loss": 0.6852, "step": 3403 }, { "epoch": 0.39, "learning_rate": 0.00014030789339756748, "loss": 0.6589, "step": 3404 }, { "epoch": 0.39, "learning_rate": 0.00014027420099850085, "loss": 0.7007, "step": 3405 }, { "epoch": 0.39, "learning_rate": 0.00014024050314158663, "loss": 0.6632, "step": 3406 }, { "epoch": 0.39, "learning_rate": 0.00014020679983139158, "loss": 0.5725, "step": 3407 }, { "epoch": 0.39, "learning_rate": 0.00014017309107248308, "loss": 0.7249, "step": 3408 }, { "epoch": 0.39, "learning_rate": 0.0001401393768694292, "loss": 0.6882, "step": 3409 }, { "epoch": 0.39, "learning_rate": 0.00014010565722679877, "loss": 0.6959, "step": 3410 }, { "epoch": 0.39, "learning_rate": 0.00014007193214916148, "loss": 0.6782, "step": 3411 }, { "epoch": 0.39, "learning_rate": 0.00014003820164108758, "loss": 0.736, "step": 3412 }, { "epoch": 0.39, "learning_rate": 0.0001400044657071482, "loss": 0.7064, "step": 3413 }, { "epoch": 0.39, "learning_rate": 0.00013997072435191504, "loss": 0.7152, "step": 3414 }, { "epoch": 0.39, "learning_rate": 0.0001399369775799607, "loss": 0.6771, "step": 3415 }, { "epoch": 0.39, "learning_rate": 0.00013990322539585842, "loss": 0.6729, "step": 3416 }, { "epoch": 0.39, "learning_rate": 0.00013986946780418226, "loss": 0.6638, "step": 3417 }, { "epoch": 0.39, "learning_rate": 0.00013983570480950686, "loss": 0.6279, "step": 3418 }, { "epoch": 0.39, "learning_rate": 0.00013980193641640782, "loss": 0.6559, "step": 3419 }, { "epoch": 0.39, "learning_rate": 0.00013976816262946122, "loss": 0.6764, "step": 3420 }, { "epoch": 0.39, "learning_rate": 0.00013973438345324404, "loss": 0.7102, "step": 3421 }, { "epoch": 0.39, "learning_rate": 0.0001397005988923339, "loss": 0.7274, "step": 3422 }, { "epoch": 0.39, "learning_rate": 0.00013966680895130925, "loss": 0.7318, "step": 3423 }, { "epoch": 0.39, "learning_rate": 0.00013963301363474916, "loss": 0.7008, "step": 3424 }, { "epoch": 0.39, "learning_rate": 0.00013959921294723354, "loss": 0.6577, "step": 3425 }, { "epoch": 0.39, "learning_rate": 0.00013956540689334285, "loss": 0.6827, "step": 3426 }, { "epoch": 0.39, "learning_rate": 0.0001395315954776585, "loss": 0.718, "step": 3427 }, { "epoch": 0.39, "learning_rate": 0.0001394977787047625, "loss": 0.6919, "step": 3428 }, { "epoch": 0.39, "learning_rate": 0.00013946395657923758, "loss": 0.651, "step": 3429 }, { "epoch": 0.39, "learning_rate": 0.0001394301291056672, "loss": 0.6507, "step": 3430 }, { "epoch": 0.39, "learning_rate": 0.00013939629628863563, "loss": 0.6756, "step": 3431 }, { "epoch": 0.39, "learning_rate": 0.00013936245813272772, "loss": 0.6334, "step": 3432 }, { "epoch": 0.39, "learning_rate": 0.0001393286146425292, "loss": 0.6941, "step": 3433 }, { "epoch": 0.39, "learning_rate": 0.00013929476582262638, "loss": 0.6747, "step": 3434 }, { "epoch": 0.39, "learning_rate": 0.0001392609116776064, "loss": 0.6477, "step": 3435 }, { "epoch": 0.39, "learning_rate": 0.00013922705221205707, "loss": 0.6706, "step": 3436 }, { "epoch": 0.39, "learning_rate": 0.00013919318743056694, "loss": 0.6174, "step": 3437 }, { "epoch": 0.39, "learning_rate": 0.00013915931733772522, "loss": 0.6666, "step": 3438 }, { "epoch": 0.39, "learning_rate": 0.00013912544193812196, "loss": 0.6324, "step": 3439 }, { "epoch": 0.39, "learning_rate": 0.0001390915612363478, "loss": 0.6512, "step": 3440 }, { "epoch": 0.39, "learning_rate": 0.0001390576752369942, "loss": 0.7226, "step": 3441 }, { "epoch": 0.39, "learning_rate": 0.0001390237839446533, "loss": 0.6538, "step": 3442 }, { "epoch": 0.39, "learning_rate": 0.00013898988736391792, "loss": 0.6508, "step": 3443 }, { "epoch": 0.39, "learning_rate": 0.00013895598549938166, "loss": 0.6887, "step": 3444 }, { "epoch": 0.39, "learning_rate": 0.00013892207835563875, "loss": 0.6751, "step": 3445 }, { "epoch": 0.39, "learning_rate": 0.00013888816593728427, "loss": 0.7586, "step": 3446 }, { "epoch": 0.39, "learning_rate": 0.0001388542482489139, "loss": 0.6294, "step": 3447 }, { "epoch": 0.39, "learning_rate": 0.00013882032529512406, "loss": 0.7008, "step": 3448 }, { "epoch": 0.39, "learning_rate": 0.0001387863970805119, "loss": 0.7557, "step": 3449 }, { "epoch": 0.39, "learning_rate": 0.0001387524636096753, "loss": 0.6969, "step": 3450 }, { "epoch": 0.39, "learning_rate": 0.0001387185248872128, "loss": 0.6715, "step": 3451 }, { "epoch": 0.39, "learning_rate": 0.0001386845809177237, "loss": 0.7477, "step": 3452 }, { "epoch": 0.39, "learning_rate": 0.00013865063170580798, "loss": 0.7055, "step": 3453 }, { "epoch": 0.39, "learning_rate": 0.00013861667725606635, "loss": 0.729, "step": 3454 }, { "epoch": 0.39, "learning_rate": 0.00013858271757310022, "loss": 0.6883, "step": 3455 }, { "epoch": 0.39, "learning_rate": 0.0001385487526615117, "loss": 0.6644, "step": 3456 }, { "epoch": 0.39, "learning_rate": 0.00013851478252590365, "loss": 0.599, "step": 3457 }, { "epoch": 0.39, "learning_rate": 0.00013848080717087958, "loss": 0.6605, "step": 3458 }, { "epoch": 0.39, "learning_rate": 0.00013844682660104377, "loss": 0.74, "step": 3459 }, { "epoch": 0.39, "learning_rate": 0.0001384128408210011, "loss": 0.6983, "step": 3460 }, { "epoch": 0.39, "learning_rate": 0.0001383788498353573, "loss": 0.6847, "step": 3461 }, { "epoch": 0.39, "learning_rate": 0.00013834485364871873, "loss": 0.6751, "step": 3462 }, { "epoch": 0.39, "learning_rate": 0.0001383108522656924, "loss": 0.6857, "step": 3463 }, { "epoch": 0.39, "learning_rate": 0.00013827684569088614, "loss": 0.7, "step": 3464 }, { "epoch": 0.39, "learning_rate": 0.00013824283392890839, "loss": 0.6456, "step": 3465 }, { "epoch": 0.39, "learning_rate": 0.00013820881698436836, "loss": 0.606, "step": 3466 }, { "epoch": 0.39, "learning_rate": 0.0001381747948618759, "loss": 0.6539, "step": 3467 }, { "epoch": 0.39, "learning_rate": 0.00013814076756604165, "loss": 0.7006, "step": 3468 }, { "epoch": 0.39, "learning_rate": 0.00013810673510147682, "loss": 0.6878, "step": 3469 }, { "epoch": 0.39, "learning_rate": 0.00013807269747279346, "loss": 0.6783, "step": 3470 }, { "epoch": 0.39, "learning_rate": 0.00013803865468460419, "loss": 0.6165, "step": 3471 }, { "epoch": 0.39, "learning_rate": 0.00013800460674152245, "loss": 0.6407, "step": 3472 }, { "epoch": 0.39, "learning_rate": 0.00013797055364816232, "loss": 0.6645, "step": 3473 }, { "epoch": 0.39, "learning_rate": 0.0001379364954091385, "loss": 0.6969, "step": 3474 }, { "epoch": 0.39, "learning_rate": 0.0001379024320290666, "loss": 0.7155, "step": 3475 }, { "epoch": 0.4, "learning_rate": 0.0001378683635125627, "loss": 0.6761, "step": 3476 }, { "epoch": 0.4, "learning_rate": 0.00013783428986424365, "loss": 0.7355, "step": 3477 }, { "epoch": 0.4, "learning_rate": 0.0001378002110887271, "loss": 0.688, "step": 3478 }, { "epoch": 0.4, "learning_rate": 0.00013776612719063126, "loss": 0.712, "step": 3479 }, { "epoch": 0.4, "learning_rate": 0.0001377320381745751, "loss": 0.6385, "step": 3480 }, { "epoch": 0.4, "learning_rate": 0.00013769794404517826, "loss": 0.6368, "step": 3481 }, { "epoch": 0.4, "learning_rate": 0.00013766384480706108, "loss": 0.6524, "step": 3482 }, { "epoch": 0.4, "learning_rate": 0.0001376297404648446, "loss": 0.6753, "step": 3483 }, { "epoch": 0.4, "learning_rate": 0.00013759563102315055, "loss": 0.7734, "step": 3484 }, { "epoch": 0.4, "learning_rate": 0.00013756151648660134, "loss": 0.7519, "step": 3485 }, { "epoch": 0.4, "learning_rate": 0.00013752739685982007, "loss": 0.6762, "step": 3486 }, { "epoch": 0.4, "learning_rate": 0.00013749327214743055, "loss": 0.7223, "step": 3487 }, { "epoch": 0.4, "learning_rate": 0.00013745914235405727, "loss": 0.7135, "step": 3488 }, { "epoch": 0.4, "learning_rate": 0.00013742500748432538, "loss": 0.6931, "step": 3489 }, { "epoch": 0.4, "learning_rate": 0.00013739086754286078, "loss": 0.7251, "step": 3490 }, { "epoch": 0.4, "learning_rate": 0.00013735672253428996, "loss": 0.6701, "step": 3491 }, { "epoch": 0.4, "learning_rate": 0.0001373225724632402, "loss": 0.6562, "step": 3492 }, { "epoch": 0.4, "learning_rate": 0.00013728841733433943, "loss": 0.7248, "step": 3493 }, { "epoch": 0.4, "learning_rate": 0.00013725425715221625, "loss": 0.7288, "step": 3494 }, { "epoch": 0.4, "learning_rate": 0.00013722009192149992, "loss": 0.6812, "step": 3495 }, { "epoch": 0.4, "learning_rate": 0.00013718592164682045, "loss": 0.6846, "step": 3496 }, { "epoch": 0.4, "learning_rate": 0.0001371517463328085, "loss": 0.6988, "step": 3497 }, { "epoch": 0.4, "learning_rate": 0.0001371175659840954, "loss": 0.6741, "step": 3498 }, { "epoch": 0.4, "learning_rate": 0.00013708338060531322, "loss": 0.6568, "step": 3499 }, { "epoch": 0.4, "learning_rate": 0.00013704919020109457, "loss": 0.7035, "step": 3500 }, { "epoch": 0.4, "learning_rate": 0.0001370149947760729, "loss": 0.6954, "step": 3501 }, { "epoch": 0.4, "learning_rate": 0.00013698079433488233, "loss": 0.7093, "step": 3502 }, { "epoch": 0.4, "learning_rate": 0.00013694658888215754, "loss": 0.7267, "step": 3503 }, { "epoch": 0.4, "learning_rate": 0.00013691237842253394, "loss": 0.6965, "step": 3504 }, { "epoch": 0.4, "learning_rate": 0.00013687816296064772, "loss": 0.686, "step": 3505 }, { "epoch": 0.4, "learning_rate": 0.00013684394250113559, "loss": 0.6587, "step": 3506 }, { "epoch": 0.4, "learning_rate": 0.00013680971704863504, "loss": 0.6928, "step": 3507 }, { "epoch": 0.4, "learning_rate": 0.00013677548660778415, "loss": 0.7118, "step": 3508 }, { "epoch": 0.4, "learning_rate": 0.00013674125118322186, "loss": 0.7254, "step": 3509 }, { "epoch": 0.4, "learning_rate": 0.00013670701077958755, "loss": 0.7046, "step": 3510 }, { "epoch": 0.4, "learning_rate": 0.00013667276540152144, "loss": 0.69, "step": 3511 }, { "epoch": 0.4, "learning_rate": 0.00013663851505366428, "loss": 0.667, "step": 3512 }, { "epoch": 0.4, "learning_rate": 0.00013660425974065774, "loss": 0.6295, "step": 3513 }, { "epoch": 0.4, "learning_rate": 0.00013656999946714388, "loss": 0.6946, "step": 3514 }, { "epoch": 0.4, "learning_rate": 0.00013653573423776555, "loss": 0.7178, "step": 3515 }, { "epoch": 0.4, "learning_rate": 0.0001365014640571664, "loss": 0.5978, "step": 3516 }, { "epoch": 0.4, "learning_rate": 0.00013646718892999047, "loss": 0.7127, "step": 3517 }, { "epoch": 0.4, "learning_rate": 0.00013643290886088276, "loss": 0.7469, "step": 3518 }, { "epoch": 0.4, "learning_rate": 0.00013639862385448872, "loss": 0.6958, "step": 3519 }, { "epoch": 0.4, "learning_rate": 0.00013636433391545462, "loss": 0.6108, "step": 3520 }, { "epoch": 0.4, "learning_rate": 0.00013633003904842732, "loss": 0.7253, "step": 3521 }, { "epoch": 0.4, "learning_rate": 0.00013629573925805436, "loss": 0.6695, "step": 3522 }, { "epoch": 0.4, "learning_rate": 0.00013626143454898392, "loss": 0.6929, "step": 3523 }, { "epoch": 0.4, "learning_rate": 0.00013622712492586492, "loss": 0.6145, "step": 3524 }, { "epoch": 0.4, "learning_rate": 0.00013619281039334692, "loss": 0.6646, "step": 3525 }, { "epoch": 0.4, "learning_rate": 0.00013615849095608006, "loss": 0.7097, "step": 3526 }, { "epoch": 0.4, "learning_rate": 0.00013612416661871533, "loss": 0.6909, "step": 3527 }, { "epoch": 0.4, "learning_rate": 0.00013608983738590413, "loss": 0.6758, "step": 3528 }, { "epoch": 0.4, "learning_rate": 0.00013605550326229872, "loss": 0.7687, "step": 3529 }, { "epoch": 0.4, "learning_rate": 0.00013602116425255202, "loss": 0.6513, "step": 3530 }, { "epoch": 0.4, "learning_rate": 0.0001359868203613175, "loss": 0.6862, "step": 3531 }, { "epoch": 0.4, "learning_rate": 0.00013595247159324934, "loss": 0.6201, "step": 3532 }, { "epoch": 0.4, "learning_rate": 0.0001359181179530024, "loss": 0.6633, "step": 3533 }, { "epoch": 0.4, "learning_rate": 0.00013588375944523223, "loss": 0.6438, "step": 3534 }, { "epoch": 0.4, "learning_rate": 0.00013584939607459495, "loss": 0.6405, "step": 3535 }, { "epoch": 0.4, "learning_rate": 0.00013581502784574742, "loss": 0.6747, "step": 3536 }, { "epoch": 0.4, "learning_rate": 0.0001357806547633471, "loss": 0.7128, "step": 3537 }, { "epoch": 0.4, "learning_rate": 0.00013574627683205214, "loss": 0.6869, "step": 3538 }, { "epoch": 0.4, "learning_rate": 0.00013571189405652136, "loss": 0.6971, "step": 3539 }, { "epoch": 0.4, "learning_rate": 0.0001356775064414142, "loss": 0.718, "step": 3540 }, { "epoch": 0.4, "learning_rate": 0.00013564311399139075, "loss": 0.7187, "step": 3541 }, { "epoch": 0.4, "learning_rate": 0.00013560871671111183, "loss": 0.7139, "step": 3542 }, { "epoch": 0.4, "learning_rate": 0.00013557431460523887, "loss": 0.6954, "step": 3543 }, { "epoch": 0.4, "learning_rate": 0.00013553990767843388, "loss": 0.7085, "step": 3544 }, { "epoch": 0.4, "learning_rate": 0.00013550549593535963, "loss": 0.7164, "step": 3545 }, { "epoch": 0.4, "learning_rate": 0.0001354710793806795, "loss": 0.7127, "step": 3546 }, { "epoch": 0.4, "learning_rate": 0.00013543665801905757, "loss": 0.6472, "step": 3547 }, { "epoch": 0.4, "learning_rate": 0.00013540223185515846, "loss": 0.6902, "step": 3548 }, { "epoch": 0.4, "learning_rate": 0.00013536780089364752, "loss": 0.6499, "step": 3549 }, { "epoch": 0.4, "learning_rate": 0.0001353333651391908, "loss": 0.6349, "step": 3550 }, { "epoch": 0.4, "learning_rate": 0.00013529892459645482, "loss": 0.6213, "step": 3551 }, { "epoch": 0.4, "learning_rate": 0.00013526447927010698, "loss": 0.6325, "step": 3552 }, { "epoch": 0.4, "learning_rate": 0.0001352300291648152, "loss": 0.6915, "step": 3553 }, { "epoch": 0.4, "learning_rate": 0.00013519557428524797, "loss": 0.7329, "step": 3554 }, { "epoch": 0.4, "learning_rate": 0.0001351611146360746, "loss": 0.6533, "step": 3555 }, { "epoch": 0.4, "learning_rate": 0.00013512665022196498, "loss": 0.7419, "step": 3556 }, { "epoch": 0.4, "learning_rate": 0.00013509218104758959, "loss": 0.642, "step": 3557 }, { "epoch": 0.4, "learning_rate": 0.00013505770711761956, "loss": 0.6513, "step": 3558 }, { "epoch": 0.4, "learning_rate": 0.0001350232284367268, "loss": 0.7367, "step": 3559 }, { "epoch": 0.4, "learning_rate": 0.00013498874500958368, "loss": 0.7011, "step": 3560 }, { "epoch": 0.4, "learning_rate": 0.00013495425684086334, "loss": 0.6686, "step": 3561 }, { "epoch": 0.4, "learning_rate": 0.0001349197639352395, "loss": 0.6789, "step": 3562 }, { "epoch": 0.4, "learning_rate": 0.00013488526629738655, "loss": 0.6839, "step": 3563 }, { "epoch": 0.41, "learning_rate": 0.00013485076393197955, "loss": 0.6463, "step": 3564 }, { "epoch": 0.41, "learning_rate": 0.0001348162568436941, "loss": 0.6794, "step": 3565 }, { "epoch": 0.41, "learning_rate": 0.00013478174503720654, "loss": 0.6959, "step": 3566 }, { "epoch": 0.41, "learning_rate": 0.0001347472285171938, "loss": 0.6388, "step": 3567 }, { "epoch": 0.41, "learning_rate": 0.00013471270728833347, "loss": 0.5999, "step": 3568 }, { "epoch": 0.41, "learning_rate": 0.0001346781813553038, "loss": 0.6783, "step": 3569 }, { "epoch": 0.41, "learning_rate": 0.0001346436507227836, "loss": 0.6225, "step": 3570 }, { "epoch": 0.41, "learning_rate": 0.0001346091153954524, "loss": 0.6609, "step": 3571 }, { "epoch": 0.41, "learning_rate": 0.00013457457537799025, "loss": 0.7231, "step": 3572 }, { "epoch": 0.41, "learning_rate": 0.00013454003067507806, "loss": 0.7263, "step": 3573 }, { "epoch": 0.41, "learning_rate": 0.00013450548129139713, "loss": 0.6859, "step": 3574 }, { "epoch": 0.41, "learning_rate": 0.00013447092723162954, "loss": 0.6728, "step": 3575 }, { "epoch": 0.41, "learning_rate": 0.00013443636850045794, "loss": 0.7135, "step": 3576 }, { "epoch": 0.41, "learning_rate": 0.0001344018051025656, "loss": 0.6514, "step": 3577 }, { "epoch": 0.41, "learning_rate": 0.0001343672370426365, "loss": 0.7069, "step": 3578 }, { "epoch": 0.41, "learning_rate": 0.0001343326643253552, "loss": 0.7484, "step": 3579 }, { "epoch": 0.41, "learning_rate": 0.0001342980869554069, "loss": 0.6928, "step": 3580 }, { "epoch": 0.41, "learning_rate": 0.00013426350493747744, "loss": 0.6817, "step": 3581 }, { "epoch": 0.41, "learning_rate": 0.00013422891827625326, "loss": 0.661, "step": 3582 }, { "epoch": 0.41, "learning_rate": 0.0001341943269764214, "loss": 0.6825, "step": 3583 }, { "epoch": 0.41, "learning_rate": 0.0001341597310426697, "loss": 0.7066, "step": 3584 }, { "epoch": 0.41, "learning_rate": 0.0001341251304796864, "loss": 0.7074, "step": 3585 }, { "epoch": 0.41, "learning_rate": 0.0001340905252921605, "loss": 0.7262, "step": 3586 }, { "epoch": 0.41, "learning_rate": 0.00013405591548478163, "loss": 0.6624, "step": 3587 }, { "epoch": 0.41, "learning_rate": 0.00013402130106223993, "loss": 0.7039, "step": 3588 }, { "epoch": 0.41, "learning_rate": 0.00013398668202922636, "loss": 0.6784, "step": 3589 }, { "epoch": 0.41, "learning_rate": 0.00013395205839043234, "loss": 0.6829, "step": 3590 }, { "epoch": 0.41, "learning_rate": 0.00013391743015054994, "loss": 0.7352, "step": 3591 }, { "epoch": 0.41, "learning_rate": 0.00013388279731427191, "loss": 0.6476, "step": 3592 }, { "epoch": 0.41, "learning_rate": 0.0001338481598862916, "loss": 0.6923, "step": 3593 }, { "epoch": 0.41, "learning_rate": 0.000133813517871303, "loss": 0.646, "step": 3594 }, { "epoch": 0.41, "learning_rate": 0.00013377887127400065, "loss": 0.6991, "step": 3595 }, { "epoch": 0.41, "learning_rate": 0.00013374422009907984, "loss": 0.7243, "step": 3596 }, { "epoch": 0.41, "learning_rate": 0.0001337095643512363, "loss": 0.6552, "step": 3597 }, { "epoch": 0.41, "learning_rate": 0.00013367490403516655, "loss": 0.6594, "step": 3598 }, { "epoch": 0.41, "learning_rate": 0.00013364023915556764, "loss": 0.7681, "step": 3599 }, { "epoch": 0.41, "learning_rate": 0.00013360556971713723, "loss": 0.7046, "step": 3600 }, { "epoch": 0.41, "learning_rate": 0.00013357089572457365, "loss": 0.675, "step": 3601 }, { "epoch": 0.41, "learning_rate": 0.00013353621718257584, "loss": 0.7279, "step": 3602 }, { "epoch": 0.41, "learning_rate": 0.00013350153409584333, "loss": 0.7332, "step": 3603 }, { "epoch": 0.41, "learning_rate": 0.00013346684646907625, "loss": 0.7382, "step": 3604 }, { "epoch": 0.41, "learning_rate": 0.0001334321543069754, "loss": 0.6027, "step": 3605 }, { "epoch": 0.41, "learning_rate": 0.00013339745761424215, "loss": 0.651, "step": 3606 }, { "epoch": 0.41, "learning_rate": 0.0001333627563955785, "loss": 0.6791, "step": 3607 }, { "epoch": 0.41, "learning_rate": 0.00013332805065568708, "loss": 0.6306, "step": 3608 }, { "epoch": 0.41, "learning_rate": 0.00013329334039927107, "loss": 0.6569, "step": 3609 }, { "epoch": 0.41, "learning_rate": 0.00013325862563103437, "loss": 0.7216, "step": 3610 }, { "epoch": 0.41, "learning_rate": 0.0001332239063556814, "loss": 0.7013, "step": 3611 }, { "epoch": 0.41, "learning_rate": 0.00013318918257791717, "loss": 0.6679, "step": 3612 }, { "epoch": 0.41, "learning_rate": 0.00013315445430244743, "loss": 0.7831, "step": 3613 }, { "epoch": 0.41, "learning_rate": 0.00013311972153397844, "loss": 0.7066, "step": 3614 }, { "epoch": 0.41, "learning_rate": 0.00013308498427721702, "loss": 0.68, "step": 3615 }, { "epoch": 0.41, "learning_rate": 0.00013305024253687075, "loss": 0.6744, "step": 3616 }, { "epoch": 0.41, "learning_rate": 0.0001330154963176477, "loss": 0.7172, "step": 3617 }, { "epoch": 0.41, "learning_rate": 0.0001329807456242566, "loss": 0.6666, "step": 3618 }, { "epoch": 0.41, "learning_rate": 0.00013294599046140672, "loss": 0.6794, "step": 3619 }, { "epoch": 0.41, "learning_rate": 0.00013291123083380803, "loss": 0.7016, "step": 3620 }, { "epoch": 0.41, "learning_rate": 0.00013287646674617107, "loss": 0.7104, "step": 3621 }, { "epoch": 0.41, "learning_rate": 0.00013284169820320692, "loss": 0.7288, "step": 3622 }, { "epoch": 0.41, "learning_rate": 0.00013280692520962732, "loss": 0.6502, "step": 3623 }, { "epoch": 0.41, "learning_rate": 0.00013277214777014464, "loss": 0.6661, "step": 3624 }, { "epoch": 0.41, "learning_rate": 0.0001327373658894718, "loss": 0.6399, "step": 3625 }, { "epoch": 0.41, "learning_rate": 0.00013270257957232238, "loss": 0.6887, "step": 3626 }, { "epoch": 0.41, "learning_rate": 0.0001326677888234105, "loss": 0.6913, "step": 3627 }, { "epoch": 0.41, "learning_rate": 0.0001326329936474509, "loss": 0.6927, "step": 3628 }, { "epoch": 0.41, "learning_rate": 0.00013259819404915892, "loss": 0.6908, "step": 3629 }, { "epoch": 0.41, "learning_rate": 0.00013256339003325053, "loss": 0.6514, "step": 3630 }, { "epoch": 0.41, "learning_rate": 0.00013252858160444224, "loss": 0.6836, "step": 3631 }, { "epoch": 0.41, "learning_rate": 0.0001324937687674512, "loss": 0.6138, "step": 3632 }, { "epoch": 0.41, "learning_rate": 0.0001324589515269952, "loss": 0.6847, "step": 3633 }, { "epoch": 0.41, "learning_rate": 0.0001324241298877925, "loss": 0.6978, "step": 3634 }, { "epoch": 0.41, "learning_rate": 0.00013238930385456204, "loss": 0.7077, "step": 3635 }, { "epoch": 0.41, "learning_rate": 0.0001323544734320234, "loss": 0.7441, "step": 3636 }, { "epoch": 0.41, "learning_rate": 0.0001323196386248967, "loss": 0.7059, "step": 3637 }, { "epoch": 0.41, "learning_rate": 0.00013228479943790258, "loss": 0.7046, "step": 3638 }, { "epoch": 0.41, "learning_rate": 0.00013224995587576244, "loss": 0.6529, "step": 3639 }, { "epoch": 0.41, "learning_rate": 0.0001322151079431981, "loss": 0.6629, "step": 3640 }, { "epoch": 0.41, "learning_rate": 0.00013218025564493212, "loss": 0.7024, "step": 3641 }, { "epoch": 0.41, "learning_rate": 0.00013214539898568755, "loss": 0.6631, "step": 3642 }, { "epoch": 0.41, "learning_rate": 0.0001321105379701881, "loss": 0.7004, "step": 3643 }, { "epoch": 0.41, "learning_rate": 0.000132075672603158, "loss": 0.7003, "step": 3644 }, { "epoch": 0.41, "learning_rate": 0.00013204080288932213, "loss": 0.7266, "step": 3645 }, { "epoch": 0.41, "learning_rate": 0.00013200592883340592, "loss": 0.7639, "step": 3646 }, { "epoch": 0.41, "learning_rate": 0.00013197105044013545, "loss": 0.6469, "step": 3647 }, { "epoch": 0.41, "learning_rate": 0.00013193616771423728, "loss": 0.7112, "step": 3648 }, { "epoch": 0.41, "learning_rate": 0.00013190128066043863, "loss": 0.6864, "step": 3649 }, { "epoch": 0.41, "learning_rate": 0.00013186638928346737, "loss": 0.6517, "step": 3650 }, { "epoch": 0.41, "learning_rate": 0.00013183149358805178, "loss": 0.6864, "step": 3651 }, { "epoch": 0.42, "learning_rate": 0.0001317965935789209, "loss": 0.6886, "step": 3652 }, { "epoch": 0.42, "learning_rate": 0.00013176168926080426, "loss": 0.6944, "step": 3653 }, { "epoch": 0.42, "learning_rate": 0.00013172678063843197, "loss": 0.6698, "step": 3654 }, { "epoch": 0.42, "learning_rate": 0.00013169186771653477, "loss": 0.6836, "step": 3655 }, { "epoch": 0.42, "learning_rate": 0.000131656950499844, "loss": 0.6454, "step": 3656 }, { "epoch": 0.42, "learning_rate": 0.00013162202899309145, "loss": 0.6247, "step": 3657 }, { "epoch": 0.42, "learning_rate": 0.0001315871032010097, "loss": 0.7483, "step": 3658 }, { "epoch": 0.42, "learning_rate": 0.0001315521731283317, "loss": 0.7287, "step": 3659 }, { "epoch": 0.42, "learning_rate": 0.00013151723877979113, "loss": 0.6048, "step": 3660 }, { "epoch": 0.42, "learning_rate": 0.0001314823001601222, "loss": 0.7284, "step": 3661 }, { "epoch": 0.42, "learning_rate": 0.00013144735727405962, "loss": 0.7398, "step": 3662 }, { "epoch": 0.42, "learning_rate": 0.00013141241012633884, "loss": 0.6706, "step": 3663 }, { "epoch": 0.42, "learning_rate": 0.0001313774587216958, "loss": 0.6514, "step": 3664 }, { "epoch": 0.42, "learning_rate": 0.00013134250306486695, "loss": 0.7025, "step": 3665 }, { "epoch": 0.42, "learning_rate": 0.0001313075431605894, "loss": 0.6146, "step": 3666 }, { "epoch": 0.42, "learning_rate": 0.00013127257901360086, "loss": 0.6962, "step": 3667 }, { "epoch": 0.42, "learning_rate": 0.00013123761062863953, "loss": 0.714, "step": 3668 }, { "epoch": 0.42, "learning_rate": 0.00013120263801044425, "loss": 0.6432, "step": 3669 }, { "epoch": 0.42, "learning_rate": 0.00013116766116375445, "loss": 0.7143, "step": 3670 }, { "epoch": 0.42, "learning_rate": 0.00013113268009331001, "loss": 0.7197, "step": 3671 }, { "epoch": 0.42, "learning_rate": 0.00013109769480385155, "loss": 0.7258, "step": 3672 }, { "epoch": 0.42, "learning_rate": 0.00013106270530012013, "loss": 0.7224, "step": 3673 }, { "epoch": 0.42, "learning_rate": 0.0001310277115868574, "loss": 0.6355, "step": 3674 }, { "epoch": 0.42, "learning_rate": 0.0001309927136688057, "loss": 0.7533, "step": 3675 }, { "epoch": 0.42, "learning_rate": 0.0001309577115507078, "loss": 0.7017, "step": 3676 }, { "epoch": 0.42, "learning_rate": 0.0001309227052373071, "loss": 0.6771, "step": 3677 }, { "epoch": 0.42, "learning_rate": 0.0001308876947333475, "loss": 0.669, "step": 3678 }, { "epoch": 0.42, "learning_rate": 0.0001308526800435736, "loss": 0.6246, "step": 3679 }, { "epoch": 0.42, "learning_rate": 0.00013081766117273047, "loss": 0.7101, "step": 3680 }, { "epoch": 0.42, "learning_rate": 0.00013078263812556378, "loss": 0.6288, "step": 3681 }, { "epoch": 0.42, "learning_rate": 0.00013074761090681972, "loss": 0.7252, "step": 3682 }, { "epoch": 0.42, "learning_rate": 0.00013071257952124512, "loss": 0.6713, "step": 3683 }, { "epoch": 0.42, "learning_rate": 0.00013067754397358733, "loss": 0.748, "step": 3684 }, { "epoch": 0.42, "learning_rate": 0.00013064250426859426, "loss": 0.6501, "step": 3685 }, { "epoch": 0.42, "learning_rate": 0.00013060746041101436, "loss": 0.6907, "step": 3686 }, { "epoch": 0.42, "learning_rate": 0.00013057241240559676, "loss": 0.6909, "step": 3687 }, { "epoch": 0.42, "learning_rate": 0.000130537360257091, "loss": 0.6685, "step": 3688 }, { "epoch": 0.42, "learning_rate": 0.00013050230397024723, "loss": 0.6455, "step": 3689 }, { "epoch": 0.42, "learning_rate": 0.00013046724354981624, "loss": 0.7147, "step": 3690 }, { "epoch": 0.42, "learning_rate": 0.0001304321790005493, "loss": 0.7231, "step": 3691 }, { "epoch": 0.42, "learning_rate": 0.00013039711032719828, "loss": 0.7107, "step": 3692 }, { "epoch": 0.42, "learning_rate": 0.00013036203753451556, "loss": 0.6166, "step": 3693 }, { "epoch": 0.42, "learning_rate": 0.0001303269606272541, "loss": 0.6658, "step": 3694 }, { "epoch": 0.42, "learning_rate": 0.00013029187961016744, "loss": 0.7125, "step": 3695 }, { "epoch": 0.42, "learning_rate": 0.00013025679448800968, "loss": 0.6841, "step": 3696 }, { "epoch": 0.42, "learning_rate": 0.0001302217052655354, "loss": 0.7028, "step": 3697 }, { "epoch": 0.42, "learning_rate": 0.00013018661194749985, "loss": 0.7268, "step": 3698 }, { "epoch": 0.42, "learning_rate": 0.00013015151453865876, "loss": 0.7219, "step": 3699 }, { "epoch": 0.42, "learning_rate": 0.00013011641304376846, "loss": 0.6399, "step": 3700 }, { "epoch": 0.42, "learning_rate": 0.00013008130746758578, "loss": 0.6451, "step": 3701 }, { "epoch": 0.42, "learning_rate": 0.0001300461978148681, "loss": 0.7102, "step": 3702 }, { "epoch": 0.42, "learning_rate": 0.00013001108409037342, "loss": 0.7041, "step": 3703 }, { "epoch": 0.42, "learning_rate": 0.00012997596629886027, "loss": 0.6567, "step": 3704 }, { "epoch": 0.42, "learning_rate": 0.00012994084444508766, "loss": 0.6994, "step": 3705 }, { "epoch": 0.42, "learning_rate": 0.00012990571853381522, "loss": 0.6621, "step": 3706 }, { "epoch": 0.42, "learning_rate": 0.0001298705885698032, "loss": 0.6525, "step": 3707 }, { "epoch": 0.42, "learning_rate": 0.0001298354545578122, "loss": 0.674, "step": 3708 }, { "epoch": 0.42, "learning_rate": 0.00012980031650260357, "loss": 0.6362, "step": 3709 }, { "epoch": 0.42, "learning_rate": 0.00012976517440893906, "loss": 0.6972, "step": 3710 }, { "epoch": 0.42, "learning_rate": 0.00012973002828158104, "loss": 0.6425, "step": 3711 }, { "epoch": 0.42, "learning_rate": 0.00012969487812529242, "loss": 0.7281, "step": 3712 }, { "epoch": 0.42, "learning_rate": 0.0001296597239448367, "loss": 0.7096, "step": 3713 }, { "epoch": 0.42, "learning_rate": 0.0001296245657449778, "loss": 0.6893, "step": 3714 }, { "epoch": 0.42, "learning_rate": 0.0001295894035304803, "loss": 0.6546, "step": 3715 }, { "epoch": 0.42, "learning_rate": 0.0001295542373061093, "loss": 0.7076, "step": 3716 }, { "epoch": 0.42, "learning_rate": 0.0001295190670766304, "loss": 0.6763, "step": 3717 }, { "epoch": 0.42, "learning_rate": 0.00012948389284680978, "loss": 0.6836, "step": 3718 }, { "epoch": 0.42, "learning_rate": 0.00012944871462141415, "loss": 0.6677, "step": 3719 }, { "epoch": 0.42, "learning_rate": 0.00012941353240521078, "loss": 0.6723, "step": 3720 }, { "epoch": 0.42, "learning_rate": 0.00012937834620296748, "loss": 0.6579, "step": 3721 }, { "epoch": 0.42, "learning_rate": 0.0001293431560194525, "loss": 0.731, "step": 3722 }, { "epoch": 0.42, "learning_rate": 0.00012930796185943485, "loss": 0.6557, "step": 3723 }, { "epoch": 0.42, "learning_rate": 0.00012927276372768382, "loss": 0.7003, "step": 3724 }, { "epoch": 0.42, "learning_rate": 0.00012923756162896941, "loss": 0.7377, "step": 3725 }, { "epoch": 0.42, "learning_rate": 0.00012920235556806216, "loss": 0.7016, "step": 3726 }, { "epoch": 0.42, "learning_rate": 0.00012916714554973306, "loss": 0.6647, "step": 3727 }, { "epoch": 0.42, "learning_rate": 0.00012913193157875364, "loss": 0.699, "step": 3728 }, { "epoch": 0.42, "learning_rate": 0.000129096713659896, "loss": 0.6598, "step": 3729 }, { "epoch": 0.42, "learning_rate": 0.00012906149179793284, "loss": 0.686, "step": 3730 }, { "epoch": 0.42, "learning_rate": 0.00012902626599763724, "loss": 0.6413, "step": 3731 }, { "epoch": 0.42, "learning_rate": 0.000128991036263783, "loss": 0.7021, "step": 3732 }, { "epoch": 0.42, "learning_rate": 0.0001289558026011443, "loss": 0.6936, "step": 3733 }, { "epoch": 0.42, "learning_rate": 0.0001289205650144959, "loss": 0.6933, "step": 3734 }, { "epoch": 0.42, "learning_rate": 0.00012888532350861312, "loss": 0.7322, "step": 3735 }, { "epoch": 0.42, "learning_rate": 0.00012885007808827178, "loss": 0.7343, "step": 3736 }, { "epoch": 0.42, "learning_rate": 0.00012881482875824827, "loss": 0.716, "step": 3737 }, { "epoch": 0.42, "learning_rate": 0.0001287795755233194, "loss": 0.6531, "step": 3738 }, { "epoch": 0.42, "learning_rate": 0.0001287443183882627, "loss": 0.7124, "step": 3739 }, { "epoch": 0.43, "learning_rate": 0.00012870905735785606, "loss": 0.724, "step": 3740 }, { "epoch": 0.43, "learning_rate": 0.00012867379243687794, "loss": 0.7167, "step": 3741 }, { "epoch": 0.43, "learning_rate": 0.00012863852363010736, "loss": 0.6813, "step": 3742 }, { "epoch": 0.43, "learning_rate": 0.00012860325094232386, "loss": 0.7235, "step": 3743 }, { "epoch": 0.43, "learning_rate": 0.0001285679743783075, "loss": 0.645, "step": 3744 }, { "epoch": 0.43, "learning_rate": 0.00012853269394283887, "loss": 0.6825, "step": 3745 }, { "epoch": 0.43, "learning_rate": 0.00012849740964069906, "loss": 0.6778, "step": 3746 }, { "epoch": 0.43, "learning_rate": 0.00012846212147666968, "loss": 0.6477, "step": 3747 }, { "epoch": 0.43, "learning_rate": 0.0001284268294555329, "loss": 0.7764, "step": 3748 }, { "epoch": 0.43, "learning_rate": 0.0001283915335820714, "loss": 0.7094, "step": 3749 }, { "epoch": 0.43, "learning_rate": 0.00012835623386106844, "loss": 0.6292, "step": 3750 }, { "epoch": 0.43, "learning_rate": 0.0001283209302973076, "loss": 0.6815, "step": 3751 }, { "epoch": 0.43, "learning_rate": 0.00012828562289557324, "loss": 0.6808, "step": 3752 }, { "epoch": 0.43, "learning_rate": 0.00012825031166065006, "loss": 0.6964, "step": 3753 }, { "epoch": 0.43, "learning_rate": 0.00012821499659732339, "loss": 0.6522, "step": 3754 }, { "epoch": 0.43, "learning_rate": 0.000128179677710379, "loss": 0.7012, "step": 3755 }, { "epoch": 0.43, "learning_rate": 0.00012814435500460317, "loss": 0.6577, "step": 3756 }, { "epoch": 0.43, "learning_rate": 0.00012810902848478279, "loss": 0.6641, "step": 3757 }, { "epoch": 0.43, "learning_rate": 0.0001280736981557052, "loss": 0.6674, "step": 3758 }, { "epoch": 0.43, "learning_rate": 0.00012803836402215825, "loss": 0.6682, "step": 3759 }, { "epoch": 0.43, "learning_rate": 0.00012800302608893035, "loss": 0.6363, "step": 3760 }, { "epoch": 0.43, "learning_rate": 0.00012796768436081036, "loss": 0.6852, "step": 3761 }, { "epoch": 0.43, "learning_rate": 0.00012793233884258773, "loss": 0.676, "step": 3762 }, { "epoch": 0.43, "learning_rate": 0.00012789698953905235, "loss": 0.61, "step": 3763 }, { "epoch": 0.43, "learning_rate": 0.0001278616364549947, "loss": 0.6851, "step": 3764 }, { "epoch": 0.43, "learning_rate": 0.0001278262795952057, "loss": 0.6815, "step": 3765 }, { "epoch": 0.43, "learning_rate": 0.0001277909189644768, "loss": 0.7098, "step": 3766 }, { "epoch": 0.43, "learning_rate": 0.00012775555456760008, "loss": 0.6865, "step": 3767 }, { "epoch": 0.43, "learning_rate": 0.00012772018640936787, "loss": 0.6507, "step": 3768 }, { "epoch": 0.43, "learning_rate": 0.00012768481449457325, "loss": 0.6395, "step": 3769 }, { "epoch": 0.43, "learning_rate": 0.00012764943882800976, "loss": 0.6885, "step": 3770 }, { "epoch": 0.43, "learning_rate": 0.0001276140594144713, "loss": 0.7304, "step": 3771 }, { "epoch": 0.43, "learning_rate": 0.0001275786762587525, "loss": 0.6591, "step": 3772 }, { "epoch": 0.43, "learning_rate": 0.00012754328936564829, "loss": 0.6852, "step": 3773 }, { "epoch": 0.43, "learning_rate": 0.00012750789873995427, "loss": 0.6797, "step": 3774 }, { "epoch": 0.43, "learning_rate": 0.0001274725043864665, "loss": 0.636, "step": 3775 }, { "epoch": 0.43, "learning_rate": 0.00012743710630998143, "loss": 0.6642, "step": 3776 }, { "epoch": 0.43, "learning_rate": 0.0001274017045152962, "loss": 0.749, "step": 3777 }, { "epoch": 0.43, "learning_rate": 0.0001273662990072083, "loss": 0.7202, "step": 3778 }, { "epoch": 0.43, "learning_rate": 0.0001273308897905158, "loss": 0.7107, "step": 3779 }, { "epoch": 0.43, "learning_rate": 0.00012729547687001733, "loss": 0.6927, "step": 3780 }, { "epoch": 0.43, "learning_rate": 0.00012726006025051185, "loss": 0.7432, "step": 3781 }, { "epoch": 0.43, "learning_rate": 0.00012722463993679897, "loss": 0.5927, "step": 3782 }, { "epoch": 0.43, "learning_rate": 0.00012718921593367875, "loss": 0.6303, "step": 3783 }, { "epoch": 0.43, "learning_rate": 0.00012715378824595174, "loss": 0.6542, "step": 3784 }, { "epoch": 0.43, "learning_rate": 0.000127118356878419, "loss": 0.6694, "step": 3785 }, { "epoch": 0.43, "learning_rate": 0.00012708292183588208, "loss": 0.6737, "step": 3786 }, { "epoch": 0.43, "learning_rate": 0.00012704748312314309, "loss": 0.6564, "step": 3787 }, { "epoch": 0.43, "learning_rate": 0.00012701204074500456, "loss": 0.6922, "step": 3788 }, { "epoch": 0.43, "learning_rate": 0.00012697659470626953, "loss": 0.7215, "step": 3789 }, { "epoch": 0.43, "learning_rate": 0.00012694114501174154, "loss": 0.7094, "step": 3790 }, { "epoch": 0.43, "learning_rate": 0.00012690569166622464, "loss": 0.7051, "step": 3791 }, { "epoch": 0.43, "learning_rate": 0.0001268702346745234, "loss": 0.7047, "step": 3792 }, { "epoch": 0.43, "learning_rate": 0.0001268347740414428, "loss": 0.6979, "step": 3793 }, { "epoch": 0.43, "learning_rate": 0.0001267993097717884, "loss": 0.6198, "step": 3794 }, { "epoch": 0.43, "learning_rate": 0.00012676384187036623, "loss": 0.6738, "step": 3795 }, { "epoch": 0.43, "learning_rate": 0.00012672837034198277, "loss": 0.6913, "step": 3796 }, { "epoch": 0.43, "learning_rate": 0.00012669289519144506, "loss": 0.7372, "step": 3797 }, { "epoch": 0.43, "learning_rate": 0.00012665741642356055, "loss": 0.7149, "step": 3798 }, { "epoch": 0.43, "learning_rate": 0.00012662193404313723, "loss": 0.7031, "step": 3799 }, { "epoch": 0.43, "learning_rate": 0.00012658644805498362, "loss": 0.6211, "step": 3800 }, { "epoch": 0.43, "learning_rate": 0.00012655095846390865, "loss": 0.7, "step": 3801 }, { "epoch": 0.43, "learning_rate": 0.00012651546527472175, "loss": 0.6277, "step": 3802 }, { "epoch": 0.43, "learning_rate": 0.0001264799684922329, "loss": 0.6607, "step": 3803 }, { "epoch": 0.43, "learning_rate": 0.00012644446812125248, "loss": 0.6652, "step": 3804 }, { "epoch": 0.43, "learning_rate": 0.00012640896416659146, "loss": 0.6837, "step": 3805 }, { "epoch": 0.43, "learning_rate": 0.00012637345663306116, "loss": 0.709, "step": 3806 }, { "epoch": 0.43, "learning_rate": 0.00012633794552547353, "loss": 0.6707, "step": 3807 }, { "epoch": 0.43, "learning_rate": 0.0001263024308486409, "loss": 0.6917, "step": 3808 }, { "epoch": 0.43, "learning_rate": 0.00012626691260737616, "loss": 0.6756, "step": 3809 }, { "epoch": 0.43, "learning_rate": 0.0001262313908064926, "loss": 0.7846, "step": 3810 }, { "epoch": 0.43, "learning_rate": 0.000126195865450804, "loss": 0.7163, "step": 3811 }, { "epoch": 0.43, "learning_rate": 0.00012616033654512475, "loss": 0.6858, "step": 3812 }, { "epoch": 0.43, "learning_rate": 0.00012612480409426958, "loss": 0.6901, "step": 3813 }, { "epoch": 0.43, "learning_rate": 0.00012608926810305372, "loss": 0.6824, "step": 3814 }, { "epoch": 0.43, "learning_rate": 0.00012605372857629299, "loss": 0.7133, "step": 3815 }, { "epoch": 0.43, "learning_rate": 0.00012601818551880354, "loss": 0.7063, "step": 3816 }, { "epoch": 0.43, "learning_rate": 0.00012598263893540208, "loss": 0.663, "step": 3817 }, { "epoch": 0.43, "learning_rate": 0.0001259470888309058, "loss": 0.6683, "step": 3818 }, { "epoch": 0.43, "learning_rate": 0.00012591153521013235, "loss": 0.6755, "step": 3819 }, { "epoch": 0.43, "learning_rate": 0.00012587597807789982, "loss": 0.6025, "step": 3820 }, { "epoch": 0.43, "learning_rate": 0.00012584041743902687, "loss": 0.728, "step": 3821 }, { "epoch": 0.43, "learning_rate": 0.00012580485329833255, "loss": 0.7023, "step": 3822 }, { "epoch": 0.43, "learning_rate": 0.00012576928566063636, "loss": 0.6541, "step": 3823 }, { "epoch": 0.43, "learning_rate": 0.00012573371453075845, "loss": 0.7489, "step": 3824 }, { "epoch": 0.43, "learning_rate": 0.0001256981399135192, "loss": 0.6965, "step": 3825 }, { "epoch": 0.43, "learning_rate": 0.00012566256181373967, "loss": 0.672, "step": 3826 }, { "epoch": 0.43, "learning_rate": 0.0001256269802362413, "loss": 0.67, "step": 3827 }, { "epoch": 0.44, "learning_rate": 0.00012559139518584592, "loss": 0.7319, "step": 3828 }, { "epoch": 0.44, "learning_rate": 0.000125555806667376, "loss": 0.7138, "step": 3829 }, { "epoch": 0.44, "learning_rate": 0.00012552021468565435, "loss": 0.6672, "step": 3830 }, { "epoch": 0.44, "learning_rate": 0.00012548461924550433, "loss": 0.6976, "step": 3831 }, { "epoch": 0.44, "learning_rate": 0.0001254490203517497, "loss": 0.6678, "step": 3832 }, { "epoch": 0.44, "learning_rate": 0.00012541341800921475, "loss": 0.682, "step": 3833 }, { "epoch": 0.44, "learning_rate": 0.00012537781222272422, "loss": 0.6538, "step": 3834 }, { "epoch": 0.44, "learning_rate": 0.00012534220299710325, "loss": 0.691, "step": 3835 }, { "epoch": 0.44, "learning_rate": 0.0001253065903371776, "loss": 0.6973, "step": 3836 }, { "epoch": 0.44, "learning_rate": 0.0001252709742477733, "loss": 0.6963, "step": 3837 }, { "epoch": 0.44, "learning_rate": 0.00012523535473371703, "loss": 0.6698, "step": 3838 }, { "epoch": 0.44, "learning_rate": 0.00012519973179983573, "loss": 0.6886, "step": 3839 }, { "epoch": 0.44, "learning_rate": 0.00012516410545095706, "loss": 0.7126, "step": 3840 }, { "epoch": 0.44, "learning_rate": 0.00012512847569190892, "loss": 0.683, "step": 3841 }, { "epoch": 0.44, "learning_rate": 0.00012509284252751974, "loss": 0.6819, "step": 3842 }, { "epoch": 0.44, "learning_rate": 0.00012505720596261847, "loss": 0.6059, "step": 3843 }, { "epoch": 0.44, "learning_rate": 0.0001250215660020345, "loss": 0.6689, "step": 3844 }, { "epoch": 0.44, "learning_rate": 0.00012498592265059762, "loss": 0.6324, "step": 3845 }, { "epoch": 0.44, "learning_rate": 0.0001249502759131381, "loss": 0.6457, "step": 3846 }, { "epoch": 0.44, "learning_rate": 0.0001249146257944867, "loss": 0.6887, "step": 3847 }, { "epoch": 0.44, "learning_rate": 0.00012487897229947466, "loss": 0.545, "step": 3848 }, { "epoch": 0.44, "learning_rate": 0.00012484331543293365, "loss": 0.6585, "step": 3849 }, { "epoch": 0.44, "learning_rate": 0.00012480765519969569, "loss": 0.7322, "step": 3850 }, { "epoch": 0.44, "learning_rate": 0.00012477199160459344, "loss": 0.6638, "step": 3851 }, { "epoch": 0.44, "learning_rate": 0.00012473632465245994, "loss": 0.6624, "step": 3852 }, { "epoch": 0.44, "learning_rate": 0.00012470065434812863, "loss": 0.6647, "step": 3853 }, { "epoch": 0.44, "learning_rate": 0.00012466498069643346, "loss": 0.6725, "step": 3854 }, { "epoch": 0.44, "learning_rate": 0.00012462930370220885, "loss": 0.6453, "step": 3855 }, { "epoch": 0.44, "learning_rate": 0.00012459362337028962, "loss": 0.7815, "step": 3856 }, { "epoch": 0.44, "learning_rate": 0.00012455793970551107, "loss": 0.6666, "step": 3857 }, { "epoch": 0.44, "learning_rate": 0.00012452225271270898, "loss": 0.7109, "step": 3858 }, { "epoch": 0.44, "learning_rate": 0.0001244865623967195, "loss": 0.6875, "step": 3859 }, { "epoch": 0.44, "learning_rate": 0.00012445086876237935, "loss": 0.7069, "step": 3860 }, { "epoch": 0.44, "learning_rate": 0.00012441517181452556, "loss": 0.719, "step": 3861 }, { "epoch": 0.44, "learning_rate": 0.00012437947155799573, "loss": 0.681, "step": 3862 }, { "epoch": 0.44, "learning_rate": 0.00012434376799762785, "loss": 0.6824, "step": 3863 }, { "epoch": 0.44, "learning_rate": 0.00012430806113826036, "loss": 0.64, "step": 3864 }, { "epoch": 0.44, "learning_rate": 0.00012427235098473214, "loss": 0.7154, "step": 3865 }, { "epoch": 0.44, "learning_rate": 0.00012423663754188263, "loss": 0.68, "step": 3866 }, { "epoch": 0.44, "learning_rate": 0.00012420092081455144, "loss": 0.7053, "step": 3867 }, { "epoch": 0.44, "learning_rate": 0.00012416520080757893, "loss": 0.7137, "step": 3868 }, { "epoch": 0.44, "learning_rate": 0.00012412947752580574, "loss": 0.6591, "step": 3869 }, { "epoch": 0.44, "learning_rate": 0.000124093750974073, "loss": 0.6706, "step": 3870 }, { "epoch": 0.44, "learning_rate": 0.00012405802115722224, "loss": 0.7068, "step": 3871 }, { "epoch": 0.44, "learning_rate": 0.0001240222880800955, "loss": 0.7242, "step": 3872 }, { "epoch": 0.44, "learning_rate": 0.0001239865517475352, "loss": 0.6077, "step": 3873 }, { "epoch": 0.44, "learning_rate": 0.00012395081216438425, "loss": 0.7164, "step": 3874 }, { "epoch": 0.44, "learning_rate": 0.00012391506933548597, "loss": 0.7587, "step": 3875 }, { "epoch": 0.44, "learning_rate": 0.00012387932326568416, "loss": 0.6709, "step": 3876 }, { "epoch": 0.44, "learning_rate": 0.00012384357395982295, "loss": 0.7188, "step": 3877 }, { "epoch": 0.44, "learning_rate": 0.0001238078214227471, "loss": 0.6837, "step": 3878 }, { "epoch": 0.44, "learning_rate": 0.00012377206565930158, "loss": 0.6393, "step": 3879 }, { "epoch": 0.44, "learning_rate": 0.00012373630667433195, "loss": 0.661, "step": 3880 }, { "epoch": 0.44, "learning_rate": 0.00012370054447268422, "loss": 0.6684, "step": 3881 }, { "epoch": 0.44, "learning_rate": 0.0001236647790592047, "loss": 0.7322, "step": 3882 }, { "epoch": 0.44, "learning_rate": 0.00012362901043874028, "loss": 0.6503, "step": 3883 }, { "epoch": 0.44, "learning_rate": 0.00012359323861613824, "loss": 0.7068, "step": 3884 }, { "epoch": 0.44, "learning_rate": 0.0001235574635962462, "loss": 0.705, "step": 3885 }, { "epoch": 0.44, "learning_rate": 0.00012352168538391233, "loss": 0.6965, "step": 3886 }, { "epoch": 0.44, "learning_rate": 0.00012348590398398522, "loss": 0.6524, "step": 3887 }, { "epoch": 0.44, "learning_rate": 0.00012345011940131383, "loss": 0.6427, "step": 3888 }, { "epoch": 0.44, "learning_rate": 0.00012341433164074763, "loss": 0.6198, "step": 3889 }, { "epoch": 0.44, "learning_rate": 0.00012337854070713642, "loss": 0.7007, "step": 3890 }, { "epoch": 0.44, "learning_rate": 0.00012334274660533048, "loss": 0.6426, "step": 3891 }, { "epoch": 0.44, "learning_rate": 0.00012330694934018063, "loss": 0.6823, "step": 3892 }, { "epoch": 0.44, "learning_rate": 0.00012327114891653792, "loss": 0.6422, "step": 3893 }, { "epoch": 0.44, "learning_rate": 0.00012323534533925393, "loss": 0.7029, "step": 3894 }, { "epoch": 0.44, "learning_rate": 0.00012319953861318075, "loss": 0.5946, "step": 3895 }, { "epoch": 0.44, "learning_rate": 0.00012316372874317068, "loss": 0.7087, "step": 3896 }, { "epoch": 0.44, "learning_rate": 0.00012312791573407665, "loss": 0.6137, "step": 3897 }, { "epoch": 0.44, "learning_rate": 0.00012309209959075195, "loss": 0.6839, "step": 3898 }, { "epoch": 0.44, "learning_rate": 0.0001230562803180502, "loss": 0.6699, "step": 3899 }, { "epoch": 0.44, "learning_rate": 0.0001230204579208256, "loss": 0.6857, "step": 3900 }, { "epoch": 0.44, "learning_rate": 0.00012298463240393272, "loss": 0.6997, "step": 3901 }, { "epoch": 0.44, "learning_rate": 0.00012294880377222649, "loss": 0.6785, "step": 3902 }, { "epoch": 0.44, "learning_rate": 0.00012291297203056233, "loss": 0.6758, "step": 3903 }, { "epoch": 0.44, "learning_rate": 0.000122877137183796, "loss": 0.7215, "step": 3904 }, { "epoch": 0.44, "learning_rate": 0.00012284129923678381, "loss": 0.7351, "step": 3905 }, { "epoch": 0.44, "learning_rate": 0.0001228054581943824, "loss": 0.6936, "step": 3906 }, { "epoch": 0.44, "learning_rate": 0.00012276961406144885, "loss": 0.7333, "step": 3907 }, { "epoch": 0.44, "learning_rate": 0.00012273376684284062, "loss": 0.6368, "step": 3908 }, { "epoch": 0.44, "learning_rate": 0.00012269791654341563, "loss": 0.6826, "step": 3909 }, { "epoch": 0.44, "learning_rate": 0.00012266206316803227, "loss": 0.6267, "step": 3910 }, { "epoch": 0.44, "learning_rate": 0.0001226262067215493, "loss": 0.7328, "step": 3911 }, { "epoch": 0.44, "learning_rate": 0.0001225903472088258, "loss": 0.7202, "step": 3912 }, { "epoch": 0.44, "learning_rate": 0.00012255448463472136, "loss": 0.6859, "step": 3913 }, { "epoch": 0.44, "learning_rate": 0.00012251861900409604, "loss": 0.7132, "step": 3914 }, { "epoch": 0.44, "learning_rate": 0.00012248275032181023, "loss": 0.66, "step": 3915 }, { "epoch": 0.45, "learning_rate": 0.0001224468785927247, "loss": 0.6719, "step": 3916 }, { "epoch": 0.45, "learning_rate": 0.00012241100382170077, "loss": 0.6595, "step": 3917 }, { "epoch": 0.45, "learning_rate": 0.00012237512601360003, "loss": 0.6796, "step": 3918 }, { "epoch": 0.45, "learning_rate": 0.00012233924517328457, "loss": 0.698, "step": 3919 }, { "epoch": 0.45, "learning_rate": 0.00012230336130561684, "loss": 0.6779, "step": 3920 }, { "epoch": 0.45, "learning_rate": 0.00012226747441545973, "loss": 0.6739, "step": 3921 }, { "epoch": 0.45, "learning_rate": 0.00012223158450767654, "loss": 0.6851, "step": 3922 }, { "epoch": 0.45, "learning_rate": 0.00012219569158713098, "loss": 0.6323, "step": 3923 }, { "epoch": 0.45, "learning_rate": 0.00012215979565868712, "loss": 0.6836, "step": 3924 }, { "epoch": 0.45, "learning_rate": 0.0001221238967272095, "loss": 0.6731, "step": 3925 }, { "epoch": 0.45, "learning_rate": 0.00012208799479756306, "loss": 0.622, "step": 3926 }, { "epoch": 0.45, "learning_rate": 0.0001220520898746131, "loss": 0.7105, "step": 3927 }, { "epoch": 0.45, "learning_rate": 0.00012201618196322535, "loss": 0.684, "step": 3928 }, { "epoch": 0.45, "learning_rate": 0.000121980271068266, "loss": 0.6508, "step": 3929 }, { "epoch": 0.45, "learning_rate": 0.00012194435719460153, "loss": 0.7037, "step": 3930 }, { "epoch": 0.45, "learning_rate": 0.00012190844034709891, "loss": 0.6159, "step": 3931 }, { "epoch": 0.45, "learning_rate": 0.00012187252053062555, "loss": 0.637, "step": 3932 }, { "epoch": 0.45, "learning_rate": 0.00012183659775004911, "loss": 0.6911, "step": 3933 }, { "epoch": 0.45, "learning_rate": 0.00012180067201023779, "loss": 0.6741, "step": 3934 }, { "epoch": 0.45, "learning_rate": 0.00012176474331606016, "loss": 0.698, "step": 3935 }, { "epoch": 0.45, "learning_rate": 0.00012172881167238514, "loss": 0.7333, "step": 3936 }, { "epoch": 0.45, "learning_rate": 0.00012169287708408212, "loss": 0.6409, "step": 3937 }, { "epoch": 0.45, "learning_rate": 0.00012165693955602086, "loss": 0.656, "step": 3938 }, { "epoch": 0.45, "learning_rate": 0.00012162099909307148, "loss": 0.6685, "step": 3939 }, { "epoch": 0.45, "learning_rate": 0.00012158505570010457, "loss": 0.6588, "step": 3940 }, { "epoch": 0.45, "learning_rate": 0.00012154910938199102, "loss": 0.7052, "step": 3941 }, { "epoch": 0.45, "learning_rate": 0.00012151316014360224, "loss": 0.7277, "step": 3942 }, { "epoch": 0.45, "learning_rate": 0.00012147720798980992, "loss": 0.6622, "step": 3943 }, { "epoch": 0.45, "learning_rate": 0.00012144125292548622, "loss": 0.7158, "step": 3944 }, { "epoch": 0.45, "learning_rate": 0.00012140529495550367, "loss": 0.6561, "step": 3945 }, { "epoch": 0.45, "learning_rate": 0.00012136933408473521, "loss": 0.6335, "step": 3946 }, { "epoch": 0.45, "learning_rate": 0.00012133337031805412, "loss": 0.7001, "step": 3947 }, { "epoch": 0.45, "learning_rate": 0.00012129740366033414, "loss": 0.6666, "step": 3948 }, { "epoch": 0.45, "learning_rate": 0.00012126143411644935, "loss": 0.6498, "step": 3949 }, { "epoch": 0.45, "learning_rate": 0.00012122546169127425, "loss": 0.7038, "step": 3950 }, { "epoch": 0.45, "learning_rate": 0.00012118948638968373, "loss": 0.7094, "step": 3951 }, { "epoch": 0.45, "learning_rate": 0.00012115350821655307, "loss": 0.6415, "step": 3952 }, { "epoch": 0.45, "learning_rate": 0.00012111752717675788, "loss": 0.6854, "step": 3953 }, { "epoch": 0.45, "learning_rate": 0.00012108154327517427, "loss": 0.6796, "step": 3954 }, { "epoch": 0.45, "learning_rate": 0.00012104555651667868, "loss": 0.6842, "step": 3955 }, { "epoch": 0.45, "learning_rate": 0.00012100956690614789, "loss": 0.715, "step": 3956 }, { "epoch": 0.45, "learning_rate": 0.00012097357444845912, "loss": 0.7013, "step": 3957 }, { "epoch": 0.45, "learning_rate": 0.00012093757914849, "loss": 0.641, "step": 3958 }, { "epoch": 0.45, "learning_rate": 0.00012090158101111848, "loss": 0.6376, "step": 3959 }, { "epoch": 0.45, "learning_rate": 0.00012086558004122297, "loss": 0.6646, "step": 3960 }, { "epoch": 0.45, "learning_rate": 0.00012082957624368216, "loss": 0.7015, "step": 3961 }, { "epoch": 0.45, "learning_rate": 0.00012079356962337522, "loss": 0.6696, "step": 3962 }, { "epoch": 0.45, "learning_rate": 0.0001207575601851817, "loss": 0.6589, "step": 3963 }, { "epoch": 0.45, "learning_rate": 0.00012072154793398143, "loss": 0.6305, "step": 3964 }, { "epoch": 0.45, "learning_rate": 0.00012068553287465474, "loss": 0.6169, "step": 3965 }, { "epoch": 0.45, "learning_rate": 0.00012064951501208229, "loss": 0.6904, "step": 3966 }, { "epoch": 0.45, "learning_rate": 0.00012061349435114504, "loss": 0.6826, "step": 3967 }, { "epoch": 0.45, "learning_rate": 0.00012057747089672451, "loss": 0.6647, "step": 3968 }, { "epoch": 0.45, "learning_rate": 0.0001205414446537025, "loss": 0.6778, "step": 3969 }, { "epoch": 0.45, "learning_rate": 0.0001205054156269611, "loss": 0.7367, "step": 3970 }, { "epoch": 0.45, "learning_rate": 0.00012046938382138291, "loss": 0.6473, "step": 3971 }, { "epoch": 0.45, "learning_rate": 0.00012043334924185088, "loss": 0.6676, "step": 3972 }, { "epoch": 0.45, "learning_rate": 0.00012039731189324828, "loss": 0.6596, "step": 3973 }, { "epoch": 0.45, "learning_rate": 0.0001203612717804588, "loss": 0.7062, "step": 3974 }, { "epoch": 0.45, "learning_rate": 0.00012032522890836654, "loss": 0.6381, "step": 3975 }, { "epoch": 0.45, "learning_rate": 0.00012028918328185585, "loss": 0.6761, "step": 3976 }, { "epoch": 0.45, "learning_rate": 0.00012025313490581162, "loss": 0.6647, "step": 3977 }, { "epoch": 0.45, "learning_rate": 0.00012021708378511896, "loss": 0.6938, "step": 3978 }, { "epoch": 0.45, "learning_rate": 0.00012018102992466342, "loss": 0.6957, "step": 3979 }, { "epoch": 0.45, "learning_rate": 0.00012014497332933097, "loss": 0.6345, "step": 3980 }, { "epoch": 0.45, "learning_rate": 0.00012010891400400784, "loss": 0.7088, "step": 3981 }, { "epoch": 0.45, "learning_rate": 0.0001200728519535807, "loss": 0.6755, "step": 3982 }, { "epoch": 0.45, "learning_rate": 0.00012003678718293663, "loss": 0.6226, "step": 3983 }, { "epoch": 0.45, "learning_rate": 0.00012000071969696298, "loss": 0.6514, "step": 3984 }, { "epoch": 0.45, "learning_rate": 0.00011996464950054753, "loss": 0.6779, "step": 3985 }, { "epoch": 0.45, "learning_rate": 0.00011992857659857841, "loss": 0.7222, "step": 3986 }, { "epoch": 0.45, "learning_rate": 0.00011989250099594411, "loss": 0.7125, "step": 3987 }, { "epoch": 0.45, "learning_rate": 0.0001198564226975335, "loss": 0.7028, "step": 3988 }, { "epoch": 0.45, "learning_rate": 0.00011982034170823585, "loss": 0.6577, "step": 3989 }, { "epoch": 0.45, "learning_rate": 0.0001197842580329407, "loss": 0.6793, "step": 3990 }, { "epoch": 0.45, "learning_rate": 0.00011974817167653798, "loss": 0.658, "step": 3991 }, { "epoch": 0.45, "learning_rate": 0.00011971208264391814, "loss": 0.6677, "step": 3992 }, { "epoch": 0.45, "learning_rate": 0.00011967599093997173, "loss": 0.6664, "step": 3993 }, { "epoch": 0.45, "learning_rate": 0.00011963989656958988, "loss": 0.6528, "step": 3994 }, { "epoch": 0.45, "learning_rate": 0.00011960379953766397, "loss": 0.6805, "step": 3995 }, { "epoch": 0.45, "learning_rate": 0.00011956769984908574, "loss": 0.6056, "step": 3996 }, { "epoch": 0.45, "learning_rate": 0.00011953159750874739, "loss": 0.6984, "step": 3997 }, { "epoch": 0.45, "learning_rate": 0.00011949549252154135, "loss": 0.7043, "step": 3998 }, { "epoch": 0.45, "learning_rate": 0.00011945938489236048, "loss": 0.7062, "step": 3999 }, { "epoch": 0.45, "learning_rate": 0.00011942327462609801, "loss": 0.7288, "step": 4000 }, { "epoch": 0.45, "learning_rate": 0.00011938716172764746, "loss": 0.721, "step": 4001 }, { "epoch": 0.45, "learning_rate": 0.00011935104620190278, "loss": 0.68, "step": 4002 }, { "epoch": 0.45, "learning_rate": 0.00011931492805375826, "loss": 0.7436, "step": 4003 }, { "epoch": 0.46, "learning_rate": 0.00011927880728810849, "loss": 0.6845, "step": 4004 }, { "epoch": 0.46, "learning_rate": 0.00011924268390984848, "loss": 0.6901, "step": 4005 }, { "epoch": 0.46, "learning_rate": 0.00011920655792387355, "loss": 0.6502, "step": 4006 }, { "epoch": 0.46, "learning_rate": 0.00011917042933507941, "loss": 0.6791, "step": 4007 }, { "epoch": 0.46, "learning_rate": 0.00011913429814836212, "loss": 0.6746, "step": 4008 }, { "epoch": 0.46, "learning_rate": 0.00011909816436861804, "loss": 0.6973, "step": 4009 }, { "epoch": 0.46, "learning_rate": 0.00011906202800074396, "loss": 0.674, "step": 4010 }, { "epoch": 0.46, "learning_rate": 0.00011902588904963694, "loss": 0.6776, "step": 4011 }, { "epoch": 0.46, "learning_rate": 0.00011898974752019448, "loss": 0.6295, "step": 4012 }, { "epoch": 0.46, "learning_rate": 0.00011895360341731434, "loss": 0.6827, "step": 4013 }, { "epoch": 0.46, "learning_rate": 0.00011891745674589465, "loss": 0.6321, "step": 4014 }, { "epoch": 0.46, "learning_rate": 0.00011888130751083398, "loss": 0.6338, "step": 4015 }, { "epoch": 0.46, "learning_rate": 0.00011884515571703107, "loss": 0.6194, "step": 4016 }, { "epoch": 0.46, "learning_rate": 0.00011880900136938522, "loss": 0.7679, "step": 4017 }, { "epoch": 0.46, "learning_rate": 0.00011877284447279588, "loss": 0.6979, "step": 4018 }, { "epoch": 0.46, "learning_rate": 0.00011873668503216298, "loss": 0.7252, "step": 4019 }, { "epoch": 0.46, "learning_rate": 0.00011870052305238675, "loss": 0.6392, "step": 4020 }, { "epoch": 0.46, "learning_rate": 0.00011866435853836772, "loss": 0.6593, "step": 4021 }, { "epoch": 0.46, "learning_rate": 0.00011862819149500681, "loss": 0.6399, "step": 4022 }, { "epoch": 0.46, "learning_rate": 0.00011859202192720534, "loss": 0.7058, "step": 4023 }, { "epoch": 0.46, "learning_rate": 0.00011855584983986483, "loss": 0.7205, "step": 4024 }, { "epoch": 0.46, "learning_rate": 0.00011851967523788725, "loss": 0.6688, "step": 4025 }, { "epoch": 0.46, "learning_rate": 0.00011848349812617492, "loss": 0.7482, "step": 4026 }, { "epoch": 0.46, "learning_rate": 0.0001184473185096304, "loss": 0.7298, "step": 4027 }, { "epoch": 0.46, "learning_rate": 0.00011841113639315666, "loss": 0.6824, "step": 4028 }, { "epoch": 0.46, "learning_rate": 0.00011837495178165706, "loss": 0.6877, "step": 4029 }, { "epoch": 0.46, "learning_rate": 0.00011833876468003517, "loss": 0.6162, "step": 4030 }, { "epoch": 0.46, "learning_rate": 0.00011830257509319498, "loss": 0.5983, "step": 4031 }, { "epoch": 0.46, "learning_rate": 0.00011826638302604081, "loss": 0.6593, "step": 4032 }, { "epoch": 0.46, "learning_rate": 0.00011823018848347733, "loss": 0.6416, "step": 4033 }, { "epoch": 0.46, "learning_rate": 0.0001181939914704095, "loss": 0.6477, "step": 4034 }, { "epoch": 0.46, "learning_rate": 0.00011815779199174264, "loss": 0.6889, "step": 4035 }, { "epoch": 0.46, "learning_rate": 0.00011812159005238239, "loss": 0.6427, "step": 4036 }, { "epoch": 0.46, "learning_rate": 0.00011808538565723478, "loss": 0.638, "step": 4037 }, { "epoch": 0.46, "learning_rate": 0.00011804917881120607, "loss": 0.7226, "step": 4038 }, { "epoch": 0.46, "learning_rate": 0.00011801296951920295, "loss": 0.6881, "step": 4039 }, { "epoch": 0.46, "learning_rate": 0.00011797675778613242, "loss": 0.7269, "step": 4040 }, { "epoch": 0.46, "learning_rate": 0.00011794054361690172, "loss": 0.7295, "step": 4041 }, { "epoch": 0.46, "learning_rate": 0.00011790432701641856, "loss": 0.6826, "step": 4042 }, { "epoch": 0.46, "learning_rate": 0.00011786810798959089, "loss": 0.7086, "step": 4043 }, { "epoch": 0.46, "learning_rate": 0.00011783188654132702, "loss": 0.699, "step": 4044 }, { "epoch": 0.46, "learning_rate": 0.00011779566267653555, "loss": 0.702, "step": 4045 }, { "epoch": 0.46, "learning_rate": 0.0001177594364001255, "loss": 0.759, "step": 4046 }, { "epoch": 0.46, "learning_rate": 0.00011772320771700607, "loss": 0.6468, "step": 4047 }, { "epoch": 0.46, "learning_rate": 0.00011768697663208693, "loss": 0.7001, "step": 4048 }, { "epoch": 0.46, "learning_rate": 0.00011765074315027802, "loss": 0.6711, "step": 4049 }, { "epoch": 0.46, "learning_rate": 0.00011761450727648955, "loss": 0.6351, "step": 4050 }, { "epoch": 0.46, "learning_rate": 0.00011757826901563214, "loss": 0.7195, "step": 4051 }, { "epoch": 0.46, "learning_rate": 0.00011754202837261672, "loss": 0.63, "step": 4052 }, { "epoch": 0.46, "learning_rate": 0.00011750578535235449, "loss": 0.7641, "step": 4053 }, { "epoch": 0.46, "learning_rate": 0.00011746953995975696, "loss": 0.6637, "step": 4054 }, { "epoch": 0.46, "learning_rate": 0.00011743329219973609, "loss": 0.6978, "step": 4055 }, { "epoch": 0.46, "learning_rate": 0.00011739704207720405, "loss": 0.6978, "step": 4056 }, { "epoch": 0.46, "learning_rate": 0.0001173607895970733, "loss": 0.7316, "step": 4057 }, { "epoch": 0.46, "learning_rate": 0.00011732453476425675, "loss": 0.6648, "step": 4058 }, { "epoch": 0.46, "learning_rate": 0.00011728827758366751, "loss": 0.6448, "step": 4059 }, { "epoch": 0.46, "learning_rate": 0.00011725201806021909, "loss": 0.7086, "step": 4060 }, { "epoch": 0.46, "learning_rate": 0.0001172157561988252, "loss": 0.7089, "step": 4061 }, { "epoch": 0.46, "learning_rate": 0.00011717949200440004, "loss": 0.6889, "step": 4062 }, { "epoch": 0.46, "learning_rate": 0.00011714322548185801, "loss": 0.7042, "step": 4063 }, { "epoch": 0.46, "learning_rate": 0.00011710695663611379, "loss": 0.6813, "step": 4064 }, { "epoch": 0.46, "learning_rate": 0.00011707068547208249, "loss": 0.7054, "step": 4065 }, { "epoch": 0.46, "learning_rate": 0.00011703441199467948, "loss": 0.7513, "step": 4066 }, { "epoch": 0.46, "learning_rate": 0.00011699813620882038, "loss": 0.7214, "step": 4067 }, { "epoch": 0.46, "learning_rate": 0.00011696185811942124, "loss": 0.6823, "step": 4068 }, { "epoch": 0.46, "learning_rate": 0.00011692557773139839, "loss": 0.6673, "step": 4069 }, { "epoch": 0.46, "learning_rate": 0.00011688929504966834, "loss": 0.6349, "step": 4070 }, { "epoch": 0.46, "learning_rate": 0.00011685301007914816, "loss": 0.7172, "step": 4071 }, { "epoch": 0.46, "learning_rate": 0.00011681672282475495, "loss": 0.6767, "step": 4072 }, { "epoch": 0.46, "learning_rate": 0.00011678043329140634, "loss": 0.6263, "step": 4073 }, { "epoch": 0.46, "learning_rate": 0.00011674414148402017, "loss": 0.6507, "step": 4074 }, { "epoch": 0.46, "learning_rate": 0.00011670784740751461, "loss": 0.6706, "step": 4075 }, { "epoch": 0.46, "learning_rate": 0.00011667155106680812, "loss": 0.6983, "step": 4076 }, { "epoch": 0.46, "learning_rate": 0.00011663525246681947, "loss": 0.569, "step": 4077 }, { "epoch": 0.46, "learning_rate": 0.00011659895161246779, "loss": 0.7117, "step": 4078 }, { "epoch": 0.46, "learning_rate": 0.0001165626485086724, "loss": 0.6858, "step": 4079 }, { "epoch": 0.46, "learning_rate": 0.00011652634316035304, "loss": 0.6595, "step": 4080 }, { "epoch": 0.46, "learning_rate": 0.0001164900355724297, "loss": 0.7146, "step": 4081 }, { "epoch": 0.46, "learning_rate": 0.0001164537257498227, "loss": 0.6586, "step": 4082 }, { "epoch": 0.46, "learning_rate": 0.00011641741369745264, "loss": 0.7018, "step": 4083 }, { "epoch": 0.46, "learning_rate": 0.00011638109942024043, "loss": 0.6952, "step": 4084 }, { "epoch": 0.46, "learning_rate": 0.00011634478292310724, "loss": 0.6845, "step": 4085 }, { "epoch": 0.46, "learning_rate": 0.00011630846421097466, "loss": 0.6687, "step": 4086 }, { "epoch": 0.46, "learning_rate": 0.00011627214328876441, "loss": 0.6775, "step": 4087 }, { "epoch": 0.46, "learning_rate": 0.00011623582016139865, "loss": 0.6253, "step": 4088 }, { "epoch": 0.46, "learning_rate": 0.0001161994948337998, "loss": 0.69, "step": 4089 }, { "epoch": 0.46, "learning_rate": 0.00011616316731089052, "loss": 0.6731, "step": 4090 }, { "epoch": 0.46, "learning_rate": 0.00011612683759759387, "loss": 0.6914, "step": 4091 }, { "epoch": 0.47, "learning_rate": 0.0001160905056988331, "loss": 0.7718, "step": 4092 }, { "epoch": 0.47, "learning_rate": 0.00011605417161953184, "loss": 0.6518, "step": 4093 }, { "epoch": 0.47, "learning_rate": 0.00011601783536461399, "loss": 0.664, "step": 4094 }, { "epoch": 0.47, "learning_rate": 0.00011598149693900371, "loss": 0.7, "step": 4095 }, { "epoch": 0.47, "learning_rate": 0.00011594515634762551, "loss": 0.6625, "step": 4096 }, { "epoch": 0.47, "learning_rate": 0.00011590881359540416, "loss": 0.6638, "step": 4097 }, { "epoch": 0.47, "learning_rate": 0.00011587246868726466, "loss": 0.6629, "step": 4098 }, { "epoch": 0.47, "learning_rate": 0.00011583612162813249, "loss": 0.6724, "step": 4099 }, { "epoch": 0.47, "learning_rate": 0.00011579977242293323, "loss": 0.6827, "step": 4100 }, { "epoch": 0.47, "learning_rate": 0.00011576342107659282, "loss": 0.6666, "step": 4101 }, { "epoch": 0.47, "learning_rate": 0.0001157270675940375, "loss": 0.7392, "step": 4102 }, { "epoch": 0.47, "learning_rate": 0.00011569071198019383, "loss": 0.6158, "step": 4103 }, { "epoch": 0.47, "learning_rate": 0.00011565435423998858, "loss": 0.6909, "step": 4104 }, { "epoch": 0.47, "learning_rate": 0.00011561799437834886, "loss": 0.6473, "step": 4105 }, { "epoch": 0.47, "learning_rate": 0.00011558163240020207, "loss": 0.6769, "step": 4106 }, { "epoch": 0.47, "learning_rate": 0.00011554526831047585, "loss": 0.6963, "step": 4107 }, { "epoch": 0.47, "learning_rate": 0.00011550890211409822, "loss": 0.686, "step": 4108 }, { "epoch": 0.47, "learning_rate": 0.00011547253381599738, "loss": 0.6621, "step": 4109 }, { "epoch": 0.47, "learning_rate": 0.00011543616342110186, "loss": 0.6508, "step": 4110 }, { "epoch": 0.47, "learning_rate": 0.00011539979093434051, "loss": 0.7068, "step": 4111 }, { "epoch": 0.47, "learning_rate": 0.00011536341636064236, "loss": 0.7491, "step": 4112 }, { "epoch": 0.47, "learning_rate": 0.00011532703970493685, "loss": 0.7219, "step": 4113 }, { "epoch": 0.47, "learning_rate": 0.00011529066097215364, "loss": 0.6665, "step": 4114 }, { "epoch": 0.47, "learning_rate": 0.00011525428016722264, "loss": 0.6885, "step": 4115 }, { "epoch": 0.47, "learning_rate": 0.0001152178972950741, "loss": 0.6758, "step": 4116 }, { "epoch": 0.47, "learning_rate": 0.00011518151236063854, "loss": 0.6969, "step": 4117 }, { "epoch": 0.47, "learning_rate": 0.00011514512536884672, "loss": 0.5979, "step": 4118 }, { "epoch": 0.47, "learning_rate": 0.00011510873632462971, "loss": 0.7506, "step": 4119 }, { "epoch": 0.47, "learning_rate": 0.00011507234523291886, "loss": 0.6512, "step": 4120 }, { "epoch": 0.47, "learning_rate": 0.00011503595209864574, "loss": 0.6816, "step": 4121 }, { "epoch": 0.47, "learning_rate": 0.00011499955692674234, "loss": 0.6824, "step": 4122 }, { "epoch": 0.47, "learning_rate": 0.00011496315972214075, "loss": 0.6365, "step": 4123 }, { "epoch": 0.47, "learning_rate": 0.00011492676048977347, "loss": 0.6487, "step": 4124 }, { "epoch": 0.47, "learning_rate": 0.00011489035923457317, "loss": 0.6844, "step": 4125 }, { "epoch": 0.47, "learning_rate": 0.0001148539559614729, "loss": 0.6493, "step": 4126 }, { "epoch": 0.47, "learning_rate": 0.00011481755067540589, "loss": 0.6368, "step": 4127 }, { "epoch": 0.47, "learning_rate": 0.00011478114338130573, "loss": 0.7221, "step": 4128 }, { "epoch": 0.47, "learning_rate": 0.00011474473408410618, "loss": 0.7035, "step": 4129 }, { "epoch": 0.47, "learning_rate": 0.00011470832278874133, "loss": 0.6305, "step": 4130 }, { "epoch": 0.47, "learning_rate": 0.00011467190950014562, "loss": 0.7182, "step": 4131 }, { "epoch": 0.47, "learning_rate": 0.00011463549422325357, "loss": 0.6313, "step": 4132 }, { "epoch": 0.47, "learning_rate": 0.00011459907696300012, "loss": 0.6134, "step": 4133 }, { "epoch": 0.47, "learning_rate": 0.00011456265772432049, "loss": 0.6785, "step": 4134 }, { "epoch": 0.47, "learning_rate": 0.00011452623651215, "loss": 0.6829, "step": 4135 }, { "epoch": 0.47, "learning_rate": 0.00011448981333142446, "loss": 0.6493, "step": 4136 }, { "epoch": 0.47, "learning_rate": 0.00011445338818707978, "loss": 0.6633, "step": 4137 }, { "epoch": 0.47, "learning_rate": 0.0001144169610840522, "loss": 0.7066, "step": 4138 }, { "epoch": 0.47, "learning_rate": 0.0001143805320272782, "loss": 0.65, "step": 4139 }, { "epoch": 0.47, "learning_rate": 0.00011434410102169462, "loss": 0.6677, "step": 4140 }, { "epoch": 0.47, "learning_rate": 0.0001143076680722384, "loss": 0.7564, "step": 4141 }, { "epoch": 0.47, "learning_rate": 0.00011427123318384687, "loss": 0.681, "step": 4142 }, { "epoch": 0.47, "learning_rate": 0.00011423479636145762, "loss": 0.6567, "step": 4143 }, { "epoch": 0.47, "learning_rate": 0.00011419835761000841, "loss": 0.7199, "step": 4144 }, { "epoch": 0.47, "learning_rate": 0.00011416191693443732, "loss": 0.6594, "step": 4145 }, { "epoch": 0.47, "learning_rate": 0.00011412547433968275, "loss": 0.6664, "step": 4146 }, { "epoch": 0.47, "learning_rate": 0.00011408902983068321, "loss": 0.7496, "step": 4147 }, { "epoch": 0.47, "learning_rate": 0.00011405258341237765, "loss": 0.7286, "step": 4148 }, { "epoch": 0.47, "learning_rate": 0.0001140161350897051, "loss": 0.6799, "step": 4149 }, { "epoch": 0.47, "learning_rate": 0.000113979684867605, "loss": 0.6941, "step": 4150 }, { "epoch": 0.47, "learning_rate": 0.00011394323275101695, "loss": 0.6314, "step": 4151 }, { "epoch": 0.47, "learning_rate": 0.00011390677874488087, "loss": 0.6516, "step": 4152 }, { "epoch": 0.47, "learning_rate": 0.00011387032285413686, "loss": 0.6641, "step": 4153 }, { "epoch": 0.47, "learning_rate": 0.00011383386508372535, "loss": 0.6063, "step": 4154 }, { "epoch": 0.47, "learning_rate": 0.000113797405438587, "loss": 0.6962, "step": 4155 }, { "epoch": 0.47, "learning_rate": 0.0001137609439236627, "loss": 0.6573, "step": 4156 }, { "epoch": 0.47, "learning_rate": 0.00011372448054389364, "loss": 0.6048, "step": 4157 }, { "epoch": 0.47, "learning_rate": 0.0001136880153042212, "loss": 0.637, "step": 4158 }, { "epoch": 0.47, "learning_rate": 0.00011365154820958706, "loss": 0.6527, "step": 4159 }, { "epoch": 0.47, "learning_rate": 0.00011361507926493317, "loss": 0.6862, "step": 4160 }, { "epoch": 0.47, "learning_rate": 0.00011357860847520165, "loss": 0.7272, "step": 4161 }, { "epoch": 0.47, "learning_rate": 0.00011354213584533495, "loss": 0.6018, "step": 4162 }, { "epoch": 0.47, "learning_rate": 0.00011350566138027576, "loss": 0.6428, "step": 4163 }, { "epoch": 0.47, "learning_rate": 0.00011346918508496696, "loss": 0.7441, "step": 4164 }, { "epoch": 0.47, "learning_rate": 0.00011343270696435173, "loss": 0.6831, "step": 4165 }, { "epoch": 0.47, "learning_rate": 0.00011339622702337347, "loss": 0.5871, "step": 4166 }, { "epoch": 0.47, "learning_rate": 0.00011335974526697586, "loss": 0.6905, "step": 4167 }, { "epoch": 0.47, "learning_rate": 0.00011332326170010279, "loss": 0.5994, "step": 4168 }, { "epoch": 0.47, "learning_rate": 0.00011328677632769841, "loss": 0.6826, "step": 4169 }, { "epoch": 0.47, "learning_rate": 0.00011325028915470715, "loss": 0.6504, "step": 4170 }, { "epoch": 0.47, "learning_rate": 0.00011321380018607361, "loss": 0.645, "step": 4171 }, { "epoch": 0.47, "learning_rate": 0.00011317730942674267, "loss": 0.6066, "step": 4172 }, { "epoch": 0.47, "learning_rate": 0.0001131408168816595, "loss": 0.7076, "step": 4173 }, { "epoch": 0.47, "learning_rate": 0.00011310432255576944, "loss": 0.7081, "step": 4174 }, { "epoch": 0.47, "learning_rate": 0.0001130678264540181, "loss": 0.5909, "step": 4175 }, { "epoch": 0.47, "learning_rate": 0.0001130313285813513, "loss": 0.6727, "step": 4176 }, { "epoch": 0.47, "learning_rate": 0.00011299482894271518, "loss": 0.6559, "step": 4177 }, { "epoch": 0.47, "learning_rate": 0.00011295832754305606, "loss": 0.6411, "step": 4178 }, { "epoch": 0.47, "learning_rate": 0.0001129218243873205, "loss": 0.7018, "step": 4179 }, { "epoch": 0.48, "learning_rate": 0.00011288531948045532, "loss": 0.6311, "step": 4180 }, { "epoch": 0.48, "learning_rate": 0.00011284881282740751, "loss": 0.675, "step": 4181 }, { "epoch": 0.48, "learning_rate": 0.00011281230443312441, "loss": 0.6891, "step": 4182 }, { "epoch": 0.48, "learning_rate": 0.00011277579430255349, "loss": 0.66, "step": 4183 }, { "epoch": 0.48, "learning_rate": 0.00011273928244064256, "loss": 0.6874, "step": 4184 }, { "epoch": 0.48, "learning_rate": 0.00011270276885233958, "loss": 0.7074, "step": 4185 }, { "epoch": 0.48, "learning_rate": 0.0001126662535425927, "loss": 0.6526, "step": 4186 }, { "epoch": 0.48, "learning_rate": 0.00011262973651635047, "loss": 0.7065, "step": 4187 }, { "epoch": 0.48, "learning_rate": 0.00011259321777856155, "loss": 0.685, "step": 4188 }, { "epoch": 0.48, "learning_rate": 0.00011255669733417482, "loss": 0.6702, "step": 4189 }, { "epoch": 0.48, "learning_rate": 0.00011252017518813947, "loss": 0.6859, "step": 4190 }, { "epoch": 0.48, "learning_rate": 0.00011248365134540489, "loss": 0.69, "step": 4191 }, { "epoch": 0.48, "learning_rate": 0.0001124471258109206, "loss": 0.6757, "step": 4192 }, { "epoch": 0.48, "learning_rate": 0.00011241059858963653, "loss": 0.6585, "step": 4193 }, { "epoch": 0.48, "learning_rate": 0.00011237406968650278, "loss": 0.6634, "step": 4194 }, { "epoch": 0.48, "learning_rate": 0.00011233753910646951, "loss": 0.6608, "step": 4195 }, { "epoch": 0.48, "learning_rate": 0.00011230100685448735, "loss": 0.6905, "step": 4196 }, { "epoch": 0.48, "learning_rate": 0.00011226447293550701, "loss": 0.6772, "step": 4197 }, { "epoch": 0.48, "learning_rate": 0.00011222793735447947, "loss": 0.6869, "step": 4198 }, { "epoch": 0.48, "learning_rate": 0.00011219140011635591, "loss": 0.6716, "step": 4199 }, { "epoch": 0.48, "learning_rate": 0.00011215486122608782, "loss": 0.6484, "step": 4200 }, { "epoch": 0.48, "learning_rate": 0.00011211832068862678, "loss": 0.6734, "step": 4201 }, { "epoch": 0.48, "learning_rate": 0.00011208177850892467, "loss": 0.683, "step": 4202 }, { "epoch": 0.48, "learning_rate": 0.00011204523469193361, "loss": 0.6687, "step": 4203 }, { "epoch": 0.48, "learning_rate": 0.00011200868924260593, "loss": 0.6968, "step": 4204 }, { "epoch": 0.48, "learning_rate": 0.00011197214216589416, "loss": 0.7188, "step": 4205 }, { "epoch": 0.48, "learning_rate": 0.000111935593466751, "loss": 0.6829, "step": 4206 }, { "epoch": 0.48, "learning_rate": 0.00011189904315012949, "loss": 0.6893, "step": 4207 }, { "epoch": 0.48, "learning_rate": 0.00011186249122098283, "loss": 0.6425, "step": 4208 }, { "epoch": 0.48, "learning_rate": 0.00011182593768426438, "loss": 0.6115, "step": 4209 }, { "epoch": 0.48, "learning_rate": 0.00011178938254492779, "loss": 0.6533, "step": 4210 }, { "epoch": 0.48, "learning_rate": 0.00011175282580792696, "loss": 0.6951, "step": 4211 }, { "epoch": 0.48, "learning_rate": 0.00011171626747821593, "loss": 0.6648, "step": 4212 }, { "epoch": 0.48, "learning_rate": 0.00011167970756074895, "loss": 0.6406, "step": 4213 }, { "epoch": 0.48, "learning_rate": 0.00011164314606048058, "loss": 0.7285, "step": 4214 }, { "epoch": 0.48, "learning_rate": 0.00011160658298236548, "loss": 0.6867, "step": 4215 }, { "epoch": 0.48, "learning_rate": 0.00011157001833135858, "loss": 0.6115, "step": 4216 }, { "epoch": 0.48, "learning_rate": 0.00011153345211241506, "loss": 0.6977, "step": 4217 }, { "epoch": 0.48, "learning_rate": 0.00011149688433049024, "loss": 0.6134, "step": 4218 }, { "epoch": 0.48, "learning_rate": 0.00011146031499053968, "loss": 0.6907, "step": 4219 }, { "epoch": 0.48, "learning_rate": 0.00011142374409751919, "loss": 0.7378, "step": 4220 }, { "epoch": 0.48, "learning_rate": 0.0001113871716563847, "loss": 0.6709, "step": 4221 }, { "epoch": 0.48, "learning_rate": 0.00011135059767209246, "loss": 0.6059, "step": 4222 }, { "epoch": 0.48, "learning_rate": 0.00011131402214959883, "loss": 0.6858, "step": 4223 }, { "epoch": 0.48, "learning_rate": 0.00011127744509386045, "loss": 0.6809, "step": 4224 }, { "epoch": 0.48, "learning_rate": 0.00011124086650983414, "loss": 0.684, "step": 4225 }, { "epoch": 0.48, "learning_rate": 0.0001112042864024769, "loss": 0.6772, "step": 4226 }, { "epoch": 0.48, "learning_rate": 0.00011116770477674603, "loss": 0.6709, "step": 4227 }, { "epoch": 0.48, "learning_rate": 0.0001111311216375989, "loss": 0.674, "step": 4228 }, { "epoch": 0.48, "learning_rate": 0.00011109453698999317, "loss": 0.6902, "step": 4229 }, { "epoch": 0.48, "learning_rate": 0.0001110579508388867, "loss": 0.6446, "step": 4230 }, { "epoch": 0.48, "learning_rate": 0.00011102136318923759, "loss": 0.6582, "step": 4231 }, { "epoch": 0.48, "learning_rate": 0.00011098477404600403, "loss": 0.6837, "step": 4232 }, { "epoch": 0.48, "learning_rate": 0.00011094818341414446, "loss": 0.6438, "step": 4233 }, { "epoch": 0.48, "learning_rate": 0.00011091159129861764, "loss": 0.7411, "step": 4234 }, { "epoch": 0.48, "learning_rate": 0.00011087499770438232, "loss": 0.6457, "step": 4235 }, { "epoch": 0.48, "learning_rate": 0.00011083840263639764, "loss": 0.626, "step": 4236 }, { "epoch": 0.48, "learning_rate": 0.00011080180609962283, "loss": 0.7098, "step": 4237 }, { "epoch": 0.48, "learning_rate": 0.00011076520809901736, "loss": 0.6999, "step": 4238 }, { "epoch": 0.48, "learning_rate": 0.00011072860863954087, "loss": 0.7319, "step": 4239 }, { "epoch": 0.48, "learning_rate": 0.00011069200772615324, "loss": 0.6735, "step": 4240 }, { "epoch": 0.48, "learning_rate": 0.00011065540536381451, "loss": 0.6877, "step": 4241 }, { "epoch": 0.48, "learning_rate": 0.00011061880155748497, "loss": 0.6554, "step": 4242 }, { "epoch": 0.48, "learning_rate": 0.00011058219631212501, "loss": 0.7807, "step": 4243 }, { "epoch": 0.48, "learning_rate": 0.00011054558963269526, "loss": 0.6408, "step": 4244 }, { "epoch": 0.48, "learning_rate": 0.00011050898152415664, "loss": 0.6755, "step": 4245 }, { "epoch": 0.48, "learning_rate": 0.0001104723719914701, "loss": 0.7395, "step": 4246 }, { "epoch": 0.48, "learning_rate": 0.00011043576103959686, "loss": 0.738, "step": 4247 }, { "epoch": 0.48, "learning_rate": 0.00011039914867349841, "loss": 0.7113, "step": 4248 }, { "epoch": 0.48, "learning_rate": 0.00011036253489813628, "loss": 0.6419, "step": 4249 }, { "epoch": 0.48, "learning_rate": 0.00011032591971847228, "loss": 0.7246, "step": 4250 }, { "epoch": 0.48, "learning_rate": 0.00011028930313946843, "loss": 0.6555, "step": 4251 }, { "epoch": 0.48, "learning_rate": 0.00011025268516608689, "loss": 0.6779, "step": 4252 }, { "epoch": 0.48, "learning_rate": 0.00011021606580329003, "loss": 0.6486, "step": 4253 }, { "epoch": 0.48, "learning_rate": 0.0001101794450560404, "loss": 0.7029, "step": 4254 }, { "epoch": 0.48, "learning_rate": 0.00011014282292930072, "loss": 0.671, "step": 4255 }, { "epoch": 0.48, "learning_rate": 0.00011010619942803395, "loss": 0.6519, "step": 4256 }, { "epoch": 0.48, "learning_rate": 0.00011006957455720321, "loss": 0.6724, "step": 4257 }, { "epoch": 0.48, "learning_rate": 0.00011003294832177178, "loss": 0.6592, "step": 4258 }, { "epoch": 0.48, "learning_rate": 0.00010999632072670314, "loss": 0.66, "step": 4259 }, { "epoch": 0.48, "learning_rate": 0.00010995969177696097, "loss": 0.719, "step": 4260 }, { "epoch": 0.48, "learning_rate": 0.0001099230614775091, "loss": 0.7767, "step": 4261 }, { "epoch": 0.48, "learning_rate": 0.00010988642983331163, "loss": 0.6791, "step": 4262 }, { "epoch": 0.48, "learning_rate": 0.00010984979684933272, "loss": 0.647, "step": 4263 }, { "epoch": 0.48, "learning_rate": 0.00010981316253053677, "loss": 0.7346, "step": 4264 }, { "epoch": 0.48, "learning_rate": 0.00010977652688188839, "loss": 0.6436, "step": 4265 }, { "epoch": 0.48, "learning_rate": 0.00010973988990835233, "loss": 0.6647, "step": 4266 }, { "epoch": 0.48, "learning_rate": 0.00010970325161489352, "loss": 0.6226, "step": 4267 }, { "epoch": 0.49, "learning_rate": 0.00010966661200647712, "loss": 0.6682, "step": 4268 }, { "epoch": 0.49, "learning_rate": 0.00010962997108806836, "loss": 0.736, "step": 4269 }, { "epoch": 0.49, "learning_rate": 0.00010959332886463276, "loss": 0.6743, "step": 4270 }, { "epoch": 0.49, "learning_rate": 0.00010955668534113597, "loss": 0.6834, "step": 4271 }, { "epoch": 0.49, "learning_rate": 0.00010952004052254381, "loss": 0.7119, "step": 4272 }, { "epoch": 0.49, "learning_rate": 0.00010948339441382228, "loss": 0.718, "step": 4273 }, { "epoch": 0.49, "learning_rate": 0.00010944674701993756, "loss": 0.623, "step": 4274 }, { "epoch": 0.49, "learning_rate": 0.000109410098345856, "loss": 0.6606, "step": 4275 }, { "epoch": 0.49, "learning_rate": 0.00010937344839654415, "loss": 0.627, "step": 4276 }, { "epoch": 0.49, "learning_rate": 0.00010933679717696868, "loss": 0.7072, "step": 4277 }, { "epoch": 0.49, "learning_rate": 0.00010930014469209647, "loss": 0.6367, "step": 4278 }, { "epoch": 0.49, "learning_rate": 0.00010926349094689459, "loss": 0.6799, "step": 4279 }, { "epoch": 0.49, "learning_rate": 0.00010922683594633021, "loss": 0.619, "step": 4280 }, { "epoch": 0.49, "learning_rate": 0.00010919017969537073, "loss": 0.7232, "step": 4281 }, { "epoch": 0.49, "learning_rate": 0.00010915352219898371, "loss": 0.6696, "step": 4282 }, { "epoch": 0.49, "learning_rate": 0.00010911686346213688, "loss": 0.6474, "step": 4283 }, { "epoch": 0.49, "learning_rate": 0.00010908020348979808, "loss": 0.7341, "step": 4284 }, { "epoch": 0.49, "learning_rate": 0.00010904354228693546, "loss": 0.672, "step": 4285 }, { "epoch": 0.49, "learning_rate": 0.00010900687985851715, "loss": 0.6299, "step": 4286 }, { "epoch": 0.49, "learning_rate": 0.00010897021620951155, "loss": 0.6942, "step": 4287 }, { "epoch": 0.49, "learning_rate": 0.00010893355134488732, "loss": 0.7419, "step": 4288 }, { "epoch": 0.49, "learning_rate": 0.00010889688526961306, "loss": 0.6346, "step": 4289 }, { "epoch": 0.49, "learning_rate": 0.00010886021798865768, "loss": 0.6851, "step": 4290 }, { "epoch": 0.49, "learning_rate": 0.00010882354950699027, "loss": 0.6736, "step": 4291 }, { "epoch": 0.49, "learning_rate": 0.00010878687982958003, "loss": 0.6896, "step": 4292 }, { "epoch": 0.49, "learning_rate": 0.0001087502089613963, "loss": 0.6914, "step": 4293 }, { "epoch": 0.49, "learning_rate": 0.00010871353690740864, "loss": 0.6148, "step": 4294 }, { "epoch": 0.49, "learning_rate": 0.00010867686367258674, "loss": 0.6111, "step": 4295 }, { "epoch": 0.49, "learning_rate": 0.00010864018926190043, "loss": 0.7044, "step": 4296 }, { "epoch": 0.49, "learning_rate": 0.00010860351368031977, "loss": 0.7143, "step": 4297 }, { "epoch": 0.49, "learning_rate": 0.00010856683693281491, "loss": 0.6693, "step": 4298 }, { "epoch": 0.49, "learning_rate": 0.00010853015902435615, "loss": 0.7157, "step": 4299 }, { "epoch": 0.49, "learning_rate": 0.00010849347995991404, "loss": 0.6717, "step": 4300 }, { "epoch": 0.49, "learning_rate": 0.00010845679974445917, "loss": 0.5939, "step": 4301 }, { "epoch": 0.49, "learning_rate": 0.00010842011838296238, "loss": 0.7295, "step": 4302 }, { "epoch": 0.49, "learning_rate": 0.00010838343588039459, "loss": 0.6818, "step": 4303 }, { "epoch": 0.49, "learning_rate": 0.00010834675224172694, "loss": 0.658, "step": 4304 }, { "epoch": 0.49, "learning_rate": 0.00010831006747193071, "loss": 0.6663, "step": 4305 }, { "epoch": 0.49, "learning_rate": 0.00010827338157597726, "loss": 0.7096, "step": 4306 }, { "epoch": 0.49, "learning_rate": 0.00010823669455883818, "loss": 0.6181, "step": 4307 }, { "epoch": 0.49, "learning_rate": 0.00010820000642548524, "loss": 0.6948, "step": 4308 }, { "epoch": 0.49, "learning_rate": 0.00010816331718089025, "loss": 0.682, "step": 4309 }, { "epoch": 0.49, "learning_rate": 0.00010812662683002528, "loss": 0.7091, "step": 4310 }, { "epoch": 0.49, "learning_rate": 0.0001080899353778625, "loss": 0.6681, "step": 4311 }, { "epoch": 0.49, "learning_rate": 0.00010805324282937417, "loss": 0.7469, "step": 4312 }, { "epoch": 0.49, "learning_rate": 0.00010801654918953283, "loss": 0.7346, "step": 4313 }, { "epoch": 0.49, "learning_rate": 0.00010797985446331112, "loss": 0.6399, "step": 4314 }, { "epoch": 0.49, "learning_rate": 0.00010794315865568172, "loss": 0.6991, "step": 4315 }, { "epoch": 0.49, "learning_rate": 0.00010790646177161763, "loss": 0.699, "step": 4316 }, { "epoch": 0.49, "learning_rate": 0.00010786976381609184, "loss": 0.6872, "step": 4317 }, { "epoch": 0.49, "learning_rate": 0.0001078330647940776, "loss": 0.7105, "step": 4318 }, { "epoch": 0.49, "learning_rate": 0.00010779636471054826, "loss": 0.6487, "step": 4319 }, { "epoch": 0.49, "learning_rate": 0.00010775966357047726, "loss": 0.6705, "step": 4320 }, { "epoch": 0.49, "learning_rate": 0.00010772296137883831, "loss": 0.6427, "step": 4321 }, { "epoch": 0.49, "learning_rate": 0.00010768625814060514, "loss": 0.7017, "step": 4322 }, { "epoch": 0.49, "learning_rate": 0.00010764955386075168, "loss": 0.6161, "step": 4323 }, { "epoch": 0.49, "learning_rate": 0.00010761284854425199, "loss": 0.7452, "step": 4324 }, { "epoch": 0.49, "learning_rate": 0.00010757614219608027, "loss": 0.6131, "step": 4325 }, { "epoch": 0.49, "learning_rate": 0.0001075394348212109, "loss": 0.7208, "step": 4326 }, { "epoch": 0.49, "learning_rate": 0.0001075027264246183, "loss": 0.6499, "step": 4327 }, { "epoch": 0.49, "learning_rate": 0.00010746601701127717, "loss": 0.7053, "step": 4328 }, { "epoch": 0.49, "learning_rate": 0.00010742930658616217, "loss": 0.6766, "step": 4329 }, { "epoch": 0.49, "learning_rate": 0.00010739259515424825, "loss": 0.6802, "step": 4330 }, { "epoch": 0.49, "learning_rate": 0.00010735588272051045, "loss": 0.6959, "step": 4331 }, { "epoch": 0.49, "learning_rate": 0.00010731916928992391, "loss": 0.7312, "step": 4332 }, { "epoch": 0.49, "learning_rate": 0.00010728245486746393, "loss": 0.606, "step": 4333 }, { "epoch": 0.49, "learning_rate": 0.00010724573945810599, "loss": 0.6377, "step": 4334 }, { "epoch": 0.49, "learning_rate": 0.00010720902306682561, "loss": 0.7069, "step": 4335 }, { "epoch": 0.49, "learning_rate": 0.00010717230569859853, "loss": 0.7367, "step": 4336 }, { "epoch": 0.49, "learning_rate": 0.00010713558735840052, "loss": 0.6424, "step": 4337 }, { "epoch": 0.49, "learning_rate": 0.00010709886805120764, "loss": 0.6565, "step": 4338 }, { "epoch": 0.49, "learning_rate": 0.00010706214778199592, "loss": 0.7154, "step": 4339 }, { "epoch": 0.49, "learning_rate": 0.00010702542655574161, "loss": 0.7227, "step": 4340 }, { "epoch": 0.49, "learning_rate": 0.00010698870437742108, "loss": 0.6958, "step": 4341 }, { "epoch": 0.49, "learning_rate": 0.0001069519812520108, "loss": 0.6728, "step": 4342 }, { "epoch": 0.49, "learning_rate": 0.00010691525718448739, "loss": 0.744, "step": 4343 }, { "epoch": 0.49, "learning_rate": 0.00010687853217982759, "loss": 0.6629, "step": 4344 }, { "epoch": 0.49, "learning_rate": 0.0001068418062430083, "loss": 0.7465, "step": 4345 }, { "epoch": 0.49, "learning_rate": 0.00010680507937900645, "loss": 0.7064, "step": 4346 }, { "epoch": 0.49, "learning_rate": 0.00010676835159279923, "loss": 0.7337, "step": 4347 }, { "epoch": 0.49, "learning_rate": 0.00010673162288936385, "loss": 0.7311, "step": 4348 }, { "epoch": 0.49, "learning_rate": 0.0001066948932736777, "loss": 0.7173, "step": 4349 }, { "epoch": 0.49, "learning_rate": 0.00010665816275071829, "loss": 0.667, "step": 4350 }, { "epoch": 0.49, "learning_rate": 0.00010662143132546319, "loss": 0.6586, "step": 4351 }, { "epoch": 0.49, "learning_rate": 0.00010658469900289016, "loss": 0.7353, "step": 4352 }, { "epoch": 0.49, "learning_rate": 0.00010654796578797709, "loss": 0.5985, "step": 4353 }, { "epoch": 0.49, "learning_rate": 0.00010651123168570194, "loss": 0.6637, "step": 4354 }, { "epoch": 0.49, "learning_rate": 0.00010647449670104279, "loss": 0.6744, "step": 4355 }, { "epoch": 0.5, "learning_rate": 0.00010643776083897795, "loss": 0.6821, "step": 4356 }, { "epoch": 0.5, "learning_rate": 0.00010640102410448562, "loss": 0.6231, "step": 4357 }, { "epoch": 0.5, "learning_rate": 0.00010636428650254437, "loss": 0.6843, "step": 4358 }, { "epoch": 0.5, "learning_rate": 0.00010632754803813278, "loss": 0.7026, "step": 4359 }, { "epoch": 0.5, "learning_rate": 0.00010629080871622947, "loss": 0.7099, "step": 4360 }, { "epoch": 0.5, "learning_rate": 0.0001062540685418133, "loss": 0.7203, "step": 4361 }, { "epoch": 0.5, "learning_rate": 0.0001062173275198632, "loss": 0.6845, "step": 4362 }, { "epoch": 0.5, "learning_rate": 0.0001061805856553582, "loss": 0.7139, "step": 4363 }, { "epoch": 0.5, "learning_rate": 0.00010614384295327741, "loss": 0.7191, "step": 4364 }, { "epoch": 0.5, "learning_rate": 0.0001061070994186002, "loss": 0.625, "step": 4365 }, { "epoch": 0.5, "learning_rate": 0.00010607035505630587, "loss": 0.6067, "step": 4366 }, { "epoch": 0.5, "learning_rate": 0.00010603360987137394, "loss": 0.6874, "step": 4367 }, { "epoch": 0.5, "learning_rate": 0.00010599686386878402, "loss": 0.7097, "step": 4368 }, { "epoch": 0.5, "learning_rate": 0.0001059601170535158, "loss": 0.6841, "step": 4369 }, { "epoch": 0.5, "learning_rate": 0.00010592336943054912, "loss": 0.6796, "step": 4370 }, { "epoch": 0.5, "learning_rate": 0.00010588662100486396, "loss": 0.6746, "step": 4371 }, { "epoch": 0.5, "learning_rate": 0.00010584987178144029, "loss": 0.644, "step": 4372 }, { "epoch": 0.5, "learning_rate": 0.00010581312176525829, "loss": 0.6879, "step": 4373 }, { "epoch": 0.5, "learning_rate": 0.00010577637096129822, "loss": 0.6575, "step": 4374 }, { "epoch": 0.5, "learning_rate": 0.00010573961937454046, "loss": 0.6876, "step": 4375 }, { "epoch": 0.5, "learning_rate": 0.0001057028670099655, "loss": 0.6512, "step": 4376 }, { "epoch": 0.5, "learning_rate": 0.00010566611387255387, "loss": 0.7263, "step": 4377 }, { "epoch": 0.5, "learning_rate": 0.00010562935996728629, "loss": 0.7513, "step": 4378 }, { "epoch": 0.5, "learning_rate": 0.00010559260529914355, "loss": 0.6794, "step": 4379 }, { "epoch": 0.5, "learning_rate": 0.00010555584987310649, "loss": 0.6448, "step": 4380 }, { "epoch": 0.5, "learning_rate": 0.00010551909369415613, "loss": 0.6202, "step": 4381 }, { "epoch": 0.5, "learning_rate": 0.00010548233676727362, "loss": 0.6402, "step": 4382 }, { "epoch": 0.5, "learning_rate": 0.00010544557909744006, "loss": 0.5925, "step": 4383 }, { "epoch": 0.5, "learning_rate": 0.0001054088206896368, "loss": 0.6827, "step": 4384 }, { "epoch": 0.5, "learning_rate": 0.00010537206154884525, "loss": 0.6702, "step": 4385 }, { "epoch": 0.5, "learning_rate": 0.00010533530168004688, "loss": 0.6442, "step": 4386 }, { "epoch": 0.5, "learning_rate": 0.00010529854108822328, "loss": 0.6971, "step": 4387 }, { "epoch": 0.5, "learning_rate": 0.00010526177977835618, "loss": 0.6606, "step": 4388 }, { "epoch": 0.5, "learning_rate": 0.00010522501775542732, "loss": 0.6862, "step": 4389 }, { "epoch": 0.5, "learning_rate": 0.00010518825502441863, "loss": 0.6579, "step": 4390 }, { "epoch": 0.5, "learning_rate": 0.00010515149159031207, "loss": 0.6398, "step": 4391 }, { "epoch": 0.5, "learning_rate": 0.00010511472745808972, "loss": 0.7121, "step": 4392 }, { "epoch": 0.5, "learning_rate": 0.00010507796263273379, "loss": 0.6164, "step": 4393 }, { "epoch": 0.5, "learning_rate": 0.00010504119711922649, "loss": 0.6926, "step": 4394 }, { "epoch": 0.5, "learning_rate": 0.00010500443092255017, "loss": 0.7217, "step": 4395 }, { "epoch": 0.5, "learning_rate": 0.00010496766404768735, "loss": 0.707, "step": 4396 }, { "epoch": 0.5, "learning_rate": 0.00010493089649962051, "loss": 0.6497, "step": 4397 }, { "epoch": 0.5, "learning_rate": 0.00010489412828333236, "loss": 0.6474, "step": 4398 }, { "epoch": 0.5, "learning_rate": 0.00010485735940380556, "loss": 0.6736, "step": 4399 }, { "epoch": 0.5, "learning_rate": 0.00010482058986602295, "loss": 0.6801, "step": 4400 }, { "epoch": 0.5, "learning_rate": 0.00010478381967496742, "loss": 0.7259, "step": 4401 }, { "epoch": 0.5, "learning_rate": 0.00010474704883562201, "loss": 0.7143, "step": 4402 }, { "epoch": 0.5, "learning_rate": 0.00010471027735296974, "loss": 0.6963, "step": 4403 }, { "epoch": 0.5, "learning_rate": 0.00010467350523199382, "loss": 0.6612, "step": 4404 }, { "epoch": 0.5, "learning_rate": 0.00010463673247767749, "loss": 0.679, "step": 4405 }, { "epoch": 0.5, "learning_rate": 0.0001045999590950041, "loss": 0.6124, "step": 4406 }, { "epoch": 0.5, "learning_rate": 0.00010456318508895705, "loss": 0.7047, "step": 4407 }, { "epoch": 0.5, "learning_rate": 0.00010452641046451993, "loss": 0.6967, "step": 4408 }, { "epoch": 0.5, "learning_rate": 0.00010448963522667621, "loss": 0.7233, "step": 4409 }, { "epoch": 0.5, "learning_rate": 0.00010445285938040967, "loss": 0.7231, "step": 4410 }, { "epoch": 0.5, "learning_rate": 0.00010441608293070402, "loss": 0.6744, "step": 4411 }, { "epoch": 0.5, "learning_rate": 0.0001043793058825431, "loss": 0.6297, "step": 4412 }, { "epoch": 0.5, "learning_rate": 0.00010434252824091089, "loss": 0.6614, "step": 4413 }, { "epoch": 0.5, "learning_rate": 0.00010430575001079133, "loss": 0.6177, "step": 4414 }, { "epoch": 0.5, "learning_rate": 0.00010426897119716852, "loss": 0.7168, "step": 4415 }, { "epoch": 0.5, "learning_rate": 0.00010423219180502664, "loss": 0.6998, "step": 4416 }, { "epoch": 0.5, "learning_rate": 0.00010419541183934991, "loss": 0.6805, "step": 4417 }, { "epoch": 0.5, "learning_rate": 0.00010415863130512267, "loss": 0.712, "step": 4418 }, { "epoch": 0.5, "learning_rate": 0.00010412185020732929, "loss": 0.6004, "step": 4419 }, { "epoch": 0.5, "learning_rate": 0.00010408506855095425, "loss": 0.6793, "step": 4420 }, { "epoch": 0.5, "learning_rate": 0.00010404828634098211, "loss": 0.6396, "step": 4421 }, { "epoch": 0.5, "learning_rate": 0.00010401150358239748, "loss": 0.6663, "step": 4422 }, { "epoch": 0.5, "learning_rate": 0.00010397472028018507, "loss": 0.7195, "step": 4423 }, { "epoch": 0.5, "learning_rate": 0.00010393793643932964, "loss": 0.6753, "step": 4424 }, { "epoch": 0.5, "learning_rate": 0.00010390115206481605, "loss": 0.6916, "step": 4425 }, { "epoch": 0.5, "learning_rate": 0.00010386436716162919, "loss": 0.7012, "step": 4426 }, { "epoch": 0.5, "learning_rate": 0.00010382758173475404, "loss": 0.653, "step": 4427 }, { "epoch": 0.5, "learning_rate": 0.00010379079578917572, "loss": 0.6311, "step": 4428 }, { "epoch": 0.5, "learning_rate": 0.00010375400932987931, "loss": 0.6453, "step": 4429 }, { "epoch": 0.5, "learning_rate": 0.00010371722236185, "loss": 0.6764, "step": 4430 }, { "epoch": 0.5, "learning_rate": 0.00010368043489007309, "loss": 0.6784, "step": 4431 }, { "epoch": 0.5, "learning_rate": 0.00010364364691953388, "loss": 0.7281, "step": 4432 }, { "epoch": 0.5, "learning_rate": 0.0001036068584552178, "loss": 0.6725, "step": 4433 }, { "epoch": 0.5, "learning_rate": 0.0001035700695021103, "loss": 0.7085, "step": 4434 }, { "epoch": 0.5, "learning_rate": 0.00010353328006519693, "loss": 0.6521, "step": 4435 }, { "epoch": 0.5, "learning_rate": 0.00010349649014946332, "loss": 0.717, "step": 4436 }, { "epoch": 0.5, "learning_rate": 0.00010345969975989506, "loss": 0.6323, "step": 4437 }, { "epoch": 0.5, "learning_rate": 0.00010342290890147797, "loss": 0.7047, "step": 4438 }, { "epoch": 0.5, "learning_rate": 0.0001033861175791978, "loss": 0.711, "step": 4439 }, { "epoch": 0.5, "learning_rate": 0.00010334932579804039, "loss": 0.7463, "step": 4440 }, { "epoch": 0.5, "learning_rate": 0.00010331253356299168, "loss": 0.7617, "step": 4441 }, { "epoch": 0.5, "learning_rate": 0.00010327574087903769, "loss": 0.6456, "step": 4442 }, { "epoch": 0.51, "learning_rate": 0.00010323894775116439, "loss": 0.6489, "step": 4443 }, { "epoch": 0.51, "learning_rate": 0.0001032021541843579, "loss": 0.6711, "step": 4444 }, { "epoch": 0.51, "learning_rate": 0.00010316536018360441, "loss": 0.6665, "step": 4445 }, { "epoch": 0.51, "learning_rate": 0.00010312856575389017, "loss": 0.6854, "step": 4446 }, { "epoch": 0.51, "learning_rate": 0.00010309177090020137, "loss": 0.6336, "step": 4447 }, { "epoch": 0.51, "learning_rate": 0.0001030549756275244, "loss": 0.6361, "step": 4448 }, { "epoch": 0.51, "learning_rate": 0.00010301817994084564, "loss": 0.6509, "step": 4449 }, { "epoch": 0.51, "learning_rate": 0.00010298138384515157, "loss": 0.7126, "step": 4450 }, { "epoch": 0.51, "learning_rate": 0.00010294458734542865, "loss": 0.6674, "step": 4451 }, { "epoch": 0.51, "learning_rate": 0.00010290779044666345, "loss": 0.6985, "step": 4452 }, { "epoch": 0.51, "learning_rate": 0.00010287099315384261, "loss": 0.6796, "step": 4453 }, { "epoch": 0.51, "learning_rate": 0.00010283419547195276, "loss": 0.6134, "step": 4454 }, { "epoch": 0.51, "learning_rate": 0.00010279739740598064, "loss": 0.7382, "step": 4455 }, { "epoch": 0.51, "learning_rate": 0.00010276059896091305, "loss": 0.6476, "step": 4456 }, { "epoch": 0.51, "learning_rate": 0.00010272380014173675, "loss": 0.7164, "step": 4457 }, { "epoch": 0.51, "learning_rate": 0.00010268700095343864, "loss": 0.6817, "step": 4458 }, { "epoch": 0.51, "learning_rate": 0.00010265020140100567, "loss": 0.6863, "step": 4459 }, { "epoch": 0.51, "learning_rate": 0.00010261340148942477, "loss": 0.6757, "step": 4460 }, { "epoch": 0.51, "learning_rate": 0.000102576601223683, "loss": 0.7457, "step": 4461 }, { "epoch": 0.51, "learning_rate": 0.00010253980060876742, "loss": 0.7058, "step": 4462 }, { "epoch": 0.51, "learning_rate": 0.0001025029996496651, "loss": 0.6731, "step": 4463 }, { "epoch": 0.51, "learning_rate": 0.00010246619835136327, "loss": 0.7158, "step": 4464 }, { "epoch": 0.51, "learning_rate": 0.00010242939671884913, "loss": 0.6969, "step": 4465 }, { "epoch": 0.51, "learning_rate": 0.00010239259475710987, "loss": 0.6447, "step": 4466 }, { "epoch": 0.51, "learning_rate": 0.00010235579247113287, "loss": 0.6858, "step": 4467 }, { "epoch": 0.51, "learning_rate": 0.00010231898986590542, "loss": 0.6167, "step": 4468 }, { "epoch": 0.51, "learning_rate": 0.00010228218694641491, "loss": 0.6506, "step": 4469 }, { "epoch": 0.51, "learning_rate": 0.0001022453837176488, "loss": 0.6629, "step": 4470 }, { "epoch": 0.51, "learning_rate": 0.00010220858018459454, "loss": 0.6799, "step": 4471 }, { "epoch": 0.51, "learning_rate": 0.00010217177635223965, "loss": 0.6392, "step": 4472 }, { "epoch": 0.51, "learning_rate": 0.00010213497222557172, "loss": 0.6774, "step": 4473 }, { "epoch": 0.51, "learning_rate": 0.00010209816780957824, "loss": 0.6929, "step": 4474 }, { "epoch": 0.51, "learning_rate": 0.00010206136310924695, "loss": 0.6266, "step": 4475 }, { "epoch": 0.51, "learning_rate": 0.00010202455812956546, "loss": 0.679, "step": 4476 }, { "epoch": 0.51, "learning_rate": 0.00010198775287552149, "loss": 0.6329, "step": 4477 }, { "epoch": 0.51, "learning_rate": 0.00010195094735210278, "loss": 0.6502, "step": 4478 }, { "epoch": 0.51, "learning_rate": 0.00010191414156429715, "loss": 0.6793, "step": 4479 }, { "epoch": 0.51, "learning_rate": 0.00010187733551709235, "loss": 0.6859, "step": 4480 }, { "epoch": 0.51, "learning_rate": 0.00010184052921547629, "loss": 0.6963, "step": 4481 }, { "epoch": 0.51, "learning_rate": 0.00010180372266443685, "loss": 0.6743, "step": 4482 }, { "epoch": 0.51, "learning_rate": 0.00010176691586896194, "loss": 0.6787, "step": 4483 }, { "epoch": 0.51, "learning_rate": 0.00010173010883403951, "loss": 0.6546, "step": 4484 }, { "epoch": 0.51, "learning_rate": 0.00010169330156465755, "loss": 0.72, "step": 4485 }, { "epoch": 0.51, "learning_rate": 0.00010165649406580406, "loss": 0.631, "step": 4486 }, { "epoch": 0.51, "learning_rate": 0.00010161968634246717, "loss": 0.7135, "step": 4487 }, { "epoch": 0.51, "learning_rate": 0.00010158287839963483, "loss": 0.6636, "step": 4488 }, { "epoch": 0.51, "learning_rate": 0.00010154607024229525, "loss": 0.7048, "step": 4489 }, { "epoch": 0.51, "learning_rate": 0.00010150926187543654, "loss": 0.6894, "step": 4490 }, { "epoch": 0.51, "learning_rate": 0.00010147245330404687, "loss": 0.6951, "step": 4491 }, { "epoch": 0.51, "learning_rate": 0.00010143564453311443, "loss": 0.6304, "step": 4492 }, { "epoch": 0.51, "learning_rate": 0.00010139883556762741, "loss": 0.7178, "step": 4493 }, { "epoch": 0.51, "learning_rate": 0.00010136202641257415, "loss": 0.7089, "step": 4494 }, { "epoch": 0.51, "learning_rate": 0.00010132521707294283, "loss": 0.6819, "step": 4495 }, { "epoch": 0.51, "learning_rate": 0.00010128840755372178, "loss": 0.6682, "step": 4496 }, { "epoch": 0.51, "learning_rate": 0.00010125159785989933, "loss": 0.6652, "step": 4497 }, { "epoch": 0.51, "learning_rate": 0.00010121478799646383, "loss": 0.7358, "step": 4498 }, { "epoch": 0.51, "learning_rate": 0.00010117797796840364, "loss": 0.6747, "step": 4499 }, { "epoch": 0.51, "learning_rate": 0.00010114116778070717, "loss": 0.6441, "step": 4500 }, { "epoch": 0.51, "learning_rate": 0.00010110435743836282, "loss": 0.7471, "step": 4501 }, { "epoch": 0.51, "learning_rate": 0.00010106754694635905, "loss": 0.7386, "step": 4502 }, { "epoch": 0.51, "learning_rate": 0.00010103073630968424, "loss": 0.656, "step": 4503 }, { "epoch": 0.51, "learning_rate": 0.00010099392553332698, "loss": 0.6682, "step": 4504 }, { "epoch": 0.51, "learning_rate": 0.00010095711462227566, "loss": 0.7221, "step": 4505 }, { "epoch": 0.51, "learning_rate": 0.00010092030358151883, "loss": 0.6907, "step": 4506 }, { "epoch": 0.51, "learning_rate": 0.00010088349241604505, "loss": 0.6454, "step": 4507 }, { "epoch": 0.51, "learning_rate": 0.00010084668113084281, "loss": 0.6704, "step": 4508 }, { "epoch": 0.51, "learning_rate": 0.00010080986973090072, "loss": 0.7198, "step": 4509 }, { "epoch": 0.51, "learning_rate": 0.00010077305822120735, "loss": 0.6151, "step": 4510 }, { "epoch": 0.51, "learning_rate": 0.00010073624660675125, "loss": 0.6727, "step": 4511 }, { "epoch": 0.51, "learning_rate": 0.00010069943489252109, "loss": 0.6278, "step": 4512 }, { "epoch": 0.51, "learning_rate": 0.00010066262308350547, "loss": 0.6439, "step": 4513 }, { "epoch": 0.51, "learning_rate": 0.00010062581118469299, "loss": 0.6458, "step": 4514 }, { "epoch": 0.51, "learning_rate": 0.00010058899920107233, "loss": 0.6045, "step": 4515 }, { "epoch": 0.51, "learning_rate": 0.00010055218713763214, "loss": 0.5839, "step": 4516 }, { "epoch": 0.51, "learning_rate": 0.0001005153749993611, "loss": 0.6399, "step": 4517 }, { "epoch": 0.51, "learning_rate": 0.00010047856279124786, "loss": 0.7046, "step": 4518 }, { "epoch": 0.51, "learning_rate": 0.0001004417505182811, "loss": 0.745, "step": 4519 }, { "epoch": 0.51, "learning_rate": 0.00010040493818544959, "loss": 0.7166, "step": 4520 }, { "epoch": 0.51, "learning_rate": 0.00010036812579774197, "loss": 0.6846, "step": 4521 }, { "epoch": 0.51, "learning_rate": 0.00010033131336014697, "loss": 0.6399, "step": 4522 }, { "epoch": 0.51, "learning_rate": 0.00010029450087765326, "loss": 0.6866, "step": 4523 }, { "epoch": 0.51, "learning_rate": 0.00010025768835524969, "loss": 0.6809, "step": 4524 }, { "epoch": 0.51, "learning_rate": 0.00010022087579792485, "loss": 0.6715, "step": 4525 }, { "epoch": 0.51, "learning_rate": 0.00010018406321066755, "loss": 0.6375, "step": 4526 }, { "epoch": 0.51, "learning_rate": 0.00010014725059846654, "loss": 0.6767, "step": 4527 }, { "epoch": 0.51, "learning_rate": 0.00010011043796631052, "loss": 0.6597, "step": 4528 }, { "epoch": 0.51, "learning_rate": 0.00010007362531918826, "loss": 0.6693, "step": 4529 }, { "epoch": 0.51, "learning_rate": 0.00010003681266208853, "loss": 0.6772, "step": 4530 }, { "epoch": 0.52, "learning_rate": 0.0001, "loss": 0.7211, "step": 4531 }, { "epoch": 0.52, "learning_rate": 9.99631873379115e-05, "loss": 0.6956, "step": 4532 }, { "epoch": 0.52, "learning_rate": 9.992637468081173e-05, "loss": 0.6512, "step": 4533 }, { "epoch": 0.52, "learning_rate": 9.98895620336895e-05, "loss": 0.6925, "step": 4534 }, { "epoch": 0.52, "learning_rate": 9.98527494015335e-05, "loss": 0.6878, "step": 4535 }, { "epoch": 0.52, "learning_rate": 9.981593678933246e-05, "loss": 0.7268, "step": 4536 }, { "epoch": 0.52, "learning_rate": 9.977912420207517e-05, "loss": 0.6755, "step": 4537 }, { "epoch": 0.52, "learning_rate": 9.974231164475034e-05, "loss": 0.6733, "step": 4538 }, { "epoch": 0.52, "learning_rate": 9.970549912234672e-05, "loss": 0.6482, "step": 4539 }, { "epoch": 0.52, "learning_rate": 9.966868663985307e-05, "loss": 0.6698, "step": 4540 }, { "epoch": 0.52, "learning_rate": 9.963187420225806e-05, "loss": 0.7549, "step": 4541 }, { "epoch": 0.52, "learning_rate": 9.959506181455045e-05, "loss": 0.6316, "step": 4542 }, { "epoch": 0.52, "learning_rate": 9.955824948171892e-05, "loss": 0.7008, "step": 4543 }, { "epoch": 0.52, "learning_rate": 9.952143720875218e-05, "loss": 0.6725, "step": 4544 }, { "epoch": 0.52, "learning_rate": 9.948462500063893e-05, "loss": 0.6727, "step": 4545 }, { "epoch": 0.52, "learning_rate": 9.94478128623679e-05, "loss": 0.636, "step": 4546 }, { "epoch": 0.52, "learning_rate": 9.94110007989277e-05, "loss": 0.6673, "step": 4547 }, { "epoch": 0.52, "learning_rate": 9.937418881530703e-05, "loss": 0.6681, "step": 4548 }, { "epoch": 0.52, "learning_rate": 9.933737691649456e-05, "loss": 0.7651, "step": 4549 }, { "epoch": 0.52, "learning_rate": 9.930056510747892e-05, "loss": 0.6558, "step": 4550 }, { "epoch": 0.52, "learning_rate": 9.926375339324878e-05, "loss": 0.6741, "step": 4551 }, { "epoch": 0.52, "learning_rate": 9.92269417787927e-05, "loss": 0.6415, "step": 4552 }, { "epoch": 0.52, "learning_rate": 9.919013026909932e-05, "loss": 0.6052, "step": 4553 }, { "epoch": 0.52, "learning_rate": 9.915331886915721e-05, "loss": 0.6138, "step": 4554 }, { "epoch": 0.52, "learning_rate": 9.911650758395497e-05, "loss": 0.6779, "step": 4555 }, { "epoch": 0.52, "learning_rate": 9.907969641848117e-05, "loss": 0.6796, "step": 4556 }, { "epoch": 0.52, "learning_rate": 9.904288537772439e-05, "loss": 0.6848, "step": 4557 }, { "epoch": 0.52, "learning_rate": 9.900607446667307e-05, "loss": 0.7123, "step": 4558 }, { "epoch": 0.52, "learning_rate": 9.896926369031578e-05, "loss": 0.716, "step": 4559 }, { "epoch": 0.52, "learning_rate": 9.893245305364098e-05, "loss": 0.6683, "step": 4560 }, { "epoch": 0.52, "learning_rate": 9.889564256163718e-05, "loss": 0.6605, "step": 4561 }, { "epoch": 0.52, "learning_rate": 9.885883221929282e-05, "loss": 0.7288, "step": 4562 }, { "epoch": 0.52, "learning_rate": 9.882202203159638e-05, "loss": 0.6446, "step": 4563 }, { "epoch": 0.52, "learning_rate": 9.87852120035362e-05, "loss": 0.7161, "step": 4564 }, { "epoch": 0.52, "learning_rate": 9.874840214010069e-05, "loss": 0.6567, "step": 4565 }, { "epoch": 0.52, "learning_rate": 9.871159244627824e-05, "loss": 0.6138, "step": 4566 }, { "epoch": 0.52, "learning_rate": 9.86747829270572e-05, "loss": 0.7097, "step": 4567 }, { "epoch": 0.52, "learning_rate": 9.863797358742589e-05, "loss": 0.5773, "step": 4568 }, { "epoch": 0.52, "learning_rate": 9.860116443237261e-05, "loss": 0.711, "step": 4569 }, { "epoch": 0.52, "learning_rate": 9.856435546688561e-05, "loss": 0.6755, "step": 4570 }, { "epoch": 0.52, "learning_rate": 9.852754669595316e-05, "loss": 0.6931, "step": 4571 }, { "epoch": 0.52, "learning_rate": 9.849073812456347e-05, "loss": 0.7025, "step": 4572 }, { "epoch": 0.52, "learning_rate": 9.845392975770475e-05, "loss": 0.6484, "step": 4573 }, { "epoch": 0.52, "learning_rate": 9.84171216003652e-05, "loss": 0.6837, "step": 4574 }, { "epoch": 0.52, "learning_rate": 9.838031365753288e-05, "loss": 0.6109, "step": 4575 }, { "epoch": 0.52, "learning_rate": 9.834350593419595e-05, "loss": 0.6964, "step": 4576 }, { "epoch": 0.52, "learning_rate": 9.830669843534247e-05, "loss": 0.6228, "step": 4577 }, { "epoch": 0.52, "learning_rate": 9.82698911659605e-05, "loss": 0.7284, "step": 4578 }, { "epoch": 0.52, "learning_rate": 9.823308413103807e-05, "loss": 0.6554, "step": 4579 }, { "epoch": 0.52, "learning_rate": 9.819627733556319e-05, "loss": 0.6832, "step": 4580 }, { "epoch": 0.52, "learning_rate": 9.815947078452372e-05, "loss": 0.7018, "step": 4581 }, { "epoch": 0.52, "learning_rate": 9.812266448290767e-05, "loss": 0.6608, "step": 4582 }, { "epoch": 0.52, "learning_rate": 9.808585843570289e-05, "loss": 0.7246, "step": 4583 }, { "epoch": 0.52, "learning_rate": 9.804905264789723e-05, "loss": 0.6598, "step": 4584 }, { "epoch": 0.52, "learning_rate": 9.801224712447852e-05, "loss": 0.7687, "step": 4585 }, { "epoch": 0.52, "learning_rate": 9.797544187043458e-05, "loss": 0.7124, "step": 4586 }, { "epoch": 0.52, "learning_rate": 9.793863689075309e-05, "loss": 0.6466, "step": 4587 }, { "epoch": 0.52, "learning_rate": 9.790183219042177e-05, "loss": 0.6502, "step": 4588 }, { "epoch": 0.52, "learning_rate": 9.786502777442832e-05, "loss": 0.6719, "step": 4589 }, { "epoch": 0.52, "learning_rate": 9.782822364776034e-05, "loss": 0.7303, "step": 4590 }, { "epoch": 0.52, "learning_rate": 9.779141981540547e-05, "loss": 0.6142, "step": 4591 }, { "epoch": 0.52, "learning_rate": 9.775461628235121e-05, "loss": 0.6405, "step": 4592 }, { "epoch": 0.52, "learning_rate": 9.771781305358511e-05, "loss": 0.6636, "step": 4593 }, { "epoch": 0.52, "learning_rate": 9.76810101340946e-05, "loss": 0.6918, "step": 4594 }, { "epoch": 0.52, "learning_rate": 9.764420752886715e-05, "loss": 0.6795, "step": 4595 }, { "epoch": 0.52, "learning_rate": 9.760740524289016e-05, "loss": 0.6257, "step": 4596 }, { "epoch": 0.52, "learning_rate": 9.757060328115094e-05, "loss": 0.6499, "step": 4597 }, { "epoch": 0.52, "learning_rate": 9.753380164863676e-05, "loss": 0.6776, "step": 4598 }, { "epoch": 0.52, "learning_rate": 9.74970003503349e-05, "loss": 0.633, "step": 4599 }, { "epoch": 0.52, "learning_rate": 9.746019939123262e-05, "loss": 0.6899, "step": 4600 }, { "epoch": 0.52, "learning_rate": 9.7423398776317e-05, "loss": 0.6327, "step": 4601 }, { "epoch": 0.52, "learning_rate": 9.738659851057523e-05, "loss": 0.6513, "step": 4602 }, { "epoch": 0.52, "learning_rate": 9.734979859899437e-05, "loss": 0.6248, "step": 4603 }, { "epoch": 0.52, "learning_rate": 9.731299904656137e-05, "loss": 0.6699, "step": 4604 }, { "epoch": 0.52, "learning_rate": 9.727619985826328e-05, "loss": 0.679, "step": 4605 }, { "epoch": 0.52, "learning_rate": 9.723940103908696e-05, "loss": 0.6994, "step": 4606 }, { "epoch": 0.52, "learning_rate": 9.720260259401934e-05, "loss": 0.6974, "step": 4607 }, { "epoch": 0.52, "learning_rate": 9.716580452804726e-05, "loss": 0.7016, "step": 4608 }, { "epoch": 0.52, "learning_rate": 9.712900684615743e-05, "loss": 0.5792, "step": 4609 }, { "epoch": 0.52, "learning_rate": 9.709220955333657e-05, "loss": 0.724, "step": 4610 }, { "epoch": 0.52, "learning_rate": 9.705541265457137e-05, "loss": 0.6961, "step": 4611 }, { "epoch": 0.52, "learning_rate": 9.701861615484845e-05, "loss": 0.64, "step": 4612 }, { "epoch": 0.52, "learning_rate": 9.698182005915436e-05, "loss": 0.6163, "step": 4613 }, { "epoch": 0.52, "learning_rate": 9.694502437247562e-05, "loss": 0.6683, "step": 4614 }, { "epoch": 0.52, "learning_rate": 9.690822909979865e-05, "loss": 0.6979, "step": 4615 }, { "epoch": 0.52, "learning_rate": 9.687143424610986e-05, "loss": 0.6974, "step": 4616 }, { "epoch": 0.52, "learning_rate": 9.68346398163956e-05, "loss": 0.6367, "step": 4617 }, { "epoch": 0.52, "learning_rate": 9.679784581564212e-05, "loss": 0.6711, "step": 4618 }, { "epoch": 0.53, "learning_rate": 9.676105224883563e-05, "loss": 0.6791, "step": 4619 }, { "epoch": 0.53, "learning_rate": 9.672425912096236e-05, "loss": 0.6344, "step": 4620 }, { "epoch": 0.53, "learning_rate": 9.668746643700834e-05, "loss": 0.6632, "step": 4621 }, { "epoch": 0.53, "learning_rate": 9.665067420195962e-05, "loss": 0.7023, "step": 4622 }, { "epoch": 0.53, "learning_rate": 9.661388242080222e-05, "loss": 0.6928, "step": 4623 }, { "epoch": 0.53, "learning_rate": 9.657709109852203e-05, "loss": 0.7541, "step": 4624 }, { "epoch": 0.53, "learning_rate": 9.654030024010496e-05, "loss": 0.6914, "step": 4625 }, { "epoch": 0.53, "learning_rate": 9.650350985053672e-05, "loss": 0.6826, "step": 4626 }, { "epoch": 0.53, "learning_rate": 9.646671993480308e-05, "loss": 0.7331, "step": 4627 }, { "epoch": 0.53, "learning_rate": 9.642993049788973e-05, "loss": 0.7138, "step": 4628 }, { "epoch": 0.53, "learning_rate": 9.639314154478223e-05, "loss": 0.7236, "step": 4629 }, { "epoch": 0.53, "learning_rate": 9.635635308046613e-05, "loss": 0.6563, "step": 4630 }, { "epoch": 0.53, "learning_rate": 9.631956510992696e-05, "loss": 0.6767, "step": 4631 }, { "epoch": 0.53, "learning_rate": 9.628277763815004e-05, "loss": 0.7033, "step": 4632 }, { "epoch": 0.53, "learning_rate": 9.624599067012072e-05, "loss": 0.6308, "step": 4633 }, { "epoch": 0.53, "learning_rate": 9.620920421082429e-05, "loss": 0.6719, "step": 4634 }, { "epoch": 0.53, "learning_rate": 9.617241826524594e-05, "loss": 0.6998, "step": 4635 }, { "epoch": 0.53, "learning_rate": 9.613563283837082e-05, "loss": 0.6324, "step": 4636 }, { "epoch": 0.53, "learning_rate": 9.609884793518397e-05, "loss": 0.6905, "step": 4637 }, { "epoch": 0.53, "learning_rate": 9.606206356067037e-05, "loss": 0.7252, "step": 4638 }, { "epoch": 0.53, "learning_rate": 9.602527971981495e-05, "loss": 0.6653, "step": 4639 }, { "epoch": 0.53, "learning_rate": 9.598849641760253e-05, "loss": 0.6416, "step": 4640 }, { "epoch": 0.53, "learning_rate": 9.595171365901791e-05, "loss": 0.6922, "step": 4641 }, { "epoch": 0.53, "learning_rate": 9.591493144904576e-05, "loss": 0.626, "step": 4642 }, { "epoch": 0.53, "learning_rate": 9.587814979267075e-05, "loss": 0.6889, "step": 4643 }, { "epoch": 0.53, "learning_rate": 9.584136869487737e-05, "loss": 0.6641, "step": 4644 }, { "epoch": 0.53, "learning_rate": 9.580458816065011e-05, "loss": 0.641, "step": 4645 }, { "epoch": 0.53, "learning_rate": 9.576780819497337e-05, "loss": 0.6287, "step": 4646 }, { "epoch": 0.53, "learning_rate": 9.57310288028315e-05, "loss": 0.661, "step": 4647 }, { "epoch": 0.53, "learning_rate": 9.569424998920872e-05, "loss": 0.6297, "step": 4648 }, { "epoch": 0.53, "learning_rate": 9.565747175908916e-05, "loss": 0.7281, "step": 4649 }, { "epoch": 0.53, "learning_rate": 9.562069411745691e-05, "loss": 0.7151, "step": 4650 }, { "epoch": 0.53, "learning_rate": 9.5583917069296e-05, "loss": 0.6618, "step": 4651 }, { "epoch": 0.53, "learning_rate": 9.554714061959035e-05, "loss": 0.6538, "step": 4652 }, { "epoch": 0.53, "learning_rate": 9.55103647733238e-05, "loss": 0.7101, "step": 4653 }, { "epoch": 0.53, "learning_rate": 9.547358953548014e-05, "loss": 0.6196, "step": 4654 }, { "epoch": 0.53, "learning_rate": 9.543681491104297e-05, "loss": 0.6994, "step": 4655 }, { "epoch": 0.53, "learning_rate": 9.540004090499593e-05, "loss": 0.7024, "step": 4656 }, { "epoch": 0.53, "learning_rate": 9.536326752232252e-05, "loss": 0.6989, "step": 4657 }, { "epoch": 0.53, "learning_rate": 9.532649476800619e-05, "loss": 0.6782, "step": 4658 }, { "epoch": 0.53, "learning_rate": 9.528972264703026e-05, "loss": 0.6632, "step": 4659 }, { "epoch": 0.53, "learning_rate": 9.525295116437803e-05, "loss": 0.6666, "step": 4660 }, { "epoch": 0.53, "learning_rate": 9.52161803250326e-05, "loss": 0.7033, "step": 4661 }, { "epoch": 0.53, "learning_rate": 9.517941013397708e-05, "loss": 0.6731, "step": 4662 }, { "epoch": 0.53, "learning_rate": 9.514264059619446e-05, "loss": 0.7438, "step": 4663 }, { "epoch": 0.53, "learning_rate": 9.510587171666765e-05, "loss": 0.6004, "step": 4664 }, { "epoch": 0.53, "learning_rate": 9.50691035003795e-05, "loss": 0.6247, "step": 4665 }, { "epoch": 0.53, "learning_rate": 9.503233595231268e-05, "loss": 0.681, "step": 4666 }, { "epoch": 0.53, "learning_rate": 9.499556907744984e-05, "loss": 0.6699, "step": 4667 }, { "epoch": 0.53, "learning_rate": 9.495880288077355e-05, "loss": 0.6915, "step": 4668 }, { "epoch": 0.53, "learning_rate": 9.492203736726623e-05, "loss": 0.702, "step": 4669 }, { "epoch": 0.53, "learning_rate": 9.488527254191026e-05, "loss": 0.6955, "step": 4670 }, { "epoch": 0.53, "learning_rate": 9.484850840968796e-05, "loss": 0.7263, "step": 4671 }, { "epoch": 0.53, "learning_rate": 9.48117449755814e-05, "loss": 0.693, "step": 4672 }, { "epoch": 0.53, "learning_rate": 9.477498224457269e-05, "loss": 0.685, "step": 4673 }, { "epoch": 0.53, "learning_rate": 9.473822022164383e-05, "loss": 0.6789, "step": 4674 }, { "epoch": 0.53, "learning_rate": 9.470145891177672e-05, "loss": 0.7067, "step": 4675 }, { "epoch": 0.53, "learning_rate": 9.466469831995313e-05, "loss": 0.7235, "step": 4676 }, { "epoch": 0.53, "learning_rate": 9.462793845115479e-05, "loss": 0.7263, "step": 4677 }, { "epoch": 0.53, "learning_rate": 9.459117931036322e-05, "loss": 0.6977, "step": 4678 }, { "epoch": 0.53, "learning_rate": 9.455442090255997e-05, "loss": 0.6518, "step": 4679 }, { "epoch": 0.53, "learning_rate": 9.451766323272642e-05, "loss": 0.645, "step": 4680 }, { "epoch": 0.53, "learning_rate": 9.448090630584387e-05, "loss": 0.6727, "step": 4681 }, { "epoch": 0.53, "learning_rate": 9.444415012689356e-05, "loss": 0.732, "step": 4682 }, { "epoch": 0.53, "learning_rate": 9.44073947008565e-05, "loss": 0.6902, "step": 4683 }, { "epoch": 0.53, "learning_rate": 9.437064003271374e-05, "loss": 0.6907, "step": 4684 }, { "epoch": 0.53, "learning_rate": 9.433388612744615e-05, "loss": 0.6428, "step": 4685 }, { "epoch": 0.53, "learning_rate": 9.429713299003452e-05, "loss": 0.6843, "step": 4686 }, { "epoch": 0.53, "learning_rate": 9.426038062545953e-05, "loss": 0.7256, "step": 4687 }, { "epoch": 0.53, "learning_rate": 9.42236290387018e-05, "loss": 0.6567, "step": 4688 }, { "epoch": 0.53, "learning_rate": 9.418687823474173e-05, "loss": 0.7047, "step": 4689 }, { "epoch": 0.53, "learning_rate": 9.415012821855974e-05, "loss": 0.702, "step": 4690 }, { "epoch": 0.53, "learning_rate": 9.411337899513607e-05, "loss": 0.6526, "step": 4691 }, { "epoch": 0.53, "learning_rate": 9.40766305694509e-05, "loss": 0.6677, "step": 4692 }, { "epoch": 0.53, "learning_rate": 9.403988294648422e-05, "loss": 0.6668, "step": 4693 }, { "epoch": 0.53, "learning_rate": 9.400313613121603e-05, "loss": 0.6965, "step": 4694 }, { "epoch": 0.53, "learning_rate": 9.396639012862609e-05, "loss": 0.6873, "step": 4695 }, { "epoch": 0.53, "learning_rate": 9.392964494369415e-05, "loss": 0.6058, "step": 4696 }, { "epoch": 0.53, "learning_rate": 9.389290058139981e-05, "loss": 0.5894, "step": 4697 }, { "epoch": 0.53, "learning_rate": 9.385615704672257e-05, "loss": 0.6592, "step": 4698 }, { "epoch": 0.53, "learning_rate": 9.381941434464181e-05, "loss": 0.6625, "step": 4699 }, { "epoch": 0.53, "learning_rate": 9.378267248013683e-05, "loss": 0.6567, "step": 4700 }, { "epoch": 0.53, "learning_rate": 9.374593145818672e-05, "loss": 0.6454, "step": 4701 }, { "epoch": 0.53, "learning_rate": 9.370919128377054e-05, "loss": 0.5962, "step": 4702 }, { "epoch": 0.53, "learning_rate": 9.367245196186724e-05, "loss": 0.6673, "step": 4703 }, { "epoch": 0.53, "learning_rate": 9.363571349745562e-05, "loss": 0.676, "step": 4704 }, { "epoch": 0.53, "learning_rate": 9.359897589551442e-05, "loss": 0.6842, "step": 4705 }, { "epoch": 0.53, "learning_rate": 9.356223916102212e-05, "loss": 0.6342, "step": 4706 }, { "epoch": 0.54, "learning_rate": 9.352550329895722e-05, "loss": 0.5961, "step": 4707 }, { "epoch": 0.54, "learning_rate": 9.348876831429808e-05, "loss": 0.7258, "step": 4708 }, { "epoch": 0.54, "learning_rate": 9.345203421202292e-05, "loss": 0.6233, "step": 4709 }, { "epoch": 0.54, "learning_rate": 9.341530099710983e-05, "loss": 0.6989, "step": 4710 }, { "epoch": 0.54, "learning_rate": 9.337856867453684e-05, "loss": 0.6992, "step": 4711 }, { "epoch": 0.54, "learning_rate": 9.334183724928174e-05, "loss": 0.7076, "step": 4712 }, { "epoch": 0.54, "learning_rate": 9.330510672632232e-05, "loss": 0.6927, "step": 4713 }, { "epoch": 0.54, "learning_rate": 9.326837711063616e-05, "loss": 0.6412, "step": 4714 }, { "epoch": 0.54, "learning_rate": 9.323164840720079e-05, "loss": 0.6768, "step": 4715 }, { "epoch": 0.54, "learning_rate": 9.319492062099356e-05, "loss": 0.6875, "step": 4716 }, { "epoch": 0.54, "learning_rate": 9.315819375699175e-05, "loss": 0.7278, "step": 4717 }, { "epoch": 0.54, "learning_rate": 9.312146782017243e-05, "loss": 0.638, "step": 4718 }, { "epoch": 0.54, "learning_rate": 9.308474281551264e-05, "loss": 0.6378, "step": 4719 }, { "epoch": 0.54, "learning_rate": 9.304801874798921e-05, "loss": 0.7297, "step": 4720 }, { "epoch": 0.54, "learning_rate": 9.301129562257893e-05, "loss": 0.6518, "step": 4721 }, { "epoch": 0.54, "learning_rate": 9.297457344425842e-05, "loss": 0.6988, "step": 4722 }, { "epoch": 0.54, "learning_rate": 9.293785221800411e-05, "loss": 0.6784, "step": 4723 }, { "epoch": 0.54, "learning_rate": 9.29011319487924e-05, "loss": 0.7205, "step": 4724 }, { "epoch": 0.54, "learning_rate": 9.286441264159949e-05, "loss": 0.7074, "step": 4725 }, { "epoch": 0.54, "learning_rate": 9.28276943014015e-05, "loss": 0.6941, "step": 4726 }, { "epoch": 0.54, "learning_rate": 9.27909769331744e-05, "loss": 0.7316, "step": 4727 }, { "epoch": 0.54, "learning_rate": 9.275426054189406e-05, "loss": 0.6789, "step": 4728 }, { "epoch": 0.54, "learning_rate": 9.271754513253609e-05, "loss": 0.7151, "step": 4729 }, { "epoch": 0.54, "learning_rate": 9.268083071007611e-05, "loss": 0.7236, "step": 4730 }, { "epoch": 0.54, "learning_rate": 9.264411727948958e-05, "loss": 0.6875, "step": 4731 }, { "epoch": 0.54, "learning_rate": 9.260740484575176e-05, "loss": 0.6854, "step": 4732 }, { "epoch": 0.54, "learning_rate": 9.257069341383784e-05, "loss": 0.6371, "step": 4733 }, { "epoch": 0.54, "learning_rate": 9.25339829887229e-05, "loss": 0.6857, "step": 4734 }, { "epoch": 0.54, "learning_rate": 9.249727357538171e-05, "loss": 0.696, "step": 4735 }, { "epoch": 0.54, "learning_rate": 9.246056517878912e-05, "loss": 0.7086, "step": 4736 }, { "epoch": 0.54, "learning_rate": 9.242385780391974e-05, "loss": 0.6843, "step": 4737 }, { "epoch": 0.54, "learning_rate": 9.238715145574803e-05, "loss": 0.6565, "step": 4738 }, { "epoch": 0.54, "learning_rate": 9.235044613924836e-05, "loss": 0.6216, "step": 4739 }, { "epoch": 0.54, "learning_rate": 9.23137418593949e-05, "loss": 0.6198, "step": 4740 }, { "epoch": 0.54, "learning_rate": 9.227703862116171e-05, "loss": 0.7006, "step": 4741 }, { "epoch": 0.54, "learning_rate": 9.224033642952275e-05, "loss": 0.665, "step": 4742 }, { "epoch": 0.54, "learning_rate": 9.220363528945177e-05, "loss": 0.6761, "step": 4743 }, { "epoch": 0.54, "learning_rate": 9.21669352059224e-05, "loss": 0.6799, "step": 4744 }, { "epoch": 0.54, "learning_rate": 9.213023618390819e-05, "loss": 0.6031, "step": 4745 }, { "epoch": 0.54, "learning_rate": 9.209353822838241e-05, "loss": 0.6855, "step": 4746 }, { "epoch": 0.54, "learning_rate": 9.205684134431828e-05, "loss": 0.7216, "step": 4747 }, { "epoch": 0.54, "learning_rate": 9.20201455366889e-05, "loss": 0.6348, "step": 4748 }, { "epoch": 0.54, "learning_rate": 9.198345081046715e-05, "loss": 0.7127, "step": 4749 }, { "epoch": 0.54, "learning_rate": 9.194675717062582e-05, "loss": 0.7001, "step": 4750 }, { "epoch": 0.54, "learning_rate": 9.191006462213756e-05, "loss": 0.7566, "step": 4751 }, { "epoch": 0.54, "learning_rate": 9.187337316997476e-05, "loss": 0.6669, "step": 4752 }, { "epoch": 0.54, "learning_rate": 9.183668281910976e-05, "loss": 0.6548, "step": 4753 }, { "epoch": 0.54, "learning_rate": 9.179999357451477e-05, "loss": 0.6987, "step": 4754 }, { "epoch": 0.54, "learning_rate": 9.176330544116182e-05, "loss": 0.7593, "step": 4755 }, { "epoch": 0.54, "learning_rate": 9.172661842402275e-05, "loss": 0.6152, "step": 4756 }, { "epoch": 0.54, "learning_rate": 9.168993252806934e-05, "loss": 0.6916, "step": 4757 }, { "epoch": 0.54, "learning_rate": 9.165324775827307e-05, "loss": 0.6662, "step": 4758 }, { "epoch": 0.54, "learning_rate": 9.161656411960542e-05, "loss": 0.6851, "step": 4759 }, { "epoch": 0.54, "learning_rate": 9.157988161703763e-05, "loss": 0.6081, "step": 4760 }, { "epoch": 0.54, "learning_rate": 9.154320025554084e-05, "loss": 0.6609, "step": 4761 }, { "epoch": 0.54, "learning_rate": 9.1506520040086e-05, "loss": 0.6712, "step": 4762 }, { "epoch": 0.54, "learning_rate": 9.146984097564386e-05, "loss": 0.7273, "step": 4763 }, { "epoch": 0.54, "learning_rate": 9.143316306718512e-05, "loss": 0.6613, "step": 4764 }, { "epoch": 0.54, "learning_rate": 9.139648631968024e-05, "loss": 0.618, "step": 4765 }, { "epoch": 0.54, "learning_rate": 9.135981073809957e-05, "loss": 0.6239, "step": 4766 }, { "epoch": 0.54, "learning_rate": 9.13231363274133e-05, "loss": 0.6223, "step": 4767 }, { "epoch": 0.54, "learning_rate": 9.128646309259141e-05, "loss": 0.6952, "step": 4768 }, { "epoch": 0.54, "learning_rate": 9.124979103860374e-05, "loss": 0.6351, "step": 4769 }, { "epoch": 0.54, "learning_rate": 9.121312017042e-05, "loss": 0.7792, "step": 4770 }, { "epoch": 0.54, "learning_rate": 9.117645049300974e-05, "loss": 0.7122, "step": 4771 }, { "epoch": 0.54, "learning_rate": 9.113978201134233e-05, "loss": 0.6777, "step": 4772 }, { "epoch": 0.54, "learning_rate": 9.110311473038695e-05, "loss": 0.7217, "step": 4773 }, { "epoch": 0.54, "learning_rate": 9.106644865511273e-05, "loss": 0.7246, "step": 4774 }, { "epoch": 0.54, "learning_rate": 9.102978379048846e-05, "loss": 0.7005, "step": 4775 }, { "epoch": 0.54, "learning_rate": 9.099312014148288e-05, "loss": 0.6401, "step": 4776 }, { "epoch": 0.54, "learning_rate": 9.095645771306457e-05, "loss": 0.6561, "step": 4777 }, { "epoch": 0.54, "learning_rate": 9.091979651020191e-05, "loss": 0.5703, "step": 4778 }, { "epoch": 0.54, "learning_rate": 9.088313653786317e-05, "loss": 0.7481, "step": 4779 }, { "epoch": 0.54, "learning_rate": 9.084647780101633e-05, "loss": 0.7226, "step": 4780 }, { "epoch": 0.54, "learning_rate": 9.08098203046293e-05, "loss": 0.5945, "step": 4781 }, { "epoch": 0.54, "learning_rate": 9.077316405366981e-05, "loss": 0.6413, "step": 4782 }, { "epoch": 0.54, "learning_rate": 9.073650905310543e-05, "loss": 0.7478, "step": 4783 }, { "epoch": 0.54, "learning_rate": 9.069985530790353e-05, "loss": 0.6621, "step": 4784 }, { "epoch": 0.54, "learning_rate": 9.066320282303134e-05, "loss": 0.7207, "step": 4785 }, { "epoch": 0.54, "learning_rate": 9.062655160345587e-05, "loss": 0.6451, "step": 4786 }, { "epoch": 0.54, "learning_rate": 9.0589901654144e-05, "loss": 0.7232, "step": 4787 }, { "epoch": 0.54, "learning_rate": 9.055325298006247e-05, "loss": 0.7056, "step": 4788 }, { "epoch": 0.54, "learning_rate": 9.051660558617775e-05, "loss": 0.6812, "step": 4789 }, { "epoch": 0.54, "learning_rate": 9.047995947745623e-05, "loss": 0.7109, "step": 4790 }, { "epoch": 0.54, "learning_rate": 9.044331465886407e-05, "loss": 0.6652, "step": 4791 }, { "epoch": 0.54, "learning_rate": 9.040667113536727e-05, "loss": 0.7019, "step": 4792 }, { "epoch": 0.54, "learning_rate": 9.037002891193166e-05, "loss": 0.7319, "step": 4793 }, { "epoch": 0.54, "learning_rate": 9.033338799352291e-05, "loss": 0.6304, "step": 4794 }, { "epoch": 0.55, "learning_rate": 9.029674838510648e-05, "loss": 0.7033, "step": 4795 }, { "epoch": 0.55, "learning_rate": 9.02601100916477e-05, "loss": 0.6291, "step": 4796 }, { "epoch": 0.55, "learning_rate": 9.022347311811164e-05, "loss": 0.6779, "step": 4797 }, { "epoch": 0.55, "learning_rate": 9.018683746946326e-05, "loss": 0.7362, "step": 4798 }, { "epoch": 0.55, "learning_rate": 9.015020315066732e-05, "loss": 0.698, "step": 4799 }, { "epoch": 0.55, "learning_rate": 9.011357016668838e-05, "loss": 0.6066, "step": 4800 }, { "epoch": 0.55, "learning_rate": 9.00769385224909e-05, "loss": 0.6528, "step": 4801 }, { "epoch": 0.55, "learning_rate": 9.004030822303908e-05, "loss": 0.6067, "step": 4802 }, { "epoch": 0.55, "learning_rate": 9.00036792732969e-05, "loss": 0.6582, "step": 4803 }, { "epoch": 0.55, "learning_rate": 8.996705167822825e-05, "loss": 0.7058, "step": 4804 }, { "epoch": 0.55, "learning_rate": 8.993042544279681e-05, "loss": 0.6992, "step": 4805 }, { "epoch": 0.55, "learning_rate": 8.989380057196605e-05, "loss": 0.6728, "step": 4806 }, { "epoch": 0.55, "learning_rate": 8.985717707069927e-05, "loss": 0.6102, "step": 4807 }, { "epoch": 0.55, "learning_rate": 8.982055494395962e-05, "loss": 0.6697, "step": 4808 }, { "epoch": 0.55, "learning_rate": 8.978393419671001e-05, "loss": 0.6764, "step": 4809 }, { "epoch": 0.55, "learning_rate": 8.974731483391314e-05, "loss": 0.6378, "step": 4810 }, { "epoch": 0.55, "learning_rate": 8.971069686053158e-05, "loss": 0.6784, "step": 4811 }, { "epoch": 0.55, "learning_rate": 8.967408028152773e-05, "loss": 0.6264, "step": 4812 }, { "epoch": 0.55, "learning_rate": 8.963746510186377e-05, "loss": 0.6695, "step": 4813 }, { "epoch": 0.55, "learning_rate": 8.960085132650164e-05, "loss": 0.608, "step": 4814 }, { "epoch": 0.55, "learning_rate": 8.956423896040315e-05, "loss": 0.6648, "step": 4815 }, { "epoch": 0.55, "learning_rate": 8.952762800852994e-05, "loss": 0.6342, "step": 4816 }, { "epoch": 0.55, "learning_rate": 8.949101847584339e-05, "loss": 0.6375, "step": 4817 }, { "epoch": 0.55, "learning_rate": 8.945441036730473e-05, "loss": 0.6515, "step": 4818 }, { "epoch": 0.55, "learning_rate": 8.941780368787504e-05, "loss": 0.6938, "step": 4819 }, { "epoch": 0.55, "learning_rate": 8.938119844251507e-05, "loss": 0.6684, "step": 4820 }, { "epoch": 0.55, "learning_rate": 8.93445946361855e-05, "loss": 0.6916, "step": 4821 }, { "epoch": 0.55, "learning_rate": 8.930799227384677e-05, "loss": 0.7086, "step": 4822 }, { "epoch": 0.55, "learning_rate": 8.927139136045913e-05, "loss": 0.69, "step": 4823 }, { "epoch": 0.55, "learning_rate": 8.923479190098263e-05, "loss": 0.7206, "step": 4824 }, { "epoch": 0.55, "learning_rate": 8.919819390037721e-05, "loss": 0.6711, "step": 4825 }, { "epoch": 0.55, "learning_rate": 8.916159736360239e-05, "loss": 0.6534, "step": 4826 }, { "epoch": 0.55, "learning_rate": 8.91250022956177e-05, "loss": 0.6687, "step": 4827 }, { "epoch": 0.55, "learning_rate": 8.908840870138239e-05, "loss": 0.6708, "step": 4828 }, { "epoch": 0.55, "learning_rate": 8.905181658585553e-05, "loss": 0.665, "step": 4829 }, { "epoch": 0.55, "learning_rate": 8.901522595399598e-05, "loss": 0.6893, "step": 4830 }, { "epoch": 0.55, "learning_rate": 8.897863681076245e-05, "loss": 0.6627, "step": 4831 }, { "epoch": 0.55, "learning_rate": 8.894204916111331e-05, "loss": 0.6595, "step": 4832 }, { "epoch": 0.55, "learning_rate": 8.890546301000684e-05, "loss": 0.7072, "step": 4833 }, { "epoch": 0.55, "learning_rate": 8.886887836240111e-05, "loss": 0.7106, "step": 4834 }, { "epoch": 0.55, "learning_rate": 8.8832295223254e-05, "loss": 0.5952, "step": 4835 }, { "epoch": 0.55, "learning_rate": 8.87957135975231e-05, "loss": 0.6867, "step": 4836 }, { "epoch": 0.55, "learning_rate": 8.87591334901659e-05, "loss": 0.7077, "step": 4837 }, { "epoch": 0.55, "learning_rate": 8.872255490613956e-05, "loss": 0.7542, "step": 4838 }, { "epoch": 0.55, "learning_rate": 8.868597785040118e-05, "loss": 0.6727, "step": 4839 }, { "epoch": 0.55, "learning_rate": 8.864940232790756e-05, "loss": 0.6726, "step": 4840 }, { "epoch": 0.55, "learning_rate": 8.861282834361531e-05, "loss": 0.7058, "step": 4841 }, { "epoch": 0.55, "learning_rate": 8.857625590248086e-05, "loss": 0.6798, "step": 4842 }, { "epoch": 0.55, "learning_rate": 8.853968500946034e-05, "loss": 0.652, "step": 4843 }, { "epoch": 0.55, "learning_rate": 8.850311566950978e-05, "loss": 0.6908, "step": 4844 }, { "epoch": 0.55, "learning_rate": 8.846654788758495e-05, "loss": 0.622, "step": 4845 }, { "epoch": 0.55, "learning_rate": 8.842998166864141e-05, "loss": 0.6318, "step": 4846 }, { "epoch": 0.55, "learning_rate": 8.839341701763453e-05, "loss": 0.6821, "step": 4847 }, { "epoch": 0.55, "learning_rate": 8.835685393951947e-05, "loss": 0.7136, "step": 4848 }, { "epoch": 0.55, "learning_rate": 8.832029243925106e-05, "loss": 0.692, "step": 4849 }, { "epoch": 0.55, "learning_rate": 8.82837325217841e-05, "loss": 0.6605, "step": 4850 }, { "epoch": 0.55, "learning_rate": 8.824717419207305e-05, "loss": 0.6549, "step": 4851 }, { "epoch": 0.55, "learning_rate": 8.82106174550722e-05, "loss": 0.6939, "step": 4852 }, { "epoch": 0.55, "learning_rate": 8.817406231573569e-05, "loss": 0.6463, "step": 4853 }, { "epoch": 0.55, "learning_rate": 8.813750877901723e-05, "loss": 0.7045, "step": 4854 }, { "epoch": 0.55, "learning_rate": 8.810095684987054e-05, "loss": 0.6245, "step": 4855 }, { "epoch": 0.55, "learning_rate": 8.806440653324902e-05, "loss": 0.6844, "step": 4856 }, { "epoch": 0.55, "learning_rate": 8.802785783410588e-05, "loss": 0.7045, "step": 4857 }, { "epoch": 0.55, "learning_rate": 8.799131075739407e-05, "loss": 0.6817, "step": 4858 }, { "epoch": 0.55, "learning_rate": 8.79547653080664e-05, "loss": 0.7143, "step": 4859 }, { "epoch": 0.55, "learning_rate": 8.791822149107534e-05, "loss": 0.6828, "step": 4860 }, { "epoch": 0.55, "learning_rate": 8.788167931137325e-05, "loss": 0.6264, "step": 4861 }, { "epoch": 0.55, "learning_rate": 8.78451387739122e-05, "loss": 0.6941, "step": 4862 }, { "epoch": 0.55, "learning_rate": 8.78085998836441e-05, "loss": 0.6243, "step": 4863 }, { "epoch": 0.55, "learning_rate": 8.777206264552055e-05, "loss": 0.7203, "step": 4864 }, { "epoch": 0.55, "learning_rate": 8.773552706449304e-05, "loss": 0.664, "step": 4865 }, { "epoch": 0.55, "learning_rate": 8.769899314551269e-05, "loss": 0.6465, "step": 4866 }, { "epoch": 0.55, "learning_rate": 8.766246089353051e-05, "loss": 0.6782, "step": 4867 }, { "epoch": 0.55, "learning_rate": 8.762593031349726e-05, "loss": 0.6664, "step": 4868 }, { "epoch": 0.55, "learning_rate": 8.758940141036345e-05, "loss": 0.6207, "step": 4869 }, { "epoch": 0.55, "learning_rate": 8.755287418907942e-05, "loss": 0.7111, "step": 4870 }, { "epoch": 0.55, "learning_rate": 8.751634865459516e-05, "loss": 0.7168, "step": 4871 }, { "epoch": 0.55, "learning_rate": 8.747982481186056e-05, "loss": 0.6323, "step": 4872 }, { "epoch": 0.55, "learning_rate": 8.744330266582519e-05, "loss": 0.7558, "step": 4873 }, { "epoch": 0.55, "learning_rate": 8.740678222143847e-05, "loss": 0.6455, "step": 4874 }, { "epoch": 0.55, "learning_rate": 8.737026348364953e-05, "loss": 0.6594, "step": 4875 }, { "epoch": 0.55, "learning_rate": 8.733374645740733e-05, "loss": 0.6824, "step": 4876 }, { "epoch": 0.55, "learning_rate": 8.729723114766049e-05, "loss": 0.6553, "step": 4877 }, { "epoch": 0.55, "learning_rate": 8.726071755935747e-05, "loss": 0.618, "step": 4878 }, { "epoch": 0.55, "learning_rate": 8.722420569744652e-05, "loss": 0.571, "step": 4879 }, { "epoch": 0.55, "learning_rate": 8.71876955668756e-05, "loss": 0.7451, "step": 4880 }, { "epoch": 0.55, "learning_rate": 8.71511871725925e-05, "loss": 0.6249, "step": 4881 }, { "epoch": 0.55, "learning_rate": 8.711468051954472e-05, "loss": 0.6314, "step": 4882 }, { "epoch": 0.56, "learning_rate": 8.707817561267952e-05, "loss": 0.6972, "step": 4883 }, { "epoch": 0.56, "learning_rate": 8.704167245694397e-05, "loss": 0.7292, "step": 4884 }, { "epoch": 0.56, "learning_rate": 8.700517105728483e-05, "loss": 0.6454, "step": 4885 }, { "epoch": 0.56, "learning_rate": 8.69686714186487e-05, "loss": 0.699, "step": 4886 }, { "epoch": 0.56, "learning_rate": 8.693217354598193e-05, "loss": 0.6256, "step": 4887 }, { "epoch": 0.56, "learning_rate": 8.68956774442306e-05, "loss": 0.6374, "step": 4888 }, { "epoch": 0.56, "learning_rate": 8.685918311834052e-05, "loss": 0.6899, "step": 4889 }, { "epoch": 0.56, "learning_rate": 8.682269057325734e-05, "loss": 0.7404, "step": 4890 }, { "epoch": 0.56, "learning_rate": 8.678619981392641e-05, "loss": 0.6396, "step": 4891 }, { "epoch": 0.56, "learning_rate": 8.674971084529286e-05, "loss": 0.7311, "step": 4892 }, { "epoch": 0.56, "learning_rate": 8.671322367230162e-05, "loss": 0.649, "step": 4893 }, { "epoch": 0.56, "learning_rate": 8.667673829989725e-05, "loss": 0.702, "step": 4894 }, { "epoch": 0.56, "learning_rate": 8.664025473302417e-05, "loss": 0.7402, "step": 4895 }, { "epoch": 0.56, "learning_rate": 8.660377297662655e-05, "loss": 0.6387, "step": 4896 }, { "epoch": 0.56, "learning_rate": 8.656729303564829e-05, "loss": 0.7122, "step": 4897 }, { "epoch": 0.56, "learning_rate": 8.653081491503304e-05, "loss": 0.7436, "step": 4898 }, { "epoch": 0.56, "learning_rate": 8.649433861972426e-05, "loss": 0.6558, "step": 4899 }, { "epoch": 0.56, "learning_rate": 8.645786415466506e-05, "loss": 0.7107, "step": 4900 }, { "epoch": 0.56, "learning_rate": 8.642139152479836e-05, "loss": 0.6695, "step": 4901 }, { "epoch": 0.56, "learning_rate": 8.638492073506685e-05, "loss": 0.7148, "step": 4902 }, { "epoch": 0.56, "learning_rate": 8.634845179041295e-05, "loss": 0.6511, "step": 4903 }, { "epoch": 0.56, "learning_rate": 8.631198469577881e-05, "loss": 0.6859, "step": 4904 }, { "epoch": 0.56, "learning_rate": 8.627551945610641e-05, "loss": 0.6961, "step": 4905 }, { "epoch": 0.56, "learning_rate": 8.623905607633734e-05, "loss": 0.6307, "step": 4906 }, { "epoch": 0.56, "learning_rate": 8.620259456141303e-05, "loss": 0.6608, "step": 4907 }, { "epoch": 0.56, "learning_rate": 8.616613491627467e-05, "loss": 0.7191, "step": 4908 }, { "epoch": 0.56, "learning_rate": 8.612967714586315e-05, "loss": 0.6666, "step": 4909 }, { "epoch": 0.56, "learning_rate": 8.609322125511917e-05, "loss": 0.678, "step": 4910 }, { "epoch": 0.56, "learning_rate": 8.605676724898307e-05, "loss": 0.6251, "step": 4911 }, { "epoch": 0.56, "learning_rate": 8.602031513239503e-05, "loss": 0.6665, "step": 4912 }, { "epoch": 0.56, "learning_rate": 8.598386491029491e-05, "loss": 0.6177, "step": 4913 }, { "epoch": 0.56, "learning_rate": 8.594741658762237e-05, "loss": 0.7341, "step": 4914 }, { "epoch": 0.56, "learning_rate": 8.591097016931679e-05, "loss": 0.7139, "step": 4915 }, { "epoch": 0.56, "learning_rate": 8.58745256603173e-05, "loss": 0.6656, "step": 4916 }, { "epoch": 0.56, "learning_rate": 8.58380830655627e-05, "loss": 0.6503, "step": 4917 }, { "epoch": 0.56, "learning_rate": 8.580164238999162e-05, "loss": 0.7193, "step": 4918 }, { "epoch": 0.56, "learning_rate": 8.57652036385424e-05, "loss": 0.6819, "step": 4919 }, { "epoch": 0.56, "learning_rate": 8.572876681615311e-05, "loss": 0.6615, "step": 4920 }, { "epoch": 0.56, "learning_rate": 8.569233192776161e-05, "loss": 0.7004, "step": 4921 }, { "epoch": 0.56, "learning_rate": 8.565589897830543e-05, "loss": 0.6885, "step": 4922 }, { "epoch": 0.56, "learning_rate": 8.561946797272181e-05, "loss": 0.6812, "step": 4923 }, { "epoch": 0.56, "learning_rate": 8.558303891594783e-05, "loss": 0.6688, "step": 4924 }, { "epoch": 0.56, "learning_rate": 8.554661181292026e-05, "loss": 0.6414, "step": 4925 }, { "epoch": 0.56, "learning_rate": 8.551018666857555e-05, "loss": 0.6232, "step": 4926 }, { "epoch": 0.56, "learning_rate": 8.547376348785004e-05, "loss": 0.7189, "step": 4927 }, { "epoch": 0.56, "learning_rate": 8.543734227567956e-05, "loss": 0.7067, "step": 4928 }, { "epoch": 0.56, "learning_rate": 8.540092303699989e-05, "loss": 0.6749, "step": 4929 }, { "epoch": 0.56, "learning_rate": 8.536450577674644e-05, "loss": 0.6931, "step": 4930 }, { "epoch": 0.56, "learning_rate": 8.53280904998544e-05, "loss": 0.6984, "step": 4931 }, { "epoch": 0.56, "learning_rate": 8.529167721125866e-05, "loss": 0.6738, "step": 4932 }, { "epoch": 0.56, "learning_rate": 8.525526591589386e-05, "loss": 0.6472, "step": 4933 }, { "epoch": 0.56, "learning_rate": 8.521885661869431e-05, "loss": 0.7037, "step": 4934 }, { "epoch": 0.56, "learning_rate": 8.518244932459412e-05, "loss": 0.631, "step": 4935 }, { "epoch": 0.56, "learning_rate": 8.514604403852711e-05, "loss": 0.6097, "step": 4936 }, { "epoch": 0.56, "learning_rate": 8.510964076542682e-05, "loss": 0.6878, "step": 4937 }, { "epoch": 0.56, "learning_rate": 8.507323951022654e-05, "loss": 0.6827, "step": 4938 }, { "epoch": 0.56, "learning_rate": 8.503684027785929e-05, "loss": 0.7355, "step": 4939 }, { "epoch": 0.56, "learning_rate": 8.50004430732577e-05, "loss": 0.6686, "step": 4940 }, { "epoch": 0.56, "learning_rate": 8.496404790135426e-05, "loss": 0.723, "step": 4941 }, { "epoch": 0.56, "learning_rate": 8.492765476708117e-05, "loss": 0.6249, "step": 4942 }, { "epoch": 0.56, "learning_rate": 8.48912636753703e-05, "loss": 0.6644, "step": 4943 }, { "epoch": 0.56, "learning_rate": 8.485487463115328e-05, "loss": 0.6865, "step": 4944 }, { "epoch": 0.56, "learning_rate": 8.48184876393615e-05, "loss": 0.6646, "step": 4945 }, { "epoch": 0.56, "learning_rate": 8.478210270492592e-05, "loss": 0.7313, "step": 4946 }, { "epoch": 0.56, "learning_rate": 8.474571983277737e-05, "loss": 0.7089, "step": 4947 }, { "epoch": 0.56, "learning_rate": 8.470933902784638e-05, "loss": 0.6765, "step": 4948 }, { "epoch": 0.56, "learning_rate": 8.467296029506316e-05, "loss": 0.6192, "step": 4949 }, { "epoch": 0.56, "learning_rate": 8.463658363935769e-05, "loss": 0.7058, "step": 4950 }, { "epoch": 0.56, "learning_rate": 8.460020906565956e-05, "loss": 0.6756, "step": 4951 }, { "epoch": 0.56, "learning_rate": 8.456383657889817e-05, "loss": 0.6616, "step": 4952 }, { "epoch": 0.56, "learning_rate": 8.452746618400264e-05, "loss": 0.7121, "step": 4953 }, { "epoch": 0.56, "learning_rate": 8.449109788590179e-05, "loss": 0.6172, "step": 4954 }, { "epoch": 0.56, "learning_rate": 8.445473168952413e-05, "loss": 0.6721, "step": 4955 }, { "epoch": 0.56, "learning_rate": 8.441836759979795e-05, "loss": 0.6833, "step": 4956 }, { "epoch": 0.56, "learning_rate": 8.438200562165115e-05, "loss": 0.6902, "step": 4957 }, { "epoch": 0.56, "learning_rate": 8.434564576001143e-05, "loss": 0.6513, "step": 4958 }, { "epoch": 0.56, "learning_rate": 8.43092880198062e-05, "loss": 0.7075, "step": 4959 }, { "epoch": 0.56, "learning_rate": 8.427293240596251e-05, "loss": 0.7162, "step": 4960 }, { "epoch": 0.56, "learning_rate": 8.42365789234072e-05, "loss": 0.6044, "step": 4961 }, { "epoch": 0.56, "learning_rate": 8.420022757706681e-05, "loss": 0.6486, "step": 4962 }, { "epoch": 0.56, "learning_rate": 8.416387837186754e-05, "loss": 0.672, "step": 4963 }, { "epoch": 0.56, "learning_rate": 8.412753131273535e-05, "loss": 0.7104, "step": 4964 }, { "epoch": 0.56, "learning_rate": 8.409118640459588e-05, "loss": 0.6722, "step": 4965 }, { "epoch": 0.56, "learning_rate": 8.40548436523745e-05, "loss": 0.7074, "step": 4966 }, { "epoch": 0.56, "learning_rate": 8.401850306099632e-05, "loss": 0.6806, "step": 4967 }, { "epoch": 0.56, "learning_rate": 8.398216463538604e-05, "loss": 0.6623, "step": 4968 }, { "epoch": 0.56, "learning_rate": 8.394582838046817e-05, "loss": 0.6483, "step": 4969 }, { "epoch": 0.56, "learning_rate": 8.390949430116692e-05, "loss": 0.6627, "step": 4970 }, { "epoch": 0.57, "learning_rate": 8.387316240240614e-05, "loss": 0.6144, "step": 4971 }, { "epoch": 0.57, "learning_rate": 8.383683268910948e-05, "loss": 0.7024, "step": 4972 }, { "epoch": 0.57, "learning_rate": 8.380050516620024e-05, "loss": 0.6571, "step": 4973 }, { "epoch": 0.57, "learning_rate": 8.376417983860137e-05, "loss": 0.6936, "step": 4974 }, { "epoch": 0.57, "learning_rate": 8.372785671123562e-05, "loss": 0.6881, "step": 4975 }, { "epoch": 0.57, "learning_rate": 8.369153578902537e-05, "loss": 0.6218, "step": 4976 }, { "epoch": 0.57, "learning_rate": 8.365521707689274e-05, "loss": 0.7028, "step": 4977 }, { "epoch": 0.57, "learning_rate": 8.361890057975957e-05, "loss": 0.6804, "step": 4978 }, { "epoch": 0.57, "learning_rate": 8.358258630254737e-05, "loss": 0.65, "step": 4979 }, { "epoch": 0.57, "learning_rate": 8.354627425017731e-05, "loss": 0.6606, "step": 4980 }, { "epoch": 0.57, "learning_rate": 8.35099644275703e-05, "loss": 0.7216, "step": 4981 }, { "epoch": 0.57, "learning_rate": 8.347365683964698e-05, "loss": 0.6448, "step": 4982 }, { "epoch": 0.57, "learning_rate": 8.343735149132761e-05, "loss": 0.6441, "step": 4983 }, { "epoch": 0.57, "learning_rate": 8.340104838753227e-05, "loss": 0.6802, "step": 4984 }, { "epoch": 0.57, "learning_rate": 8.336474753318055e-05, "loss": 0.6932, "step": 4985 }, { "epoch": 0.57, "learning_rate": 8.332844893319192e-05, "loss": 0.6491, "step": 4986 }, { "epoch": 0.57, "learning_rate": 8.329215259248542e-05, "loss": 0.6954, "step": 4987 }, { "epoch": 0.57, "learning_rate": 8.325585851597984e-05, "loss": 0.6534, "step": 4988 }, { "epoch": 0.57, "learning_rate": 8.321956670859366e-05, "loss": 0.6478, "step": 4989 }, { "epoch": 0.57, "learning_rate": 8.318327717524508e-05, "loss": 0.741, "step": 4990 }, { "epoch": 0.57, "learning_rate": 8.314698992085191e-05, "loss": 0.6373, "step": 4991 }, { "epoch": 0.57, "learning_rate": 8.311070495033167e-05, "loss": 0.6898, "step": 4992 }, { "epoch": 0.57, "learning_rate": 8.307442226860165e-05, "loss": 0.6719, "step": 4993 }, { "epoch": 0.57, "learning_rate": 8.303814188057875e-05, "loss": 0.6887, "step": 4994 }, { "epoch": 0.57, "learning_rate": 8.300186379117962e-05, "loss": 0.6535, "step": 4995 }, { "epoch": 0.57, "learning_rate": 8.296558800532057e-05, "loss": 0.7107, "step": 4996 }, { "epoch": 0.57, "learning_rate": 8.292931452791754e-05, "loss": 0.6825, "step": 4997 }, { "epoch": 0.57, "learning_rate": 8.289304336388623e-05, "loss": 0.6351, "step": 4998 }, { "epoch": 0.57, "learning_rate": 8.285677451814203e-05, "loss": 0.7244, "step": 4999 }, { "epoch": 0.57, "learning_rate": 8.282050799559995e-05, "loss": 0.6996, "step": 5000 }, { "epoch": 0.57, "learning_rate": 8.278424380117482e-05, "loss": 0.7213, "step": 5001 }, { "epoch": 0.57, "learning_rate": 8.274798193978096e-05, "loss": 0.7164, "step": 5002 }, { "epoch": 0.57, "learning_rate": 8.271172241633251e-05, "loss": 0.7562, "step": 5003 }, { "epoch": 0.57, "learning_rate": 8.267546523574327e-05, "loss": 0.7072, "step": 5004 }, { "epoch": 0.57, "learning_rate": 8.263921040292671e-05, "loss": 0.6909, "step": 5005 }, { "epoch": 0.57, "learning_rate": 8.260295792279597e-05, "loss": 0.6596, "step": 5006 }, { "epoch": 0.57, "learning_rate": 8.256670780026394e-05, "loss": 0.6112, "step": 5007 }, { "epoch": 0.57, "learning_rate": 8.253046004024305e-05, "loss": 0.6807, "step": 5008 }, { "epoch": 0.57, "learning_rate": 8.249421464764555e-05, "loss": 0.7033, "step": 5009 }, { "epoch": 0.57, "learning_rate": 8.24579716273833e-05, "loss": 0.6105, "step": 5010 }, { "epoch": 0.57, "learning_rate": 8.242173098436785e-05, "loss": 0.59, "step": 5011 }, { "epoch": 0.57, "learning_rate": 8.238549272351045e-05, "loss": 0.6477, "step": 5012 }, { "epoch": 0.57, "learning_rate": 8.234925684972203e-05, "loss": 0.6994, "step": 5013 }, { "epoch": 0.57, "learning_rate": 8.231302336791308e-05, "loss": 0.6478, "step": 5014 }, { "epoch": 0.57, "learning_rate": 8.227679228299395e-05, "loss": 0.694, "step": 5015 }, { "epoch": 0.57, "learning_rate": 8.224056359987453e-05, "loss": 0.6993, "step": 5016 }, { "epoch": 0.57, "learning_rate": 8.220433732346445e-05, "loss": 0.6903, "step": 5017 }, { "epoch": 0.57, "learning_rate": 8.216811345867299e-05, "loss": 0.7384, "step": 5018 }, { "epoch": 0.57, "learning_rate": 8.213189201040914e-05, "loss": 0.7199, "step": 5019 }, { "epoch": 0.57, "learning_rate": 8.209567298358148e-05, "loss": 0.7056, "step": 5020 }, { "epoch": 0.57, "learning_rate": 8.20594563830983e-05, "loss": 0.6988, "step": 5021 }, { "epoch": 0.57, "learning_rate": 8.202324221386761e-05, "loss": 0.6923, "step": 5022 }, { "epoch": 0.57, "learning_rate": 8.198703048079706e-05, "loss": 0.6921, "step": 5023 }, { "epoch": 0.57, "learning_rate": 8.195082118879397e-05, "loss": 0.7023, "step": 5024 }, { "epoch": 0.57, "learning_rate": 8.191461434276526e-05, "loss": 0.6617, "step": 5025 }, { "epoch": 0.57, "learning_rate": 8.187840994761763e-05, "loss": 0.7104, "step": 5026 }, { "epoch": 0.57, "learning_rate": 8.18422080082574e-05, "loss": 0.6795, "step": 5027 }, { "epoch": 0.57, "learning_rate": 8.180600852959052e-05, "loss": 0.6628, "step": 5028 }, { "epoch": 0.57, "learning_rate": 8.176981151652268e-05, "loss": 0.6679, "step": 5029 }, { "epoch": 0.57, "learning_rate": 8.17336169739592e-05, "loss": 0.7047, "step": 5030 }, { "epoch": 0.57, "learning_rate": 8.169742490680504e-05, "loss": 0.6968, "step": 5031 }, { "epoch": 0.57, "learning_rate": 8.166123531996485e-05, "loss": 0.6115, "step": 5032 }, { "epoch": 0.57, "learning_rate": 8.162504821834295e-05, "loss": 0.6545, "step": 5033 }, { "epoch": 0.57, "learning_rate": 8.158886360684334e-05, "loss": 0.635, "step": 5034 }, { "epoch": 0.57, "learning_rate": 8.155268149036964e-05, "loss": 0.6646, "step": 5035 }, { "epoch": 0.57, "learning_rate": 8.151650187382513e-05, "loss": 0.7075, "step": 5036 }, { "epoch": 0.57, "learning_rate": 8.148032476211276e-05, "loss": 0.703, "step": 5037 }, { "epoch": 0.57, "learning_rate": 8.14441501601352e-05, "loss": 0.685, "step": 5038 }, { "epoch": 0.57, "learning_rate": 8.140797807279467e-05, "loss": 0.6593, "step": 5039 }, { "epoch": 0.57, "learning_rate": 8.137180850499318e-05, "loss": 0.7301, "step": 5040 }, { "epoch": 0.57, "learning_rate": 8.133564146163233e-05, "loss": 0.5642, "step": 5041 }, { "epoch": 0.57, "learning_rate": 8.129947694761329e-05, "loss": 0.6872, "step": 5042 }, { "epoch": 0.57, "learning_rate": 8.126331496783703e-05, "loss": 0.6719, "step": 5043 }, { "epoch": 0.57, "learning_rate": 8.122715552720413e-05, "loss": 0.6914, "step": 5044 }, { "epoch": 0.57, "learning_rate": 8.119099863061479e-05, "loss": 0.7052, "step": 5045 }, { "epoch": 0.57, "learning_rate": 8.115484428296891e-05, "loss": 0.6881, "step": 5046 }, { "epoch": 0.57, "learning_rate": 8.111869248916607e-05, "loss": 0.703, "step": 5047 }, { "epoch": 0.57, "learning_rate": 8.108254325410536e-05, "loss": 0.6897, "step": 5048 }, { "epoch": 0.57, "learning_rate": 8.104639658268569e-05, "loss": 0.6083, "step": 5049 }, { "epoch": 0.57, "learning_rate": 8.101025247980553e-05, "loss": 0.6674, "step": 5050 }, { "epoch": 0.57, "learning_rate": 8.097411095036305e-05, "loss": 0.6938, "step": 5051 }, { "epoch": 0.57, "learning_rate": 8.093797199925604e-05, "loss": 0.7099, "step": 5052 }, { "epoch": 0.57, "learning_rate": 8.090183563138198e-05, "loss": 0.6469, "step": 5053 }, { "epoch": 0.57, "learning_rate": 8.08657018516379e-05, "loss": 0.6431, "step": 5054 }, { "epoch": 0.57, "learning_rate": 8.082957066492061e-05, "loss": 0.707, "step": 5055 }, { "epoch": 0.57, "learning_rate": 8.079344207612648e-05, "loss": 0.6421, "step": 5056 }, { "epoch": 0.57, "learning_rate": 8.075731609015156e-05, "loss": 0.6692, "step": 5057 }, { "epoch": 0.57, "learning_rate": 8.072119271189156e-05, "loss": 0.6602, "step": 5058 }, { "epoch": 0.58, "learning_rate": 8.068507194624177e-05, "loss": 0.6385, "step": 5059 }, { "epoch": 0.58, "learning_rate": 8.064895379809724e-05, "loss": 0.6723, "step": 5060 }, { "epoch": 0.58, "learning_rate": 8.061283827235255e-05, "loss": 0.6829, "step": 5061 }, { "epoch": 0.58, "learning_rate": 8.057672537390201e-05, "loss": 0.6435, "step": 5062 }, { "epoch": 0.58, "learning_rate": 8.054061510763953e-05, "loss": 0.7152, "step": 5063 }, { "epoch": 0.58, "learning_rate": 8.05045074784587e-05, "loss": 0.6409, "step": 5064 }, { "epoch": 0.58, "learning_rate": 8.046840249125265e-05, "loss": 0.6597, "step": 5065 }, { "epoch": 0.58, "learning_rate": 8.043230015091427e-05, "loss": 0.6831, "step": 5066 }, { "epoch": 0.58, "learning_rate": 8.039620046233607e-05, "loss": 0.6328, "step": 5067 }, { "epoch": 0.58, "learning_rate": 8.036010343041013e-05, "loss": 0.6868, "step": 5068 }, { "epoch": 0.58, "learning_rate": 8.032400906002827e-05, "loss": 0.7085, "step": 5069 }, { "epoch": 0.58, "learning_rate": 8.028791735608192e-05, "loss": 0.6757, "step": 5070 }, { "epoch": 0.58, "learning_rate": 8.025182832346203e-05, "loss": 0.6413, "step": 5071 }, { "epoch": 0.58, "learning_rate": 8.021574196705934e-05, "loss": 0.6539, "step": 5072 }, { "epoch": 0.58, "learning_rate": 8.017965829176418e-05, "loss": 0.6608, "step": 5073 }, { "epoch": 0.58, "learning_rate": 8.01435773024665e-05, "loss": 0.6796, "step": 5074 }, { "epoch": 0.58, "learning_rate": 8.010749900405589e-05, "loss": 0.7061, "step": 5075 }, { "epoch": 0.58, "learning_rate": 8.007142340142163e-05, "loss": 0.67, "step": 5076 }, { "epoch": 0.58, "learning_rate": 8.00353504994525e-05, "loss": 0.6914, "step": 5077 }, { "epoch": 0.58, "learning_rate": 7.999928030303704e-05, "loss": 0.6586, "step": 5078 }, { "epoch": 0.58, "learning_rate": 7.996321281706338e-05, "loss": 0.6764, "step": 5079 }, { "epoch": 0.58, "learning_rate": 7.99271480464193e-05, "loss": 0.6778, "step": 5080 }, { "epoch": 0.58, "learning_rate": 7.98910859959922e-05, "loss": 0.5989, "step": 5081 }, { "epoch": 0.58, "learning_rate": 7.985502667066906e-05, "loss": 0.6586, "step": 5082 }, { "epoch": 0.58, "learning_rate": 7.98189700753366e-05, "loss": 0.6689, "step": 5083 }, { "epoch": 0.58, "learning_rate": 7.978291621488107e-05, "loss": 0.6741, "step": 5084 }, { "epoch": 0.58, "learning_rate": 7.974686509418839e-05, "loss": 0.7202, "step": 5085 }, { "epoch": 0.58, "learning_rate": 7.971081671814413e-05, "loss": 0.6831, "step": 5086 }, { "epoch": 0.58, "learning_rate": 7.967477109163351e-05, "loss": 0.6851, "step": 5087 }, { "epoch": 0.58, "learning_rate": 7.963872821954121e-05, "loss": 0.6624, "step": 5088 }, { "epoch": 0.58, "learning_rate": 7.960268810675174e-05, "loss": 0.7031, "step": 5089 }, { "epoch": 0.58, "learning_rate": 7.956665075814914e-05, "loss": 0.7017, "step": 5090 }, { "epoch": 0.58, "learning_rate": 7.95306161786171e-05, "loss": 0.6466, "step": 5091 }, { "epoch": 0.58, "learning_rate": 7.949458437303891e-05, "loss": 0.6012, "step": 5092 }, { "epoch": 0.58, "learning_rate": 7.945855534629756e-05, "loss": 0.7131, "step": 5093 }, { "epoch": 0.58, "learning_rate": 7.94225291032755e-05, "loss": 0.6709, "step": 5094 }, { "epoch": 0.58, "learning_rate": 7.938650564885497e-05, "loss": 0.5594, "step": 5095 }, { "epoch": 0.58, "learning_rate": 7.935048498791775e-05, "loss": 0.7041, "step": 5096 }, { "epoch": 0.58, "learning_rate": 7.931446712534527e-05, "loss": 0.6997, "step": 5097 }, { "epoch": 0.58, "learning_rate": 7.927845206601861e-05, "loss": 0.655, "step": 5098 }, { "epoch": 0.58, "learning_rate": 7.924243981481834e-05, "loss": 0.597, "step": 5099 }, { "epoch": 0.58, "learning_rate": 7.92064303766248e-05, "loss": 0.6624, "step": 5100 }, { "epoch": 0.58, "learning_rate": 7.917042375631785e-05, "loss": 0.6749, "step": 5101 }, { "epoch": 0.58, "learning_rate": 7.913441995877707e-05, "loss": 0.6183, "step": 5102 }, { "epoch": 0.58, "learning_rate": 7.909841898888153e-05, "loss": 0.6496, "step": 5103 }, { "epoch": 0.58, "learning_rate": 7.906242085151004e-05, "loss": 0.5784, "step": 5104 }, { "epoch": 0.58, "learning_rate": 7.902642555154089e-05, "loss": 0.6717, "step": 5105 }, { "epoch": 0.58, "learning_rate": 7.899043309385215e-05, "loss": 0.6678, "step": 5106 }, { "epoch": 0.58, "learning_rate": 7.895444348332135e-05, "loss": 0.6669, "step": 5107 }, { "epoch": 0.58, "learning_rate": 7.891845672482573e-05, "loss": 0.6147, "step": 5108 }, { "epoch": 0.58, "learning_rate": 7.888247282324212e-05, "loss": 0.6813, "step": 5109 }, { "epoch": 0.58, "learning_rate": 7.884649178344698e-05, "loss": 0.6738, "step": 5110 }, { "epoch": 0.58, "learning_rate": 7.88105136103163e-05, "loss": 0.662, "step": 5111 }, { "epoch": 0.58, "learning_rate": 7.877453830872576e-05, "loss": 0.646, "step": 5112 }, { "epoch": 0.58, "learning_rate": 7.873856588355066e-05, "loss": 0.6575, "step": 5113 }, { "epoch": 0.58, "learning_rate": 7.870259633966587e-05, "loss": 0.704, "step": 5114 }, { "epoch": 0.58, "learning_rate": 7.866662968194592e-05, "loss": 0.6652, "step": 5115 }, { "epoch": 0.58, "learning_rate": 7.863066591526482e-05, "loss": 0.6832, "step": 5116 }, { "epoch": 0.58, "learning_rate": 7.859470504449635e-05, "loss": 0.6206, "step": 5117 }, { "epoch": 0.58, "learning_rate": 7.85587470745138e-05, "loss": 0.6677, "step": 5118 }, { "epoch": 0.58, "learning_rate": 7.852279201019009e-05, "loss": 0.7112, "step": 5119 }, { "epoch": 0.58, "learning_rate": 7.848683985639777e-05, "loss": 0.6398, "step": 5120 }, { "epoch": 0.58, "learning_rate": 7.845089061800903e-05, "loss": 0.6523, "step": 5121 }, { "epoch": 0.58, "learning_rate": 7.841494429989549e-05, "loss": 0.6675, "step": 5122 }, { "epoch": 0.58, "learning_rate": 7.837900090692855e-05, "loss": 0.668, "step": 5123 }, { "epoch": 0.58, "learning_rate": 7.834306044397916e-05, "loss": 0.6683, "step": 5124 }, { "epoch": 0.58, "learning_rate": 7.830712291591789e-05, "loss": 0.6738, "step": 5125 }, { "epoch": 0.58, "learning_rate": 7.827118832761487e-05, "loss": 0.6522, "step": 5126 }, { "epoch": 0.58, "learning_rate": 7.823525668393988e-05, "loss": 0.6409, "step": 5127 }, { "epoch": 0.58, "learning_rate": 7.819932798976222e-05, "loss": 0.6643, "step": 5128 }, { "epoch": 0.58, "learning_rate": 7.816340224995091e-05, "loss": 0.6824, "step": 5129 }, { "epoch": 0.58, "learning_rate": 7.812747946937447e-05, "loss": 0.6763, "step": 5130 }, { "epoch": 0.58, "learning_rate": 7.80915596529011e-05, "loss": 0.6635, "step": 5131 }, { "epoch": 0.58, "learning_rate": 7.805564280539849e-05, "loss": 0.7232, "step": 5132 }, { "epoch": 0.58, "learning_rate": 7.801972893173405e-05, "loss": 0.7322, "step": 5133 }, { "epoch": 0.58, "learning_rate": 7.798381803677467e-05, "loss": 0.6522, "step": 5134 }, { "epoch": 0.58, "learning_rate": 7.794791012538692e-05, "loss": 0.6983, "step": 5135 }, { "epoch": 0.58, "learning_rate": 7.791200520243696e-05, "loss": 0.7233, "step": 5136 }, { "epoch": 0.58, "learning_rate": 7.787610327279049e-05, "loss": 0.6766, "step": 5137 }, { "epoch": 0.58, "learning_rate": 7.784020434131291e-05, "loss": 0.6531, "step": 5138 }, { "epoch": 0.58, "learning_rate": 7.780430841286906e-05, "loss": 0.6556, "step": 5139 }, { "epoch": 0.58, "learning_rate": 7.776841549232348e-05, "loss": 0.7314, "step": 5140 }, { "epoch": 0.58, "learning_rate": 7.773252558454027e-05, "loss": 0.6546, "step": 5141 }, { "epoch": 0.58, "learning_rate": 7.769663869438316e-05, "loss": 0.7435, "step": 5142 }, { "epoch": 0.58, "learning_rate": 7.766075482671543e-05, "loss": 0.7061, "step": 5143 }, { "epoch": 0.58, "learning_rate": 7.76248739864e-05, "loss": 0.6521, "step": 5144 }, { "epoch": 0.58, "learning_rate": 7.758899617829925e-05, "loss": 0.7491, "step": 5145 }, { "epoch": 0.58, "learning_rate": 7.755312140727531e-05, "loss": 0.6643, "step": 5146 }, { "epoch": 0.59, "learning_rate": 7.751724967818981e-05, "loss": 0.657, "step": 5147 }, { "epoch": 0.59, "learning_rate": 7.748138099590396e-05, "loss": 0.6578, "step": 5148 }, { "epoch": 0.59, "learning_rate": 7.744551536527864e-05, "loss": 0.6651, "step": 5149 }, { "epoch": 0.59, "learning_rate": 7.740965279117424e-05, "loss": 0.5622, "step": 5150 }, { "epoch": 0.59, "learning_rate": 7.737379327845073e-05, "loss": 0.6734, "step": 5151 }, { "epoch": 0.59, "learning_rate": 7.733793683196772e-05, "loss": 0.6426, "step": 5152 }, { "epoch": 0.59, "learning_rate": 7.730208345658436e-05, "loss": 0.6307, "step": 5153 }, { "epoch": 0.59, "learning_rate": 7.72662331571594e-05, "loss": 0.6644, "step": 5154 }, { "epoch": 0.59, "learning_rate": 7.72303859385512e-05, "loss": 0.6286, "step": 5155 }, { "epoch": 0.59, "learning_rate": 7.719454180561763e-05, "loss": 0.6946, "step": 5156 }, { "epoch": 0.59, "learning_rate": 7.715870076321621e-05, "loss": 0.6664, "step": 5157 }, { "epoch": 0.59, "learning_rate": 7.7122862816204e-05, "loss": 0.6616, "step": 5158 }, { "epoch": 0.59, "learning_rate": 7.70870279694377e-05, "loss": 0.6864, "step": 5159 }, { "epoch": 0.59, "learning_rate": 7.705119622777351e-05, "loss": 0.6359, "step": 5160 }, { "epoch": 0.59, "learning_rate": 7.701536759606731e-05, "loss": 0.5855, "step": 5161 }, { "epoch": 0.59, "learning_rate": 7.69795420791744e-05, "loss": 0.5971, "step": 5162 }, { "epoch": 0.59, "learning_rate": 7.694371968194982e-05, "loss": 0.7166, "step": 5163 }, { "epoch": 0.59, "learning_rate": 7.690790040924808e-05, "loss": 0.6486, "step": 5164 }, { "epoch": 0.59, "learning_rate": 7.687208426592336e-05, "loss": 0.7319, "step": 5165 }, { "epoch": 0.59, "learning_rate": 7.683627125682932e-05, "loss": 0.7078, "step": 5166 }, { "epoch": 0.59, "learning_rate": 7.68004613868193e-05, "loss": 0.6854, "step": 5167 }, { "epoch": 0.59, "learning_rate": 7.676465466074608e-05, "loss": 0.7538, "step": 5168 }, { "epoch": 0.59, "learning_rate": 7.672885108346209e-05, "loss": 0.6381, "step": 5169 }, { "epoch": 0.59, "learning_rate": 7.669305065981938e-05, "loss": 0.5946, "step": 5170 }, { "epoch": 0.59, "learning_rate": 7.665725339466949e-05, "loss": 0.6012, "step": 5171 }, { "epoch": 0.59, "learning_rate": 7.662145929286364e-05, "loss": 0.6881, "step": 5172 }, { "epoch": 0.59, "learning_rate": 7.658566835925242e-05, "loss": 0.5973, "step": 5173 }, { "epoch": 0.59, "learning_rate": 7.65498805986862e-05, "loss": 0.6664, "step": 5174 }, { "epoch": 0.59, "learning_rate": 7.65140960160148e-05, "loss": 0.6959, "step": 5175 }, { "epoch": 0.59, "learning_rate": 7.647831461608768e-05, "loss": 0.5727, "step": 5176 }, { "epoch": 0.59, "learning_rate": 7.644253640375382e-05, "loss": 0.6785, "step": 5177 }, { "epoch": 0.59, "learning_rate": 7.64067613838618e-05, "loss": 0.5587, "step": 5178 }, { "epoch": 0.59, "learning_rate": 7.637098956125973e-05, "loss": 0.6317, "step": 5179 }, { "epoch": 0.59, "learning_rate": 7.63352209407953e-05, "loss": 0.6825, "step": 5180 }, { "epoch": 0.59, "learning_rate": 7.62994555273158e-05, "loss": 0.7137, "step": 5181 }, { "epoch": 0.59, "learning_rate": 7.626369332566803e-05, "loss": 0.6608, "step": 5182 }, { "epoch": 0.59, "learning_rate": 7.622793434069843e-05, "loss": 0.6445, "step": 5183 }, { "epoch": 0.59, "learning_rate": 7.619217857725297e-05, "loss": 0.697, "step": 5184 }, { "epoch": 0.59, "learning_rate": 7.615642604017705e-05, "loss": 0.7342, "step": 5185 }, { "epoch": 0.59, "learning_rate": 7.612067673431587e-05, "loss": 0.7166, "step": 5186 }, { "epoch": 0.59, "learning_rate": 7.608493066451403e-05, "loss": 0.6615, "step": 5187 }, { "epoch": 0.59, "learning_rate": 7.604918783561576e-05, "loss": 0.6827, "step": 5188 }, { "epoch": 0.59, "learning_rate": 7.601344825246484e-05, "loss": 0.6284, "step": 5189 }, { "epoch": 0.59, "learning_rate": 7.597771191990455e-05, "loss": 0.6547, "step": 5190 }, { "epoch": 0.59, "learning_rate": 7.594197884277781e-05, "loss": 0.6415, "step": 5191 }, { "epoch": 0.59, "learning_rate": 7.590624902592705e-05, "loss": 0.5751, "step": 5192 }, { "epoch": 0.59, "learning_rate": 7.587052247419428e-05, "loss": 0.7171, "step": 5193 }, { "epoch": 0.59, "learning_rate": 7.583479919242108e-05, "loss": 0.6876, "step": 5194 }, { "epoch": 0.59, "learning_rate": 7.57990791854486e-05, "loss": 0.7025, "step": 5195 }, { "epoch": 0.59, "learning_rate": 7.576336245811743e-05, "loss": 0.6229, "step": 5196 }, { "epoch": 0.59, "learning_rate": 7.572764901526785e-05, "loss": 0.6357, "step": 5197 }, { "epoch": 0.59, "learning_rate": 7.569193886173964e-05, "loss": 0.6294, "step": 5198 }, { "epoch": 0.59, "learning_rate": 7.565623200237216e-05, "loss": 0.6778, "step": 5199 }, { "epoch": 0.59, "learning_rate": 7.562052844200426e-05, "loss": 0.6468, "step": 5200 }, { "epoch": 0.59, "learning_rate": 7.558482818547445e-05, "loss": 0.6719, "step": 5201 }, { "epoch": 0.59, "learning_rate": 7.554913123762068e-05, "loss": 0.6907, "step": 5202 }, { "epoch": 0.59, "learning_rate": 7.551343760328051e-05, "loss": 0.6767, "step": 5203 }, { "epoch": 0.59, "learning_rate": 7.547774728729104e-05, "loss": 0.6612, "step": 5204 }, { "epoch": 0.59, "learning_rate": 7.544206029448893e-05, "loss": 0.6405, "step": 5205 }, { "epoch": 0.59, "learning_rate": 7.540637662971041e-05, "loss": 0.6522, "step": 5206 }, { "epoch": 0.59, "learning_rate": 7.537069629779119e-05, "loss": 0.64, "step": 5207 }, { "epoch": 0.59, "learning_rate": 7.533501930356657e-05, "loss": 0.5824, "step": 5208 }, { "epoch": 0.59, "learning_rate": 7.52993456518714e-05, "loss": 0.6203, "step": 5209 }, { "epoch": 0.59, "learning_rate": 7.526367534754009e-05, "loss": 0.6162, "step": 5210 }, { "epoch": 0.59, "learning_rate": 7.522800839540655e-05, "loss": 0.6788, "step": 5211 }, { "epoch": 0.59, "learning_rate": 7.519234480030435e-05, "loss": 0.6161, "step": 5212 }, { "epoch": 0.59, "learning_rate": 7.515668456706641e-05, "loss": 0.72, "step": 5213 }, { "epoch": 0.59, "learning_rate": 7.512102770052536e-05, "loss": 0.6684, "step": 5214 }, { "epoch": 0.59, "learning_rate": 7.50853742055133e-05, "loss": 0.6922, "step": 5215 }, { "epoch": 0.59, "learning_rate": 7.504972408686191e-05, "loss": 0.663, "step": 5216 }, { "epoch": 0.59, "learning_rate": 7.50140773494024e-05, "loss": 0.5426, "step": 5217 }, { "epoch": 0.59, "learning_rate": 7.497843399796554e-05, "loss": 0.6923, "step": 5218 }, { "epoch": 0.59, "learning_rate": 7.494279403738154e-05, "loss": 0.6276, "step": 5219 }, { "epoch": 0.59, "learning_rate": 7.490715747248028e-05, "loss": 0.63, "step": 5220 }, { "epoch": 0.59, "learning_rate": 7.487152430809112e-05, "loss": 0.6956, "step": 5221 }, { "epoch": 0.59, "learning_rate": 7.483589454904296e-05, "loss": 0.6751, "step": 5222 }, { "epoch": 0.59, "learning_rate": 7.480026820016426e-05, "loss": 0.5972, "step": 5223 }, { "epoch": 0.59, "learning_rate": 7.476464526628302e-05, "loss": 0.7197, "step": 5224 }, { "epoch": 0.59, "learning_rate": 7.472902575222671e-05, "loss": 0.6443, "step": 5225 }, { "epoch": 0.59, "learning_rate": 7.469340966282242e-05, "loss": 0.6874, "step": 5226 }, { "epoch": 0.59, "learning_rate": 7.465779700289676e-05, "loss": 0.6505, "step": 5227 }, { "epoch": 0.59, "learning_rate": 7.46221877772758e-05, "loss": 0.6935, "step": 5228 }, { "epoch": 0.59, "learning_rate": 7.458658199078528e-05, "loss": 0.6522, "step": 5229 }, { "epoch": 0.59, "learning_rate": 7.455097964825033e-05, "loss": 0.6831, "step": 5230 }, { "epoch": 0.59, "learning_rate": 7.451538075449571e-05, "loss": 0.619, "step": 5231 }, { "epoch": 0.59, "learning_rate": 7.447978531434567e-05, "loss": 0.7495, "step": 5232 }, { "epoch": 0.59, "learning_rate": 7.444419333262402e-05, "loss": 0.657, "step": 5233 }, { "epoch": 0.59, "learning_rate": 7.440860481415408e-05, "loss": 0.7284, "step": 5234 }, { "epoch": 0.6, "learning_rate": 7.437301976375876e-05, "loss": 0.6809, "step": 5235 }, { "epoch": 0.6, "learning_rate": 7.433743818626034e-05, "loss": 0.6911, "step": 5236 }, { "epoch": 0.6, "learning_rate": 7.430186008648079e-05, "loss": 0.6324, "step": 5237 }, { "epoch": 0.6, "learning_rate": 7.426628546924156e-05, "loss": 0.6647, "step": 5238 }, { "epoch": 0.6, "learning_rate": 7.423071433936362e-05, "loss": 0.6801, "step": 5239 }, { "epoch": 0.6, "learning_rate": 7.419514670166746e-05, "loss": 0.6536, "step": 5240 }, { "epoch": 0.6, "learning_rate": 7.415958256097317e-05, "loss": 0.7421, "step": 5241 }, { "epoch": 0.6, "learning_rate": 7.41240219221002e-05, "loss": 0.6209, "step": 5242 }, { "epoch": 0.6, "learning_rate": 7.408846478986769e-05, "loss": 0.67, "step": 5243 }, { "epoch": 0.6, "learning_rate": 7.405291116909421e-05, "loss": 0.6634, "step": 5244 }, { "epoch": 0.6, "learning_rate": 7.401736106459792e-05, "loss": 0.6369, "step": 5245 }, { "epoch": 0.6, "learning_rate": 7.398181448119649e-05, "loss": 0.6683, "step": 5246 }, { "epoch": 0.6, "learning_rate": 7.394627142370704e-05, "loss": 0.6904, "step": 5247 }, { "epoch": 0.6, "learning_rate": 7.39107318969463e-05, "loss": 0.7172, "step": 5248 }, { "epoch": 0.6, "learning_rate": 7.387519590573046e-05, "loss": 0.6646, "step": 5249 }, { "epoch": 0.6, "learning_rate": 7.383966345487529e-05, "loss": 0.634, "step": 5250 }, { "epoch": 0.6, "learning_rate": 7.380413454919603e-05, "loss": 0.6654, "step": 5251 }, { "epoch": 0.6, "learning_rate": 7.376860919350748e-05, "loss": 0.6999, "step": 5252 }, { "epoch": 0.6, "learning_rate": 7.37330873926239e-05, "loss": 0.6481, "step": 5253 }, { "epoch": 0.6, "learning_rate": 7.369756915135912e-05, "loss": 0.6435, "step": 5254 }, { "epoch": 0.6, "learning_rate": 7.36620544745265e-05, "loss": 0.6392, "step": 5255 }, { "epoch": 0.6, "learning_rate": 7.362654336693883e-05, "loss": 0.6867, "step": 5256 }, { "epoch": 0.6, "learning_rate": 7.359103583340857e-05, "loss": 0.6917, "step": 5257 }, { "epoch": 0.6, "learning_rate": 7.355553187874756e-05, "loss": 0.68, "step": 5258 }, { "epoch": 0.6, "learning_rate": 7.352003150776714e-05, "loss": 0.6794, "step": 5259 }, { "epoch": 0.6, "learning_rate": 7.348453472527826e-05, "loss": 0.654, "step": 5260 }, { "epoch": 0.6, "learning_rate": 7.344904153609137e-05, "loss": 0.6212, "step": 5261 }, { "epoch": 0.6, "learning_rate": 7.341355194501638e-05, "loss": 0.7191, "step": 5262 }, { "epoch": 0.6, "learning_rate": 7.337806595686275e-05, "loss": 0.618, "step": 5263 }, { "epoch": 0.6, "learning_rate": 7.334258357643948e-05, "loss": 0.6748, "step": 5264 }, { "epoch": 0.6, "learning_rate": 7.330710480855498e-05, "loss": 0.6711, "step": 5265 }, { "epoch": 0.6, "learning_rate": 7.327162965801724e-05, "loss": 0.5635, "step": 5266 }, { "epoch": 0.6, "learning_rate": 7.323615812963378e-05, "loss": 0.7071, "step": 5267 }, { "epoch": 0.6, "learning_rate": 7.32006902282116e-05, "loss": 0.7617, "step": 5268 }, { "epoch": 0.6, "learning_rate": 7.316522595855724e-05, "loss": 0.683, "step": 5269 }, { "epoch": 0.6, "learning_rate": 7.312976532547666e-05, "loss": 0.656, "step": 5270 }, { "epoch": 0.6, "learning_rate": 7.30943083337754e-05, "loss": 0.6991, "step": 5271 }, { "epoch": 0.6, "learning_rate": 7.30588549882585e-05, "loss": 0.6897, "step": 5272 }, { "epoch": 0.6, "learning_rate": 7.302340529373051e-05, "loss": 0.7494, "step": 5273 }, { "epoch": 0.6, "learning_rate": 7.298795925499545e-05, "loss": 0.712, "step": 5274 }, { "epoch": 0.6, "learning_rate": 7.295251687685692e-05, "loss": 0.7172, "step": 5275 }, { "epoch": 0.6, "learning_rate": 7.291707816411793e-05, "loss": 0.6684, "step": 5276 }, { "epoch": 0.6, "learning_rate": 7.288164312158102e-05, "loss": 0.67, "step": 5277 }, { "epoch": 0.6, "learning_rate": 7.284621175404828e-05, "loss": 0.7195, "step": 5278 }, { "epoch": 0.6, "learning_rate": 7.281078406632127e-05, "loss": 0.6885, "step": 5279 }, { "epoch": 0.6, "learning_rate": 7.277536006320102e-05, "loss": 0.6819, "step": 5280 }, { "epoch": 0.6, "learning_rate": 7.273993974948818e-05, "loss": 0.7507, "step": 5281 }, { "epoch": 0.6, "learning_rate": 7.27045231299827e-05, "loss": 0.6144, "step": 5282 }, { "epoch": 0.6, "learning_rate": 7.266911020948419e-05, "loss": 0.6315, "step": 5283 }, { "epoch": 0.6, "learning_rate": 7.263370099279172e-05, "loss": 0.6506, "step": 5284 }, { "epoch": 0.6, "learning_rate": 7.259829548470383e-05, "loss": 0.672, "step": 5285 }, { "epoch": 0.6, "learning_rate": 7.256289369001861e-05, "loss": 0.6444, "step": 5286 }, { "epoch": 0.6, "learning_rate": 7.252749561353356e-05, "loss": 0.6572, "step": 5287 }, { "epoch": 0.6, "learning_rate": 7.249210126004575e-05, "loss": 0.6244, "step": 5288 }, { "epoch": 0.6, "learning_rate": 7.245671063435174e-05, "loss": 0.6792, "step": 5289 }, { "epoch": 0.6, "learning_rate": 7.242132374124753e-05, "loss": 0.7196, "step": 5290 }, { "epoch": 0.6, "learning_rate": 7.23859405855287e-05, "loss": 0.7164, "step": 5291 }, { "epoch": 0.6, "learning_rate": 7.23505611719903e-05, "loss": 0.5791, "step": 5292 }, { "epoch": 0.6, "learning_rate": 7.231518550542678e-05, "loss": 0.6775, "step": 5293 }, { "epoch": 0.6, "learning_rate": 7.227981359063217e-05, "loss": 0.6436, "step": 5294 }, { "epoch": 0.6, "learning_rate": 7.224444543239997e-05, "loss": 0.6188, "step": 5295 }, { "epoch": 0.6, "learning_rate": 7.220908103552318e-05, "loss": 0.6856, "step": 5296 }, { "epoch": 0.6, "learning_rate": 7.21737204047943e-05, "loss": 0.6698, "step": 5297 }, { "epoch": 0.6, "learning_rate": 7.213836354500533e-05, "loss": 0.6519, "step": 5298 }, { "epoch": 0.6, "learning_rate": 7.210301046094767e-05, "loss": 0.7018, "step": 5299 }, { "epoch": 0.6, "learning_rate": 7.20676611574123e-05, "loss": 0.6871, "step": 5300 }, { "epoch": 0.6, "learning_rate": 7.203231563918965e-05, "loss": 0.643, "step": 5301 }, { "epoch": 0.6, "learning_rate": 7.199697391106969e-05, "loss": 0.7135, "step": 5302 }, { "epoch": 0.6, "learning_rate": 7.196163597784178e-05, "loss": 0.6832, "step": 5303 }, { "epoch": 0.6, "learning_rate": 7.192630184429483e-05, "loss": 0.6122, "step": 5304 }, { "epoch": 0.6, "learning_rate": 7.189097151521724e-05, "loss": 0.6858, "step": 5305 }, { "epoch": 0.6, "learning_rate": 7.185564499539685e-05, "loss": 0.6896, "step": 5306 }, { "epoch": 0.6, "learning_rate": 7.182032228962103e-05, "loss": 0.6932, "step": 5307 }, { "epoch": 0.6, "learning_rate": 7.178500340267662e-05, "loss": 0.6513, "step": 5308 }, { "epoch": 0.6, "learning_rate": 7.174968833934996e-05, "loss": 0.6194, "step": 5309 }, { "epoch": 0.6, "learning_rate": 7.171437710442678e-05, "loss": 0.6837, "step": 5310 }, { "epoch": 0.6, "learning_rate": 7.167906970269242e-05, "loss": 0.7152, "step": 5311 }, { "epoch": 0.6, "learning_rate": 7.16437661389316e-05, "loss": 0.6756, "step": 5312 }, { "epoch": 0.6, "learning_rate": 7.160846641792858e-05, "loss": 0.6772, "step": 5313 }, { "epoch": 0.6, "learning_rate": 7.157317054446709e-05, "loss": 0.6312, "step": 5314 }, { "epoch": 0.6, "learning_rate": 7.153787852333035e-05, "loss": 0.6085, "step": 5315 }, { "epoch": 0.6, "learning_rate": 7.150259035930098e-05, "loss": 0.7116, "step": 5316 }, { "epoch": 0.6, "learning_rate": 7.146730605716115e-05, "loss": 0.6488, "step": 5317 }, { "epoch": 0.6, "learning_rate": 7.14320256216925e-05, "loss": 0.7015, "step": 5318 }, { "epoch": 0.6, "learning_rate": 7.139674905767613e-05, "loss": 0.6375, "step": 5319 }, { "epoch": 0.6, "learning_rate": 7.136147636989264e-05, "loss": 0.7094, "step": 5320 }, { "epoch": 0.6, "learning_rate": 7.13262075631221e-05, "loss": 0.7309, "step": 5321 }, { "epoch": 0.6, "learning_rate": 7.129094264214398e-05, "loss": 0.6931, "step": 5322 }, { "epoch": 0.61, "learning_rate": 7.125568161173733e-05, "loss": 0.6842, "step": 5323 }, { "epoch": 0.61, "learning_rate": 7.12204244766806e-05, "loss": 0.6684, "step": 5324 }, { "epoch": 0.61, "learning_rate": 7.118517124175177e-05, "loss": 0.6218, "step": 5325 }, { "epoch": 0.61, "learning_rate": 7.114992191172825e-05, "loss": 0.7271, "step": 5326 }, { "epoch": 0.61, "learning_rate": 7.11146764913869e-05, "loss": 0.6514, "step": 5327 }, { "epoch": 0.61, "learning_rate": 7.10794349855041e-05, "loss": 0.622, "step": 5328 }, { "epoch": 0.61, "learning_rate": 7.104419739885572e-05, "loss": 0.6509, "step": 5329 }, { "epoch": 0.61, "learning_rate": 7.100896373621699e-05, "loss": 0.7011, "step": 5330 }, { "epoch": 0.61, "learning_rate": 7.097373400236274e-05, "loss": 0.6702, "step": 5331 }, { "epoch": 0.61, "learning_rate": 7.09385082020672e-05, "loss": 0.7047, "step": 5332 }, { "epoch": 0.61, "learning_rate": 7.090328634010402e-05, "loss": 0.5629, "step": 5333 }, { "epoch": 0.61, "learning_rate": 7.08680684212464e-05, "loss": 0.7193, "step": 5334 }, { "epoch": 0.61, "learning_rate": 7.083285445026697e-05, "loss": 0.6388, "step": 5335 }, { "epoch": 0.61, "learning_rate": 7.079764443193783e-05, "loss": 0.6505, "step": 5336 }, { "epoch": 0.61, "learning_rate": 7.076243837103055e-05, "loss": 0.6002, "step": 5337 }, { "epoch": 0.61, "learning_rate": 7.072723627231621e-05, "loss": 0.5661, "step": 5338 }, { "epoch": 0.61, "learning_rate": 7.06920381405652e-05, "loss": 0.716, "step": 5339 }, { "epoch": 0.61, "learning_rate": 7.06568439805475e-05, "loss": 0.6358, "step": 5340 }, { "epoch": 0.61, "learning_rate": 7.062165379703256e-05, "loss": 0.6527, "step": 5341 }, { "epoch": 0.61, "learning_rate": 7.058646759478921e-05, "loss": 0.7324, "step": 5342 }, { "epoch": 0.61, "learning_rate": 7.055128537858586e-05, "loss": 0.6962, "step": 5343 }, { "epoch": 0.61, "learning_rate": 7.051610715319025e-05, "loss": 0.6902, "step": 5344 }, { "epoch": 0.61, "learning_rate": 7.048093292336964e-05, "loss": 0.6493, "step": 5345 }, { "epoch": 0.61, "learning_rate": 7.044576269389073e-05, "loss": 0.6921, "step": 5346 }, { "epoch": 0.61, "learning_rate": 7.04105964695197e-05, "loss": 0.6851, "step": 5347 }, { "epoch": 0.61, "learning_rate": 7.037543425502222e-05, "loss": 0.6393, "step": 5348 }, { "epoch": 0.61, "learning_rate": 7.034027605516333e-05, "loss": 0.6548, "step": 5349 }, { "epoch": 0.61, "learning_rate": 7.030512187470759e-05, "loss": 0.586, "step": 5350 }, { "epoch": 0.61, "learning_rate": 7.026997171841899e-05, "loss": 0.6562, "step": 5351 }, { "epoch": 0.61, "learning_rate": 7.023482559106098e-05, "loss": 0.6569, "step": 5352 }, { "epoch": 0.61, "learning_rate": 7.019968349739645e-05, "loss": 0.6848, "step": 5353 }, { "epoch": 0.61, "learning_rate": 7.01645454421878e-05, "loss": 0.6761, "step": 5354 }, { "epoch": 0.61, "learning_rate": 7.012941143019684e-05, "loss": 0.6872, "step": 5355 }, { "epoch": 0.61, "learning_rate": 7.009428146618477e-05, "loss": 0.6921, "step": 5356 }, { "epoch": 0.61, "learning_rate": 7.005915555491238e-05, "loss": 0.6372, "step": 5357 }, { "epoch": 0.61, "learning_rate": 7.002403370113977e-05, "loss": 0.7244, "step": 5358 }, { "epoch": 0.61, "learning_rate": 6.998891590962659e-05, "loss": 0.7166, "step": 5359 }, { "epoch": 0.61, "learning_rate": 6.995380218513195e-05, "loss": 0.6806, "step": 5360 }, { "epoch": 0.61, "learning_rate": 6.991869253241427e-05, "loss": 0.6387, "step": 5361 }, { "epoch": 0.61, "learning_rate": 6.988358695623158e-05, "loss": 0.6231, "step": 5362 }, { "epoch": 0.61, "learning_rate": 6.984848546134124e-05, "loss": 0.6148, "step": 5363 }, { "epoch": 0.61, "learning_rate": 6.981338805250014e-05, "loss": 0.6178, "step": 5364 }, { "epoch": 0.61, "learning_rate": 6.97782947344646e-05, "loss": 0.6584, "step": 5365 }, { "epoch": 0.61, "learning_rate": 6.974320551199039e-05, "loss": 0.7133, "step": 5366 }, { "epoch": 0.61, "learning_rate": 6.97081203898326e-05, "loss": 0.6655, "step": 5367 }, { "epoch": 0.61, "learning_rate": 6.967303937274594e-05, "loss": 0.656, "step": 5368 }, { "epoch": 0.61, "learning_rate": 6.963796246548448e-05, "loss": 0.7215, "step": 5369 }, { "epoch": 0.61, "learning_rate": 6.960288967280174e-05, "loss": 0.6466, "step": 5370 }, { "epoch": 0.61, "learning_rate": 6.95678209994507e-05, "loss": 0.6181, "step": 5371 }, { "epoch": 0.61, "learning_rate": 6.953275645018378e-05, "loss": 0.668, "step": 5372 }, { "epoch": 0.61, "learning_rate": 6.949769602975278e-05, "loss": 0.6843, "step": 5373 }, { "epoch": 0.61, "learning_rate": 6.946263974290905e-05, "loss": 0.6386, "step": 5374 }, { "epoch": 0.61, "learning_rate": 6.942758759440327e-05, "loss": 0.7292, "step": 5375 }, { "epoch": 0.61, "learning_rate": 6.939253958898564e-05, "loss": 0.7502, "step": 5376 }, { "epoch": 0.61, "learning_rate": 6.93574957314058e-05, "loss": 0.6803, "step": 5377 }, { "epoch": 0.61, "learning_rate": 6.93224560264127e-05, "loss": 0.6816, "step": 5378 }, { "epoch": 0.61, "learning_rate": 6.92874204787549e-05, "loss": 0.5842, "step": 5379 }, { "epoch": 0.61, "learning_rate": 6.925238909318029e-05, "loss": 0.7137, "step": 5380 }, { "epoch": 0.61, "learning_rate": 6.921736187443623e-05, "loss": 0.6105, "step": 5381 }, { "epoch": 0.61, "learning_rate": 6.918233882726953e-05, "loss": 0.6824, "step": 5382 }, { "epoch": 0.61, "learning_rate": 6.914731995642643e-05, "loss": 0.6576, "step": 5383 }, { "epoch": 0.61, "learning_rate": 6.911230526665253e-05, "loss": 0.696, "step": 5384 }, { "epoch": 0.61, "learning_rate": 6.907729476269296e-05, "loss": 0.6444, "step": 5385 }, { "epoch": 0.61, "learning_rate": 6.904228844929222e-05, "loss": 0.663, "step": 5386 }, { "epoch": 0.61, "learning_rate": 6.900728633119431e-05, "loss": 0.6521, "step": 5387 }, { "epoch": 0.61, "learning_rate": 6.897228841314259e-05, "loss": 0.6544, "step": 5388 }, { "epoch": 0.61, "learning_rate": 6.893729469987993e-05, "loss": 0.6959, "step": 5389 }, { "epoch": 0.61, "learning_rate": 6.890230519614849e-05, "loss": 0.6234, "step": 5390 }, { "epoch": 0.61, "learning_rate": 6.886731990669e-05, "loss": 0.7004, "step": 5391 }, { "epoch": 0.61, "learning_rate": 6.883233883624558e-05, "loss": 0.7004, "step": 5392 }, { "epoch": 0.61, "learning_rate": 6.879736198955575e-05, "loss": 0.6628, "step": 5393 }, { "epoch": 0.61, "learning_rate": 6.876238937136047e-05, "loss": 0.6675, "step": 5394 }, { "epoch": 0.61, "learning_rate": 6.872742098639918e-05, "loss": 0.7244, "step": 5395 }, { "epoch": 0.61, "learning_rate": 6.869245683941062e-05, "loss": 0.6888, "step": 5396 }, { "epoch": 0.61, "learning_rate": 6.865749693513307e-05, "loss": 0.7114, "step": 5397 }, { "epoch": 0.61, "learning_rate": 6.862254127830425e-05, "loss": 0.6358, "step": 5398 }, { "epoch": 0.61, "learning_rate": 6.858758987366116e-05, "loss": 0.6215, "step": 5399 }, { "epoch": 0.61, "learning_rate": 6.85526427259404e-05, "loss": 0.6615, "step": 5400 }, { "epoch": 0.61, "learning_rate": 6.851769983987784e-05, "loss": 0.6766, "step": 5401 }, { "epoch": 0.61, "learning_rate": 6.84827612202089e-05, "loss": 0.6644, "step": 5402 }, { "epoch": 0.61, "learning_rate": 6.844782687166831e-05, "loss": 0.6599, "step": 5403 }, { "epoch": 0.61, "learning_rate": 6.841289679899033e-05, "loss": 0.6728, "step": 5404 }, { "epoch": 0.61, "learning_rate": 6.837797100690853e-05, "loss": 0.6487, "step": 5405 }, { "epoch": 0.61, "learning_rate": 6.834304950015606e-05, "loss": 0.6483, "step": 5406 }, { "epoch": 0.61, "learning_rate": 6.830813228346525e-05, "loss": 0.6661, "step": 5407 }, { "epoch": 0.61, "learning_rate": 6.827321936156806e-05, "loss": 0.6913, "step": 5408 }, { "epoch": 0.61, "learning_rate": 6.823831073919577e-05, "loss": 0.6711, "step": 5409 }, { "epoch": 0.61, "learning_rate": 6.820340642107911e-05, "loss": 0.6677, "step": 5410 }, { "epoch": 0.62, "learning_rate": 6.816850641194821e-05, "loss": 0.5959, "step": 5411 }, { "epoch": 0.62, "learning_rate": 6.813361071653268e-05, "loss": 0.6863, "step": 5412 }, { "epoch": 0.62, "learning_rate": 6.809871933956138e-05, "loss": 0.6487, "step": 5413 }, { "epoch": 0.62, "learning_rate": 6.806383228576274e-05, "loss": 0.6941, "step": 5414 }, { "epoch": 0.62, "learning_rate": 6.802894955986458e-05, "loss": 0.6619, "step": 5415 }, { "epoch": 0.62, "learning_rate": 6.799407116659409e-05, "loss": 0.6885, "step": 5416 }, { "epoch": 0.62, "learning_rate": 6.79591971106779e-05, "loss": 0.6357, "step": 5417 }, { "epoch": 0.62, "learning_rate": 6.792432739684203e-05, "loss": 0.6812, "step": 5418 }, { "epoch": 0.62, "learning_rate": 6.788946202981195e-05, "loss": 0.6683, "step": 5419 }, { "epoch": 0.62, "learning_rate": 6.785460101431247e-05, "loss": 0.7062, "step": 5420 }, { "epoch": 0.62, "learning_rate": 6.781974435506791e-05, "loss": 0.6462, "step": 5421 }, { "epoch": 0.62, "learning_rate": 6.778489205680192e-05, "loss": 0.6774, "step": 5422 }, { "epoch": 0.62, "learning_rate": 6.775004412423761e-05, "loss": 0.6998, "step": 5423 }, { "epoch": 0.62, "learning_rate": 6.771520056209745e-05, "loss": 0.7103, "step": 5424 }, { "epoch": 0.62, "learning_rate": 6.768036137510335e-05, "loss": 0.6732, "step": 5425 }, { "epoch": 0.62, "learning_rate": 6.764552656797661e-05, "loss": 0.6345, "step": 5426 }, { "epoch": 0.62, "learning_rate": 6.761069614543795e-05, "loss": 0.6899, "step": 5427 }, { "epoch": 0.62, "learning_rate": 6.757587011220752e-05, "loss": 0.6566, "step": 5428 }, { "epoch": 0.62, "learning_rate": 6.754104847300486e-05, "loss": 0.7134, "step": 5429 }, { "epoch": 0.62, "learning_rate": 6.750623123254883e-05, "loss": 0.7089, "step": 5430 }, { "epoch": 0.62, "learning_rate": 6.74714183955578e-05, "loss": 0.6765, "step": 5431 }, { "epoch": 0.62, "learning_rate": 6.74366099667495e-05, "loss": 0.633, "step": 5432 }, { "epoch": 0.62, "learning_rate": 6.740180595084109e-05, "loss": 0.7087, "step": 5433 }, { "epoch": 0.62, "learning_rate": 6.736700635254915e-05, "loss": 0.7413, "step": 5434 }, { "epoch": 0.62, "learning_rate": 6.733221117658953e-05, "loss": 0.6836, "step": 5435 }, { "epoch": 0.62, "learning_rate": 6.729742042767763e-05, "loss": 0.6666, "step": 5436 }, { "epoch": 0.62, "learning_rate": 6.72626341105282e-05, "loss": 0.5906, "step": 5437 }, { "epoch": 0.62, "learning_rate": 6.722785222985537e-05, "loss": 0.6918, "step": 5438 }, { "epoch": 0.62, "learning_rate": 6.719307479037269e-05, "loss": 0.6958, "step": 5439 }, { "epoch": 0.62, "learning_rate": 6.715830179679315e-05, "loss": 0.6868, "step": 5440 }, { "epoch": 0.62, "learning_rate": 6.712353325382898e-05, "loss": 0.6981, "step": 5441 }, { "epoch": 0.62, "learning_rate": 6.708876916619198e-05, "loss": 0.7243, "step": 5442 }, { "epoch": 0.62, "learning_rate": 6.705400953859329e-05, "loss": 0.6221, "step": 5443 }, { "epoch": 0.62, "learning_rate": 6.701925437574341e-05, "loss": 0.6248, "step": 5444 }, { "epoch": 0.62, "learning_rate": 6.698450368235229e-05, "loss": 0.65, "step": 5445 }, { "epoch": 0.62, "learning_rate": 6.694975746312927e-05, "loss": 0.7493, "step": 5446 }, { "epoch": 0.62, "learning_rate": 6.6915015722783e-05, "loss": 0.6471, "step": 5447 }, { "epoch": 0.62, "learning_rate": 6.68802784660216e-05, "loss": 0.747, "step": 5448 }, { "epoch": 0.62, "learning_rate": 6.684554569755258e-05, "loss": 0.6841, "step": 5449 }, { "epoch": 0.62, "learning_rate": 6.681081742208283e-05, "loss": 0.6829, "step": 5450 }, { "epoch": 0.62, "learning_rate": 6.677609364431863e-05, "loss": 0.7178, "step": 5451 }, { "epoch": 0.62, "learning_rate": 6.674137436896567e-05, "loss": 0.6487, "step": 5452 }, { "epoch": 0.62, "learning_rate": 6.670665960072894e-05, "loss": 0.6508, "step": 5453 }, { "epoch": 0.62, "learning_rate": 6.667194934431296e-05, "loss": 0.6207, "step": 5454 }, { "epoch": 0.62, "learning_rate": 6.663724360442151e-05, "loss": 0.656, "step": 5455 }, { "epoch": 0.62, "learning_rate": 6.660254238575786e-05, "loss": 0.6241, "step": 5456 }, { "epoch": 0.62, "learning_rate": 6.656784569302464e-05, "loss": 0.6415, "step": 5457 }, { "epoch": 0.62, "learning_rate": 6.653315353092378e-05, "loss": 0.5969, "step": 5458 }, { "epoch": 0.62, "learning_rate": 6.64984659041567e-05, "loss": 0.6323, "step": 5459 }, { "epoch": 0.62, "learning_rate": 6.646378281742418e-05, "loss": 0.669, "step": 5460 }, { "epoch": 0.62, "learning_rate": 6.642910427542636e-05, "loss": 0.7126, "step": 5461 }, { "epoch": 0.62, "learning_rate": 6.639443028286278e-05, "loss": 0.6823, "step": 5462 }, { "epoch": 0.62, "learning_rate": 6.635976084443243e-05, "loss": 0.7176, "step": 5463 }, { "epoch": 0.62, "learning_rate": 6.632509596483349e-05, "loss": 0.624, "step": 5464 }, { "epoch": 0.62, "learning_rate": 6.629043564876373e-05, "loss": 0.6319, "step": 5465 }, { "epoch": 0.62, "learning_rate": 6.62557799009202e-05, "loss": 0.6704, "step": 5466 }, { "epoch": 0.62, "learning_rate": 6.622112872599934e-05, "loss": 0.6994, "step": 5467 }, { "epoch": 0.62, "learning_rate": 6.6186482128697e-05, "loss": 0.6821, "step": 5468 }, { "epoch": 0.62, "learning_rate": 6.61518401137084e-05, "loss": 0.6353, "step": 5469 }, { "epoch": 0.62, "learning_rate": 6.611720268572811e-05, "loss": 0.7219, "step": 5470 }, { "epoch": 0.62, "learning_rate": 6.608256984945009e-05, "loss": 0.6705, "step": 5471 }, { "epoch": 0.62, "learning_rate": 6.604794160956769e-05, "loss": 0.7027, "step": 5472 }, { "epoch": 0.62, "learning_rate": 6.601331797077367e-05, "loss": 0.6393, "step": 5473 }, { "epoch": 0.62, "learning_rate": 6.59786989377601e-05, "loss": 0.7281, "step": 5474 }, { "epoch": 0.62, "learning_rate": 6.594408451521842e-05, "loss": 0.6583, "step": 5475 }, { "epoch": 0.62, "learning_rate": 6.590947470783952e-05, "loss": 0.6558, "step": 5476 }, { "epoch": 0.62, "learning_rate": 6.587486952031361e-05, "loss": 0.6264, "step": 5477 }, { "epoch": 0.62, "learning_rate": 6.58402689573303e-05, "loss": 0.7477, "step": 5478 }, { "epoch": 0.62, "learning_rate": 6.580567302357856e-05, "loss": 0.7116, "step": 5479 }, { "epoch": 0.62, "learning_rate": 6.577108172374678e-05, "loss": 0.6134, "step": 5480 }, { "epoch": 0.62, "learning_rate": 6.573649506252259e-05, "loss": 0.6906, "step": 5481 }, { "epoch": 0.62, "learning_rate": 6.57019130445931e-05, "loss": 0.6994, "step": 5482 }, { "epoch": 0.62, "learning_rate": 6.56673356746448e-05, "loss": 0.6513, "step": 5483 }, { "epoch": 0.62, "learning_rate": 6.56327629573635e-05, "loss": 0.6323, "step": 5484 }, { "epoch": 0.62, "learning_rate": 6.55981948974344e-05, "loss": 0.6585, "step": 5485 }, { "epoch": 0.62, "learning_rate": 6.556363149954212e-05, "loss": 0.6659, "step": 5486 }, { "epoch": 0.62, "learning_rate": 6.55290727683705e-05, "loss": 0.7021, "step": 5487 }, { "epoch": 0.62, "learning_rate": 6.549451870860288e-05, "loss": 0.6528, "step": 5488 }, { "epoch": 0.62, "learning_rate": 6.545996932492195e-05, "loss": 0.6793, "step": 5489 }, { "epoch": 0.62, "learning_rate": 6.542542462200973e-05, "loss": 0.6551, "step": 5490 }, { "epoch": 0.62, "learning_rate": 6.539088460454765e-05, "loss": 0.6883, "step": 5491 }, { "epoch": 0.62, "learning_rate": 6.535634927721643e-05, "loss": 0.651, "step": 5492 }, { "epoch": 0.62, "learning_rate": 6.532181864469622e-05, "loss": 0.7201, "step": 5493 }, { "epoch": 0.62, "learning_rate": 6.528729271166656e-05, "loss": 0.6973, "step": 5494 }, { "epoch": 0.62, "learning_rate": 6.525277148280622e-05, "loss": 0.6349, "step": 5495 }, { "epoch": 0.62, "learning_rate": 6.521825496279348e-05, "loss": 0.6605, "step": 5496 }, { "epoch": 0.62, "learning_rate": 6.518374315630595e-05, "loss": 0.6591, "step": 5497 }, { "epoch": 0.62, "learning_rate": 6.514923606802049e-05, "loss": 0.6164, "step": 5498 }, { "epoch": 0.63, "learning_rate": 6.511473370261345e-05, "loss": 0.6171, "step": 5499 }, { "epoch": 0.63, "learning_rate": 6.508023606476052e-05, "loss": 0.5884, "step": 5500 }, { "epoch": 0.63, "learning_rate": 6.504574315913667e-05, "loss": 0.6855, "step": 5501 }, { "epoch": 0.63, "learning_rate": 6.501125499041632e-05, "loss": 0.6482, "step": 5502 }, { "epoch": 0.63, "learning_rate": 6.497677156327324e-05, "loss": 0.6719, "step": 5503 }, { "epoch": 0.63, "learning_rate": 6.494229288238045e-05, "loss": 0.618, "step": 5504 }, { "epoch": 0.63, "learning_rate": 6.490781895241045e-05, "loss": 0.6732, "step": 5505 }, { "epoch": 0.63, "learning_rate": 6.487334977803503e-05, "loss": 0.6477, "step": 5506 }, { "epoch": 0.63, "learning_rate": 6.48388853639254e-05, "loss": 0.6446, "step": 5507 }, { "epoch": 0.63, "learning_rate": 6.480442571475202e-05, "loss": 0.7037, "step": 5508 }, { "epoch": 0.63, "learning_rate": 6.476997083518486e-05, "loss": 0.6735, "step": 5509 }, { "epoch": 0.63, "learning_rate": 6.473552072989303e-05, "loss": 0.692, "step": 5510 }, { "epoch": 0.63, "learning_rate": 6.470107540354517e-05, "loss": 0.6663, "step": 5511 }, { "epoch": 0.63, "learning_rate": 6.466663486080922e-05, "loss": 0.6166, "step": 5512 }, { "epoch": 0.63, "learning_rate": 6.463219910635247e-05, "loss": 0.6705, "step": 5513 }, { "epoch": 0.63, "learning_rate": 6.459776814484155e-05, "loss": 0.5525, "step": 5514 }, { "epoch": 0.63, "learning_rate": 6.456334198094248e-05, "loss": 0.7102, "step": 5515 }, { "epoch": 0.63, "learning_rate": 6.45289206193205e-05, "loss": 0.68, "step": 5516 }, { "epoch": 0.63, "learning_rate": 6.449450406464039e-05, "loss": 0.6753, "step": 5517 }, { "epoch": 0.63, "learning_rate": 6.446009232156614e-05, "loss": 0.6747, "step": 5518 }, { "epoch": 0.63, "learning_rate": 6.442568539476116e-05, "loss": 0.6375, "step": 5519 }, { "epoch": 0.63, "learning_rate": 6.43912832888882e-05, "loss": 0.6809, "step": 5520 }, { "epoch": 0.63, "learning_rate": 6.435688600860927e-05, "loss": 0.6707, "step": 5521 }, { "epoch": 0.63, "learning_rate": 6.432249355858585e-05, "loss": 0.6558, "step": 5522 }, { "epoch": 0.63, "learning_rate": 6.428810594347867e-05, "loss": 0.6196, "step": 5523 }, { "epoch": 0.63, "learning_rate": 6.425372316794787e-05, "loss": 0.6622, "step": 5524 }, { "epoch": 0.63, "learning_rate": 6.421934523665291e-05, "loss": 0.6277, "step": 5525 }, { "epoch": 0.63, "learning_rate": 6.418497215425261e-05, "loss": 0.6567, "step": 5526 }, { "epoch": 0.63, "learning_rate": 6.415060392540506e-05, "loss": 0.6641, "step": 5527 }, { "epoch": 0.63, "learning_rate": 6.411624055476778e-05, "loss": 0.6591, "step": 5528 }, { "epoch": 0.63, "learning_rate": 6.408188204699759e-05, "loss": 0.6238, "step": 5529 }, { "epoch": 0.63, "learning_rate": 6.404752840675065e-05, "loss": 0.69, "step": 5530 }, { "epoch": 0.63, "learning_rate": 6.401317963868254e-05, "loss": 0.741, "step": 5531 }, { "epoch": 0.63, "learning_rate": 6.3978835747448e-05, "loss": 0.6734, "step": 5532 }, { "epoch": 0.63, "learning_rate": 6.394449673770129e-05, "loss": 0.6551, "step": 5533 }, { "epoch": 0.63, "learning_rate": 6.39101626140959e-05, "loss": 0.6222, "step": 5534 }, { "epoch": 0.63, "learning_rate": 6.387583338128471e-05, "loss": 0.6248, "step": 5535 }, { "epoch": 0.63, "learning_rate": 6.384150904391992e-05, "loss": 0.7032, "step": 5536 }, { "epoch": 0.63, "learning_rate": 6.380718960665313e-05, "loss": 0.6117, "step": 5537 }, { "epoch": 0.63, "learning_rate": 6.37728750741351e-05, "loss": 0.7005, "step": 5538 }, { "epoch": 0.63, "learning_rate": 6.373856545101611e-05, "loss": 0.6839, "step": 5539 }, { "epoch": 0.63, "learning_rate": 6.370426074194568e-05, "loss": 0.6338, "step": 5540 }, { "epoch": 0.63, "learning_rate": 6.36699609515727e-05, "loss": 0.5897, "step": 5541 }, { "epoch": 0.63, "learning_rate": 6.363566608454539e-05, "loss": 0.677, "step": 5542 }, { "epoch": 0.63, "learning_rate": 6.36013761455113e-05, "loss": 0.6598, "step": 5543 }, { "epoch": 0.63, "learning_rate": 6.356709113911727e-05, "loss": 0.6742, "step": 5544 }, { "epoch": 0.63, "learning_rate": 6.353281107000954e-05, "loss": 0.5514, "step": 5545 }, { "epoch": 0.63, "learning_rate": 6.349853594283363e-05, "loss": 0.6872, "step": 5546 }, { "epoch": 0.63, "learning_rate": 6.346426576223443e-05, "loss": 0.6806, "step": 5547 }, { "epoch": 0.63, "learning_rate": 6.343000053285617e-05, "loss": 0.6508, "step": 5548 }, { "epoch": 0.63, "learning_rate": 6.33957402593423e-05, "loss": 0.6227, "step": 5549 }, { "epoch": 0.63, "learning_rate": 6.336148494633571e-05, "loss": 0.6879, "step": 5550 }, { "epoch": 0.63, "learning_rate": 6.332723459847861e-05, "loss": 0.7128, "step": 5551 }, { "epoch": 0.63, "learning_rate": 6.329298922041247e-05, "loss": 0.6536, "step": 5552 }, { "epoch": 0.63, "learning_rate": 6.325874881677815e-05, "loss": 0.6851, "step": 5553 }, { "epoch": 0.63, "learning_rate": 6.322451339221587e-05, "loss": 0.6354, "step": 5554 }, { "epoch": 0.63, "learning_rate": 6.319028295136501e-05, "loss": 0.7276, "step": 5555 }, { "epoch": 0.63, "learning_rate": 6.315605749886444e-05, "loss": 0.6546, "step": 5556 }, { "epoch": 0.63, "learning_rate": 6.312183703935231e-05, "loss": 0.6877, "step": 5557 }, { "epoch": 0.63, "learning_rate": 6.308762157746604e-05, "loss": 0.6945, "step": 5558 }, { "epoch": 0.63, "learning_rate": 6.305341111784247e-05, "loss": 0.666, "step": 5559 }, { "epoch": 0.63, "learning_rate": 6.30192056651177e-05, "loss": 0.652, "step": 5560 }, { "epoch": 0.63, "learning_rate": 6.298500522392709e-05, "loss": 0.6566, "step": 5561 }, { "epoch": 0.63, "learning_rate": 6.295080979890543e-05, "loss": 0.7133, "step": 5562 }, { "epoch": 0.63, "learning_rate": 6.291661939468683e-05, "loss": 0.6496, "step": 5563 }, { "epoch": 0.63, "learning_rate": 6.288243401590461e-05, "loss": 0.6969, "step": 5564 }, { "epoch": 0.63, "learning_rate": 6.284825366719152e-05, "loss": 0.6894, "step": 5565 }, { "epoch": 0.63, "learning_rate": 6.281407835317957e-05, "loss": 0.6707, "step": 5566 }, { "epoch": 0.63, "learning_rate": 6.277990807850011e-05, "loss": 0.655, "step": 5567 }, { "epoch": 0.63, "learning_rate": 6.274574284778378e-05, "loss": 0.7079, "step": 5568 }, { "epoch": 0.63, "learning_rate": 6.27115826656606e-05, "loss": 0.7201, "step": 5569 }, { "epoch": 0.63, "learning_rate": 6.267742753675983e-05, "loss": 0.6234, "step": 5570 }, { "epoch": 0.63, "learning_rate": 6.264327746571008e-05, "loss": 0.6429, "step": 5571 }, { "epoch": 0.63, "learning_rate": 6.260913245713927e-05, "loss": 0.7289, "step": 5572 }, { "epoch": 0.63, "learning_rate": 6.257499251567464e-05, "loss": 0.6049, "step": 5573 }, { "epoch": 0.63, "learning_rate": 6.254085764594276e-05, "loss": 0.6326, "step": 5574 }, { "epoch": 0.63, "learning_rate": 6.250672785256946e-05, "loss": 0.6329, "step": 5575 }, { "epoch": 0.63, "learning_rate": 6.247260314017992e-05, "loss": 0.5928, "step": 5576 }, { "epoch": 0.63, "learning_rate": 6.24384835133987e-05, "loss": 0.654, "step": 5577 }, { "epoch": 0.63, "learning_rate": 6.240436897684948e-05, "loss": 0.7168, "step": 5578 }, { "epoch": 0.63, "learning_rate": 6.237025953515541e-05, "loss": 0.7002, "step": 5579 }, { "epoch": 0.63, "learning_rate": 6.233615519293894e-05, "loss": 0.6337, "step": 5580 }, { "epoch": 0.63, "learning_rate": 6.230205595482175e-05, "loss": 0.6545, "step": 5581 }, { "epoch": 0.63, "learning_rate": 6.226796182542491e-05, "loss": 0.6441, "step": 5582 }, { "epoch": 0.63, "learning_rate": 6.223387280936878e-05, "loss": 0.6337, "step": 5583 }, { "epoch": 0.63, "learning_rate": 6.219978891127294e-05, "loss": 0.7095, "step": 5584 }, { "epoch": 0.63, "learning_rate": 6.216571013575636e-05, "loss": 0.645, "step": 5585 }, { "epoch": 0.63, "learning_rate": 6.213163648743735e-05, "loss": 0.7211, "step": 5586 }, { "epoch": 0.64, "learning_rate": 6.209756797093343e-05, "loss": 0.6009, "step": 5587 }, { "epoch": 0.64, "learning_rate": 6.20635045908615e-05, "loss": 0.6709, "step": 5588 }, { "epoch": 0.64, "learning_rate": 6.202944635183772e-05, "loss": 0.6636, "step": 5589 }, { "epoch": 0.64, "learning_rate": 6.199539325847757e-05, "loss": 0.6453, "step": 5590 }, { "epoch": 0.64, "learning_rate": 6.196134531539582e-05, "loss": 0.7292, "step": 5591 }, { "epoch": 0.64, "learning_rate": 6.192730252720657e-05, "loss": 0.7133, "step": 5592 }, { "epoch": 0.64, "learning_rate": 6.189326489852319e-05, "loss": 0.6658, "step": 5593 }, { "epoch": 0.64, "learning_rate": 6.185923243395838e-05, "loss": 0.6167, "step": 5594 }, { "epoch": 0.64, "learning_rate": 6.182520513812411e-05, "loss": 0.6822, "step": 5595 }, { "epoch": 0.64, "learning_rate": 6.179118301563165e-05, "loss": 0.6415, "step": 5596 }, { "epoch": 0.64, "learning_rate": 6.175716607109161e-05, "loss": 0.7097, "step": 5597 }, { "epoch": 0.64, "learning_rate": 6.172315430911387e-05, "loss": 0.6173, "step": 5598 }, { "epoch": 0.64, "learning_rate": 6.16891477343076e-05, "loss": 0.7011, "step": 5599 }, { "epoch": 0.64, "learning_rate": 6.165514635128132e-05, "loss": 0.6616, "step": 5600 }, { "epoch": 0.64, "learning_rate": 6.162115016464272e-05, "loss": 0.6729, "step": 5601 }, { "epoch": 0.64, "learning_rate": 6.158715917899893e-05, "loss": 0.6202, "step": 5602 }, { "epoch": 0.64, "learning_rate": 6.155317339895627e-05, "loss": 0.7413, "step": 5603 }, { "epoch": 0.64, "learning_rate": 6.151919282912043e-05, "loss": 0.6767, "step": 5604 }, { "epoch": 0.64, "learning_rate": 6.148521747409639e-05, "loss": 0.5904, "step": 5605 }, { "epoch": 0.64, "learning_rate": 6.145124733848833e-05, "loss": 0.6028, "step": 5606 }, { "epoch": 0.64, "learning_rate": 6.141728242689982e-05, "loss": 0.6927, "step": 5607 }, { "epoch": 0.64, "learning_rate": 6.138332274393367e-05, "loss": 0.7036, "step": 5608 }, { "epoch": 0.64, "learning_rate": 6.134936829419204e-05, "loss": 0.5837, "step": 5609 }, { "epoch": 0.64, "learning_rate": 6.131541908227632e-05, "loss": 0.7018, "step": 5610 }, { "epoch": 0.64, "learning_rate": 6.128147511278723e-05, "loss": 0.7169, "step": 5611 }, { "epoch": 0.64, "learning_rate": 6.124753639032474e-05, "loss": 0.6721, "step": 5612 }, { "epoch": 0.64, "learning_rate": 6.121360291948812e-05, "loss": 0.6953, "step": 5613 }, { "epoch": 0.64, "learning_rate": 6.117967470487597e-05, "loss": 0.6742, "step": 5614 }, { "epoch": 0.64, "learning_rate": 6.114575175108612e-05, "loss": 0.6801, "step": 5615 }, { "epoch": 0.64, "learning_rate": 6.111183406271575e-05, "loss": 0.6823, "step": 5616 }, { "epoch": 0.64, "learning_rate": 6.107792164436126e-05, "loss": 0.6478, "step": 5617 }, { "epoch": 0.64, "learning_rate": 6.104401450061839e-05, "loss": 0.6885, "step": 5618 }, { "epoch": 0.64, "learning_rate": 6.1010112636082095e-05, "loss": 0.6754, "step": 5619 }, { "epoch": 0.64, "learning_rate": 6.0976216055346716e-05, "loss": 0.6559, "step": 5620 }, { "epoch": 0.64, "learning_rate": 6.094232476300579e-05, "loss": 0.6723, "step": 5621 }, { "epoch": 0.64, "learning_rate": 6.090843876365223e-05, "loss": 0.7119, "step": 5622 }, { "epoch": 0.64, "learning_rate": 6.0874558061878074e-05, "loss": 0.7171, "step": 5623 }, { "epoch": 0.64, "learning_rate": 6.0840682662274806e-05, "loss": 0.6913, "step": 5624 }, { "epoch": 0.64, "learning_rate": 6.080681256943309e-05, "loss": 0.6115, "step": 5625 }, { "epoch": 0.64, "learning_rate": 6.077294778794294e-05, "loss": 0.6418, "step": 5626 }, { "epoch": 0.64, "learning_rate": 6.07390883223936e-05, "loss": 0.7393, "step": 5627 }, { "epoch": 0.64, "learning_rate": 6.070523417737366e-05, "loss": 0.6472, "step": 5628 }, { "epoch": 0.64, "learning_rate": 6.067138535747084e-05, "loss": 0.693, "step": 5629 }, { "epoch": 0.64, "learning_rate": 6.0637541867272294e-05, "loss": 0.7173, "step": 5630 }, { "epoch": 0.64, "learning_rate": 6.0603703711364404e-05, "loss": 0.6673, "step": 5631 }, { "epoch": 0.64, "learning_rate": 6.05698708943328e-05, "loss": 0.6949, "step": 5632 }, { "epoch": 0.64, "learning_rate": 6.053604342076243e-05, "loss": 0.6645, "step": 5633 }, { "epoch": 0.64, "learning_rate": 6.050222129523755e-05, "loss": 0.6242, "step": 5634 }, { "epoch": 0.64, "learning_rate": 6.0468404522341525e-05, "loss": 0.7074, "step": 5635 }, { "epoch": 0.64, "learning_rate": 6.0434593106657155e-05, "loss": 0.6388, "step": 5636 }, { "epoch": 0.64, "learning_rate": 6.0400787052766504e-05, "loss": 0.5751, "step": 5637 }, { "epoch": 0.64, "learning_rate": 6.036698636525084e-05, "loss": 0.7194, "step": 5638 }, { "epoch": 0.64, "learning_rate": 6.033319104869076e-05, "loss": 0.6236, "step": 5639 }, { "epoch": 0.64, "learning_rate": 6.029940110766612e-05, "loss": 0.6807, "step": 5640 }, { "epoch": 0.64, "learning_rate": 6.0265616546756e-05, "loss": 0.6922, "step": 5641 }, { "epoch": 0.64, "learning_rate": 6.0231837370538814e-05, "loss": 0.6313, "step": 5642 }, { "epoch": 0.64, "learning_rate": 6.01980635835922e-05, "loss": 0.642, "step": 5643 }, { "epoch": 0.64, "learning_rate": 6.016429519049314e-05, "loss": 0.6398, "step": 5644 }, { "epoch": 0.64, "learning_rate": 6.013053219581779e-05, "loss": 0.6937, "step": 5645 }, { "epoch": 0.64, "learning_rate": 6.00967746041416e-05, "loss": 0.6624, "step": 5646 }, { "epoch": 0.64, "learning_rate": 6.006302242003934e-05, "loss": 0.6287, "step": 5647 }, { "epoch": 0.64, "learning_rate": 6.0029275648085e-05, "loss": 0.6907, "step": 5648 }, { "epoch": 0.64, "learning_rate": 5.9995534292851855e-05, "loss": 0.6936, "step": 5649 }, { "epoch": 0.64, "learning_rate": 5.996179835891241e-05, "loss": 0.6707, "step": 5650 }, { "epoch": 0.64, "learning_rate": 5.9928067850838554e-05, "loss": 0.7287, "step": 5651 }, { "epoch": 0.64, "learning_rate": 5.989434277320123e-05, "loss": 0.7217, "step": 5652 }, { "epoch": 0.64, "learning_rate": 5.986062313057084e-05, "loss": 0.6641, "step": 5653 }, { "epoch": 0.64, "learning_rate": 5.9826908927516944e-05, "loss": 0.6703, "step": 5654 }, { "epoch": 0.64, "learning_rate": 5.979320016860841e-05, "loss": 0.7701, "step": 5655 }, { "epoch": 0.64, "learning_rate": 5.9759496858413355e-05, "loss": 0.6808, "step": 5656 }, { "epoch": 0.64, "learning_rate": 5.9725799001499215e-05, "loss": 0.603, "step": 5657 }, { "epoch": 0.64, "learning_rate": 5.9692106602432526e-05, "loss": 0.6002, "step": 5658 }, { "epoch": 0.64, "learning_rate": 5.965841966577923e-05, "loss": 0.6337, "step": 5659 }, { "epoch": 0.64, "learning_rate": 5.96247381961045e-05, "loss": 0.7425, "step": 5660 }, { "epoch": 0.64, "learning_rate": 5.9591062197972744e-05, "loss": 0.5934, "step": 5661 }, { "epoch": 0.64, "learning_rate": 5.955739167594767e-05, "loss": 0.6562, "step": 5662 }, { "epoch": 0.64, "learning_rate": 5.952372663459217e-05, "loss": 0.6557, "step": 5663 }, { "epoch": 0.64, "learning_rate": 5.9490067078468446e-05, "loss": 0.6213, "step": 5664 }, { "epoch": 0.64, "learning_rate": 5.945641301213798e-05, "loss": 0.6992, "step": 5665 }, { "epoch": 0.64, "learning_rate": 5.9422764440161414e-05, "loss": 0.6734, "step": 5666 }, { "epoch": 0.64, "learning_rate": 5.938912136709877e-05, "loss": 0.646, "step": 5667 }, { "epoch": 0.64, "learning_rate": 5.935548379750924e-05, "loss": 0.624, "step": 5668 }, { "epoch": 0.64, "learning_rate": 5.932185173595128e-05, "loss": 0.6229, "step": 5669 }, { "epoch": 0.64, "learning_rate": 5.9288225186982626e-05, "loss": 0.6711, "step": 5670 }, { "epoch": 0.64, "learning_rate": 5.9254604155160265e-05, "loss": 0.6984, "step": 5671 }, { "epoch": 0.64, "learning_rate": 5.922098864504041e-05, "loss": 0.6662, "step": 5672 }, { "epoch": 0.64, "learning_rate": 5.918737866117854e-05, "loss": 0.6844, "step": 5673 }, { "epoch": 0.64, "learning_rate": 5.9153774208129444e-05, "loss": 0.7223, "step": 5674 }, { "epoch": 0.65, "learning_rate": 5.912017529044701e-05, "loss": 0.7176, "step": 5675 }, { "epoch": 0.65, "learning_rate": 5.908658191268451e-05, "loss": 0.7315, "step": 5676 }, { "epoch": 0.65, "learning_rate": 5.905299407939443e-05, "loss": 0.6954, "step": 5677 }, { "epoch": 0.65, "learning_rate": 5.90194117951285e-05, "loss": 0.64, "step": 5678 }, { "epoch": 0.65, "learning_rate": 5.8985835064437736e-05, "loss": 0.6604, "step": 5679 }, { "epoch": 0.65, "learning_rate": 5.895226389187227e-05, "loss": 0.6905, "step": 5680 }, { "epoch": 0.65, "learning_rate": 5.891869828198164e-05, "loss": 0.6801, "step": 5681 }, { "epoch": 0.65, "learning_rate": 5.888513823931454e-05, "loss": 0.6473, "step": 5682 }, { "epoch": 0.65, "learning_rate": 5.885158376841895e-05, "loss": 0.6688, "step": 5683 }, { "epoch": 0.65, "learning_rate": 5.8818034873842067e-05, "loss": 0.6719, "step": 5684 }, { "epoch": 0.65, "learning_rate": 5.8784491560130374e-05, "loss": 0.6817, "step": 5685 }, { "epoch": 0.65, "learning_rate": 5.875095383182954e-05, "loss": 0.6496, "step": 5686 }, { "epoch": 0.65, "learning_rate": 5.8717421693484473e-05, "loss": 0.651, "step": 5687 }, { "epoch": 0.65, "learning_rate": 5.8683895149639404e-05, "loss": 0.6856, "step": 5688 }, { "epoch": 0.65, "learning_rate": 5.865037420483773e-05, "loss": 0.6902, "step": 5689 }, { "epoch": 0.65, "learning_rate": 5.861685886362214e-05, "loss": 0.6395, "step": 5690 }, { "epoch": 0.65, "learning_rate": 5.858334913053454e-05, "loss": 0.6617, "step": 5691 }, { "epoch": 0.65, "learning_rate": 5.854984501011604e-05, "loss": 0.6678, "step": 5692 }, { "epoch": 0.65, "learning_rate": 5.851634650690705e-05, "loss": 0.7192, "step": 5693 }, { "epoch": 0.65, "learning_rate": 5.848285362544719e-05, "loss": 0.7385, "step": 5694 }, { "epoch": 0.65, "learning_rate": 5.844936637027531e-05, "loss": 0.6824, "step": 5695 }, { "epoch": 0.65, "learning_rate": 5.8415884745929537e-05, "loss": 0.6644, "step": 5696 }, { "epoch": 0.65, "learning_rate": 5.838240875694724e-05, "loss": 0.6448, "step": 5697 }, { "epoch": 0.65, "learning_rate": 5.8348938407864914e-05, "loss": 0.6328, "step": 5698 }, { "epoch": 0.65, "learning_rate": 5.831547370321837e-05, "loss": 0.6566, "step": 5699 }, { "epoch": 0.65, "learning_rate": 5.82820146475427e-05, "loss": 0.7, "step": 5700 }, { "epoch": 0.65, "learning_rate": 5.824856124537213e-05, "loss": 0.6814, "step": 5701 }, { "epoch": 0.65, "learning_rate": 5.821511350124025e-05, "loss": 0.6134, "step": 5702 }, { "epoch": 0.65, "learning_rate": 5.818167141967976e-05, "loss": 0.6175, "step": 5703 }, { "epoch": 0.65, "learning_rate": 5.81482350052226e-05, "loss": 0.6683, "step": 5704 }, { "epoch": 0.65, "learning_rate": 5.811480426240004e-05, "loss": 0.697, "step": 5705 }, { "epoch": 0.65, "learning_rate": 5.8081379195742455e-05, "loss": 0.7385, "step": 5706 }, { "epoch": 0.65, "learning_rate": 5.804795980977962e-05, "loss": 0.621, "step": 5707 }, { "epoch": 0.65, "learning_rate": 5.801454610904036e-05, "loss": 0.6645, "step": 5708 }, { "epoch": 0.65, "learning_rate": 5.7981138098052836e-05, "loss": 0.7241, "step": 5709 }, { "epoch": 0.65, "learning_rate": 5.794773578134434e-05, "loss": 0.657, "step": 5710 }, { "epoch": 0.65, "learning_rate": 5.7914339163441555e-05, "loss": 0.6952, "step": 5711 }, { "epoch": 0.65, "learning_rate": 5.788094824887023e-05, "loss": 0.6316, "step": 5712 }, { "epoch": 0.65, "learning_rate": 5.7847563042155485e-05, "loss": 0.6545, "step": 5713 }, { "epoch": 0.65, "learning_rate": 5.781418354782153e-05, "loss": 0.7008, "step": 5714 }, { "epoch": 0.65, "learning_rate": 5.7780809770391873e-05, "loss": 0.6684, "step": 5715 }, { "epoch": 0.65, "learning_rate": 5.7747441714389195e-05, "loss": 0.6931, "step": 5716 }, { "epoch": 0.65, "learning_rate": 5.771407938433553e-05, "loss": 0.629, "step": 5717 }, { "epoch": 0.65, "learning_rate": 5.768072278475196e-05, "loss": 0.6532, "step": 5718 }, { "epoch": 0.65, "learning_rate": 5.7647371920158996e-05, "loss": 0.6807, "step": 5719 }, { "epoch": 0.65, "learning_rate": 5.76140267950761e-05, "loss": 0.6474, "step": 5720 }, { "epoch": 0.65, "learning_rate": 5.758068741402223e-05, "loss": 0.6703, "step": 5721 }, { "epoch": 0.65, "learning_rate": 5.7547353781515364e-05, "loss": 0.6839, "step": 5722 }, { "epoch": 0.65, "learning_rate": 5.7514025902072864e-05, "loss": 0.6647, "step": 5723 }, { "epoch": 0.65, "learning_rate": 5.748070378021116e-05, "loss": 0.6553, "step": 5724 }, { "epoch": 0.65, "learning_rate": 5.744738742044602e-05, "loss": 0.6284, "step": 5725 }, { "epoch": 0.65, "learning_rate": 5.741407682729239e-05, "loss": 0.704, "step": 5726 }, { "epoch": 0.65, "learning_rate": 5.738077200526435e-05, "loss": 0.6486, "step": 5727 }, { "epoch": 0.65, "learning_rate": 5.7347472958875384e-05, "loss": 0.6423, "step": 5728 }, { "epoch": 0.65, "learning_rate": 5.7314179692637994e-05, "loss": 0.6829, "step": 5729 }, { "epoch": 0.65, "learning_rate": 5.728089221106408e-05, "loss": 0.6036, "step": 5730 }, { "epoch": 0.65, "learning_rate": 5.72476105186646e-05, "loss": 0.6742, "step": 5731 }, { "epoch": 0.65, "learning_rate": 5.721433461994983e-05, "loss": 0.7237, "step": 5732 }, { "epoch": 0.65, "learning_rate": 5.7181064519429174e-05, "loss": 0.5821, "step": 5733 }, { "epoch": 0.65, "learning_rate": 5.7147800221611366e-05, "loss": 0.6295, "step": 5734 }, { "epoch": 0.65, "learning_rate": 5.7114541731004255e-05, "loss": 0.6132, "step": 5735 }, { "epoch": 0.65, "learning_rate": 5.7081289052115025e-05, "loss": 0.6949, "step": 5736 }, { "epoch": 0.65, "learning_rate": 5.704804218944984e-05, "loss": 0.6679, "step": 5737 }, { "epoch": 0.65, "learning_rate": 5.7014801147514316e-05, "loss": 0.6562, "step": 5738 }, { "epoch": 0.65, "learning_rate": 5.698156593081314e-05, "loss": 0.7074, "step": 5739 }, { "epoch": 0.65, "learning_rate": 5.694833654385032e-05, "loss": 0.6636, "step": 5740 }, { "epoch": 0.65, "learning_rate": 5.6915112991128925e-05, "loss": 0.6709, "step": 5741 }, { "epoch": 0.65, "learning_rate": 5.688189527715145e-05, "loss": 0.6783, "step": 5742 }, { "epoch": 0.65, "learning_rate": 5.6848683406419314e-05, "loss": 0.6499, "step": 5743 }, { "epoch": 0.65, "learning_rate": 5.681547738343339e-05, "loss": 0.6741, "step": 5744 }, { "epoch": 0.65, "learning_rate": 5.67822772126936e-05, "loss": 0.6798, "step": 5745 }, { "epoch": 0.65, "learning_rate": 5.674908289869923e-05, "loss": 0.6525, "step": 5746 }, { "epoch": 0.65, "learning_rate": 5.671589444594859e-05, "loss": 0.7066, "step": 5747 }, { "epoch": 0.65, "learning_rate": 5.6682711858939366e-05, "loss": 0.7165, "step": 5748 }, { "epoch": 0.65, "learning_rate": 5.664953514216833e-05, "loss": 0.6383, "step": 5749 }, { "epoch": 0.65, "learning_rate": 5.6616364300131465e-05, "loss": 0.6913, "step": 5750 }, { "epoch": 0.65, "learning_rate": 5.6583199337324056e-05, "loss": 0.7294, "step": 5751 }, { "epoch": 0.65, "learning_rate": 5.655004025824051e-05, "loss": 0.7319, "step": 5752 }, { "epoch": 0.65, "learning_rate": 5.6516887067374436e-05, "loss": 0.7204, "step": 5753 }, { "epoch": 0.65, "learning_rate": 5.6483739769218615e-05, "loss": 0.5826, "step": 5754 }, { "epoch": 0.65, "learning_rate": 5.645059836826517e-05, "loss": 0.6644, "step": 5755 }, { "epoch": 0.65, "learning_rate": 5.641746286900524e-05, "loss": 0.6347, "step": 5756 }, { "epoch": 0.65, "learning_rate": 5.6384333275929356e-05, "loss": 0.6721, "step": 5757 }, { "epoch": 0.65, "learning_rate": 5.635120959352707e-05, "loss": 0.685, "step": 5758 }, { "epoch": 0.65, "learning_rate": 5.631809182628729e-05, "loss": 0.6193, "step": 5759 }, { "epoch": 0.65, "learning_rate": 5.628497997869793e-05, "loss": 0.6945, "step": 5760 }, { "epoch": 0.65, "learning_rate": 5.62518740552463e-05, "loss": 0.6771, "step": 5761 }, { "epoch": 0.65, "learning_rate": 5.621877406041876e-05, "loss": 0.6652, "step": 5762 }, { "epoch": 0.66, "learning_rate": 5.6185679998701016e-05, "loss": 0.7151, "step": 5763 }, { "epoch": 0.66, "learning_rate": 5.615259187457778e-05, "loss": 0.6821, "step": 5764 }, { "epoch": 0.66, "learning_rate": 5.611950969253321e-05, "loss": 0.6776, "step": 5765 }, { "epoch": 0.66, "learning_rate": 5.6086433457050334e-05, "loss": 0.7034, "step": 5766 }, { "epoch": 0.66, "learning_rate": 5.6053363172611674e-05, "loss": 0.6819, "step": 5767 }, { "epoch": 0.66, "learning_rate": 5.602029884369874e-05, "loss": 0.6691, "step": 5768 }, { "epoch": 0.66, "learning_rate": 5.59872404747924e-05, "loss": 0.6447, "step": 5769 }, { "epoch": 0.66, "learning_rate": 5.595418807037256e-05, "loss": 0.6796, "step": 5770 }, { "epoch": 0.66, "learning_rate": 5.592114163491846e-05, "loss": 0.6501, "step": 5771 }, { "epoch": 0.66, "learning_rate": 5.588810117290843e-05, "loss": 0.6302, "step": 5772 }, { "epoch": 0.66, "learning_rate": 5.5855066688820014e-05, "loss": 0.7463, "step": 5773 }, { "epoch": 0.66, "learning_rate": 5.58220381871299e-05, "loss": 0.6851, "step": 5774 }, { "epoch": 0.66, "learning_rate": 5.578901567231414e-05, "loss": 0.655, "step": 5775 }, { "epoch": 0.66, "learning_rate": 5.575599914884777e-05, "loss": 0.6381, "step": 5776 }, { "epoch": 0.66, "learning_rate": 5.572298862120506e-05, "loss": 0.7203, "step": 5777 }, { "epoch": 0.66, "learning_rate": 5.568998409385961e-05, "loss": 0.5893, "step": 5778 }, { "epoch": 0.66, "learning_rate": 5.5656985571284026e-05, "loss": 0.6727, "step": 5779 }, { "epoch": 0.66, "learning_rate": 5.562399305795023e-05, "loss": 0.7325, "step": 5780 }, { "epoch": 0.66, "learning_rate": 5.559100655832921e-05, "loss": 0.6581, "step": 5781 }, { "epoch": 0.66, "learning_rate": 5.55580260768913e-05, "loss": 0.6284, "step": 5782 }, { "epoch": 0.66, "learning_rate": 5.5525051618105794e-05, "loss": 0.623, "step": 5783 }, { "epoch": 0.66, "learning_rate": 5.5492083186441415e-05, "loss": 0.6668, "step": 5784 }, { "epoch": 0.66, "learning_rate": 5.545912078636586e-05, "loss": 0.6274, "step": 5785 }, { "epoch": 0.66, "learning_rate": 5.542616442234618e-05, "loss": 0.692, "step": 5786 }, { "epoch": 0.66, "learning_rate": 5.5393214098848455e-05, "loss": 0.7076, "step": 5787 }, { "epoch": 0.66, "learning_rate": 5.536026982033815e-05, "loss": 0.704, "step": 5788 }, { "epoch": 0.66, "learning_rate": 5.532733159127963e-05, "loss": 0.6401, "step": 5789 }, { "epoch": 0.66, "learning_rate": 5.5294399416136676e-05, "loss": 0.7181, "step": 5790 }, { "epoch": 0.66, "learning_rate": 5.526147329937211e-05, "loss": 0.6949, "step": 5791 }, { "epoch": 0.66, "learning_rate": 5.5228553245448064e-05, "loss": 0.652, "step": 5792 }, { "epoch": 0.66, "learning_rate": 5.519563925882574e-05, "loss": 0.7241, "step": 5793 }, { "epoch": 0.66, "learning_rate": 5.516273134396552e-05, "loss": 0.6057, "step": 5794 }, { "epoch": 0.66, "learning_rate": 5.512982950532699e-05, "loss": 0.6904, "step": 5795 }, { "epoch": 0.66, "learning_rate": 5.509693374736897e-05, "loss": 0.7135, "step": 5796 }, { "epoch": 0.66, "learning_rate": 5.5064044074549335e-05, "loss": 0.6759, "step": 5797 }, { "epoch": 0.66, "learning_rate": 5.503116049132528e-05, "loss": 0.7157, "step": 5798 }, { "epoch": 0.66, "learning_rate": 5.499828300215305e-05, "loss": 0.6643, "step": 5799 }, { "epoch": 0.66, "learning_rate": 5.496541161148807e-05, "loss": 0.658, "step": 5800 }, { "epoch": 0.66, "learning_rate": 5.4932546323785075e-05, "loss": 0.6388, "step": 5801 }, { "epoch": 0.66, "learning_rate": 5.489968714349778e-05, "loss": 0.6887, "step": 5802 }, { "epoch": 0.66, "learning_rate": 5.486683407507925e-05, "loss": 0.67, "step": 5803 }, { "epoch": 0.66, "learning_rate": 5.4833987122981576e-05, "loss": 0.6386, "step": 5804 }, { "epoch": 0.66, "learning_rate": 5.480114629165619e-05, "loss": 0.6062, "step": 5805 }, { "epoch": 0.66, "learning_rate": 5.476831158555344e-05, "loss": 0.6375, "step": 5806 }, { "epoch": 0.66, "learning_rate": 5.473548300912311e-05, "loss": 0.7333, "step": 5807 }, { "epoch": 0.66, "learning_rate": 5.4702660566813955e-05, "loss": 0.6242, "step": 5808 }, { "epoch": 0.66, "learning_rate": 5.4669844263074064e-05, "loss": 0.6269, "step": 5809 }, { "epoch": 0.66, "learning_rate": 5.463703410235057e-05, "loss": 0.6977, "step": 5810 }, { "epoch": 0.66, "learning_rate": 5.460423008908981e-05, "loss": 0.6998, "step": 5811 }, { "epoch": 0.66, "learning_rate": 5.4571432227737274e-05, "loss": 0.651, "step": 5812 }, { "epoch": 0.66, "learning_rate": 5.453864052273769e-05, "loss": 0.6578, "step": 5813 }, { "epoch": 0.66, "learning_rate": 5.450585497853482e-05, "loss": 0.6276, "step": 5814 }, { "epoch": 0.66, "learning_rate": 5.4473075599571774e-05, "loss": 0.6957, "step": 5815 }, { "epoch": 0.66, "learning_rate": 5.444030239029065e-05, "loss": 0.7109, "step": 5816 }, { "epoch": 0.66, "learning_rate": 5.440753535513281e-05, "loss": 0.6259, "step": 5817 }, { "epoch": 0.66, "learning_rate": 5.437477449853869e-05, "loss": 0.6263, "step": 5818 }, { "epoch": 0.66, "learning_rate": 5.434201982494806e-05, "loss": 0.7053, "step": 5819 }, { "epoch": 0.66, "learning_rate": 5.4309271338799626e-05, "loss": 0.6654, "step": 5820 }, { "epoch": 0.66, "learning_rate": 5.4276529044531463e-05, "loss": 0.6836, "step": 5821 }, { "epoch": 0.66, "learning_rate": 5.4243792946580686e-05, "loss": 0.6098, "step": 5822 }, { "epoch": 0.66, "learning_rate": 5.421106304938356e-05, "loss": 0.6712, "step": 5823 }, { "epoch": 0.66, "learning_rate": 5.417833935737562e-05, "loss": 0.6117, "step": 5824 }, { "epoch": 0.66, "learning_rate": 5.41456218749914e-05, "loss": 0.6483, "step": 5825 }, { "epoch": 0.66, "learning_rate": 5.411291060666479e-05, "loss": 0.6397, "step": 5826 }, { "epoch": 0.66, "learning_rate": 5.408020555682867e-05, "loss": 0.6701, "step": 5827 }, { "epoch": 0.66, "learning_rate": 5.404750672991514e-05, "loss": 0.658, "step": 5828 }, { "epoch": 0.66, "learning_rate": 5.4014814130355404e-05, "loss": 0.6166, "step": 5829 }, { "epoch": 0.66, "learning_rate": 5.398212776257998e-05, "loss": 0.7043, "step": 5830 }, { "epoch": 0.66, "learning_rate": 5.394944763101835e-05, "loss": 0.6331, "step": 5831 }, { "epoch": 0.66, "learning_rate": 5.391677374009927e-05, "loss": 0.7012, "step": 5832 }, { "epoch": 0.66, "learning_rate": 5.388410609425063e-05, "loss": 0.6374, "step": 5833 }, { "epoch": 0.66, "learning_rate": 5.3851444697899425e-05, "loss": 0.6992, "step": 5834 }, { "epoch": 0.66, "learning_rate": 5.3818789555471796e-05, "loss": 0.6399, "step": 5835 }, { "epoch": 0.66, "learning_rate": 5.3786140671393184e-05, "loss": 0.6385, "step": 5836 }, { "epoch": 0.66, "learning_rate": 5.3753498050087966e-05, "loss": 0.6747, "step": 5837 }, { "epoch": 0.66, "learning_rate": 5.372086169597988e-05, "loss": 0.7177, "step": 5838 }, { "epoch": 0.66, "learning_rate": 5.3688231613491656e-05, "loss": 0.6506, "step": 5839 }, { "epoch": 0.66, "learning_rate": 5.365560780704524e-05, "loss": 0.6868, "step": 5840 }, { "epoch": 0.66, "learning_rate": 5.362299028106169e-05, "loss": 0.6776, "step": 5841 }, { "epoch": 0.66, "learning_rate": 5.359037903996131e-05, "loss": 0.6168, "step": 5842 }, { "epoch": 0.66, "learning_rate": 5.3557774088163404e-05, "loss": 0.6634, "step": 5843 }, { "epoch": 0.66, "learning_rate": 5.352517543008658e-05, "loss": 0.6714, "step": 5844 }, { "epoch": 0.66, "learning_rate": 5.349258307014848e-05, "loss": 0.6967, "step": 5845 }, { "epoch": 0.66, "learning_rate": 5.3459997012765916e-05, "loss": 0.665, "step": 5846 }, { "epoch": 0.66, "learning_rate": 5.3427417262354906e-05, "loss": 0.6934, "step": 5847 }, { "epoch": 0.66, "learning_rate": 5.339484382333053e-05, "loss": 0.7139, "step": 5848 }, { "epoch": 0.66, "learning_rate": 5.336227670010703e-05, "loss": 0.684, "step": 5849 }, { "epoch": 0.66, "learning_rate": 5.332971589709787e-05, "loss": 0.6772, "step": 5850 }, { "epoch": 0.67, "learning_rate": 5.329716141871559e-05, "loss": 0.7127, "step": 5851 }, { "epoch": 0.67, "learning_rate": 5.32646132693718e-05, "loss": 0.6653, "step": 5852 }, { "epoch": 0.67, "learning_rate": 5.323207145347744e-05, "loss": 0.6767, "step": 5853 }, { "epoch": 0.67, "learning_rate": 5.3199535975442404e-05, "loss": 0.6766, "step": 5854 }, { "epoch": 0.67, "learning_rate": 5.3167006839675894e-05, "loss": 0.7216, "step": 5855 }, { "epoch": 0.67, "learning_rate": 5.313448405058612e-05, "loss": 0.6534, "step": 5856 }, { "epoch": 0.67, "learning_rate": 5.310196761258047e-05, "loss": 0.7571, "step": 5857 }, { "epoch": 0.67, "learning_rate": 5.306945753006547e-05, "loss": 0.6803, "step": 5858 }, { "epoch": 0.67, "learning_rate": 5.303695380744684e-05, "loss": 0.6279, "step": 5859 }, { "epoch": 0.67, "learning_rate": 5.3004456449129344e-05, "loss": 0.6708, "step": 5860 }, { "epoch": 0.67, "learning_rate": 5.297196545951699e-05, "loss": 0.6774, "step": 5861 }, { "epoch": 0.67, "learning_rate": 5.293948084301284e-05, "loss": 0.6756, "step": 5862 }, { "epoch": 0.67, "learning_rate": 5.2907002604019126e-05, "loss": 0.7132, "step": 5863 }, { "epoch": 0.67, "learning_rate": 5.287453074693716e-05, "loss": 0.683, "step": 5864 }, { "epoch": 0.67, "learning_rate": 5.284206527616751e-05, "loss": 0.6381, "step": 5865 }, { "epoch": 0.67, "learning_rate": 5.280960619610973e-05, "loss": 0.6035, "step": 5866 }, { "epoch": 0.67, "learning_rate": 5.277715351116268e-05, "loss": 0.7136, "step": 5867 }, { "epoch": 0.67, "learning_rate": 5.2744707225724186e-05, "loss": 0.6863, "step": 5868 }, { "epoch": 0.67, "learning_rate": 5.27122673441913e-05, "loss": 0.6959, "step": 5869 }, { "epoch": 0.67, "learning_rate": 5.267983387096015e-05, "loss": 0.7563, "step": 5870 }, { "epoch": 0.67, "learning_rate": 5.2647406810426104e-05, "loss": 0.6389, "step": 5871 }, { "epoch": 0.67, "learning_rate": 5.2614986166983484e-05, "loss": 0.5961, "step": 5872 }, { "epoch": 0.67, "learning_rate": 5.258257194502596e-05, "loss": 0.595, "step": 5873 }, { "epoch": 0.67, "learning_rate": 5.2550164148946155e-05, "loss": 0.6568, "step": 5874 }, { "epoch": 0.67, "learning_rate": 5.251776278313586e-05, "loss": 0.6545, "step": 5875 }, { "epoch": 0.67, "learning_rate": 5.248536785198608e-05, "loss": 0.7091, "step": 5876 }, { "epoch": 0.67, "learning_rate": 5.245297935988682e-05, "loss": 0.6697, "step": 5877 }, { "epoch": 0.67, "learning_rate": 5.242059731122735e-05, "loss": 0.7151, "step": 5878 }, { "epoch": 0.67, "learning_rate": 5.238822171039595e-05, "loss": 0.677, "step": 5879 }, { "epoch": 0.67, "learning_rate": 5.235585256178008e-05, "loss": 0.6966, "step": 5880 }, { "epoch": 0.67, "learning_rate": 5.232348986976627e-05, "loss": 0.7007, "step": 5881 }, { "epoch": 0.67, "learning_rate": 5.229113363874032e-05, "loss": 0.6871, "step": 5882 }, { "epoch": 0.67, "learning_rate": 5.225878387308696e-05, "loss": 0.6306, "step": 5883 }, { "epoch": 0.67, "learning_rate": 5.2226440577190213e-05, "loss": 0.6471, "step": 5884 }, { "epoch": 0.67, "learning_rate": 5.219410375543314e-05, "loss": 0.7084, "step": 5885 }, { "epoch": 0.67, "learning_rate": 5.21617734121979e-05, "loss": 0.7188, "step": 5886 }, { "epoch": 0.67, "learning_rate": 5.212944955186581e-05, "loss": 0.6203, "step": 5887 }, { "epoch": 0.67, "learning_rate": 5.2097132178817356e-05, "loss": 0.5972, "step": 5888 }, { "epoch": 0.67, "learning_rate": 5.206482129743204e-05, "loss": 0.6875, "step": 5889 }, { "epoch": 0.67, "learning_rate": 5.2032516912088646e-05, "loss": 0.6814, "step": 5890 }, { "epoch": 0.67, "learning_rate": 5.200021902716483e-05, "loss": 0.7092, "step": 5891 }, { "epoch": 0.67, "learning_rate": 5.1967927647037614e-05, "loss": 0.6535, "step": 5892 }, { "epoch": 0.67, "learning_rate": 5.193564277608298e-05, "loss": 0.7258, "step": 5893 }, { "epoch": 0.67, "learning_rate": 5.190336441867616e-05, "loss": 0.7124, "step": 5894 }, { "epoch": 0.67, "learning_rate": 5.1871092579191314e-05, "loss": 0.6989, "step": 5895 }, { "epoch": 0.67, "learning_rate": 5.1838827262001944e-05, "loss": 0.654, "step": 5896 }, { "epoch": 0.67, "learning_rate": 5.180656847148051e-05, "loss": 0.7123, "step": 5897 }, { "epoch": 0.67, "learning_rate": 5.1774316211998585e-05, "loss": 0.6239, "step": 5898 }, { "epoch": 0.67, "learning_rate": 5.1742070487927e-05, "loss": 0.6126, "step": 5899 }, { "epoch": 0.67, "learning_rate": 5.17098313036355e-05, "loss": 0.7283, "step": 5900 }, { "epoch": 0.67, "learning_rate": 5.1677598663493155e-05, "loss": 0.7288, "step": 5901 }, { "epoch": 0.67, "learning_rate": 5.1645372571868e-05, "loss": 0.716, "step": 5902 }, { "epoch": 0.67, "learning_rate": 5.1613153033127215e-05, "loss": 0.6403, "step": 5903 }, { "epoch": 0.67, "learning_rate": 5.158094005163706e-05, "loss": 0.6328, "step": 5904 }, { "epoch": 0.67, "learning_rate": 5.1548733631763034e-05, "loss": 0.7136, "step": 5905 }, { "epoch": 0.67, "learning_rate": 5.151653377786958e-05, "loss": 0.6437, "step": 5906 }, { "epoch": 0.67, "learning_rate": 5.148434049432047e-05, "loss": 0.6918, "step": 5907 }, { "epoch": 0.67, "learning_rate": 5.145215378547825e-05, "loss": 0.6312, "step": 5908 }, { "epoch": 0.67, "learning_rate": 5.141997365570492e-05, "loss": 0.7531, "step": 5909 }, { "epoch": 0.67, "learning_rate": 5.1387800109361375e-05, "loss": 0.6401, "step": 5910 }, { "epoch": 0.67, "learning_rate": 5.1355633150807735e-05, "loss": 0.7211, "step": 5911 }, { "epoch": 0.67, "learning_rate": 5.13234727844031e-05, "loss": 0.6948, "step": 5912 }, { "epoch": 0.67, "learning_rate": 5.129131901450588e-05, "loss": 0.6527, "step": 5913 }, { "epoch": 0.67, "learning_rate": 5.125917184547332e-05, "loss": 0.7, "step": 5914 }, { "epoch": 0.67, "learning_rate": 5.122703128166201e-05, "loss": 0.6348, "step": 5915 }, { "epoch": 0.67, "learning_rate": 5.119489732742748e-05, "loss": 0.7559, "step": 5916 }, { "epoch": 0.67, "learning_rate": 5.116276998712451e-05, "loss": 0.6916, "step": 5917 }, { "epoch": 0.67, "learning_rate": 5.113064926510685e-05, "loss": 0.6939, "step": 5918 }, { "epoch": 0.67, "learning_rate": 5.1098535165727445e-05, "loss": 0.7077, "step": 5919 }, { "epoch": 0.67, "learning_rate": 5.1066427693338314e-05, "loss": 0.664, "step": 5920 }, { "epoch": 0.67, "learning_rate": 5.1034326852290506e-05, "loss": 0.7019, "step": 5921 }, { "epoch": 0.67, "learning_rate": 5.1002232646934314e-05, "loss": 0.6705, "step": 5922 }, { "epoch": 0.67, "learning_rate": 5.0970145081619036e-05, "loss": 0.6622, "step": 5923 }, { "epoch": 0.67, "learning_rate": 5.093806416069309e-05, "loss": 0.6689, "step": 5924 }, { "epoch": 0.67, "learning_rate": 5.0905989888503924e-05, "loss": 0.665, "step": 5925 }, { "epoch": 0.67, "learning_rate": 5.087392226939827e-05, "loss": 0.7086, "step": 5926 }, { "epoch": 0.67, "learning_rate": 5.084186130772173e-05, "loss": 0.6757, "step": 5927 }, { "epoch": 0.67, "learning_rate": 5.080980700781922e-05, "loss": 0.6742, "step": 5928 }, { "epoch": 0.67, "learning_rate": 5.077775937403456e-05, "loss": 0.6388, "step": 5929 }, { "epoch": 0.67, "learning_rate": 5.0745718410710874e-05, "loss": 0.6815, "step": 5930 }, { "epoch": 0.67, "learning_rate": 5.071368412219011e-05, "loss": 0.684, "step": 5931 }, { "epoch": 0.67, "learning_rate": 5.068165651281358e-05, "loss": 0.6473, "step": 5932 }, { "epoch": 0.67, "learning_rate": 5.0649635586921495e-05, "loss": 0.727, "step": 5933 }, { "epoch": 0.67, "learning_rate": 5.061762134885333e-05, "loss": 0.6531, "step": 5934 }, { "epoch": 0.67, "learning_rate": 5.0585613802947486e-05, "loss": 0.649, "step": 5935 }, { "epoch": 0.67, "learning_rate": 5.055361295354164e-05, "loss": 0.6537, "step": 5936 }, { "epoch": 0.67, "learning_rate": 5.05216188049723e-05, "loss": 0.6388, "step": 5937 }, { "epoch": 0.67, "learning_rate": 5.048963136157538e-05, "loss": 0.6345, "step": 5938 }, { "epoch": 0.68, "learning_rate": 5.045765062768559e-05, "loss": 0.5872, "step": 5939 }, { "epoch": 0.68, "learning_rate": 5.042567660763701e-05, "loss": 0.6815, "step": 5940 }, { "epoch": 0.68, "learning_rate": 5.039370930576259e-05, "loss": 0.6814, "step": 5941 }, { "epoch": 0.68, "learning_rate": 5.036174872639443e-05, "loss": 0.734, "step": 5942 }, { "epoch": 0.68, "learning_rate": 5.03297948738638e-05, "loss": 0.6539, "step": 5943 }, { "epoch": 0.68, "learning_rate": 5.0297847752500974e-05, "loss": 0.6001, "step": 5944 }, { "epoch": 0.68, "learning_rate": 5.026590736663528e-05, "loss": 0.6472, "step": 5945 }, { "epoch": 0.68, "learning_rate": 5.023397372059528e-05, "loss": 0.666, "step": 5946 }, { "epoch": 0.68, "learning_rate": 5.02020468187085e-05, "loss": 0.6045, "step": 5947 }, { "epoch": 0.68, "learning_rate": 5.017012666530154e-05, "loss": 0.6997, "step": 5948 }, { "epoch": 0.68, "learning_rate": 5.0138213264700204e-05, "loss": 0.6745, "step": 5949 }, { "epoch": 0.68, "learning_rate": 5.010630662122924e-05, "loss": 0.7049, "step": 5950 }, { "epoch": 0.68, "learning_rate": 5.007440673921262e-05, "loss": 0.6492, "step": 5951 }, { "epoch": 0.68, "learning_rate": 5.0042513622973234e-05, "loss": 0.6958, "step": 5952 }, { "epoch": 0.68, "learning_rate": 5.001062727683328e-05, "loss": 0.7121, "step": 5953 }, { "epoch": 0.68, "learning_rate": 4.997874770511376e-05, "loss": 0.623, "step": 5954 }, { "epoch": 0.68, "learning_rate": 4.9946874912135e-05, "loss": 0.6565, "step": 5955 }, { "epoch": 0.68, "learning_rate": 4.9915008902216243e-05, "loss": 0.6775, "step": 5956 }, { "epoch": 0.68, "learning_rate": 4.9883149679675965e-05, "loss": 0.6388, "step": 5957 }, { "epoch": 0.68, "learning_rate": 4.985129724883156e-05, "loss": 0.6551, "step": 5958 }, { "epoch": 0.68, "learning_rate": 4.981945161399969e-05, "loss": 0.7192, "step": 5959 }, { "epoch": 0.68, "learning_rate": 4.978761277949584e-05, "loss": 0.6206, "step": 5960 }, { "epoch": 0.68, "learning_rate": 4.975578074963484e-05, "loss": 0.6612, "step": 5961 }, { "epoch": 0.68, "learning_rate": 4.9723955528730384e-05, "loss": 0.652, "step": 5962 }, { "epoch": 0.68, "learning_rate": 4.969213712109543e-05, "loss": 0.6882, "step": 5963 }, { "epoch": 0.68, "learning_rate": 4.966032553104186e-05, "loss": 0.5714, "step": 5964 }, { "epoch": 0.68, "learning_rate": 4.962852076288073e-05, "loss": 0.6001, "step": 5965 }, { "epoch": 0.68, "learning_rate": 4.959672282092206e-05, "loss": 0.664, "step": 5966 }, { "epoch": 0.68, "learning_rate": 4.9564931709475103e-05, "loss": 0.6889, "step": 5967 }, { "epoch": 0.68, "learning_rate": 4.9533147432848036e-05, "loss": 0.6394, "step": 5968 }, { "epoch": 0.68, "learning_rate": 4.950136999534825e-05, "loss": 0.6352, "step": 5969 }, { "epoch": 0.68, "learning_rate": 4.9469599401282084e-05, "loss": 0.6528, "step": 5970 }, { "epoch": 0.68, "learning_rate": 4.943783565495498e-05, "loss": 0.7264, "step": 5971 }, { "epoch": 0.68, "learning_rate": 4.940607876067153e-05, "loss": 0.5906, "step": 5972 }, { "epoch": 0.68, "learning_rate": 4.9374328722735276e-05, "loss": 0.6992, "step": 5973 }, { "epoch": 0.68, "learning_rate": 4.934258554544897e-05, "loss": 0.7135, "step": 5974 }, { "epoch": 0.68, "learning_rate": 4.931084923311428e-05, "loss": 0.6862, "step": 5975 }, { "epoch": 0.68, "learning_rate": 4.9279119790032135e-05, "loss": 0.6514, "step": 5976 }, { "epoch": 0.68, "learning_rate": 4.924739722050228e-05, "loss": 0.6796, "step": 5977 }, { "epoch": 0.68, "learning_rate": 4.921568152882376e-05, "loss": 0.6159, "step": 5978 }, { "epoch": 0.68, "learning_rate": 4.918397271929454e-05, "loss": 0.6597, "step": 5979 }, { "epoch": 0.68, "learning_rate": 4.9152270796211795e-05, "loss": 0.6213, "step": 5980 }, { "epoch": 0.68, "learning_rate": 4.912057576387162e-05, "loss": 0.6746, "step": 5981 }, { "epoch": 0.68, "learning_rate": 4.9088887626569246e-05, "loss": 0.6759, "step": 5982 }, { "epoch": 0.68, "learning_rate": 4.905720638859892e-05, "loss": 0.7021, "step": 5983 }, { "epoch": 0.68, "learning_rate": 4.902553205425409e-05, "loss": 0.7076, "step": 5984 }, { "epoch": 0.68, "learning_rate": 4.899386462782707e-05, "loss": 0.6752, "step": 5985 }, { "epoch": 0.68, "learning_rate": 4.8962204113609434e-05, "loss": 0.6543, "step": 5986 }, { "epoch": 0.68, "learning_rate": 4.893055051589167e-05, "loss": 0.6863, "step": 5987 }, { "epoch": 0.68, "learning_rate": 4.8898903838963415e-05, "loss": 0.7025, "step": 5988 }, { "epoch": 0.68, "learning_rate": 4.886726408711329e-05, "loss": 0.6697, "step": 5989 }, { "epoch": 0.68, "learning_rate": 4.883563126462909e-05, "loss": 0.6605, "step": 5990 }, { "epoch": 0.68, "learning_rate": 4.8804005375797534e-05, "loss": 0.5945, "step": 5991 }, { "epoch": 0.68, "learning_rate": 4.877238642490456e-05, "loss": 0.687, "step": 5992 }, { "epoch": 0.68, "learning_rate": 4.8740774416235034e-05, "loss": 0.5983, "step": 5993 }, { "epoch": 0.68, "learning_rate": 4.870916935407289e-05, "loss": 0.7228, "step": 5994 }, { "epoch": 0.68, "learning_rate": 4.867757124270125e-05, "loss": 0.6865, "step": 5995 }, { "epoch": 0.68, "learning_rate": 4.86459800864021e-05, "loss": 0.6702, "step": 5996 }, { "epoch": 0.68, "learning_rate": 4.861439588945667e-05, "loss": 0.6609, "step": 5997 }, { "epoch": 0.68, "learning_rate": 4.8582818656145136e-05, "loss": 0.6598, "step": 5998 }, { "epoch": 0.68, "learning_rate": 4.855124839074675e-05, "loss": 0.6154, "step": 5999 }, { "epoch": 0.68, "learning_rate": 4.851968509753978e-05, "loss": 0.6271, "step": 6000 }, { "epoch": 0.68, "learning_rate": 4.848812878080169e-05, "loss": 0.6466, "step": 6001 }, { "epoch": 0.68, "learning_rate": 4.8456579444808804e-05, "loss": 0.6776, "step": 6002 }, { "epoch": 0.68, "learning_rate": 4.842503709383669e-05, "loss": 0.6739, "step": 6003 }, { "epoch": 0.68, "learning_rate": 4.839350173215985e-05, "loss": 0.6791, "step": 6004 }, { "epoch": 0.68, "learning_rate": 4.836197336405185e-05, "loss": 0.6623, "step": 6005 }, { "epoch": 0.68, "learning_rate": 4.8330451993785295e-05, "loss": 0.7201, "step": 6006 }, { "epoch": 0.68, "learning_rate": 4.8298937625631966e-05, "loss": 0.7056, "step": 6007 }, { "epoch": 0.68, "learning_rate": 4.82674302638625e-05, "loss": 0.6937, "step": 6008 }, { "epoch": 0.68, "learning_rate": 4.823592991274678e-05, "loss": 0.656, "step": 6009 }, { "epoch": 0.68, "learning_rate": 4.82044365765536e-05, "loss": 0.6786, "step": 6010 }, { "epoch": 0.68, "learning_rate": 4.8172950259550855e-05, "loss": 0.6374, "step": 6011 }, { "epoch": 0.68, "learning_rate": 4.814147096600543e-05, "loss": 0.687, "step": 6012 }, { "epoch": 0.68, "learning_rate": 4.8109998700183414e-05, "loss": 0.6109, "step": 6013 }, { "epoch": 0.68, "learning_rate": 4.807853346634974e-05, "loss": 0.581, "step": 6014 }, { "epoch": 0.68, "learning_rate": 4.804707526876857e-05, "loss": 0.5962, "step": 6015 }, { "epoch": 0.68, "learning_rate": 4.8015624111703006e-05, "loss": 0.6455, "step": 6016 }, { "epoch": 0.68, "learning_rate": 4.798417999941518e-05, "loss": 0.6749, "step": 6017 }, { "epoch": 0.68, "learning_rate": 4.7952742936166374e-05, "loss": 0.6569, "step": 6018 }, { "epoch": 0.68, "learning_rate": 4.7921312926216824e-05, "loss": 0.6452, "step": 6019 }, { "epoch": 0.68, "learning_rate": 4.78898899738258e-05, "loss": 0.6936, "step": 6020 }, { "epoch": 0.68, "learning_rate": 4.7858474083251716e-05, "loss": 0.6133, "step": 6021 }, { "epoch": 0.68, "learning_rate": 4.7827065258751936e-05, "loss": 0.6735, "step": 6022 }, { "epoch": 0.68, "learning_rate": 4.7795663504582866e-05, "loss": 0.6348, "step": 6023 }, { "epoch": 0.68, "learning_rate": 4.776426882500005e-05, "loss": 0.6377, "step": 6024 }, { "epoch": 0.68, "learning_rate": 4.773288122425793e-05, "loss": 0.5984, "step": 6025 }, { "epoch": 0.68, "learning_rate": 4.770150070661015e-05, "loss": 0.6493, "step": 6026 }, { "epoch": 0.69, "learning_rate": 4.767012727630927e-05, "loss": 0.7291, "step": 6027 }, { "epoch": 0.69, "learning_rate": 4.763876093760693e-05, "loss": 0.6745, "step": 6028 }, { "epoch": 0.69, "learning_rate": 4.7607401694753774e-05, "loss": 0.6619, "step": 6029 }, { "epoch": 0.69, "learning_rate": 4.757604955199959e-05, "loss": 0.7417, "step": 6030 }, { "epoch": 0.69, "learning_rate": 4.7544704513593064e-05, "loss": 0.6408, "step": 6031 }, { "epoch": 0.69, "learning_rate": 4.751336658378205e-05, "loss": 0.7278, "step": 6032 }, { "epoch": 0.69, "learning_rate": 4.748203576681335e-05, "loss": 0.6322, "step": 6033 }, { "epoch": 0.69, "learning_rate": 4.7450712066932824e-05, "loss": 0.5828, "step": 6034 }, { "epoch": 0.69, "learning_rate": 4.7419395488385335e-05, "loss": 0.6347, "step": 6035 }, { "epoch": 0.69, "learning_rate": 4.7388086035414904e-05, "loss": 0.6529, "step": 6036 }, { "epoch": 0.69, "learning_rate": 4.735678371226441e-05, "loss": 0.6029, "step": 6037 }, { "epoch": 0.69, "learning_rate": 4.7325488523175944e-05, "loss": 0.6619, "step": 6038 }, { "epoch": 0.69, "learning_rate": 4.7294200472390504e-05, "loss": 0.6766, "step": 6039 }, { "epoch": 0.69, "learning_rate": 4.726291956414816e-05, "loss": 0.6776, "step": 6040 }, { "epoch": 0.69, "learning_rate": 4.7231645802687954e-05, "loss": 0.6262, "step": 6041 }, { "epoch": 0.69, "learning_rate": 4.7200379192248126e-05, "loss": 0.6985, "step": 6042 }, { "epoch": 0.69, "learning_rate": 4.716911973706575e-05, "loss": 0.6244, "step": 6043 }, { "epoch": 0.69, "learning_rate": 4.713786744137709e-05, "loss": 0.6875, "step": 6044 }, { "epoch": 0.69, "learning_rate": 4.710662230941735e-05, "loss": 0.6307, "step": 6045 }, { "epoch": 0.69, "learning_rate": 4.707538434542072e-05, "loss": 0.6055, "step": 6046 }, { "epoch": 0.69, "learning_rate": 4.704415355362058e-05, "loss": 0.6896, "step": 6047 }, { "epoch": 0.69, "learning_rate": 4.7012929938249164e-05, "loss": 0.6962, "step": 6048 }, { "epoch": 0.69, "learning_rate": 4.698171350353787e-05, "loss": 0.6633, "step": 6049 }, { "epoch": 0.69, "learning_rate": 4.695050425371703e-05, "loss": 0.6904, "step": 6050 }, { "epoch": 0.69, "learning_rate": 4.691930219301605e-05, "loss": 0.6714, "step": 6051 }, { "epoch": 0.69, "learning_rate": 4.688810732566328e-05, "loss": 0.7267, "step": 6052 }, { "epoch": 0.69, "learning_rate": 4.685691965588624e-05, "loss": 0.698, "step": 6053 }, { "epoch": 0.69, "learning_rate": 4.6825739187911354e-05, "loss": 0.6959, "step": 6054 }, { "epoch": 0.69, "learning_rate": 4.67945659259642e-05, "loss": 0.5629, "step": 6055 }, { "epoch": 0.69, "learning_rate": 4.676339987426914e-05, "loss": 0.6603, "step": 6056 }, { "epoch": 0.69, "learning_rate": 4.673224103704983e-05, "loss": 0.6558, "step": 6057 }, { "epoch": 0.69, "learning_rate": 4.670108941852875e-05, "loss": 0.679, "step": 6058 }, { "epoch": 0.69, "learning_rate": 4.666994502292755e-05, "loss": 0.6979, "step": 6059 }, { "epoch": 0.69, "learning_rate": 4.6638807854466783e-05, "loss": 0.6322, "step": 6060 }, { "epoch": 0.69, "learning_rate": 4.660767791736615e-05, "loss": 0.6222, "step": 6061 }, { "epoch": 0.69, "learning_rate": 4.657655521584416e-05, "loss": 0.6663, "step": 6062 }, { "epoch": 0.69, "learning_rate": 4.654543975411859e-05, "loss": 0.622, "step": 6063 }, { "epoch": 0.69, "learning_rate": 4.6514331536406044e-05, "loss": 0.7485, "step": 6064 }, { "epoch": 0.69, "learning_rate": 4.648323056692227e-05, "loss": 0.7586, "step": 6065 }, { "epoch": 0.69, "learning_rate": 4.645213684988195e-05, "loss": 0.7306, "step": 6066 }, { "epoch": 0.69, "learning_rate": 4.642105038949889e-05, "loss": 0.6984, "step": 6067 }, { "epoch": 0.69, "learning_rate": 4.638997118998577e-05, "loss": 0.6814, "step": 6068 }, { "epoch": 0.69, "learning_rate": 4.635889925555433e-05, "loss": 0.7018, "step": 6069 }, { "epoch": 0.69, "learning_rate": 4.632783459041545e-05, "loss": 0.6398, "step": 6070 }, { "epoch": 0.69, "learning_rate": 4.629677719877884e-05, "loss": 0.6359, "step": 6071 }, { "epoch": 0.69, "learning_rate": 4.626572708485337e-05, "loss": 0.6601, "step": 6072 }, { "epoch": 0.69, "learning_rate": 4.623468425284685e-05, "loss": 0.6574, "step": 6073 }, { "epoch": 0.69, "learning_rate": 4.62036487069661e-05, "loss": 0.6073, "step": 6074 }, { "epoch": 0.69, "learning_rate": 4.6172620451416947e-05, "loss": 0.6557, "step": 6075 }, { "epoch": 0.69, "learning_rate": 4.614159949040432e-05, "loss": 0.6162, "step": 6076 }, { "epoch": 0.69, "learning_rate": 4.611058582813203e-05, "loss": 0.6694, "step": 6077 }, { "epoch": 0.69, "learning_rate": 4.6079579468803044e-05, "loss": 0.6833, "step": 6078 }, { "epoch": 0.69, "learning_rate": 4.604858041661915e-05, "loss": 0.6686, "step": 6079 }, { "epoch": 0.69, "learning_rate": 4.601758867578133e-05, "loss": 0.6997, "step": 6080 }, { "epoch": 0.69, "learning_rate": 4.598660425048945e-05, "loss": 0.6764, "step": 6081 }, { "epoch": 0.69, "learning_rate": 4.5955627144942494e-05, "loss": 0.6285, "step": 6082 }, { "epoch": 0.69, "learning_rate": 4.592465736333832e-05, "loss": 0.6675, "step": 6083 }, { "epoch": 0.69, "learning_rate": 4.589369490987398e-05, "loss": 0.6377, "step": 6084 }, { "epoch": 0.69, "learning_rate": 4.5862739788745267e-05, "loss": 0.6708, "step": 6085 }, { "epoch": 0.69, "learning_rate": 4.5831792004147245e-05, "loss": 0.6592, "step": 6086 }, { "epoch": 0.69, "learning_rate": 4.5800851560273795e-05, "loss": 0.6846, "step": 6087 }, { "epoch": 0.69, "learning_rate": 4.576991846131796e-05, "loss": 0.6311, "step": 6088 }, { "epoch": 0.69, "learning_rate": 4.573899271147164e-05, "loss": 0.6373, "step": 6089 }, { "epoch": 0.69, "learning_rate": 4.5708074314925866e-05, "loss": 0.6634, "step": 6090 }, { "epoch": 0.69, "learning_rate": 4.567716327587058e-05, "loss": 0.7223, "step": 6091 }, { "epoch": 0.69, "learning_rate": 4.5646259598494736e-05, "loss": 0.7656, "step": 6092 }, { "epoch": 0.69, "learning_rate": 4.561536328698636e-05, "loss": 0.5862, "step": 6093 }, { "epoch": 0.69, "learning_rate": 4.5584474345532426e-05, "loss": 0.6274, "step": 6094 }, { "epoch": 0.69, "learning_rate": 4.55535927783189e-05, "loss": 0.6485, "step": 6095 }, { "epoch": 0.69, "learning_rate": 4.552271858953073e-05, "loss": 0.6106, "step": 6096 }, { "epoch": 0.69, "learning_rate": 4.549185178335198e-05, "loss": 0.6679, "step": 6097 }, { "epoch": 0.69, "learning_rate": 4.546099236396556e-05, "loss": 0.6687, "step": 6098 }, { "epoch": 0.69, "learning_rate": 4.5430140335553525e-05, "loss": 0.67, "step": 6099 }, { "epoch": 0.69, "learning_rate": 4.5399295702296786e-05, "loss": 0.7388, "step": 6100 }, { "epoch": 0.69, "learning_rate": 4.5368458468375416e-05, "loss": 0.6757, "step": 6101 }, { "epoch": 0.69, "learning_rate": 4.533762863796826e-05, "loss": 0.6047, "step": 6102 }, { "epoch": 0.69, "learning_rate": 4.5306806215253394e-05, "loss": 0.6875, "step": 6103 }, { "epoch": 0.69, "learning_rate": 4.527599120440772e-05, "loss": 0.6297, "step": 6104 }, { "epoch": 0.69, "learning_rate": 4.5245183609607266e-05, "loss": 0.6591, "step": 6105 }, { "epoch": 0.69, "learning_rate": 4.521438343502693e-05, "loss": 0.6648, "step": 6106 }, { "epoch": 0.69, "learning_rate": 4.518359068484077e-05, "loss": 0.6912, "step": 6107 }, { "epoch": 0.69, "learning_rate": 4.5152805363221585e-05, "loss": 0.6996, "step": 6108 }, { "epoch": 0.69, "learning_rate": 4.5122027474341425e-05, "loss": 0.7025, "step": 6109 }, { "epoch": 0.69, "learning_rate": 4.5091257022371145e-05, "loss": 0.6391, "step": 6110 }, { "epoch": 0.69, "learning_rate": 4.506049401148077e-05, "loss": 0.5867, "step": 6111 }, { "epoch": 0.69, "learning_rate": 4.5029738445839143e-05, "loss": 0.6654, "step": 6112 }, { "epoch": 0.69, "learning_rate": 4.4998990329614164e-05, "loss": 0.5917, "step": 6113 }, { "epoch": 0.69, "learning_rate": 4.4968249666972806e-05, "loss": 0.6721, "step": 6114 }, { "epoch": 0.7, "learning_rate": 4.4937516462080906e-05, "loss": 0.6884, "step": 6115 }, { "epoch": 0.7, "learning_rate": 4.4906790719103306e-05, "loss": 0.6749, "step": 6116 }, { "epoch": 0.7, "learning_rate": 4.4876072442203964e-05, "loss": 0.7152, "step": 6117 }, { "epoch": 0.7, "learning_rate": 4.484536163554568e-05, "loss": 0.6469, "step": 6118 }, { "epoch": 0.7, "learning_rate": 4.481465830329027e-05, "loss": 0.6029, "step": 6119 }, { "epoch": 0.7, "learning_rate": 4.478396244959862e-05, "loss": 0.6821, "step": 6120 }, { "epoch": 0.7, "learning_rate": 4.4753274078630515e-05, "loss": 0.6911, "step": 6121 }, { "epoch": 0.7, "learning_rate": 4.4722593194544784e-05, "loss": 0.651, "step": 6122 }, { "epoch": 0.7, "learning_rate": 4.469191980149917e-05, "loss": 0.5917, "step": 6123 }, { "epoch": 0.7, "learning_rate": 4.4661253903650544e-05, "loss": 0.6359, "step": 6124 }, { "epoch": 0.7, "learning_rate": 4.463059550515452e-05, "loss": 0.6375, "step": 6125 }, { "epoch": 0.7, "learning_rate": 4.4599944610165943e-05, "loss": 0.7071, "step": 6126 }, { "epoch": 0.7, "learning_rate": 4.4569301222838474e-05, "loss": 0.6646, "step": 6127 }, { "epoch": 0.7, "learning_rate": 4.453866534732489e-05, "loss": 0.6338, "step": 6128 }, { "epoch": 0.7, "learning_rate": 4.4508036987776836e-05, "loss": 0.6805, "step": 6129 }, { "epoch": 0.7, "learning_rate": 4.4477416148344986e-05, "loss": 0.6958, "step": 6130 }, { "epoch": 0.7, "learning_rate": 4.444680283317896e-05, "loss": 0.6645, "step": 6131 }, { "epoch": 0.7, "learning_rate": 4.4416197046427457e-05, "loss": 0.6576, "step": 6132 }, { "epoch": 0.7, "learning_rate": 4.4385598792238005e-05, "loss": 0.655, "step": 6133 }, { "epoch": 0.7, "learning_rate": 4.4355008074757285e-05, "loss": 0.6463, "step": 6134 }, { "epoch": 0.7, "learning_rate": 4.4324424898130824e-05, "loss": 0.6986, "step": 6135 }, { "epoch": 0.7, "learning_rate": 4.429384926650316e-05, "loss": 0.668, "step": 6136 }, { "epoch": 0.7, "learning_rate": 4.426328118401779e-05, "loss": 0.6931, "step": 6137 }, { "epoch": 0.7, "learning_rate": 4.423272065481728e-05, "loss": 0.6247, "step": 6138 }, { "epoch": 0.7, "learning_rate": 4.420216768304305e-05, "loss": 0.6702, "step": 6139 }, { "epoch": 0.7, "learning_rate": 4.417162227283561e-05, "loss": 0.7296, "step": 6140 }, { "epoch": 0.7, "learning_rate": 4.4141084428334356e-05, "loss": 0.6597, "step": 6141 }, { "epoch": 0.7, "learning_rate": 4.411055415367766e-05, "loss": 0.6729, "step": 6142 }, { "epoch": 0.7, "learning_rate": 4.408003145300298e-05, "loss": 0.6992, "step": 6143 }, { "epoch": 0.7, "learning_rate": 4.404951633044657e-05, "loss": 0.6784, "step": 6144 }, { "epoch": 0.7, "learning_rate": 4.401900879014386e-05, "loss": 0.6973, "step": 6145 }, { "epoch": 0.7, "learning_rate": 4.3988508836229045e-05, "loss": 0.649, "step": 6146 }, { "epoch": 0.7, "learning_rate": 4.3958016472835515e-05, "loss": 0.6384, "step": 6147 }, { "epoch": 0.7, "learning_rate": 4.392753170409537e-05, "loss": 0.666, "step": 6148 }, { "epoch": 0.7, "learning_rate": 4.389705453413992e-05, "loss": 0.6258, "step": 6149 }, { "epoch": 0.7, "learning_rate": 4.386658496709928e-05, "loss": 0.6831, "step": 6150 }, { "epoch": 0.7, "learning_rate": 4.383612300710267e-05, "loss": 0.6313, "step": 6151 }, { "epoch": 0.7, "learning_rate": 4.380566865827818e-05, "loss": 0.605, "step": 6152 }, { "epoch": 0.7, "learning_rate": 4.377522192475289e-05, "loss": 0.6173, "step": 6153 }, { "epoch": 0.7, "learning_rate": 4.374478281065282e-05, "loss": 0.6625, "step": 6154 }, { "epoch": 0.7, "learning_rate": 4.3714351320103063e-05, "loss": 0.5955, "step": 6155 }, { "epoch": 0.7, "learning_rate": 4.3683927457227556e-05, "loss": 0.6469, "step": 6156 }, { "epoch": 0.7, "learning_rate": 4.3653511226149315e-05, "loss": 0.6234, "step": 6157 }, { "epoch": 0.7, "learning_rate": 4.362310263099023e-05, "loss": 0.6527, "step": 6158 }, { "epoch": 0.7, "learning_rate": 4.3592701675871187e-05, "loss": 0.6807, "step": 6159 }, { "epoch": 0.7, "learning_rate": 4.3562308364911995e-05, "loss": 0.6246, "step": 6160 }, { "epoch": 0.7, "learning_rate": 4.353192270223156e-05, "loss": 0.6451, "step": 6161 }, { "epoch": 0.7, "learning_rate": 4.350154469194758e-05, "loss": 0.5998, "step": 6162 }, { "epoch": 0.7, "learning_rate": 4.347117433817687e-05, "loss": 0.6905, "step": 6163 }, { "epoch": 0.7, "learning_rate": 4.344081164503511e-05, "loss": 0.6622, "step": 6164 }, { "epoch": 0.7, "learning_rate": 4.341045661663691e-05, "loss": 0.7388, "step": 6165 }, { "epoch": 0.7, "learning_rate": 4.338010925709599e-05, "loss": 0.6362, "step": 6166 }, { "epoch": 0.7, "learning_rate": 4.3349769570524854e-05, "loss": 0.6587, "step": 6167 }, { "epoch": 0.7, "learning_rate": 4.331943756103514e-05, "loss": 0.7081, "step": 6168 }, { "epoch": 0.7, "learning_rate": 4.328911323273731e-05, "loss": 0.58, "step": 6169 }, { "epoch": 0.7, "learning_rate": 4.325879658974084e-05, "loss": 0.6317, "step": 6170 }, { "epoch": 0.7, "learning_rate": 4.322848763615411e-05, "loss": 0.6857, "step": 6171 }, { "epoch": 0.7, "learning_rate": 4.3198186376084584e-05, "loss": 0.6975, "step": 6172 }, { "epoch": 0.7, "learning_rate": 4.316789281363853e-05, "loss": 0.6504, "step": 6173 }, { "epoch": 0.7, "learning_rate": 4.313760695292133e-05, "loss": 0.6966, "step": 6174 }, { "epoch": 0.7, "learning_rate": 4.310732879803718e-05, "loss": 0.6763, "step": 6175 }, { "epoch": 0.7, "learning_rate": 4.3077058353089316e-05, "loss": 0.6285, "step": 6176 }, { "epoch": 0.7, "learning_rate": 4.304679562217986e-05, "loss": 0.552, "step": 6177 }, { "epoch": 0.7, "learning_rate": 4.301654060941e-05, "loss": 0.7033, "step": 6178 }, { "epoch": 0.7, "learning_rate": 4.2986293318879735e-05, "loss": 0.6929, "step": 6179 }, { "epoch": 0.7, "learning_rate": 4.2956053754688174e-05, "loss": 0.6398, "step": 6180 }, { "epoch": 0.7, "learning_rate": 4.2925821920933264e-05, "loss": 0.6104, "step": 6181 }, { "epoch": 0.7, "learning_rate": 4.289559782171193e-05, "loss": 0.6587, "step": 6182 }, { "epoch": 0.7, "learning_rate": 4.286538146112003e-05, "loss": 0.6768, "step": 6183 }, { "epoch": 0.7, "learning_rate": 4.283517284325248e-05, "loss": 0.6547, "step": 6184 }, { "epoch": 0.7, "learning_rate": 4.280497197220298e-05, "loss": 0.6558, "step": 6185 }, { "epoch": 0.7, "learning_rate": 4.277477885206433e-05, "loss": 0.7224, "step": 6186 }, { "epoch": 0.7, "learning_rate": 4.274459348692822e-05, "loss": 0.6761, "step": 6187 }, { "epoch": 0.7, "learning_rate": 4.2714415880885215e-05, "loss": 0.6919, "step": 6188 }, { "epoch": 0.7, "learning_rate": 4.268424603802499e-05, "loss": 0.6325, "step": 6189 }, { "epoch": 0.7, "learning_rate": 4.2654083962436045e-05, "loss": 0.6205, "step": 6190 }, { "epoch": 0.7, "learning_rate": 4.26239296582058e-05, "loss": 0.6833, "step": 6191 }, { "epoch": 0.7, "learning_rate": 4.2593783129420785e-05, "loss": 0.6852, "step": 6192 }, { "epoch": 0.7, "learning_rate": 4.256364438016631e-05, "loss": 0.6739, "step": 6193 }, { "epoch": 0.7, "learning_rate": 4.253351341452668e-05, "loss": 0.663, "step": 6194 }, { "epoch": 0.7, "learning_rate": 4.2503390236585216e-05, "loss": 0.6929, "step": 6195 }, { "epoch": 0.7, "learning_rate": 4.2473274850424075e-05, "loss": 0.6316, "step": 6196 }, { "epoch": 0.7, "learning_rate": 4.244316726012446e-05, "loss": 0.6541, "step": 6197 }, { "epoch": 0.7, "learning_rate": 4.241306746976644e-05, "loss": 0.6359, "step": 6198 }, { "epoch": 0.7, "learning_rate": 4.238297548342907e-05, "loss": 0.6563, "step": 6199 }, { "epoch": 0.7, "learning_rate": 4.235289130519027e-05, "loss": 0.644, "step": 6200 }, { "epoch": 0.7, "learning_rate": 4.2322814939127044e-05, "loss": 0.6472, "step": 6201 }, { "epoch": 0.7, "learning_rate": 4.2292746389315196e-05, "loss": 0.629, "step": 6202 }, { "epoch": 0.71, "learning_rate": 4.2262685659829596e-05, "loss": 0.672, "step": 6203 }, { "epoch": 0.71, "learning_rate": 4.2232632754743965e-05, "loss": 0.6954, "step": 6204 }, { "epoch": 0.71, "learning_rate": 4.2202587678130965e-05, "loss": 0.7136, "step": 6205 }, { "epoch": 0.71, "learning_rate": 4.217255043406221e-05, "loss": 0.6456, "step": 6206 }, { "epoch": 0.71, "learning_rate": 4.2142521026608316e-05, "loss": 0.6337, "step": 6207 }, { "epoch": 0.71, "learning_rate": 4.211249945983873e-05, "loss": 0.6482, "step": 6208 }, { "epoch": 0.71, "learning_rate": 4.2082485737821955e-05, "loss": 0.6652, "step": 6209 }, { "epoch": 0.71, "learning_rate": 4.205247986462533e-05, "loss": 0.6986, "step": 6210 }, { "epoch": 0.71, "learning_rate": 4.2022481844315165e-05, "loss": 0.6409, "step": 6211 }, { "epoch": 0.71, "learning_rate": 4.199249168095668e-05, "loss": 0.733, "step": 6212 }, { "epoch": 0.71, "learning_rate": 4.196250937861412e-05, "loss": 0.6626, "step": 6213 }, { "epoch": 0.71, "learning_rate": 4.1932534941350545e-05, "loss": 0.5879, "step": 6214 }, { "epoch": 0.71, "learning_rate": 4.190256837322807e-05, "loss": 0.726, "step": 6215 }, { "epoch": 0.71, "learning_rate": 4.187260967830764e-05, "loss": 0.6819, "step": 6216 }, { "epoch": 0.71, "learning_rate": 4.1842658860649155e-05, "loss": 0.6924, "step": 6217 }, { "epoch": 0.71, "learning_rate": 4.181271592431152e-05, "loss": 0.7203, "step": 6218 }, { "epoch": 0.71, "learning_rate": 4.1782780873352444e-05, "loss": 0.673, "step": 6219 }, { "epoch": 0.71, "learning_rate": 4.1752853711828745e-05, "loss": 0.6254, "step": 6220 }, { "epoch": 0.71, "learning_rate": 4.1722934443795994e-05, "loss": 0.6712, "step": 6221 }, { "epoch": 0.71, "learning_rate": 4.169302307330879e-05, "loss": 0.6431, "step": 6222 }, { "epoch": 0.71, "learning_rate": 4.1663119604420596e-05, "loss": 0.6889, "step": 6223 }, { "epoch": 0.71, "learning_rate": 4.163322404118391e-05, "loss": 0.7308, "step": 6224 }, { "epoch": 0.71, "learning_rate": 4.160333638765005e-05, "loss": 0.691, "step": 6225 }, { "epoch": 0.71, "learning_rate": 4.157345664786938e-05, "loss": 0.7012, "step": 6226 }, { "epoch": 0.71, "learning_rate": 4.1543584825891e-05, "loss": 0.6276, "step": 6227 }, { "epoch": 0.71, "learning_rate": 4.1513720925763166e-05, "loss": 0.6041, "step": 6228 }, { "epoch": 0.71, "learning_rate": 4.148386495153286e-05, "loss": 0.6943, "step": 6229 }, { "epoch": 0.71, "learning_rate": 4.1454016907246165e-05, "loss": 0.7281, "step": 6230 }, { "epoch": 0.71, "learning_rate": 4.142417679694793e-05, "loss": 0.6257, "step": 6231 }, { "epoch": 0.71, "learning_rate": 4.1394344624682114e-05, "loss": 0.6857, "step": 6232 }, { "epoch": 0.71, "learning_rate": 4.1364520394491346e-05, "loss": 0.7038, "step": 6233 }, { "epoch": 0.71, "learning_rate": 4.133470411041742e-05, "loss": 0.6751, "step": 6234 }, { "epoch": 0.71, "learning_rate": 4.13048957765009e-05, "loss": 0.7119, "step": 6235 }, { "epoch": 0.71, "learning_rate": 4.127509539678138e-05, "loss": 0.6454, "step": 6236 }, { "epoch": 0.71, "learning_rate": 4.124530297529727e-05, "loss": 0.669, "step": 6237 }, { "epoch": 0.71, "learning_rate": 4.121551851608603e-05, "loss": 0.6752, "step": 6238 }, { "epoch": 0.71, "learning_rate": 4.118574202318392e-05, "loss": 0.7675, "step": 6239 }, { "epoch": 0.71, "learning_rate": 4.115597350062612e-05, "loss": 0.6218, "step": 6240 }, { "epoch": 0.71, "learning_rate": 4.1126212952446874e-05, "loss": 0.7131, "step": 6241 }, { "epoch": 0.71, "learning_rate": 4.109646038267917e-05, "loss": 0.6301, "step": 6242 }, { "epoch": 0.71, "learning_rate": 4.106671579535509e-05, "loss": 0.7722, "step": 6243 }, { "epoch": 0.71, "learning_rate": 4.103697919450542e-05, "loss": 0.637, "step": 6244 }, { "epoch": 0.71, "learning_rate": 4.100725058416005e-05, "loss": 0.6354, "step": 6245 }, { "epoch": 0.71, "learning_rate": 4.097752996834768e-05, "loss": 0.7078, "step": 6246 }, { "epoch": 0.71, "learning_rate": 4.094781735109602e-05, "loss": 0.7064, "step": 6247 }, { "epoch": 0.71, "learning_rate": 4.091811273643157e-05, "loss": 0.6926, "step": 6248 }, { "epoch": 0.71, "learning_rate": 4.0888416128379936e-05, "loss": 0.6544, "step": 6249 }, { "epoch": 0.71, "learning_rate": 4.085872753096536e-05, "loss": 0.6683, "step": 6250 }, { "epoch": 0.71, "learning_rate": 4.082904694821127e-05, "loss": 0.6491, "step": 6251 }, { "epoch": 0.71, "learning_rate": 4.079937438413983e-05, "loss": 0.7116, "step": 6252 }, { "epoch": 0.71, "learning_rate": 4.0769709842772265e-05, "loss": 0.7049, "step": 6253 }, { "epoch": 0.71, "learning_rate": 4.0740053328128534e-05, "loss": 0.7107, "step": 6254 }, { "epoch": 0.71, "learning_rate": 4.071040484422772e-05, "loss": 0.6652, "step": 6255 }, { "epoch": 0.71, "learning_rate": 4.068076439508758e-05, "loss": 0.7212, "step": 6256 }, { "epoch": 0.71, "learning_rate": 4.065113198472499e-05, "loss": 0.6957, "step": 6257 }, { "epoch": 0.71, "learning_rate": 4.0621507617155595e-05, "loss": 0.5956, "step": 6258 }, { "epoch": 0.71, "learning_rate": 4.0591891296394056e-05, "loss": 0.6319, "step": 6259 }, { "epoch": 0.71, "learning_rate": 4.056228302645385e-05, "loss": 0.6758, "step": 6260 }, { "epoch": 0.71, "learning_rate": 4.0532682811347466e-05, "loss": 0.6976, "step": 6261 }, { "epoch": 0.71, "learning_rate": 4.050309065508621e-05, "loss": 0.617, "step": 6262 }, { "epoch": 0.71, "learning_rate": 4.047350656168029e-05, "loss": 0.6072, "step": 6263 }, { "epoch": 0.71, "learning_rate": 4.044393053513892e-05, "loss": 0.6104, "step": 6264 }, { "epoch": 0.71, "learning_rate": 4.041436257947015e-05, "loss": 0.7453, "step": 6265 }, { "epoch": 0.71, "learning_rate": 4.038480269868091e-05, "loss": 0.6585, "step": 6266 }, { "epoch": 0.71, "learning_rate": 4.0355250896777084e-05, "loss": 0.6522, "step": 6267 }, { "epoch": 0.71, "learning_rate": 4.0325707177763496e-05, "loss": 0.6501, "step": 6268 }, { "epoch": 0.71, "learning_rate": 4.029617154564375e-05, "loss": 0.6948, "step": 6269 }, { "epoch": 0.71, "learning_rate": 4.0266644004420515e-05, "loss": 0.6546, "step": 6270 }, { "epoch": 0.71, "learning_rate": 4.023712455809521e-05, "loss": 0.6364, "step": 6271 }, { "epoch": 0.71, "learning_rate": 4.020761321066833e-05, "loss": 0.6845, "step": 6272 }, { "epoch": 0.71, "learning_rate": 4.017810996613903e-05, "loss": 0.683, "step": 6273 }, { "epoch": 0.71, "learning_rate": 4.014861482850563e-05, "loss": 0.6644, "step": 6274 }, { "epoch": 0.71, "learning_rate": 4.011912780176512e-05, "loss": 0.6469, "step": 6275 }, { "epoch": 0.71, "learning_rate": 4.00896488899136e-05, "loss": 0.6842, "step": 6276 }, { "epoch": 0.71, "learning_rate": 4.00601780969459e-05, "loss": 0.6823, "step": 6277 }, { "epoch": 0.71, "learning_rate": 4.0030715426855915e-05, "loss": 0.6156, "step": 6278 }, { "epoch": 0.71, "learning_rate": 4.0001260883636205e-05, "loss": 0.6235, "step": 6279 }, { "epoch": 0.71, "learning_rate": 3.997181447127848e-05, "loss": 0.6876, "step": 6280 }, { "epoch": 0.71, "learning_rate": 3.9942376193773146e-05, "loss": 0.7068, "step": 6281 }, { "epoch": 0.71, "learning_rate": 3.991294605510969e-05, "loss": 0.6302, "step": 6282 }, { "epoch": 0.71, "learning_rate": 3.9883524059276366e-05, "loss": 0.6416, "step": 6283 }, { "epoch": 0.71, "learning_rate": 3.985411021026031e-05, "loss": 0.633, "step": 6284 }, { "epoch": 0.71, "learning_rate": 3.9824704512047676e-05, "loss": 0.681, "step": 6285 }, { "epoch": 0.71, "learning_rate": 3.979530696862343e-05, "loss": 0.7183, "step": 6286 }, { "epoch": 0.71, "learning_rate": 3.9765917583971366e-05, "loss": 0.644, "step": 6287 }, { "epoch": 0.71, "learning_rate": 3.973653636207437e-05, "loss": 0.6626, "step": 6288 }, { "epoch": 0.71, "learning_rate": 3.970716330691405e-05, "loss": 0.664, "step": 6289 }, { "epoch": 0.71, "learning_rate": 3.967779842247091e-05, "loss": 0.6998, "step": 6290 }, { "epoch": 0.72, "learning_rate": 3.964844171272449e-05, "loss": 0.715, "step": 6291 }, { "epoch": 0.72, "learning_rate": 3.9619093181653055e-05, "loss": 0.6478, "step": 6292 }, { "epoch": 0.72, "learning_rate": 3.958975283323389e-05, "loss": 0.5991, "step": 6293 }, { "epoch": 0.72, "learning_rate": 3.956042067144307e-05, "loss": 0.6568, "step": 6294 }, { "epoch": 0.72, "learning_rate": 3.95310967002557e-05, "loss": 0.6756, "step": 6295 }, { "epoch": 0.72, "learning_rate": 3.950178092364554e-05, "loss": 0.6328, "step": 6296 }, { "epoch": 0.72, "learning_rate": 3.947247334558548e-05, "loss": 0.7203, "step": 6297 }, { "epoch": 0.72, "learning_rate": 3.9443173970047164e-05, "loss": 0.691, "step": 6298 }, { "epoch": 0.72, "learning_rate": 3.94138828010012e-05, "loss": 0.6803, "step": 6299 }, { "epoch": 0.72, "learning_rate": 3.9384599842417024e-05, "loss": 0.5977, "step": 6300 }, { "epoch": 0.72, "learning_rate": 3.935532509826297e-05, "loss": 0.7569, "step": 6301 }, { "epoch": 0.72, "learning_rate": 3.932605857250625e-05, "loss": 0.7314, "step": 6302 }, { "epoch": 0.72, "learning_rate": 3.929680026911305e-05, "loss": 0.716, "step": 6303 }, { "epoch": 0.72, "learning_rate": 3.9267550192048295e-05, "loss": 0.6945, "step": 6304 }, { "epoch": 0.72, "learning_rate": 3.923830834527594e-05, "loss": 0.7262, "step": 6305 }, { "epoch": 0.72, "learning_rate": 3.920907473275874e-05, "loss": 0.6674, "step": 6306 }, { "epoch": 0.72, "learning_rate": 3.917984935845834e-05, "loss": 0.6894, "step": 6307 }, { "epoch": 0.72, "learning_rate": 3.915063222633526e-05, "loss": 0.6326, "step": 6308 }, { "epoch": 0.72, "learning_rate": 3.9121423340348976e-05, "loss": 0.7489, "step": 6309 }, { "epoch": 0.72, "learning_rate": 3.909222270445774e-05, "loss": 0.6913, "step": 6310 }, { "epoch": 0.72, "learning_rate": 3.90630303226188e-05, "loss": 0.5864, "step": 6311 }, { "epoch": 0.72, "learning_rate": 3.9033846198788195e-05, "loss": 0.6774, "step": 6312 }, { "epoch": 0.72, "learning_rate": 3.9004670336920833e-05, "loss": 0.6635, "step": 6313 }, { "epoch": 0.72, "learning_rate": 3.897550274097064e-05, "loss": 0.7004, "step": 6314 }, { "epoch": 0.72, "learning_rate": 3.894634341489023e-05, "loss": 0.6594, "step": 6315 }, { "epoch": 0.72, "learning_rate": 3.891719236263128e-05, "loss": 0.6068, "step": 6316 }, { "epoch": 0.72, "learning_rate": 3.8888049588144224e-05, "loss": 0.684, "step": 6317 }, { "epoch": 0.72, "learning_rate": 3.88589150953784e-05, "loss": 0.7038, "step": 6318 }, { "epoch": 0.72, "learning_rate": 3.8829788888282e-05, "loss": 0.6704, "step": 6319 }, { "epoch": 0.72, "learning_rate": 3.880067097080221e-05, "loss": 0.5903, "step": 6320 }, { "epoch": 0.72, "learning_rate": 3.877156134688492e-05, "loss": 0.7266, "step": 6321 }, { "epoch": 0.72, "learning_rate": 3.874246002047507e-05, "loss": 0.647, "step": 6322 }, { "epoch": 0.72, "learning_rate": 3.871336699551634e-05, "loss": 0.6393, "step": 6323 }, { "epoch": 0.72, "learning_rate": 3.8684282275951356e-05, "loss": 0.6292, "step": 6324 }, { "epoch": 0.72, "learning_rate": 3.865520586572155e-05, "loss": 0.6686, "step": 6325 }, { "epoch": 0.72, "learning_rate": 3.862613776876735e-05, "loss": 0.6879, "step": 6326 }, { "epoch": 0.72, "learning_rate": 3.8597077989027904e-05, "loss": 0.6519, "step": 6327 }, { "epoch": 0.72, "learning_rate": 3.8568026530441405e-05, "loss": 0.7062, "step": 6328 }, { "epoch": 0.72, "learning_rate": 3.8538983396944764e-05, "loss": 0.6767, "step": 6329 }, { "epoch": 0.72, "learning_rate": 3.8509948592473844e-05, "loss": 0.6891, "step": 6330 }, { "epoch": 0.72, "learning_rate": 3.848092212096331e-05, "loss": 0.659, "step": 6331 }, { "epoch": 0.72, "learning_rate": 3.845190398634684e-05, "loss": 0.698, "step": 6332 }, { "epoch": 0.72, "learning_rate": 3.8422894192556804e-05, "loss": 0.7046, "step": 6333 }, { "epoch": 0.72, "learning_rate": 3.839389274352461e-05, "loss": 0.6699, "step": 6334 }, { "epoch": 0.72, "learning_rate": 3.8364899643180394e-05, "loss": 0.6676, "step": 6335 }, { "epoch": 0.72, "learning_rate": 3.833591489545322e-05, "loss": 0.6433, "step": 6336 }, { "epoch": 0.72, "learning_rate": 3.8306938504271065e-05, "loss": 0.6232, "step": 6337 }, { "epoch": 0.72, "learning_rate": 3.827797047356068e-05, "loss": 0.69, "step": 6338 }, { "epoch": 0.72, "learning_rate": 3.824901080724776e-05, "loss": 0.7041, "step": 6339 }, { "epoch": 0.72, "learning_rate": 3.822005950925685e-05, "loss": 0.6581, "step": 6340 }, { "epoch": 0.72, "learning_rate": 3.8191116583511346e-05, "loss": 0.7256, "step": 6341 }, { "epoch": 0.72, "learning_rate": 3.8162182033933444e-05, "loss": 0.6848, "step": 6342 }, { "epoch": 0.72, "learning_rate": 3.8133255864444373e-05, "loss": 0.6796, "step": 6343 }, { "epoch": 0.72, "learning_rate": 3.810433807896404e-05, "loss": 0.7082, "step": 6344 }, { "epoch": 0.72, "learning_rate": 3.807542868141138e-05, "loss": 0.6453, "step": 6345 }, { "epoch": 0.72, "learning_rate": 3.804652767570408e-05, "loss": 0.654, "step": 6346 }, { "epoch": 0.72, "learning_rate": 3.8017635065758714e-05, "loss": 0.6577, "step": 6347 }, { "epoch": 0.72, "learning_rate": 3.798875085549071e-05, "loss": 0.666, "step": 6348 }, { "epoch": 0.72, "learning_rate": 3.795987504881443e-05, "loss": 0.6755, "step": 6349 }, { "epoch": 0.72, "learning_rate": 3.793100764964299e-05, "loss": 0.6607, "step": 6350 }, { "epoch": 0.72, "learning_rate": 3.790214866188847e-05, "loss": 0.665, "step": 6351 }, { "epoch": 0.72, "learning_rate": 3.787329808946174e-05, "loss": 0.6417, "step": 6352 }, { "epoch": 0.72, "learning_rate": 3.784445593627254e-05, "loss": 0.6267, "step": 6353 }, { "epoch": 0.72, "learning_rate": 3.781562220622944e-05, "loss": 0.7063, "step": 6354 }, { "epoch": 0.72, "learning_rate": 3.7786796903239985e-05, "loss": 0.6774, "step": 6355 }, { "epoch": 0.72, "learning_rate": 3.775798003121044e-05, "loss": 0.6695, "step": 6356 }, { "epoch": 0.72, "learning_rate": 3.772917159404603e-05, "loss": 0.648, "step": 6357 }, { "epoch": 0.72, "learning_rate": 3.7700371595650777e-05, "loss": 0.6913, "step": 6358 }, { "epoch": 0.72, "learning_rate": 3.7671580039927546e-05, "loss": 0.6446, "step": 6359 }, { "epoch": 0.72, "learning_rate": 3.764279693077815e-05, "loss": 0.6307, "step": 6360 }, { "epoch": 0.72, "learning_rate": 3.7614022272103144e-05, "loss": 0.6723, "step": 6361 }, { "epoch": 0.72, "learning_rate": 3.7585256067801986e-05, "loss": 0.617, "step": 6362 }, { "epoch": 0.72, "learning_rate": 3.755649832177305e-05, "loss": 0.6933, "step": 6363 }, { "epoch": 0.72, "learning_rate": 3.752774903791346e-05, "loss": 0.5971, "step": 6364 }, { "epoch": 0.72, "learning_rate": 3.749900822011923e-05, "loss": 0.6053, "step": 6365 }, { "epoch": 0.72, "learning_rate": 3.747027587228527e-05, "loss": 0.742, "step": 6366 }, { "epoch": 0.72, "learning_rate": 3.7441551998305256e-05, "loss": 0.6076, "step": 6367 }, { "epoch": 0.72, "learning_rate": 3.7412836602071846e-05, "loss": 0.6799, "step": 6368 }, { "epoch": 0.72, "learning_rate": 3.738412968747642e-05, "loss": 0.653, "step": 6369 }, { "epoch": 0.72, "learning_rate": 3.735543125840927e-05, "loss": 0.6225, "step": 6370 }, { "epoch": 0.72, "learning_rate": 3.7326741318759486e-05, "loss": 0.6371, "step": 6371 }, { "epoch": 0.72, "learning_rate": 3.7298059872415125e-05, "loss": 0.6725, "step": 6372 }, { "epoch": 0.72, "learning_rate": 3.726938692326294e-05, "loss": 0.5805, "step": 6373 }, { "epoch": 0.72, "learning_rate": 3.7240722475188706e-05, "loss": 0.6522, "step": 6374 }, { "epoch": 0.72, "learning_rate": 3.721206653207683e-05, "loss": 0.6361, "step": 6375 }, { "epoch": 0.72, "learning_rate": 3.7183419097810776e-05, "loss": 0.6101, "step": 6376 }, { "epoch": 0.72, "learning_rate": 3.715478017627271e-05, "loss": 0.6505, "step": 6377 }, { "epoch": 0.72, "learning_rate": 3.712614977134374e-05, "loss": 0.6889, "step": 6378 }, { "epoch": 0.73, "learning_rate": 3.709752788690374e-05, "loss": 0.657, "step": 6379 }, { "epoch": 0.73, "learning_rate": 3.706891452683151e-05, "loss": 0.6697, "step": 6380 }, { "epoch": 0.73, "learning_rate": 3.704030969500464e-05, "loss": 0.5967, "step": 6381 }, { "epoch": 0.73, "learning_rate": 3.701171339529956e-05, "loss": 0.6701, "step": 6382 }, { "epoch": 0.73, "learning_rate": 3.698312563159155e-05, "loss": 0.6485, "step": 6383 }, { "epoch": 0.73, "learning_rate": 3.6954546407754796e-05, "loss": 0.6286, "step": 6384 }, { "epoch": 0.73, "learning_rate": 3.69259757276622e-05, "loss": 0.6814, "step": 6385 }, { "epoch": 0.73, "learning_rate": 3.6897413595185657e-05, "loss": 0.6722, "step": 6386 }, { "epoch": 0.73, "learning_rate": 3.6868860014195804e-05, "loss": 0.6294, "step": 6387 }, { "epoch": 0.73, "learning_rate": 3.6840314988562095e-05, "loss": 0.6696, "step": 6388 }, { "epoch": 0.73, "learning_rate": 3.681177852215294e-05, "loss": 0.6753, "step": 6389 }, { "epoch": 0.73, "learning_rate": 3.678325061883546e-05, "loss": 0.6639, "step": 6390 }, { "epoch": 0.73, "learning_rate": 3.675473128247575e-05, "loss": 0.6582, "step": 6391 }, { "epoch": 0.73, "learning_rate": 3.6726220516938626e-05, "loss": 0.6467, "step": 6392 }, { "epoch": 0.73, "learning_rate": 3.6697718326087785e-05, "loss": 0.7021, "step": 6393 }, { "epoch": 0.73, "learning_rate": 3.6669224713785744e-05, "loss": 0.7141, "step": 6394 }, { "epoch": 0.73, "learning_rate": 3.664073968389393e-05, "loss": 0.6275, "step": 6395 }, { "epoch": 0.73, "learning_rate": 3.6612263240272504e-05, "loss": 0.6853, "step": 6396 }, { "epoch": 0.73, "learning_rate": 3.658379538678061e-05, "loss": 0.589, "step": 6397 }, { "epoch": 0.73, "learning_rate": 3.655533612727599e-05, "loss": 0.6, "step": 6398 }, { "epoch": 0.73, "learning_rate": 3.652688546561546e-05, "loss": 0.6541, "step": 6399 }, { "epoch": 0.73, "learning_rate": 3.649844340565453e-05, "loss": 0.6813, "step": 6400 }, { "epoch": 0.73, "learning_rate": 3.647000995124763e-05, "loss": 0.6134, "step": 6401 }, { "epoch": 0.73, "learning_rate": 3.6441585106247936e-05, "loss": 0.6381, "step": 6402 }, { "epoch": 0.73, "learning_rate": 3.64131688745076e-05, "loss": 0.5949, "step": 6403 }, { "epoch": 0.73, "learning_rate": 3.638476125987736e-05, "loss": 0.7045, "step": 6404 }, { "epoch": 0.73, "learning_rate": 3.635636226620706e-05, "loss": 0.679, "step": 6405 }, { "epoch": 0.73, "learning_rate": 3.632797189734517e-05, "loss": 0.6105, "step": 6406 }, { "epoch": 0.73, "learning_rate": 3.629959015713914e-05, "loss": 0.6786, "step": 6407 }, { "epoch": 0.73, "learning_rate": 3.627121704943513e-05, "loss": 0.6532, "step": 6408 }, { "epoch": 0.73, "learning_rate": 3.624285257807825e-05, "loss": 0.5905, "step": 6409 }, { "epoch": 0.73, "learning_rate": 3.621449674691233e-05, "loss": 0.6739, "step": 6410 }, { "epoch": 0.73, "learning_rate": 3.618614955978005e-05, "loss": 0.6545, "step": 6411 }, { "epoch": 0.73, "learning_rate": 3.6157811020523e-05, "loss": 0.6838, "step": 6412 }, { "epoch": 0.73, "learning_rate": 3.612948113298148e-05, "loss": 0.7281, "step": 6413 }, { "epoch": 0.73, "learning_rate": 3.610115990099476e-05, "loss": 0.7023, "step": 6414 }, { "epoch": 0.73, "learning_rate": 3.607284732840075e-05, "loss": 0.6724, "step": 6415 }, { "epoch": 0.73, "learning_rate": 3.604454341903638e-05, "loss": 0.6316, "step": 6416 }, { "epoch": 0.73, "learning_rate": 3.601624817673723e-05, "loss": 0.7359, "step": 6417 }, { "epoch": 0.73, "learning_rate": 3.598796160533789e-05, "loss": 0.6751, "step": 6418 }, { "epoch": 0.73, "learning_rate": 3.59596837086716e-05, "loss": 0.6625, "step": 6419 }, { "epoch": 0.73, "learning_rate": 3.5931414490570595e-05, "loss": 0.6587, "step": 6420 }, { "epoch": 0.73, "learning_rate": 3.59031539548657e-05, "loss": 0.6714, "step": 6421 }, { "epoch": 0.73, "learning_rate": 3.587490210538682e-05, "loss": 0.6942, "step": 6422 }, { "epoch": 0.73, "learning_rate": 3.5846658945962494e-05, "loss": 0.7186, "step": 6423 }, { "epoch": 0.73, "learning_rate": 3.581842448042022e-05, "loss": 0.6381, "step": 6424 }, { "epoch": 0.73, "learning_rate": 3.5790198712586195e-05, "loss": 0.7617, "step": 6425 }, { "epoch": 0.73, "learning_rate": 3.5761981646285606e-05, "loss": 0.6647, "step": 6426 }, { "epoch": 0.73, "learning_rate": 3.5733773285342184e-05, "loss": 0.6634, "step": 6427 }, { "epoch": 0.73, "learning_rate": 3.570557363357878e-05, "loss": 0.6932, "step": 6428 }, { "epoch": 0.73, "learning_rate": 3.567738269481685e-05, "loss": 0.6747, "step": 6429 }, { "epoch": 0.73, "learning_rate": 3.564920047287682e-05, "loss": 0.6585, "step": 6430 }, { "epoch": 0.73, "learning_rate": 3.562102697157784e-05, "loss": 0.6355, "step": 6431 }, { "epoch": 0.73, "learning_rate": 3.559286219473786e-05, "loss": 0.7241, "step": 6432 }, { "epoch": 0.73, "learning_rate": 3.5564706146173775e-05, "loss": 0.6571, "step": 6433 }, { "epoch": 0.73, "learning_rate": 3.553655882970113e-05, "loss": 0.6757, "step": 6434 }, { "epoch": 0.73, "learning_rate": 3.5508420249134435e-05, "loss": 0.6918, "step": 6435 }, { "epoch": 0.73, "learning_rate": 3.548029040828694e-05, "loss": 0.6059, "step": 6436 }, { "epoch": 0.73, "learning_rate": 3.5452169310970706e-05, "loss": 0.7075, "step": 6437 }, { "epoch": 0.73, "learning_rate": 3.54240569609966e-05, "loss": 0.7188, "step": 6438 }, { "epoch": 0.73, "learning_rate": 3.53959533621744e-05, "loss": 0.6469, "step": 6439 }, { "epoch": 0.73, "learning_rate": 3.5367858518312534e-05, "loss": 0.6648, "step": 6440 }, { "epoch": 0.73, "learning_rate": 3.533977243321844e-05, "loss": 0.6837, "step": 6441 }, { "epoch": 0.73, "learning_rate": 3.5311695110698176e-05, "loss": 0.66, "step": 6442 }, { "epoch": 0.73, "learning_rate": 3.5283626554556814e-05, "loss": 0.6159, "step": 6443 }, { "epoch": 0.73, "learning_rate": 3.525556676859799e-05, "loss": 0.7172, "step": 6444 }, { "epoch": 0.73, "learning_rate": 3.5227515756624386e-05, "loss": 0.6924, "step": 6445 }, { "epoch": 0.73, "learning_rate": 3.519947352243732e-05, "loss": 0.6497, "step": 6446 }, { "epoch": 0.73, "learning_rate": 3.517144006983708e-05, "loss": 0.6187, "step": 6447 }, { "epoch": 0.73, "learning_rate": 3.514341540262262e-05, "loss": 0.6988, "step": 6448 }, { "epoch": 0.73, "learning_rate": 3.5115399524591855e-05, "loss": 0.6674, "step": 6449 }, { "epoch": 0.73, "learning_rate": 3.508739243954127e-05, "loss": 0.6417, "step": 6450 }, { "epoch": 0.73, "learning_rate": 3.505939415126643e-05, "loss": 0.6493, "step": 6451 }, { "epoch": 0.73, "learning_rate": 3.503140466356151e-05, "loss": 0.6572, "step": 6452 }, { "epoch": 0.73, "learning_rate": 3.500342398021964e-05, "loss": 0.6651, "step": 6453 }, { "epoch": 0.73, "learning_rate": 3.4975452105032634e-05, "loss": 0.6345, "step": 6454 }, { "epoch": 0.73, "learning_rate": 3.494748904179115e-05, "loss": 0.623, "step": 6455 }, { "epoch": 0.73, "learning_rate": 3.491953479428471e-05, "loss": 0.6633, "step": 6456 }, { "epoch": 0.73, "learning_rate": 3.489158936630159e-05, "loss": 0.6101, "step": 6457 }, { "epoch": 0.73, "learning_rate": 3.4863652761628816e-05, "loss": 0.6538, "step": 6458 }, { "epoch": 0.73, "learning_rate": 3.4835724984052366e-05, "loss": 0.7071, "step": 6459 }, { "epoch": 0.73, "learning_rate": 3.4807806037356896e-05, "loss": 0.6233, "step": 6460 }, { "epoch": 0.73, "learning_rate": 3.477989592532586e-05, "loss": 0.6547, "step": 6461 }, { "epoch": 0.73, "learning_rate": 3.4751994651741626e-05, "loss": 0.6903, "step": 6462 }, { "epoch": 0.73, "learning_rate": 3.4724102220385234e-05, "loss": 0.732, "step": 6463 }, { "epoch": 0.73, "learning_rate": 3.469621863503667e-05, "loss": 0.6268, "step": 6464 }, { "epoch": 0.73, "learning_rate": 3.466834389947455e-05, "loss": 0.6016, "step": 6465 }, { "epoch": 0.73, "learning_rate": 3.464047801747649e-05, "loss": 0.6541, "step": 6466 }, { "epoch": 0.74, "learning_rate": 3.461262099281868e-05, "loss": 0.7046, "step": 6467 }, { "epoch": 0.74, "learning_rate": 3.458477282927629e-05, "loss": 0.6519, "step": 6468 }, { "epoch": 0.74, "learning_rate": 3.455693353062319e-05, "loss": 0.6868, "step": 6469 }, { "epoch": 0.74, "learning_rate": 3.4529103100632145e-05, "loss": 0.6141, "step": 6470 }, { "epoch": 0.74, "learning_rate": 3.4501281543074614e-05, "loss": 0.6342, "step": 6471 }, { "epoch": 0.74, "learning_rate": 3.4473468861720905e-05, "loss": 0.6722, "step": 6472 }, { "epoch": 0.74, "learning_rate": 3.444566506034007e-05, "loss": 0.6303, "step": 6473 }, { "epoch": 0.74, "learning_rate": 3.4417870142700094e-05, "loss": 0.667, "step": 6474 }, { "epoch": 0.74, "learning_rate": 3.4390084112567566e-05, "loss": 0.6951, "step": 6475 }, { "epoch": 0.74, "learning_rate": 3.436230697370807e-05, "loss": 0.6852, "step": 6476 }, { "epoch": 0.74, "learning_rate": 3.4334538729885836e-05, "loss": 0.6748, "step": 6477 }, { "epoch": 0.74, "learning_rate": 3.430677938486395e-05, "loss": 0.6987, "step": 6478 }, { "epoch": 0.74, "learning_rate": 3.4279028942404234e-05, "loss": 0.6653, "step": 6479 }, { "epoch": 0.74, "learning_rate": 3.425128740626742e-05, "loss": 0.6606, "step": 6480 }, { "epoch": 0.74, "learning_rate": 3.4223554780212906e-05, "loss": 0.6749, "step": 6481 }, { "epoch": 0.74, "learning_rate": 3.4195831067999e-05, "loss": 0.646, "step": 6482 }, { "epoch": 0.74, "learning_rate": 3.416811627338271e-05, "loss": 0.6986, "step": 6483 }, { "epoch": 0.74, "learning_rate": 3.4140410400119835e-05, "loss": 0.6546, "step": 6484 }, { "epoch": 0.74, "learning_rate": 3.411271345196506e-05, "loss": 0.6751, "step": 6485 }, { "epoch": 0.74, "learning_rate": 3.4085025432671746e-05, "loss": 0.6669, "step": 6486 }, { "epoch": 0.74, "learning_rate": 3.4057346345992145e-05, "loss": 0.6405, "step": 6487 }, { "epoch": 0.74, "learning_rate": 3.4029676195677226e-05, "loss": 0.6964, "step": 6488 }, { "epoch": 0.74, "learning_rate": 3.400201498547677e-05, "loss": 0.6289, "step": 6489 }, { "epoch": 0.74, "learning_rate": 3.397436271913932e-05, "loss": 0.6721, "step": 6490 }, { "epoch": 0.74, "learning_rate": 3.3946719400412285e-05, "loss": 0.6509, "step": 6491 }, { "epoch": 0.74, "learning_rate": 3.391908503304175e-05, "loss": 0.6042, "step": 6492 }, { "epoch": 0.74, "learning_rate": 3.389145962077273e-05, "loss": 0.6632, "step": 6493 }, { "epoch": 0.74, "learning_rate": 3.3863843167348886e-05, "loss": 0.6771, "step": 6494 }, { "epoch": 0.74, "learning_rate": 3.383623567651273e-05, "loss": 0.681, "step": 6495 }, { "epoch": 0.74, "learning_rate": 3.380863715200553e-05, "loss": 0.6196, "step": 6496 }, { "epoch": 0.74, "learning_rate": 3.3781047597567415e-05, "loss": 0.6201, "step": 6497 }, { "epoch": 0.74, "learning_rate": 3.375346701693719e-05, "loss": 0.694, "step": 6498 }, { "epoch": 0.74, "learning_rate": 3.372589541385256e-05, "loss": 0.6757, "step": 6499 }, { "epoch": 0.74, "learning_rate": 3.3698332792049914e-05, "loss": 0.6109, "step": 6500 }, { "epoch": 0.74, "learning_rate": 3.3670779155264465e-05, "loss": 0.611, "step": 6501 }, { "epoch": 0.74, "learning_rate": 3.364323450723017e-05, "loss": 0.6862, "step": 6502 }, { "epoch": 0.74, "learning_rate": 3.3615698851679863e-05, "loss": 0.6646, "step": 6503 }, { "epoch": 0.74, "learning_rate": 3.3588172192345056e-05, "loss": 0.6046, "step": 6504 }, { "epoch": 0.74, "learning_rate": 3.3560654532956125e-05, "loss": 0.6473, "step": 6505 }, { "epoch": 0.74, "learning_rate": 3.353314587724217e-05, "loss": 0.6116, "step": 6506 }, { "epoch": 0.74, "learning_rate": 3.3505646228931056e-05, "loss": 0.7111, "step": 6507 }, { "epoch": 0.74, "learning_rate": 3.347815559174951e-05, "loss": 0.6854, "step": 6508 }, { "epoch": 0.74, "learning_rate": 3.345067396942292e-05, "loss": 0.7108, "step": 6509 }, { "epoch": 0.74, "learning_rate": 3.342320136567561e-05, "loss": 0.6445, "step": 6510 }, { "epoch": 0.74, "learning_rate": 3.339573778423053e-05, "loss": 0.664, "step": 6511 }, { "epoch": 0.74, "learning_rate": 3.336828322880948e-05, "loss": 0.635, "step": 6512 }, { "epoch": 0.74, "learning_rate": 3.3340837703133e-05, "loss": 0.6548, "step": 6513 }, { "epoch": 0.74, "learning_rate": 3.331340121092048e-05, "loss": 0.7124, "step": 6514 }, { "epoch": 0.74, "learning_rate": 3.328597375588998e-05, "loss": 0.5983, "step": 6515 }, { "epoch": 0.74, "learning_rate": 3.325855534175846e-05, "loss": 0.7236, "step": 6516 }, { "epoch": 0.74, "learning_rate": 3.323114597224154e-05, "loss": 0.6474, "step": 6517 }, { "epoch": 0.74, "learning_rate": 3.3203745651053686e-05, "loss": 0.6849, "step": 6518 }, { "epoch": 0.74, "learning_rate": 3.317635438190806e-05, "loss": 0.6873, "step": 6519 }, { "epoch": 0.74, "learning_rate": 3.314897216851673e-05, "loss": 0.6288, "step": 6520 }, { "epoch": 0.74, "learning_rate": 3.3121599014590375e-05, "loss": 0.6182, "step": 6521 }, { "epoch": 0.74, "learning_rate": 3.309423492383862e-05, "loss": 0.6574, "step": 6522 }, { "epoch": 0.74, "learning_rate": 3.3066879899969704e-05, "loss": 0.6998, "step": 6523 }, { "epoch": 0.74, "learning_rate": 3.3039533946690735e-05, "loss": 0.6743, "step": 6524 }, { "epoch": 0.74, "learning_rate": 3.3012197067707505e-05, "loss": 0.6848, "step": 6525 }, { "epoch": 0.74, "learning_rate": 3.2984869266724704e-05, "loss": 0.651, "step": 6526 }, { "epoch": 0.74, "learning_rate": 3.295755054744567e-05, "loss": 0.6696, "step": 6527 }, { "epoch": 0.74, "learning_rate": 3.29302409135726e-05, "loss": 0.6229, "step": 6528 }, { "epoch": 0.74, "learning_rate": 3.29029403688064e-05, "loss": 0.6803, "step": 6529 }, { "epoch": 0.74, "learning_rate": 3.287564891684672e-05, "loss": 0.6078, "step": 6530 }, { "epoch": 0.74, "learning_rate": 3.284836656139211e-05, "loss": 0.6334, "step": 6531 }, { "epoch": 0.74, "learning_rate": 3.282109330613975e-05, "loss": 0.5847, "step": 6532 }, { "epoch": 0.74, "learning_rate": 3.2793829154785605e-05, "loss": 0.6516, "step": 6533 }, { "epoch": 0.74, "learning_rate": 3.276657411102449e-05, "loss": 0.7093, "step": 6534 }, { "epoch": 0.74, "learning_rate": 3.273932817854992e-05, "loss": 0.6089, "step": 6535 }, { "epoch": 0.74, "learning_rate": 3.2712091361054153e-05, "loss": 0.6816, "step": 6536 }, { "epoch": 0.74, "learning_rate": 3.26848636622283e-05, "loss": 0.6675, "step": 6537 }, { "epoch": 0.74, "learning_rate": 3.265764508576212e-05, "loss": 0.6438, "step": 6538 }, { "epoch": 0.74, "learning_rate": 3.263043563534428e-05, "loss": 0.6461, "step": 6539 }, { "epoch": 0.74, "learning_rate": 3.260323531466207e-05, "loss": 0.7124, "step": 6540 }, { "epoch": 0.74, "learning_rate": 3.257604412740163e-05, "loss": 0.6466, "step": 6541 }, { "epoch": 0.74, "learning_rate": 3.254886207724778e-05, "loss": 0.5833, "step": 6542 }, { "epoch": 0.74, "learning_rate": 3.2521689167884214e-05, "loss": 0.713, "step": 6543 }, { "epoch": 0.74, "learning_rate": 3.249452540299329e-05, "loss": 0.624, "step": 6544 }, { "epoch": 0.74, "learning_rate": 3.246737078625626e-05, "loss": 0.7089, "step": 6545 }, { "epoch": 0.74, "learning_rate": 3.244022532135289e-05, "loss": 0.6951, "step": 6546 }, { "epoch": 0.74, "learning_rate": 3.2413089011961975e-05, "loss": 0.7116, "step": 6547 }, { "epoch": 0.74, "learning_rate": 3.238596186176087e-05, "loss": 0.7113, "step": 6548 }, { "epoch": 0.74, "learning_rate": 3.235884387442586e-05, "loss": 0.6575, "step": 6549 }, { "epoch": 0.74, "learning_rate": 3.2331735053631805e-05, "loss": 0.6808, "step": 6550 }, { "epoch": 0.74, "learning_rate": 3.230463540305251e-05, "loss": 0.6708, "step": 6551 }, { "epoch": 0.74, "learning_rate": 3.227754492636039e-05, "loss": 0.6799, "step": 6552 }, { "epoch": 0.74, "learning_rate": 3.225046362722668e-05, "loss": 0.6476, "step": 6553 }, { "epoch": 0.74, "learning_rate": 3.2223391509321334e-05, "loss": 0.6506, "step": 6554 }, { "epoch": 0.75, "learning_rate": 3.219632857631315e-05, "loss": 0.6544, "step": 6555 }, { "epoch": 0.75, "learning_rate": 3.2169274831869546e-05, "loss": 0.6157, "step": 6556 }, { "epoch": 0.75, "learning_rate": 3.214223027965686e-05, "loss": 0.5679, "step": 6557 }, { "epoch": 0.75, "learning_rate": 3.211519492334004e-05, "loss": 0.6378, "step": 6558 }, { "epoch": 0.75, "learning_rate": 3.2088168766582816e-05, "loss": 0.6413, "step": 6559 }, { "epoch": 0.75, "learning_rate": 3.2061151813047766e-05, "loss": 0.6059, "step": 6560 }, { "epoch": 0.75, "learning_rate": 3.203414406639608e-05, "loss": 0.7102, "step": 6561 }, { "epoch": 0.75, "learning_rate": 3.2007145530287874e-05, "loss": 0.6769, "step": 6562 }, { "epoch": 0.75, "learning_rate": 3.1980156208381796e-05, "loss": 0.6977, "step": 6563 }, { "epoch": 0.75, "learning_rate": 3.195317610433545e-05, "loss": 0.6218, "step": 6564 }, { "epoch": 0.75, "learning_rate": 3.192620522180503e-05, "loss": 0.6281, "step": 6565 }, { "epoch": 0.75, "learning_rate": 3.189924356444564e-05, "loss": 0.6686, "step": 6566 }, { "epoch": 0.75, "learning_rate": 3.187229113591096e-05, "loss": 0.6647, "step": 6567 }, { "epoch": 0.75, "learning_rate": 3.184534793985362e-05, "loss": 0.691, "step": 6568 }, { "epoch": 0.75, "learning_rate": 3.181841397992477e-05, "loss": 0.6956, "step": 6569 }, { "epoch": 0.75, "learning_rate": 3.17914892597745e-05, "loss": 0.6639, "step": 6570 }, { "epoch": 0.75, "learning_rate": 3.176457378305151e-05, "loss": 0.629, "step": 6571 }, { "epoch": 0.75, "learning_rate": 3.1737667553403395e-05, "loss": 0.6954, "step": 6572 }, { "epoch": 0.75, "learning_rate": 3.1710770574476325e-05, "loss": 0.609, "step": 6573 }, { "epoch": 0.75, "learning_rate": 3.1683882849915415e-05, "loss": 0.657, "step": 6574 }, { "epoch": 0.75, "learning_rate": 3.1657004383364276e-05, "loss": 0.6614, "step": 6575 }, { "epoch": 0.75, "learning_rate": 3.16301351784655e-05, "loss": 0.7054, "step": 6576 }, { "epoch": 0.75, "learning_rate": 3.160327523886028e-05, "loss": 0.5986, "step": 6577 }, { "epoch": 0.75, "learning_rate": 3.1576424568188634e-05, "loss": 0.6492, "step": 6578 }, { "epoch": 0.75, "learning_rate": 3.154958317008926e-05, "loss": 0.7353, "step": 6579 }, { "epoch": 0.75, "learning_rate": 3.152275104819966e-05, "loss": 0.6467, "step": 6580 }, { "epoch": 0.75, "learning_rate": 3.149592820615604e-05, "loss": 0.6388, "step": 6581 }, { "epoch": 0.75, "learning_rate": 3.1469114647593326e-05, "loss": 0.6761, "step": 6582 }, { "epoch": 0.75, "learning_rate": 3.144231037614526e-05, "loss": 0.7091, "step": 6583 }, { "epoch": 0.75, "learning_rate": 3.141551539544424e-05, "loss": 0.6313, "step": 6584 }, { "epoch": 0.75, "learning_rate": 3.138872970912152e-05, "loss": 0.6629, "step": 6585 }, { "epoch": 0.75, "learning_rate": 3.136195332080691e-05, "loss": 0.6628, "step": 6586 }, { "epoch": 0.75, "learning_rate": 3.1335186234129176e-05, "loss": 0.6622, "step": 6587 }, { "epoch": 0.75, "learning_rate": 3.130842845271564e-05, "loss": 0.6949, "step": 6588 }, { "epoch": 0.75, "learning_rate": 3.12816799801925e-05, "loss": 0.6547, "step": 6589 }, { "epoch": 0.75, "learning_rate": 3.12549408201846e-05, "loss": 0.6275, "step": 6590 }, { "epoch": 0.75, "learning_rate": 3.122821097631562e-05, "loss": 0.6589, "step": 6591 }, { "epoch": 0.75, "learning_rate": 3.120149045220779e-05, "loss": 0.6286, "step": 6592 }, { "epoch": 0.75, "learning_rate": 3.1174779251482314e-05, "loss": 0.6092, "step": 6593 }, { "epoch": 0.75, "learning_rate": 3.1148077377758945e-05, "loss": 0.6571, "step": 6594 }, { "epoch": 0.75, "learning_rate": 3.112138483465632e-05, "loss": 0.6969, "step": 6595 }, { "epoch": 0.75, "learning_rate": 3.1094701625791657e-05, "loss": 0.6839, "step": 6596 }, { "epoch": 0.75, "learning_rate": 3.106802775478111e-05, "loss": 0.6661, "step": 6597 }, { "epoch": 0.75, "learning_rate": 3.1041363225239284e-05, "loss": 0.7052, "step": 6598 }, { "epoch": 0.75, "learning_rate": 3.1014708040779807e-05, "loss": 0.6559, "step": 6599 }, { "epoch": 0.75, "learning_rate": 3.098806220501484e-05, "loss": 0.6776, "step": 6600 }, { "epoch": 0.75, "learning_rate": 3.096142572155544e-05, "loss": 0.6979, "step": 6601 }, { "epoch": 0.75, "learning_rate": 3.093479859401124e-05, "loss": 0.6935, "step": 6602 }, { "epoch": 0.75, "learning_rate": 3.090818082599065e-05, "loss": 0.6492, "step": 6603 }, { "epoch": 0.75, "learning_rate": 3.088157242110092e-05, "loss": 0.7006, "step": 6604 }, { "epoch": 0.75, "learning_rate": 3.085497338294788e-05, "loss": 0.6757, "step": 6605 }, { "epoch": 0.75, "learning_rate": 3.08283837151362e-05, "loss": 0.6869, "step": 6606 }, { "epoch": 0.75, "learning_rate": 3.080180342126923e-05, "loss": 0.7023, "step": 6607 }, { "epoch": 0.75, "learning_rate": 3.077523250494904e-05, "loss": 0.6499, "step": 6608 }, { "epoch": 0.75, "learning_rate": 3.0748670969776414e-05, "loss": 0.6247, "step": 6609 }, { "epoch": 0.75, "learning_rate": 3.072211881935097e-05, "loss": 0.6526, "step": 6610 }, { "epoch": 0.75, "learning_rate": 3.0695576057270926e-05, "loss": 0.6757, "step": 6611 }, { "epoch": 0.75, "learning_rate": 3.066904268713333e-05, "loss": 0.6863, "step": 6612 }, { "epoch": 0.75, "learning_rate": 3.064251871253385e-05, "loss": 0.6426, "step": 6613 }, { "epoch": 0.75, "learning_rate": 3.0616004137067045e-05, "loss": 0.6437, "step": 6614 }, { "epoch": 0.75, "learning_rate": 3.058949896432597e-05, "loss": 0.6363, "step": 6615 }, { "epoch": 0.75, "learning_rate": 3.056300319790261e-05, "loss": 0.6851, "step": 6616 }, { "epoch": 0.75, "learning_rate": 3.053651684138755e-05, "loss": 0.6444, "step": 6617 }, { "epoch": 0.75, "learning_rate": 3.0510039898370202e-05, "loss": 0.6554, "step": 6618 }, { "epoch": 0.75, "learning_rate": 3.048357237243863e-05, "loss": 0.6475, "step": 6619 }, { "epoch": 0.75, "learning_rate": 3.045711426717962e-05, "loss": 0.6939, "step": 6620 }, { "epoch": 0.75, "learning_rate": 3.0430665586178676e-05, "loss": 0.6918, "step": 6621 }, { "epoch": 0.75, "learning_rate": 3.0404226333020114e-05, "loss": 0.7068, "step": 6622 }, { "epoch": 0.75, "learning_rate": 3.037779651128686e-05, "loss": 0.6608, "step": 6623 }, { "epoch": 0.75, "learning_rate": 3.035137612456065e-05, "loss": 0.6512, "step": 6624 }, { "epoch": 0.75, "learning_rate": 3.032496517642187e-05, "loss": 0.6915, "step": 6625 }, { "epoch": 0.75, "learning_rate": 3.029856367044964e-05, "loss": 0.7042, "step": 6626 }, { "epoch": 0.75, "learning_rate": 3.027217161022189e-05, "loss": 0.6342, "step": 6627 }, { "epoch": 0.75, "learning_rate": 3.0245788999315138e-05, "loss": 0.6699, "step": 6628 }, { "epoch": 0.75, "learning_rate": 3.0219415841304675e-05, "loss": 0.7365, "step": 6629 }, { "epoch": 0.75, "learning_rate": 3.0193052139764566e-05, "loss": 0.632, "step": 6630 }, { "epoch": 0.75, "learning_rate": 3.0166697898267516e-05, "loss": 0.6521, "step": 6631 }, { "epoch": 0.75, "learning_rate": 3.0140353120384956e-05, "loss": 0.6727, "step": 6632 }, { "epoch": 0.75, "learning_rate": 3.0114017809687122e-05, "loss": 0.6932, "step": 6633 }, { "epoch": 0.75, "learning_rate": 3.0087691969742826e-05, "loss": 0.659, "step": 6634 }, { "epoch": 0.75, "learning_rate": 3.0061375604119746e-05, "loss": 0.614, "step": 6635 }, { "epoch": 0.75, "learning_rate": 3.0035068716384128e-05, "loss": 0.6403, "step": 6636 }, { "epoch": 0.75, "learning_rate": 3.0008771310101114e-05, "loss": 0.6235, "step": 6637 }, { "epoch": 0.75, "learning_rate": 2.9982483388834327e-05, "loss": 0.638, "step": 6638 }, { "epoch": 0.75, "learning_rate": 2.9956204956146326e-05, "loss": 0.7011, "step": 6639 }, { "epoch": 0.75, "learning_rate": 2.9929936015598225e-05, "loss": 0.6744, "step": 6640 }, { "epoch": 0.75, "learning_rate": 2.9903676570749984e-05, "loss": 0.6634, "step": 6641 }, { "epoch": 0.75, "learning_rate": 2.9877426625160176e-05, "loss": 0.6991, "step": 6642 }, { "epoch": 0.76, "learning_rate": 2.9851186182386127e-05, "loss": 0.6671, "step": 6643 }, { "epoch": 0.76, "learning_rate": 2.9824955245983833e-05, "loss": 0.7186, "step": 6644 }, { "epoch": 0.76, "learning_rate": 2.9798733819508083e-05, "loss": 0.6569, "step": 6645 }, { "epoch": 0.76, "learning_rate": 2.9772521906512306e-05, "loss": 0.6754, "step": 6646 }, { "epoch": 0.76, "learning_rate": 2.974631951054869e-05, "loss": 0.6745, "step": 6647 }, { "epoch": 0.76, "learning_rate": 2.972012663516811e-05, "loss": 0.6535, "step": 6648 }, { "epoch": 0.76, "learning_rate": 2.9693943283920146e-05, "loss": 0.6852, "step": 6649 }, { "epoch": 0.76, "learning_rate": 2.9667769460353045e-05, "loss": 0.6346, "step": 6650 }, { "epoch": 0.76, "learning_rate": 2.9641605168013886e-05, "loss": 0.6265, "step": 6651 }, { "epoch": 0.76, "learning_rate": 2.961545041044832e-05, "loss": 0.5836, "step": 6652 }, { "epoch": 0.76, "learning_rate": 2.9589305191200824e-05, "loss": 0.7005, "step": 6653 }, { "epoch": 0.76, "learning_rate": 2.9563169513814503e-05, "loss": 0.6803, "step": 6654 }, { "epoch": 0.76, "learning_rate": 2.9537043381831143e-05, "loss": 0.6627, "step": 6655 }, { "epoch": 0.76, "learning_rate": 2.951092679879136e-05, "loss": 0.7065, "step": 6656 }, { "epoch": 0.76, "learning_rate": 2.9484819768234327e-05, "loss": 0.7054, "step": 6657 }, { "epoch": 0.76, "learning_rate": 2.9458722293698083e-05, "loss": 0.6559, "step": 6658 }, { "epoch": 0.76, "learning_rate": 2.9432634378719225e-05, "loss": 0.6173, "step": 6659 }, { "epoch": 0.76, "learning_rate": 2.9406556026833133e-05, "loss": 0.7063, "step": 6660 }, { "epoch": 0.76, "learning_rate": 2.938048724157383e-05, "loss": 0.6731, "step": 6661 }, { "epoch": 0.76, "learning_rate": 2.9354428026474155e-05, "loss": 0.6255, "step": 6662 }, { "epoch": 0.76, "learning_rate": 2.9328378385065513e-05, "loss": 0.6563, "step": 6663 }, { "epoch": 0.76, "learning_rate": 2.9302338320878154e-05, "loss": 0.6875, "step": 6664 }, { "epoch": 0.76, "learning_rate": 2.9276307837440898e-05, "loss": 0.6562, "step": 6665 }, { "epoch": 0.76, "learning_rate": 2.9250286938281345e-05, "loss": 0.6383, "step": 6666 }, { "epoch": 0.76, "learning_rate": 2.9224275626925746e-05, "loss": 0.6388, "step": 6667 }, { "epoch": 0.76, "learning_rate": 2.919827390689912e-05, "loss": 0.7007, "step": 6668 }, { "epoch": 0.76, "learning_rate": 2.9172281781725118e-05, "loss": 0.7165, "step": 6669 }, { "epoch": 0.76, "learning_rate": 2.9146299254926156e-05, "loss": 0.6057, "step": 6670 }, { "epoch": 0.76, "learning_rate": 2.9120326330023295e-05, "loss": 0.6783, "step": 6671 }, { "epoch": 0.76, "learning_rate": 2.9094363010536306e-05, "loss": 0.7051, "step": 6672 }, { "epoch": 0.76, "learning_rate": 2.9068409299983636e-05, "loss": 0.6886, "step": 6673 }, { "epoch": 0.76, "learning_rate": 2.904246520188253e-05, "loss": 0.6654, "step": 6674 }, { "epoch": 0.76, "learning_rate": 2.9016530719748792e-05, "loss": 0.6821, "step": 6675 }, { "epoch": 0.76, "learning_rate": 2.8990605857097054e-05, "loss": 0.5899, "step": 6676 }, { "epoch": 0.76, "learning_rate": 2.8964690617440547e-05, "loss": 0.6264, "step": 6677 }, { "epoch": 0.76, "learning_rate": 2.89387850042912e-05, "loss": 0.6429, "step": 6678 }, { "epoch": 0.76, "learning_rate": 2.891288902115975e-05, "loss": 0.6552, "step": 6679 }, { "epoch": 0.76, "learning_rate": 2.8887002671555465e-05, "loss": 0.6387, "step": 6680 }, { "epoch": 0.76, "learning_rate": 2.8861125958986446e-05, "loss": 0.6726, "step": 6681 }, { "epoch": 0.76, "learning_rate": 2.8835258886959427e-05, "loss": 0.6897, "step": 6682 }, { "epoch": 0.76, "learning_rate": 2.8809401458979834e-05, "loss": 0.6901, "step": 6683 }, { "epoch": 0.76, "learning_rate": 2.8783553678551746e-05, "loss": 0.6471, "step": 6684 }, { "epoch": 0.76, "learning_rate": 2.8757715549178065e-05, "loss": 0.5847, "step": 6685 }, { "epoch": 0.76, "learning_rate": 2.873188707436023e-05, "loss": 0.6532, "step": 6686 }, { "epoch": 0.76, "learning_rate": 2.8706068257598507e-05, "loss": 0.6827, "step": 6687 }, { "epoch": 0.76, "learning_rate": 2.868025910239176e-05, "loss": 0.6214, "step": 6688 }, { "epoch": 0.76, "learning_rate": 2.8654459612237572e-05, "loss": 0.7018, "step": 6689 }, { "epoch": 0.76, "learning_rate": 2.862866979063219e-05, "loss": 0.685, "step": 6690 }, { "epoch": 0.76, "learning_rate": 2.8602889641070652e-05, "loss": 0.662, "step": 6691 }, { "epoch": 0.76, "learning_rate": 2.857711916704652e-05, "loss": 0.6524, "step": 6692 }, { "epoch": 0.76, "learning_rate": 2.855135837205225e-05, "loss": 0.6714, "step": 6693 }, { "epoch": 0.76, "learning_rate": 2.852560725957876e-05, "loss": 0.6948, "step": 6694 }, { "epoch": 0.76, "learning_rate": 2.8499865833115836e-05, "loss": 0.6706, "step": 6695 }, { "epoch": 0.76, "learning_rate": 2.8474134096151838e-05, "loss": 0.6741, "step": 6696 }, { "epoch": 0.76, "learning_rate": 2.8448412052173922e-05, "loss": 0.6489, "step": 6697 }, { "epoch": 0.76, "learning_rate": 2.84226997046678e-05, "loss": 0.6448, "step": 6698 }, { "epoch": 0.76, "learning_rate": 2.839699705711799e-05, "loss": 0.6607, "step": 6699 }, { "epoch": 0.76, "learning_rate": 2.8371304113007634e-05, "loss": 0.6406, "step": 6700 }, { "epoch": 0.76, "learning_rate": 2.8345620875818535e-05, "loss": 0.6611, "step": 6701 }, { "epoch": 0.76, "learning_rate": 2.831994734903126e-05, "loss": 0.6853, "step": 6702 }, { "epoch": 0.76, "learning_rate": 2.829428353612499e-05, "loss": 0.6537, "step": 6703 }, { "epoch": 0.76, "learning_rate": 2.826862944057759e-05, "loss": 0.7014, "step": 6704 }, { "epoch": 0.76, "learning_rate": 2.8242985065865668e-05, "loss": 0.6369, "step": 6705 }, { "epoch": 0.76, "learning_rate": 2.8217350415464482e-05, "loss": 0.7313, "step": 6706 }, { "epoch": 0.76, "learning_rate": 2.819172549284792e-05, "loss": 0.6131, "step": 6707 }, { "epoch": 0.76, "learning_rate": 2.8166110301488657e-05, "loss": 0.6291, "step": 6708 }, { "epoch": 0.76, "learning_rate": 2.814050484485794e-05, "loss": 0.7056, "step": 6709 }, { "epoch": 0.76, "learning_rate": 2.8114909126425816e-05, "loss": 0.7089, "step": 6710 }, { "epoch": 0.76, "learning_rate": 2.8089323149660895e-05, "loss": 0.6952, "step": 6711 }, { "epoch": 0.76, "learning_rate": 2.806374691803053e-05, "loss": 0.6804, "step": 6712 }, { "epoch": 0.76, "learning_rate": 2.8038180435000716e-05, "loss": 0.6571, "step": 6713 }, { "epoch": 0.76, "learning_rate": 2.801262370403619e-05, "loss": 0.6738, "step": 6714 }, { "epoch": 0.76, "learning_rate": 2.7987076728600292e-05, "loss": 0.646, "step": 6715 }, { "epoch": 0.76, "learning_rate": 2.7961539512155165e-05, "loss": 0.6495, "step": 6716 }, { "epoch": 0.76, "learning_rate": 2.793601205816141e-05, "loss": 0.6734, "step": 6717 }, { "epoch": 0.76, "learning_rate": 2.7910494370078534e-05, "loss": 0.6405, "step": 6718 }, { "epoch": 0.76, "learning_rate": 2.788498645136456e-05, "loss": 0.7166, "step": 6719 }, { "epoch": 0.76, "learning_rate": 2.78594883054763e-05, "loss": 0.5831, "step": 6720 }, { "epoch": 0.76, "learning_rate": 2.7833999935869148e-05, "loss": 0.6476, "step": 6721 }, { "epoch": 0.76, "learning_rate": 2.7808521345997272e-05, "loss": 0.6635, "step": 6722 }, { "epoch": 0.76, "learning_rate": 2.7783052539313437e-05, "loss": 0.6011, "step": 6723 }, { "epoch": 0.76, "learning_rate": 2.7757593519269087e-05, "loss": 0.6645, "step": 6724 }, { "epoch": 0.76, "learning_rate": 2.7732144289314344e-05, "loss": 0.6654, "step": 6725 }, { "epoch": 0.76, "learning_rate": 2.770670485289806e-05, "loss": 0.691, "step": 6726 }, { "epoch": 0.76, "learning_rate": 2.768127521346767e-05, "loss": 0.6335, "step": 6727 }, { "epoch": 0.76, "learning_rate": 2.7655855374469387e-05, "loss": 0.6731, "step": 6728 }, { "epoch": 0.76, "learning_rate": 2.7630445339347998e-05, "loss": 0.6106, "step": 6729 }, { "epoch": 0.76, "learning_rate": 2.760504511154698e-05, "loss": 0.6728, "step": 6730 }, { "epoch": 0.77, "learning_rate": 2.7579654694508562e-05, "loss": 0.6273, "step": 6731 }, { "epoch": 0.77, "learning_rate": 2.7554274091673505e-05, "loss": 0.6349, "step": 6732 }, { "epoch": 0.77, "learning_rate": 2.7528903306481425e-05, "loss": 0.6391, "step": 6733 }, { "epoch": 0.77, "learning_rate": 2.7503542342370382e-05, "loss": 0.6324, "step": 6734 }, { "epoch": 0.77, "learning_rate": 2.747819120277729e-05, "loss": 0.6674, "step": 6735 }, { "epoch": 0.77, "learning_rate": 2.7452849891137634e-05, "loss": 0.7063, "step": 6736 }, { "epoch": 0.77, "learning_rate": 2.7427518410885644e-05, "loss": 0.6138, "step": 6737 }, { "epoch": 0.77, "learning_rate": 2.7402196765454112e-05, "loss": 0.6629, "step": 6738 }, { "epoch": 0.77, "learning_rate": 2.737688495827465e-05, "loss": 0.7076, "step": 6739 }, { "epoch": 0.77, "learning_rate": 2.7351582992777314e-05, "loss": 0.7412, "step": 6740 }, { "epoch": 0.77, "learning_rate": 2.732629087239106e-05, "loss": 0.6412, "step": 6741 }, { "epoch": 0.77, "learning_rate": 2.730100860054333e-05, "loss": 0.6621, "step": 6742 }, { "epoch": 0.77, "learning_rate": 2.7275736180660383e-05, "loss": 0.6715, "step": 6743 }, { "epoch": 0.77, "learning_rate": 2.7250473616166994e-05, "loss": 0.7273, "step": 6744 }, { "epoch": 0.77, "learning_rate": 2.722522091048678e-05, "loss": 0.6421, "step": 6745 }, { "epoch": 0.77, "learning_rate": 2.7199978067041777e-05, "loss": 0.6229, "step": 6746 }, { "epoch": 0.77, "learning_rate": 2.7174745089252928e-05, "loss": 0.7063, "step": 6747 }, { "epoch": 0.77, "learning_rate": 2.7149521980539684e-05, "loss": 0.6803, "step": 6748 }, { "epoch": 0.77, "learning_rate": 2.7124308744320247e-05, "loss": 0.6665, "step": 6749 }, { "epoch": 0.77, "learning_rate": 2.7099105384011436e-05, "loss": 0.7064, "step": 6750 }, { "epoch": 0.77, "learning_rate": 2.7073911903028705e-05, "loss": 0.726, "step": 6751 }, { "epoch": 0.77, "learning_rate": 2.7048728304786253e-05, "loss": 0.6211, "step": 6752 }, { "epoch": 0.77, "learning_rate": 2.702355459269684e-05, "loss": 0.6807, "step": 6753 }, { "epoch": 0.77, "learning_rate": 2.699839077017201e-05, "loss": 0.6182, "step": 6754 }, { "epoch": 0.77, "learning_rate": 2.697323684062181e-05, "loss": 0.6488, "step": 6755 }, { "epoch": 0.77, "learning_rate": 2.6948092807455128e-05, "loss": 0.5436, "step": 6756 }, { "epoch": 0.77, "learning_rate": 2.69229586740793e-05, "loss": 0.6462, "step": 6757 }, { "epoch": 0.77, "learning_rate": 2.6897834443900526e-05, "loss": 0.6201, "step": 6758 }, { "epoch": 0.77, "learning_rate": 2.6872720120323503e-05, "loss": 0.6624, "step": 6759 }, { "epoch": 0.77, "learning_rate": 2.6847615706751716e-05, "loss": 0.6674, "step": 6760 }, { "epoch": 0.77, "learning_rate": 2.6822521206587182e-05, "loss": 0.6008, "step": 6761 }, { "epoch": 0.77, "learning_rate": 2.6797436623230732e-05, "loss": 0.6794, "step": 6762 }, { "epoch": 0.77, "learning_rate": 2.677236196008165e-05, "loss": 0.6754, "step": 6763 }, { "epoch": 0.77, "learning_rate": 2.6747297220538047e-05, "loss": 0.6822, "step": 6764 }, { "epoch": 0.77, "learning_rate": 2.672224240799659e-05, "loss": 0.7402, "step": 6765 }, { "epoch": 0.77, "learning_rate": 2.669719752585269e-05, "loss": 0.7142, "step": 6766 }, { "epoch": 0.77, "learning_rate": 2.6672162577500302e-05, "loss": 0.5869, "step": 6767 }, { "epoch": 0.77, "learning_rate": 2.664713756633219e-05, "loss": 0.6774, "step": 6768 }, { "epoch": 0.77, "learning_rate": 2.662212249573953e-05, "loss": 0.6151, "step": 6769 }, { "epoch": 0.77, "learning_rate": 2.65971173691124e-05, "loss": 0.7297, "step": 6770 }, { "epoch": 0.77, "learning_rate": 2.657212218983938e-05, "loss": 0.6442, "step": 6771 }, { "epoch": 0.77, "learning_rate": 2.6547136961307772e-05, "loss": 0.668, "step": 6772 }, { "epoch": 0.77, "learning_rate": 2.65221616869035e-05, "loss": 0.6419, "step": 6773 }, { "epoch": 0.77, "learning_rate": 2.6497196370011113e-05, "loss": 0.6347, "step": 6774 }, { "epoch": 0.77, "learning_rate": 2.6472241014013888e-05, "loss": 0.7158, "step": 6775 }, { "epoch": 0.77, "learning_rate": 2.6447295622293656e-05, "loss": 0.6646, "step": 6776 }, { "epoch": 0.77, "learning_rate": 2.6422360198231e-05, "loss": 0.6849, "step": 6777 }, { "epoch": 0.77, "learning_rate": 2.6397434745205074e-05, "loss": 0.6485, "step": 6778 }, { "epoch": 0.77, "learning_rate": 2.637251926659371e-05, "loss": 0.6529, "step": 6779 }, { "epoch": 0.77, "learning_rate": 2.6347613765773337e-05, "loss": 0.6211, "step": 6780 }, { "epoch": 0.77, "learning_rate": 2.632271824611916e-05, "loss": 0.6643, "step": 6781 }, { "epoch": 0.77, "learning_rate": 2.629783271100488e-05, "loss": 0.6515, "step": 6782 }, { "epoch": 0.77, "learning_rate": 2.6272957163802982e-05, "loss": 0.6809, "step": 6783 }, { "epoch": 0.77, "learning_rate": 2.6248091607884463e-05, "loss": 0.6836, "step": 6784 }, { "epoch": 0.77, "learning_rate": 2.6223236046619126e-05, "loss": 0.6538, "step": 6785 }, { "epoch": 0.77, "learning_rate": 2.61983904833752e-05, "loss": 0.6107, "step": 6786 }, { "epoch": 0.77, "learning_rate": 2.6173554921519795e-05, "loss": 0.6945, "step": 6787 }, { "epoch": 0.77, "learning_rate": 2.614872936441848e-05, "loss": 0.6568, "step": 6788 }, { "epoch": 0.77, "learning_rate": 2.6123913815435618e-05, "loss": 0.6098, "step": 6789 }, { "epoch": 0.77, "learning_rate": 2.6099108277934103e-05, "loss": 0.6592, "step": 6790 }, { "epoch": 0.77, "learning_rate": 2.607431275527552e-05, "loss": 0.6539, "step": 6791 }, { "epoch": 0.77, "learning_rate": 2.6049527250820048e-05, "loss": 0.7052, "step": 6792 }, { "epoch": 0.77, "learning_rate": 2.6024751767926624e-05, "loss": 0.6835, "step": 6793 }, { "epoch": 0.77, "learning_rate": 2.5999986309952683e-05, "loss": 0.628, "step": 6794 }, { "epoch": 0.77, "learning_rate": 2.597523088025444e-05, "loss": 0.6431, "step": 6795 }, { "epoch": 0.77, "learning_rate": 2.5950485482186638e-05, "loss": 0.6535, "step": 6796 }, { "epoch": 0.77, "learning_rate": 2.5925750119102687e-05, "loss": 0.6872, "step": 6797 }, { "epoch": 0.77, "learning_rate": 2.59010247943547e-05, "loss": 0.669, "step": 6798 }, { "epoch": 0.77, "learning_rate": 2.5876309511293373e-05, "loss": 0.6826, "step": 6799 }, { "epoch": 0.77, "learning_rate": 2.5851604273268003e-05, "loss": 0.6628, "step": 6800 }, { "epoch": 0.77, "learning_rate": 2.5826909083626648e-05, "loss": 0.6236, "step": 6801 }, { "epoch": 0.77, "learning_rate": 2.58022239457159e-05, "loss": 0.5913, "step": 6802 }, { "epoch": 0.77, "learning_rate": 2.5777548862880984e-05, "loss": 0.7295, "step": 6803 }, { "epoch": 0.77, "learning_rate": 2.575288383846587e-05, "loss": 0.7345, "step": 6804 }, { "epoch": 0.77, "learning_rate": 2.572822887581302e-05, "loss": 0.6464, "step": 6805 }, { "epoch": 0.77, "learning_rate": 2.570358397826367e-05, "loss": 0.628, "step": 6806 }, { "epoch": 0.77, "learning_rate": 2.5678949149157606e-05, "loss": 0.6709, "step": 6807 }, { "epoch": 0.77, "learning_rate": 2.5654324391833262e-05, "loss": 0.5683, "step": 6808 }, { "epoch": 0.77, "learning_rate": 2.562970970962768e-05, "loss": 0.686, "step": 6809 }, { "epoch": 0.77, "learning_rate": 2.560510510587666e-05, "loss": 0.6929, "step": 6810 }, { "epoch": 0.77, "learning_rate": 2.5580510583914452e-05, "loss": 0.7122, "step": 6811 }, { "epoch": 0.77, "learning_rate": 2.5555926147074127e-05, "loss": 0.6527, "step": 6812 }, { "epoch": 0.77, "learning_rate": 2.5531351798687265e-05, "loss": 0.6338, "step": 6813 }, { "epoch": 0.77, "learning_rate": 2.5506787542084097e-05, "loss": 0.5503, "step": 6814 }, { "epoch": 0.77, "learning_rate": 2.548223338059349e-05, "loss": 0.6222, "step": 6815 }, { "epoch": 0.77, "learning_rate": 2.545768931754301e-05, "loss": 0.6508, "step": 6816 }, { "epoch": 0.77, "learning_rate": 2.543315535625873e-05, "loss": 0.7241, "step": 6817 }, { "epoch": 0.77, "learning_rate": 2.5408631500065495e-05, "loss": 0.644, "step": 6818 }, { "epoch": 0.78, "learning_rate": 2.5384117752286684e-05, "loss": 0.639, "step": 6819 }, { "epoch": 0.78, "learning_rate": 2.5359614116244323e-05, "loss": 0.6417, "step": 6820 }, { "epoch": 0.78, "learning_rate": 2.5335120595259043e-05, "loss": 0.6716, "step": 6821 }, { "epoch": 0.78, "learning_rate": 2.531063719265021e-05, "loss": 0.6443, "step": 6822 }, { "epoch": 0.78, "learning_rate": 2.528616391173567e-05, "loss": 0.659, "step": 6823 }, { "epoch": 0.78, "learning_rate": 2.526170075583205e-05, "loss": 0.6526, "step": 6824 }, { "epoch": 0.78, "learning_rate": 2.5237247728254498e-05, "loss": 0.7226, "step": 6825 }, { "epoch": 0.78, "learning_rate": 2.5212804832316784e-05, "loss": 0.6729, "step": 6826 }, { "epoch": 0.78, "learning_rate": 2.518837207133139e-05, "loss": 0.7186, "step": 6827 }, { "epoch": 0.78, "learning_rate": 2.5163949448609336e-05, "loss": 0.6951, "step": 6828 }, { "epoch": 0.78, "learning_rate": 2.5139536967460365e-05, "loss": 0.6931, "step": 6829 }, { "epoch": 0.78, "learning_rate": 2.511513463119274e-05, "loss": 0.6152, "step": 6830 }, { "epoch": 0.78, "learning_rate": 2.5090742443113423e-05, "loss": 0.5951, "step": 6831 }, { "epoch": 0.78, "learning_rate": 2.5066360406527922e-05, "loss": 0.6887, "step": 6832 }, { "epoch": 0.78, "learning_rate": 2.50419885247405e-05, "loss": 0.5902, "step": 6833 }, { "epoch": 0.78, "learning_rate": 2.5017626801053895e-05, "loss": 0.6585, "step": 6834 }, { "epoch": 0.78, "learning_rate": 2.4993275238769608e-05, "loss": 0.587, "step": 6835 }, { "epoch": 0.78, "learning_rate": 2.496893384118766e-05, "loss": 0.7274, "step": 6836 }, { "epoch": 0.78, "learning_rate": 2.4944602611606727e-05, "loss": 0.6263, "step": 6837 }, { "epoch": 0.78, "learning_rate": 2.4920281553324087e-05, "loss": 0.7148, "step": 6838 }, { "epoch": 0.78, "learning_rate": 2.4895970669635715e-05, "loss": 0.6521, "step": 6839 }, { "epoch": 0.78, "learning_rate": 2.4871669963836107e-05, "loss": 0.6702, "step": 6840 }, { "epoch": 0.78, "learning_rate": 2.4847379439218477e-05, "loss": 0.7387, "step": 6841 }, { "epoch": 0.78, "learning_rate": 2.4823099099074564e-05, "loss": 0.7168, "step": 6842 }, { "epoch": 0.78, "learning_rate": 2.4798828946694807e-05, "loss": 0.6512, "step": 6843 }, { "epoch": 0.78, "learning_rate": 2.4774568985368173e-05, "loss": 0.687, "step": 6844 }, { "epoch": 0.78, "learning_rate": 2.4750319218382368e-05, "loss": 0.6664, "step": 6845 }, { "epoch": 0.78, "learning_rate": 2.4726079649023603e-05, "loss": 0.6232, "step": 6846 }, { "epoch": 0.78, "learning_rate": 2.47018502805768e-05, "loss": 0.6533, "step": 6847 }, { "epoch": 0.78, "learning_rate": 2.467763111632544e-05, "loss": 0.6939, "step": 6848 }, { "epoch": 0.78, "learning_rate": 2.465342215955161e-05, "loss": 0.6019, "step": 6849 }, { "epoch": 0.78, "learning_rate": 2.4629223413536085e-05, "loss": 0.5956, "step": 6850 }, { "epoch": 0.78, "learning_rate": 2.4605034881558165e-05, "loss": 0.7002, "step": 6851 }, { "epoch": 0.78, "learning_rate": 2.458085656689586e-05, "loss": 0.6184, "step": 6852 }, { "epoch": 0.78, "learning_rate": 2.455668847282573e-05, "loss": 0.6203, "step": 6853 }, { "epoch": 0.78, "learning_rate": 2.453253060262296e-05, "loss": 0.6929, "step": 6854 }, { "epoch": 0.78, "learning_rate": 2.4508382959561337e-05, "loss": 0.7057, "step": 6855 }, { "epoch": 0.78, "learning_rate": 2.4484245546913333e-05, "loss": 0.6529, "step": 6856 }, { "epoch": 0.78, "learning_rate": 2.4460118367949912e-05, "loss": 0.6514, "step": 6857 }, { "epoch": 0.78, "learning_rate": 2.4436001425940815e-05, "loss": 0.628, "step": 6858 }, { "epoch": 0.78, "learning_rate": 2.441189472415424e-05, "loss": 0.6821, "step": 6859 }, { "epoch": 0.78, "learning_rate": 2.4387798265857074e-05, "loss": 0.6616, "step": 6860 }, { "epoch": 0.78, "learning_rate": 2.436371205431477e-05, "loss": 0.6527, "step": 6861 }, { "epoch": 0.78, "learning_rate": 2.4339636092791485e-05, "loss": 0.7233, "step": 6862 }, { "epoch": 0.78, "learning_rate": 2.4315570384549867e-05, "loss": 0.7172, "step": 6863 }, { "epoch": 0.78, "learning_rate": 2.4291514932851335e-05, "loss": 0.7046, "step": 6864 }, { "epoch": 0.78, "learning_rate": 2.4267469740955673e-05, "loss": 0.6764, "step": 6865 }, { "epoch": 0.78, "learning_rate": 2.4243434812121514e-05, "loss": 0.5702, "step": 6866 }, { "epoch": 0.78, "learning_rate": 2.421941014960596e-05, "loss": 0.6947, "step": 6867 }, { "epoch": 0.78, "learning_rate": 2.4195395756664817e-05, "loss": 0.713, "step": 6868 }, { "epoch": 0.78, "learning_rate": 2.4171391636552388e-05, "loss": 0.6556, "step": 6869 }, { "epoch": 0.78, "learning_rate": 2.414739779252171e-05, "loss": 0.7064, "step": 6870 }, { "epoch": 0.78, "learning_rate": 2.4123414227824316e-05, "loss": 0.6721, "step": 6871 }, { "epoch": 0.78, "learning_rate": 2.4099440945710383e-05, "loss": 0.6649, "step": 6872 }, { "epoch": 0.78, "learning_rate": 2.4075477949428748e-05, "loss": 0.6641, "step": 6873 }, { "epoch": 0.78, "learning_rate": 2.405152524222678e-05, "loss": 0.6584, "step": 6874 }, { "epoch": 0.78, "learning_rate": 2.402758282735047e-05, "loss": 0.6329, "step": 6875 }, { "epoch": 0.78, "learning_rate": 2.4003650708044468e-05, "loss": 0.6059, "step": 6876 }, { "epoch": 0.78, "learning_rate": 2.3979728887551968e-05, "loss": 0.6522, "step": 6877 }, { "epoch": 0.78, "learning_rate": 2.395581736911475e-05, "loss": 0.6461, "step": 6878 }, { "epoch": 0.78, "learning_rate": 2.3931916155973312e-05, "loss": 0.6773, "step": 6879 }, { "epoch": 0.78, "learning_rate": 2.3908025251366606e-05, "loss": 0.6877, "step": 6880 }, { "epoch": 0.78, "learning_rate": 2.388414465853235e-05, "loss": 0.6897, "step": 6881 }, { "epoch": 0.78, "learning_rate": 2.386027438070667e-05, "loss": 0.6802, "step": 6882 }, { "epoch": 0.78, "learning_rate": 2.3836414421124476e-05, "loss": 0.6376, "step": 6883 }, { "epoch": 0.78, "learning_rate": 2.381256478301914e-05, "loss": 0.7394, "step": 6884 }, { "epoch": 0.78, "learning_rate": 2.3788725469622774e-05, "loss": 0.6769, "step": 6885 }, { "epoch": 0.78, "learning_rate": 2.3764896484165943e-05, "loss": 0.6694, "step": 6886 }, { "epoch": 0.78, "learning_rate": 2.3741077829877978e-05, "loss": 0.7082, "step": 6887 }, { "epoch": 0.78, "learning_rate": 2.3717269509986607e-05, "loss": 0.6772, "step": 6888 }, { "epoch": 0.78, "learning_rate": 2.3693471527718335e-05, "loss": 0.6126, "step": 6889 }, { "epoch": 0.78, "learning_rate": 2.3669683886298154e-05, "loss": 0.6163, "step": 6890 }, { "epoch": 0.78, "learning_rate": 2.3645906588949763e-05, "loss": 0.6478, "step": 6891 }, { "epoch": 0.78, "learning_rate": 2.3622139638895314e-05, "loss": 0.6648, "step": 6892 }, { "epoch": 0.78, "learning_rate": 2.359838303935572e-05, "loss": 0.6586, "step": 6893 }, { "epoch": 0.78, "learning_rate": 2.3574636793550377e-05, "loss": 0.7021, "step": 6894 }, { "epoch": 0.78, "learning_rate": 2.3550900904697292e-05, "loss": 0.6866, "step": 6895 }, { "epoch": 0.78, "learning_rate": 2.3527175376013066e-05, "loss": 0.6806, "step": 6896 }, { "epoch": 0.78, "learning_rate": 2.350346021071299e-05, "loss": 0.6229, "step": 6897 }, { "epoch": 0.78, "learning_rate": 2.3479755412010807e-05, "loss": 0.6948, "step": 6898 }, { "epoch": 0.78, "learning_rate": 2.3456060983118976e-05, "loss": 0.6544, "step": 6899 }, { "epoch": 0.78, "learning_rate": 2.343237692724848e-05, "loss": 0.6674, "step": 6900 }, { "epoch": 0.78, "learning_rate": 2.3408703247608886e-05, "loss": 0.691, "step": 6901 }, { "epoch": 0.78, "learning_rate": 2.338503994740844e-05, "loss": 0.6362, "step": 6902 }, { "epoch": 0.78, "learning_rate": 2.3361387029853877e-05, "loss": 0.6282, "step": 6903 }, { "epoch": 0.78, "learning_rate": 2.333774449815065e-05, "loss": 0.633, "step": 6904 }, { "epoch": 0.78, "learning_rate": 2.3314112355502615e-05, "loss": 0.6829, "step": 6905 }, { "epoch": 0.78, "learning_rate": 2.3290490605112436e-05, "loss": 0.6892, "step": 6906 }, { "epoch": 0.79, "learning_rate": 2.3266879250181195e-05, "loss": 0.6192, "step": 6907 }, { "epoch": 0.79, "learning_rate": 2.3243278293908687e-05, "loss": 0.6313, "step": 6908 }, { "epoch": 0.79, "learning_rate": 2.3219687739493212e-05, "loss": 0.6301, "step": 6909 }, { "epoch": 0.79, "learning_rate": 2.3196107590131766e-05, "loss": 0.636, "step": 6910 }, { "epoch": 0.79, "learning_rate": 2.317253784901976e-05, "loss": 0.7291, "step": 6911 }, { "epoch": 0.79, "learning_rate": 2.314897851935137e-05, "loss": 0.6593, "step": 6912 }, { "epoch": 0.79, "learning_rate": 2.3125429604319248e-05, "loss": 0.71, "step": 6913 }, { "epoch": 0.79, "learning_rate": 2.3101891107114738e-05, "loss": 0.6947, "step": 6914 }, { "epoch": 0.79, "learning_rate": 2.307836303092764e-05, "loss": 0.6738, "step": 6915 }, { "epoch": 0.79, "learning_rate": 2.305484537894651e-05, "loss": 0.6824, "step": 6916 }, { "epoch": 0.79, "learning_rate": 2.3031338154358285e-05, "loss": 0.6547, "step": 6917 }, { "epoch": 0.79, "learning_rate": 2.300784136034867e-05, "loss": 0.6383, "step": 6918 }, { "epoch": 0.79, "learning_rate": 2.298435500010183e-05, "loss": 0.6491, "step": 6919 }, { "epoch": 0.79, "learning_rate": 2.2960879076800635e-05, "loss": 0.6969, "step": 6920 }, { "epoch": 0.79, "learning_rate": 2.2937413593626443e-05, "loss": 0.6237, "step": 6921 }, { "epoch": 0.79, "learning_rate": 2.2913958553759207e-05, "loss": 0.6475, "step": 6922 }, { "epoch": 0.79, "learning_rate": 2.2890513960377536e-05, "loss": 0.6691, "step": 6923 }, { "epoch": 0.79, "learning_rate": 2.286707981665853e-05, "loss": 0.6688, "step": 6924 }, { "epoch": 0.79, "learning_rate": 2.2843656125777978e-05, "loss": 0.6122, "step": 6925 }, { "epoch": 0.79, "learning_rate": 2.282024289091014e-05, "loss": 0.6123, "step": 6926 }, { "epoch": 0.79, "learning_rate": 2.2796840115227968e-05, "loss": 0.7528, "step": 6927 }, { "epoch": 0.79, "learning_rate": 2.277344780190286e-05, "loss": 0.6721, "step": 6928 }, { "epoch": 0.79, "learning_rate": 2.2750065954104937e-05, "loss": 0.6858, "step": 6929 }, { "epoch": 0.79, "learning_rate": 2.2726694575002815e-05, "loss": 0.6865, "step": 6930 }, { "epoch": 0.79, "learning_rate": 2.270333366776375e-05, "loss": 0.6742, "step": 6931 }, { "epoch": 0.79, "learning_rate": 2.2679983235553493e-05, "loss": 0.6452, "step": 6932 }, { "epoch": 0.79, "learning_rate": 2.2656643281536527e-05, "loss": 0.7014, "step": 6933 }, { "epoch": 0.79, "learning_rate": 2.263331380887569e-05, "loss": 0.6459, "step": 6934 }, { "epoch": 0.79, "learning_rate": 2.2609994820732627e-05, "loss": 0.6951, "step": 6935 }, { "epoch": 0.79, "learning_rate": 2.2586686320267393e-05, "loss": 0.5664, "step": 6936 }, { "epoch": 0.79, "learning_rate": 2.2563388310638754e-05, "loss": 0.6782, "step": 6937 }, { "epoch": 0.79, "learning_rate": 2.254010079500396e-05, "loss": 0.6268, "step": 6938 }, { "epoch": 0.79, "learning_rate": 2.2516823776518868e-05, "loss": 0.615, "step": 6939 }, { "epoch": 0.79, "learning_rate": 2.2493557258337893e-05, "loss": 0.6737, "step": 6940 }, { "epoch": 0.79, "learning_rate": 2.2470301243614113e-05, "loss": 0.6822, "step": 6941 }, { "epoch": 0.79, "learning_rate": 2.2447055735499034e-05, "loss": 0.6295, "step": 6942 }, { "epoch": 0.79, "learning_rate": 2.242382073714291e-05, "loss": 0.5635, "step": 6943 }, { "epoch": 0.79, "learning_rate": 2.2400596251694427e-05, "loss": 0.66, "step": 6944 }, { "epoch": 0.79, "learning_rate": 2.2377382282300907e-05, "loss": 0.621, "step": 6945 }, { "epoch": 0.79, "learning_rate": 2.2354178832108264e-05, "loss": 0.6888, "step": 6946 }, { "epoch": 0.79, "learning_rate": 2.233098590426094e-05, "loss": 0.6589, "step": 6947 }, { "epoch": 0.79, "learning_rate": 2.2307803501902002e-05, "loss": 0.6827, "step": 6948 }, { "epoch": 0.79, "learning_rate": 2.228463162817306e-05, "loss": 0.6601, "step": 6949 }, { "epoch": 0.79, "learning_rate": 2.226147028621428e-05, "loss": 0.6178, "step": 6950 }, { "epoch": 0.79, "learning_rate": 2.2238319479164426e-05, "loss": 0.6792, "step": 6951 }, { "epoch": 0.79, "learning_rate": 2.2215179210160864e-05, "loss": 0.6662, "step": 6952 }, { "epoch": 0.79, "learning_rate": 2.219204948233944e-05, "loss": 0.6371, "step": 6953 }, { "epoch": 0.79, "learning_rate": 2.21689302988347e-05, "loss": 0.6653, "step": 6954 }, { "epoch": 0.79, "learning_rate": 2.214582166277963e-05, "loss": 0.6767, "step": 6955 }, { "epoch": 0.79, "learning_rate": 2.2122723577305927e-05, "loss": 0.6788, "step": 6956 }, { "epoch": 0.79, "learning_rate": 2.209963604554367e-05, "loss": 0.5838, "step": 6957 }, { "epoch": 0.79, "learning_rate": 2.2076559070621707e-05, "loss": 0.5882, "step": 6958 }, { "epoch": 0.79, "learning_rate": 2.2053492655667296e-05, "loss": 0.7162, "step": 6959 }, { "epoch": 0.79, "learning_rate": 2.203043680380641e-05, "loss": 0.7363, "step": 6960 }, { "epoch": 0.79, "learning_rate": 2.200739151816347e-05, "loss": 0.6533, "step": 6961 }, { "epoch": 0.79, "learning_rate": 2.1984356801861506e-05, "loss": 0.6822, "step": 6962 }, { "epoch": 0.79, "learning_rate": 2.1961332658022106e-05, "loss": 0.6613, "step": 6963 }, { "epoch": 0.79, "learning_rate": 2.193831908976548e-05, "loss": 0.6711, "step": 6964 }, { "epoch": 0.79, "learning_rate": 2.1915316100210303e-05, "loss": 0.6096, "step": 6965 }, { "epoch": 0.79, "learning_rate": 2.1892323692473948e-05, "loss": 0.5679, "step": 6966 }, { "epoch": 0.79, "learning_rate": 2.1869341869672254e-05, "loss": 0.6515, "step": 6967 }, { "epoch": 0.79, "learning_rate": 2.184637063491961e-05, "loss": 0.6455, "step": 6968 }, { "epoch": 0.79, "learning_rate": 2.182340999132908e-05, "loss": 0.6107, "step": 6969 }, { "epoch": 0.79, "learning_rate": 2.1800459942012195e-05, "loss": 0.6843, "step": 6970 }, { "epoch": 0.79, "learning_rate": 2.177752049007906e-05, "loss": 0.629, "step": 6971 }, { "epoch": 0.79, "learning_rate": 2.175459163863841e-05, "loss": 0.669, "step": 6972 }, { "epoch": 0.79, "learning_rate": 2.173167339079748e-05, "loss": 0.5645, "step": 6973 }, { "epoch": 0.79, "learning_rate": 2.1708765749662064e-05, "loss": 0.5993, "step": 6974 }, { "epoch": 0.79, "learning_rate": 2.1685868718336578e-05, "loss": 0.6676, "step": 6975 }, { "epoch": 0.79, "learning_rate": 2.1662982299923928e-05, "loss": 0.6661, "step": 6976 }, { "epoch": 0.79, "learning_rate": 2.164010649752567e-05, "loss": 0.6248, "step": 6977 }, { "epoch": 0.79, "learning_rate": 2.1617241314241833e-05, "loss": 0.6365, "step": 6978 }, { "epoch": 0.79, "learning_rate": 2.1594386753171037e-05, "loss": 0.5849, "step": 6979 }, { "epoch": 0.79, "learning_rate": 2.157154281741046e-05, "loss": 0.6462, "step": 6980 }, { "epoch": 0.79, "learning_rate": 2.15487095100559e-05, "loss": 0.6725, "step": 6981 }, { "epoch": 0.79, "learning_rate": 2.1525886834201592e-05, "loss": 0.6666, "step": 6982 }, { "epoch": 0.79, "learning_rate": 2.150307479294048e-05, "loss": 0.5815, "step": 6983 }, { "epoch": 0.79, "learning_rate": 2.1480273389363937e-05, "loss": 0.6586, "step": 6984 }, { "epoch": 0.79, "learning_rate": 2.1457482626561953e-05, "loss": 0.6517, "step": 6985 }, { "epoch": 0.79, "learning_rate": 2.1434702507623063e-05, "loss": 0.6704, "step": 6986 }, { "epoch": 0.79, "learning_rate": 2.141193303563438e-05, "loss": 0.6472, "step": 6987 }, { "epoch": 0.79, "learning_rate": 2.138917421368154e-05, "loss": 0.6153, "step": 6988 }, { "epoch": 0.79, "learning_rate": 2.1366426044848796e-05, "loss": 0.6724, "step": 6989 }, { "epoch": 0.79, "learning_rate": 2.1343688532218886e-05, "loss": 0.7625, "step": 6990 }, { "epoch": 0.79, "learning_rate": 2.132096167887314e-05, "loss": 0.7365, "step": 6991 }, { "epoch": 0.79, "learning_rate": 2.12982454878914e-05, "loss": 0.6685, "step": 6992 }, { "epoch": 0.79, "learning_rate": 2.1275539962352177e-05, "loss": 0.6394, "step": 6993 }, { "epoch": 0.79, "learning_rate": 2.1252845105332386e-05, "loss": 0.6919, "step": 6994 }, { "epoch": 0.8, "learning_rate": 2.1230160919907626e-05, "loss": 0.6039, "step": 6995 }, { "epoch": 0.8, "learning_rate": 2.120748740915198e-05, "loss": 0.6391, "step": 6996 }, { "epoch": 0.8, "learning_rate": 2.118482457613806e-05, "loss": 0.7365, "step": 6997 }, { "epoch": 0.8, "learning_rate": 2.1162172423937143e-05, "loss": 0.6331, "step": 6998 }, { "epoch": 0.8, "learning_rate": 2.1139530955618914e-05, "loss": 0.6811, "step": 6999 }, { "epoch": 0.8, "learning_rate": 2.111690017425173e-05, "loss": 0.7252, "step": 7000 }, { "epoch": 0.8, "learning_rate": 2.109428008290244e-05, "loss": 0.7086, "step": 7001 }, { "epoch": 0.8, "learning_rate": 2.1071670684636448e-05, "loss": 0.7492, "step": 7002 }, { "epoch": 0.8, "learning_rate": 2.10490719825177e-05, "loss": 0.6896, "step": 7003 }, { "epoch": 0.8, "learning_rate": 2.1026483979608748e-05, "loss": 0.66, "step": 7004 }, { "epoch": 0.8, "learning_rate": 2.100390667897061e-05, "loss": 0.6792, "step": 7005 }, { "epoch": 0.8, "learning_rate": 2.0981340083662946e-05, "loss": 0.6706, "step": 7006 }, { "epoch": 0.8, "learning_rate": 2.0958784196743896e-05, "loss": 0.6467, "step": 7007 }, { "epoch": 0.8, "learning_rate": 2.0936239021270178e-05, "loss": 0.6687, "step": 7008 }, { "epoch": 0.8, "learning_rate": 2.091370456029701e-05, "loss": 0.6925, "step": 7009 }, { "epoch": 0.8, "learning_rate": 2.0891180816878265e-05, "loss": 0.7352, "step": 7010 }, { "epoch": 0.8, "learning_rate": 2.086866779406623e-05, "loss": 0.6174, "step": 7011 }, { "epoch": 0.8, "learning_rate": 2.0846165494911886e-05, "loss": 0.6517, "step": 7012 }, { "epoch": 0.8, "learning_rate": 2.0823673922464627e-05, "loss": 0.6566, "step": 7013 }, { "epoch": 0.8, "learning_rate": 2.0801193079772463e-05, "loss": 0.6373, "step": 7014 }, { "epoch": 0.8, "learning_rate": 2.0778722969881915e-05, "loss": 0.6811, "step": 7015 }, { "epoch": 0.8, "learning_rate": 2.075626359583811e-05, "loss": 0.7029, "step": 7016 }, { "epoch": 0.8, "learning_rate": 2.073381496068463e-05, "loss": 0.6309, "step": 7017 }, { "epoch": 0.8, "learning_rate": 2.07113770674637e-05, "loss": 0.708, "step": 7018 }, { "epoch": 0.8, "learning_rate": 2.0688949919216026e-05, "loss": 0.5725, "step": 7019 }, { "epoch": 0.8, "learning_rate": 2.0666533518980834e-05, "loss": 0.6574, "step": 7020 }, { "epoch": 0.8, "learning_rate": 2.0644127869795994e-05, "loss": 0.7222, "step": 7021 }, { "epoch": 0.8, "learning_rate": 2.0621732974697804e-05, "loss": 0.6471, "step": 7022 }, { "epoch": 0.8, "learning_rate": 2.05993488367212e-05, "loss": 0.6926, "step": 7023 }, { "epoch": 0.8, "learning_rate": 2.0576975458899606e-05, "loss": 0.6434, "step": 7024 }, { "epoch": 0.8, "learning_rate": 2.0554612844264997e-05, "loss": 0.7172, "step": 7025 }, { "epoch": 0.8, "learning_rate": 2.053226099584785e-05, "loss": 0.6371, "step": 7026 }, { "epoch": 0.8, "learning_rate": 2.05099199166773e-05, "loss": 0.6908, "step": 7027 }, { "epoch": 0.8, "learning_rate": 2.048758960978088e-05, "loss": 0.6143, "step": 7028 }, { "epoch": 0.8, "learning_rate": 2.0465270078184793e-05, "loss": 0.6889, "step": 7029 }, { "epoch": 0.8, "learning_rate": 2.044296132491369e-05, "loss": 0.6255, "step": 7030 }, { "epoch": 0.8, "learning_rate": 2.0420663352990787e-05, "loss": 0.6724, "step": 7031 }, { "epoch": 0.8, "learning_rate": 2.0398376165437815e-05, "loss": 0.6852, "step": 7032 }, { "epoch": 0.8, "learning_rate": 2.0376099765275135e-05, "loss": 0.64, "step": 7033 }, { "epoch": 0.8, "learning_rate": 2.0353834155521522e-05, "loss": 0.6026, "step": 7034 }, { "epoch": 0.8, "learning_rate": 2.0331579339194428e-05, "loss": 0.6102, "step": 7035 }, { "epoch": 0.8, "learning_rate": 2.0309335319309664e-05, "loss": 0.6444, "step": 7036 }, { "epoch": 0.8, "learning_rate": 2.0287102098881762e-05, "loss": 0.6247, "step": 7037 }, { "epoch": 0.8, "learning_rate": 2.0264879680923632e-05, "loss": 0.6505, "step": 7038 }, { "epoch": 0.8, "learning_rate": 2.024266806844687e-05, "loss": 0.6221, "step": 7039 }, { "epoch": 0.8, "learning_rate": 2.022046726446145e-05, "loss": 0.5988, "step": 7040 }, { "epoch": 0.8, "learning_rate": 2.0198277271976052e-05, "loss": 0.6567, "step": 7041 }, { "epoch": 0.8, "learning_rate": 2.0176098093997753e-05, "loss": 0.6236, "step": 7042 }, { "epoch": 0.8, "learning_rate": 2.0153929733532195e-05, "loss": 0.6655, "step": 7043 }, { "epoch": 0.8, "learning_rate": 2.013177219358362e-05, "loss": 0.7259, "step": 7044 }, { "epoch": 0.8, "learning_rate": 2.0109625477154737e-05, "loss": 0.5804, "step": 7045 }, { "epoch": 0.8, "learning_rate": 2.0087489587246767e-05, "loss": 0.6385, "step": 7046 }, { "epoch": 0.8, "learning_rate": 2.0065364526859576e-05, "loss": 0.618, "step": 7047 }, { "epoch": 0.8, "learning_rate": 2.0043250298991444e-05, "loss": 0.6464, "step": 7048 }, { "epoch": 0.8, "learning_rate": 2.002114690663922e-05, "loss": 0.6352, "step": 7049 }, { "epoch": 0.8, "learning_rate": 1.999905435279833e-05, "loss": 0.6712, "step": 7050 }, { "epoch": 0.8, "learning_rate": 1.9976972640462664e-05, "loss": 0.6175, "step": 7051 }, { "epoch": 0.8, "learning_rate": 1.9954901772624745e-05, "loss": 0.7001, "step": 7052 }, { "epoch": 0.8, "learning_rate": 1.9932841752275435e-05, "loss": 0.6389, "step": 7053 }, { "epoch": 0.8, "learning_rate": 1.9910792582404348e-05, "loss": 0.7061, "step": 7054 }, { "epoch": 0.8, "learning_rate": 1.9888754265999454e-05, "loss": 0.5906, "step": 7055 }, { "epoch": 0.8, "learning_rate": 1.9866726806047386e-05, "loss": 0.6726, "step": 7056 }, { "epoch": 0.8, "learning_rate": 1.9844710205533203e-05, "loss": 0.6997, "step": 7057 }, { "epoch": 0.8, "learning_rate": 1.982270446744059e-05, "loss": 0.6659, "step": 7058 }, { "epoch": 0.8, "learning_rate": 1.980070959475161e-05, "loss": 0.6403, "step": 7059 }, { "epoch": 0.8, "learning_rate": 1.9778725590447022e-05, "loss": 0.6498, "step": 7060 }, { "epoch": 0.8, "learning_rate": 1.9756752457506e-05, "loss": 0.6606, "step": 7061 }, { "epoch": 0.8, "learning_rate": 1.9734790198906306e-05, "loss": 0.7198, "step": 7062 }, { "epoch": 0.8, "learning_rate": 1.971283881762417e-05, "loss": 0.6808, "step": 7063 }, { "epoch": 0.8, "learning_rate": 1.969089831663443e-05, "loss": 0.6445, "step": 7064 }, { "epoch": 0.8, "learning_rate": 1.9668968698910385e-05, "loss": 0.6721, "step": 7065 }, { "epoch": 0.8, "learning_rate": 1.964704996742387e-05, "loss": 0.7005, "step": 7066 }, { "epoch": 0.8, "learning_rate": 1.9625142125145213e-05, "loss": 0.6215, "step": 7067 }, { "epoch": 0.8, "learning_rate": 1.9603245175043362e-05, "loss": 0.6625, "step": 7068 }, { "epoch": 0.8, "learning_rate": 1.9581359120085707e-05, "loss": 0.6733, "step": 7069 }, { "epoch": 0.8, "learning_rate": 1.9559483963238168e-05, "loss": 0.6137, "step": 7070 }, { "epoch": 0.8, "learning_rate": 1.9537619707465237e-05, "loss": 0.6475, "step": 7071 }, { "epoch": 0.8, "learning_rate": 1.9515766355729857e-05, "loss": 0.6413, "step": 7072 }, { "epoch": 0.8, "learning_rate": 1.9493923910993594e-05, "loss": 0.6901, "step": 7073 }, { "epoch": 0.8, "learning_rate": 1.947209237621641e-05, "loss": 0.5921, "step": 7074 }, { "epoch": 0.8, "learning_rate": 1.945027175435694e-05, "loss": 0.7098, "step": 7075 }, { "epoch": 0.8, "learning_rate": 1.9428462048372142e-05, "loss": 0.6486, "step": 7076 }, { "epoch": 0.8, "learning_rate": 1.9406663261217684e-05, "loss": 0.6495, "step": 7077 }, { "epoch": 0.8, "learning_rate": 1.9384875395847634e-05, "loss": 0.6598, "step": 7078 }, { "epoch": 0.8, "learning_rate": 1.9363098455214668e-05, "loss": 0.6791, "step": 7079 }, { "epoch": 0.8, "learning_rate": 1.934133244226989e-05, "loss": 0.7072, "step": 7080 }, { "epoch": 0.8, "learning_rate": 1.9319577359963037e-05, "loss": 0.6339, "step": 7081 }, { "epoch": 0.8, "learning_rate": 1.929783321124221e-05, "loss": 0.6299, "step": 7082 }, { "epoch": 0.81, "learning_rate": 1.9276099999054176e-05, "loss": 0.7515, "step": 7083 }, { "epoch": 0.81, "learning_rate": 1.925437772634412e-05, "loss": 0.6221, "step": 7084 }, { "epoch": 0.81, "learning_rate": 1.923266639605582e-05, "loss": 0.6701, "step": 7085 }, { "epoch": 0.81, "learning_rate": 1.9210966011131504e-05, "loss": 0.551, "step": 7086 }, { "epoch": 0.81, "learning_rate": 1.9189276574512006e-05, "loss": 0.6013, "step": 7087 }, { "epoch": 0.81, "learning_rate": 1.916759808913653e-05, "loss": 0.6727, "step": 7088 }, { "epoch": 0.81, "learning_rate": 1.9145930557942958e-05, "loss": 0.7446, "step": 7089 }, { "epoch": 0.81, "learning_rate": 1.9124273983867547e-05, "loss": 0.7544, "step": 7090 }, { "epoch": 0.81, "learning_rate": 1.910262836984521e-05, "loss": 0.7089, "step": 7091 }, { "epoch": 0.81, "learning_rate": 1.908099371880926e-05, "loss": 0.7191, "step": 7092 }, { "epoch": 0.81, "learning_rate": 1.905937003369155e-05, "loss": 0.6852, "step": 7093 }, { "epoch": 0.81, "learning_rate": 1.903775731742249e-05, "loss": 0.6259, "step": 7094 }, { "epoch": 0.81, "learning_rate": 1.901615557293095e-05, "loss": 0.7348, "step": 7095 }, { "epoch": 0.81, "learning_rate": 1.8994564803144376e-05, "loss": 0.5834, "step": 7096 }, { "epoch": 0.81, "learning_rate": 1.897298501098864e-05, "loss": 0.5647, "step": 7097 }, { "epoch": 0.81, "learning_rate": 1.895141619938825e-05, "loss": 0.6629, "step": 7098 }, { "epoch": 0.81, "learning_rate": 1.8929858371266052e-05, "loss": 0.6872, "step": 7099 }, { "epoch": 0.81, "learning_rate": 1.890831152954359e-05, "loss": 0.6838, "step": 7100 }, { "epoch": 0.81, "learning_rate": 1.8886775677140756e-05, "loss": 0.6549, "step": 7101 }, { "epoch": 0.81, "learning_rate": 1.88652508169761e-05, "loss": 0.6669, "step": 7102 }, { "epoch": 0.81, "learning_rate": 1.8843736951966552e-05, "loss": 0.6941, "step": 7103 }, { "epoch": 0.81, "learning_rate": 1.882223408502769e-05, "loss": 0.6302, "step": 7104 }, { "epoch": 0.81, "learning_rate": 1.880074221907342e-05, "loss": 0.6264, "step": 7105 }, { "epoch": 0.81, "learning_rate": 1.8779261357016332e-05, "loss": 0.6125, "step": 7106 }, { "epoch": 0.81, "learning_rate": 1.8757791501767407e-05, "loss": 0.6525, "step": 7107 }, { "epoch": 0.81, "learning_rate": 1.8736332656236234e-05, "loss": 0.5916, "step": 7108 }, { "epoch": 0.81, "learning_rate": 1.8714884823330813e-05, "loss": 0.6699, "step": 7109 }, { "epoch": 0.81, "learning_rate": 1.8693448005957726e-05, "loss": 0.6942, "step": 7110 }, { "epoch": 0.81, "learning_rate": 1.8672022207021978e-05, "loss": 0.6338, "step": 7111 }, { "epoch": 0.81, "learning_rate": 1.865060742942719e-05, "loss": 0.6441, "step": 7112 }, { "epoch": 0.81, "learning_rate": 1.8629203676075392e-05, "loss": 0.6563, "step": 7113 }, { "epoch": 0.81, "learning_rate": 1.8607810949867198e-05, "loss": 0.6935, "step": 7114 }, { "epoch": 0.81, "learning_rate": 1.8586429253701677e-05, "loss": 0.6693, "step": 7115 }, { "epoch": 0.81, "learning_rate": 1.856505859047638e-05, "loss": 0.6471, "step": 7116 }, { "epoch": 0.81, "learning_rate": 1.8543698963087464e-05, "loss": 0.6396, "step": 7117 }, { "epoch": 0.81, "learning_rate": 1.8522350374429475e-05, "loss": 0.6672, "step": 7118 }, { "epoch": 0.81, "learning_rate": 1.8501012827395546e-05, "loss": 0.7456, "step": 7119 }, { "epoch": 0.81, "learning_rate": 1.8479686324877278e-05, "loss": 0.6817, "step": 7120 }, { "epoch": 0.81, "learning_rate": 1.8458370869764774e-05, "loss": 0.6344, "step": 7121 }, { "epoch": 0.81, "learning_rate": 1.8437066464946607e-05, "loss": 0.6952, "step": 7122 }, { "epoch": 0.81, "learning_rate": 1.8415773113309952e-05, "loss": 0.5953, "step": 7123 }, { "epoch": 0.81, "learning_rate": 1.8394490817740384e-05, "loss": 0.6537, "step": 7124 }, { "epoch": 0.81, "learning_rate": 1.837321958112205e-05, "loss": 0.6102, "step": 7125 }, { "epoch": 0.81, "learning_rate": 1.835195940633755e-05, "loss": 0.663, "step": 7126 }, { "epoch": 0.81, "learning_rate": 1.8330710296268016e-05, "loss": 0.6498, "step": 7127 }, { "epoch": 0.81, "learning_rate": 1.8309472253793024e-05, "loss": 0.6503, "step": 7128 }, { "epoch": 0.81, "learning_rate": 1.828824528179076e-05, "loss": 0.737, "step": 7129 }, { "epoch": 0.81, "learning_rate": 1.826702938313779e-05, "loss": 0.6429, "step": 7130 }, { "epoch": 0.81, "learning_rate": 1.8245824560709278e-05, "loss": 0.7609, "step": 7131 }, { "epoch": 0.81, "learning_rate": 1.822463081737883e-05, "loss": 0.6105, "step": 7132 }, { "epoch": 0.81, "learning_rate": 1.8203448156018543e-05, "loss": 0.6429, "step": 7133 }, { "epoch": 0.81, "learning_rate": 1.8182276579499025e-05, "loss": 0.6807, "step": 7134 }, { "epoch": 0.81, "learning_rate": 1.8161116090689434e-05, "loss": 0.6329, "step": 7135 }, { "epoch": 0.81, "learning_rate": 1.813996669245732e-05, "loss": 0.5933, "step": 7136 }, { "epoch": 0.81, "learning_rate": 1.811882838766885e-05, "loss": 0.6429, "step": 7137 }, { "epoch": 0.81, "learning_rate": 1.809770117918862e-05, "loss": 0.6776, "step": 7138 }, { "epoch": 0.81, "learning_rate": 1.807658506987967e-05, "loss": 0.631, "step": 7139 }, { "epoch": 0.81, "learning_rate": 1.805548006260367e-05, "loss": 0.6418, "step": 7140 }, { "epoch": 0.81, "learning_rate": 1.8034386160220683e-05, "loss": 0.6948, "step": 7141 }, { "epoch": 0.81, "learning_rate": 1.8013303365589273e-05, "loss": 0.6729, "step": 7142 }, { "epoch": 0.81, "learning_rate": 1.7992231681566564e-05, "loss": 0.6355, "step": 7143 }, { "epoch": 0.81, "learning_rate": 1.7971171111008112e-05, "loss": 0.6867, "step": 7144 }, { "epoch": 0.81, "learning_rate": 1.7950121656767958e-05, "loss": 0.6656, "step": 7145 }, { "epoch": 0.81, "learning_rate": 1.7929083321698713e-05, "loss": 0.7023, "step": 7146 }, { "epoch": 0.81, "learning_rate": 1.7908056108651395e-05, "loss": 0.6442, "step": 7147 }, { "epoch": 0.81, "learning_rate": 1.7887040020475598e-05, "loss": 0.5933, "step": 7148 }, { "epoch": 0.81, "learning_rate": 1.7866035060019335e-05, "loss": 0.6334, "step": 7149 }, { "epoch": 0.81, "learning_rate": 1.7845041230129146e-05, "loss": 0.6552, "step": 7150 }, { "epoch": 0.81, "learning_rate": 1.7824058533650024e-05, "loss": 0.6337, "step": 7151 }, { "epoch": 0.81, "learning_rate": 1.780308697342554e-05, "loss": 0.654, "step": 7152 }, { "epoch": 0.81, "learning_rate": 1.778212655229765e-05, "loss": 0.6799, "step": 7153 }, { "epoch": 0.81, "learning_rate": 1.7761177273106898e-05, "loss": 0.6624, "step": 7154 }, { "epoch": 0.81, "learning_rate": 1.774023913869226e-05, "loss": 0.6715, "step": 7155 }, { "epoch": 0.81, "learning_rate": 1.77193121518912e-05, "loss": 0.6613, "step": 7156 }, { "epoch": 0.81, "learning_rate": 1.7698396315539667e-05, "loss": 0.6418, "step": 7157 }, { "epoch": 0.81, "learning_rate": 1.7677491632472167e-05, "loss": 0.6727, "step": 7158 }, { "epoch": 0.81, "learning_rate": 1.7656598105521583e-05, "loss": 0.7313, "step": 7159 }, { "epoch": 0.81, "learning_rate": 1.763571573751941e-05, "loss": 0.6367, "step": 7160 }, { "epoch": 0.81, "learning_rate": 1.7614844531295538e-05, "loss": 0.618, "step": 7161 }, { "epoch": 0.81, "learning_rate": 1.7593984489678384e-05, "loss": 0.7347, "step": 7162 }, { "epoch": 0.81, "learning_rate": 1.7573135615494806e-05, "loss": 0.6725, "step": 7163 }, { "epoch": 0.81, "learning_rate": 1.7552297911570247e-05, "loss": 0.6287, "step": 7164 }, { "epoch": 0.81, "learning_rate": 1.7531471380728503e-05, "loss": 0.6468, "step": 7165 }, { "epoch": 0.81, "learning_rate": 1.7510656025792005e-05, "loss": 0.6314, "step": 7166 }, { "epoch": 0.81, "learning_rate": 1.748985184958155e-05, "loss": 0.689, "step": 7167 }, { "epoch": 0.81, "learning_rate": 1.7469058854916442e-05, "loss": 0.6736, "step": 7168 }, { "epoch": 0.81, "learning_rate": 1.7448277044614537e-05, "loss": 0.5796, "step": 7169 }, { "epoch": 0.81, "learning_rate": 1.742750642149208e-05, "loss": 0.626, "step": 7170 }, { "epoch": 0.82, "learning_rate": 1.7406746988363887e-05, "loss": 0.5759, "step": 7171 }, { "epoch": 0.82, "learning_rate": 1.738599874804322e-05, "loss": 0.627, "step": 7172 }, { "epoch": 0.82, "learning_rate": 1.7365261703341795e-05, "loss": 0.6103, "step": 7173 }, { "epoch": 0.82, "learning_rate": 1.7344535857069832e-05, "loss": 0.7112, "step": 7174 }, { "epoch": 0.82, "learning_rate": 1.7323821212036083e-05, "loss": 0.6897, "step": 7175 }, { "epoch": 0.82, "learning_rate": 1.7303117771047682e-05, "loss": 0.633, "step": 7176 }, { "epoch": 0.82, "learning_rate": 1.7282425536910364e-05, "loss": 0.6834, "step": 7177 }, { "epoch": 0.82, "learning_rate": 1.7261744512428256e-05, "loss": 0.6975, "step": 7178 }, { "epoch": 0.82, "learning_rate": 1.724107470040398e-05, "loss": 0.5905, "step": 7179 }, { "epoch": 0.82, "learning_rate": 1.7220416103638648e-05, "loss": 0.6269, "step": 7180 }, { "epoch": 0.82, "learning_rate": 1.7199768724931888e-05, "loss": 0.6512, "step": 7181 }, { "epoch": 0.82, "learning_rate": 1.7179132567081725e-05, "loss": 0.6707, "step": 7182 }, { "epoch": 0.82, "learning_rate": 1.71585076328848e-05, "loss": 0.6539, "step": 7183 }, { "epoch": 0.82, "learning_rate": 1.713789392513604e-05, "loss": 0.6741, "step": 7184 }, { "epoch": 0.82, "learning_rate": 1.7117291446629026e-05, "loss": 0.667, "step": 7185 }, { "epoch": 0.82, "learning_rate": 1.7096700200155713e-05, "loss": 0.67, "step": 7186 }, { "epoch": 0.82, "learning_rate": 1.7076120188506605e-05, "loss": 0.674, "step": 7187 }, { "epoch": 0.82, "learning_rate": 1.7055551414470615e-05, "loss": 0.618, "step": 7188 }, { "epoch": 0.82, "learning_rate": 1.7034993880835203e-05, "loss": 0.6342, "step": 7189 }, { "epoch": 0.82, "learning_rate": 1.701444759038624e-05, "loss": 0.6949, "step": 7190 }, { "epoch": 0.82, "learning_rate": 1.6993912545908086e-05, "loss": 0.6927, "step": 7191 }, { "epoch": 0.82, "learning_rate": 1.697338875018364e-05, "loss": 0.6771, "step": 7192 }, { "epoch": 0.82, "learning_rate": 1.6952876205994184e-05, "loss": 0.6493, "step": 7193 }, { "epoch": 0.82, "learning_rate": 1.6932374916119563e-05, "loss": 0.6076, "step": 7194 }, { "epoch": 0.82, "learning_rate": 1.6911884883338036e-05, "loss": 0.6796, "step": 7195 }, { "epoch": 0.82, "learning_rate": 1.6891406110426346e-05, "loss": 0.6651, "step": 7196 }, { "epoch": 0.82, "learning_rate": 1.68709386001597e-05, "loss": 0.6286, "step": 7197 }, { "epoch": 0.82, "learning_rate": 1.6850482355311858e-05, "loss": 0.667, "step": 7198 }, { "epoch": 0.82, "learning_rate": 1.683003737865493e-05, "loss": 0.5814, "step": 7199 }, { "epoch": 0.82, "learning_rate": 1.6809603672959617e-05, "loss": 0.6997, "step": 7200 }, { "epoch": 0.82, "learning_rate": 1.6789181240995012e-05, "loss": 0.6704, "step": 7201 }, { "epoch": 0.82, "learning_rate": 1.6768770085528707e-05, "loss": 0.6231, "step": 7202 }, { "epoch": 0.82, "learning_rate": 1.6748370209326736e-05, "loss": 0.6824, "step": 7203 }, { "epoch": 0.82, "learning_rate": 1.6727981615153688e-05, "loss": 0.697, "step": 7204 }, { "epoch": 0.82, "learning_rate": 1.6707604305772518e-05, "loss": 0.6649, "step": 7205 }, { "epoch": 0.82, "learning_rate": 1.6687238283944772e-05, "loss": 0.6439, "step": 7206 }, { "epoch": 0.82, "learning_rate": 1.6666883552430302e-05, "loss": 0.6475, "step": 7207 }, { "epoch": 0.82, "learning_rate": 1.6646540113987595e-05, "loss": 0.7312, "step": 7208 }, { "epoch": 0.82, "learning_rate": 1.6626207971373497e-05, "loss": 0.6614, "step": 7209 }, { "epoch": 0.82, "learning_rate": 1.6605887127343412e-05, "loss": 0.6229, "step": 7210 }, { "epoch": 0.82, "learning_rate": 1.65855775846511e-05, "loss": 0.6976, "step": 7211 }, { "epoch": 0.82, "learning_rate": 1.6565279346048912e-05, "loss": 0.6388, "step": 7212 }, { "epoch": 0.82, "learning_rate": 1.6544992414287585e-05, "loss": 0.6063, "step": 7213 }, { "epoch": 0.82, "learning_rate": 1.6524716792116323e-05, "loss": 0.7135, "step": 7214 }, { "epoch": 0.82, "learning_rate": 1.6504452482282874e-05, "loss": 0.5613, "step": 7215 }, { "epoch": 0.82, "learning_rate": 1.6484199487533368e-05, "loss": 0.6994, "step": 7216 }, { "epoch": 0.82, "learning_rate": 1.6463957810612407e-05, "loss": 0.6659, "step": 7217 }, { "epoch": 0.82, "learning_rate": 1.6443727454263157e-05, "loss": 0.6843, "step": 7218 }, { "epoch": 0.82, "learning_rate": 1.6423508421227128e-05, "loss": 0.6881, "step": 7219 }, { "epoch": 0.82, "learning_rate": 1.640330071424434e-05, "loss": 0.618, "step": 7220 }, { "epoch": 0.82, "learning_rate": 1.6383104336053335e-05, "loss": 0.6396, "step": 7221 }, { "epoch": 0.82, "learning_rate": 1.636291928939101e-05, "loss": 0.6268, "step": 7222 }, { "epoch": 0.82, "learning_rate": 1.634274557699287e-05, "loss": 0.6591, "step": 7223 }, { "epoch": 0.82, "learning_rate": 1.6322583201592688e-05, "loss": 0.6333, "step": 7224 }, { "epoch": 0.82, "learning_rate": 1.6302432165922908e-05, "loss": 0.6286, "step": 7225 }, { "epoch": 0.82, "learning_rate": 1.6282292472714268e-05, "loss": 0.666, "step": 7226 }, { "epoch": 0.82, "learning_rate": 1.626216412469611e-05, "loss": 0.6985, "step": 7227 }, { "epoch": 0.82, "learning_rate": 1.6242047124596127e-05, "loss": 0.6529, "step": 7228 }, { "epoch": 0.82, "learning_rate": 1.6221941475140577e-05, "loss": 0.6694, "step": 7229 }, { "epoch": 0.82, "learning_rate": 1.620184717905403e-05, "loss": 0.6104, "step": 7230 }, { "epoch": 0.82, "learning_rate": 1.618176423905967e-05, "loss": 0.675, "step": 7231 }, { "epoch": 0.82, "learning_rate": 1.6161692657879058e-05, "loss": 0.6402, "step": 7232 }, { "epoch": 0.82, "learning_rate": 1.614163243823228e-05, "loss": 0.6836, "step": 7233 }, { "epoch": 0.82, "learning_rate": 1.6121583582837772e-05, "loss": 0.7055, "step": 7234 }, { "epoch": 0.82, "learning_rate": 1.6101546094412566e-05, "loss": 0.6252, "step": 7235 }, { "epoch": 0.82, "learning_rate": 1.6081519975672065e-05, "loss": 0.6637, "step": 7236 }, { "epoch": 0.82, "learning_rate": 1.6061505229330144e-05, "loss": 0.7181, "step": 7237 }, { "epoch": 0.82, "learning_rate": 1.6041501858099116e-05, "loss": 0.6938, "step": 7238 }, { "epoch": 0.82, "learning_rate": 1.6021509864689844e-05, "loss": 0.7086, "step": 7239 }, { "epoch": 0.82, "learning_rate": 1.6001529251811554e-05, "loss": 0.6833, "step": 7240 }, { "epoch": 0.82, "learning_rate": 1.5981560022171938e-05, "loss": 0.6515, "step": 7241 }, { "epoch": 0.82, "learning_rate": 1.596160217847723e-05, "loss": 0.7066, "step": 7242 }, { "epoch": 0.82, "learning_rate": 1.5941655723432003e-05, "loss": 0.6986, "step": 7243 }, { "epoch": 0.82, "learning_rate": 1.5921720659739402e-05, "loss": 0.7283, "step": 7244 }, { "epoch": 0.82, "learning_rate": 1.5901796990100905e-05, "loss": 0.6506, "step": 7245 }, { "epoch": 0.82, "learning_rate": 1.588188471721661e-05, "loss": 0.6395, "step": 7246 }, { "epoch": 0.82, "learning_rate": 1.5861983843784856e-05, "loss": 0.6709, "step": 7247 }, { "epoch": 0.82, "learning_rate": 1.5842094372502626e-05, "loss": 0.6067, "step": 7248 }, { "epoch": 0.82, "learning_rate": 1.582221630606525e-05, "loss": 0.7165, "step": 7249 }, { "epoch": 0.82, "learning_rate": 1.5802349647166592e-05, "loss": 0.6503, "step": 7250 }, { "epoch": 0.82, "learning_rate": 1.578249439849888e-05, "loss": 0.6394, "step": 7251 }, { "epoch": 0.82, "learning_rate": 1.5762650562752912e-05, "loss": 0.6614, "step": 7252 }, { "epoch": 0.82, "learning_rate": 1.5742818142617767e-05, "loss": 0.6162, "step": 7253 }, { "epoch": 0.82, "learning_rate": 1.572299714078116e-05, "loss": 0.6332, "step": 7254 }, { "epoch": 0.82, "learning_rate": 1.570318755992912e-05, "loss": 0.6376, "step": 7255 }, { "epoch": 0.82, "learning_rate": 1.5683389402746253e-05, "loss": 0.6303, "step": 7256 }, { "epoch": 0.82, "learning_rate": 1.56636026719155e-05, "loss": 0.6388, "step": 7257 }, { "epoch": 0.82, "learning_rate": 1.5643827370118336e-05, "loss": 0.6718, "step": 7258 }, { "epoch": 0.83, "learning_rate": 1.562406350003459e-05, "loss": 0.6361, "step": 7259 }, { "epoch": 0.83, "learning_rate": 1.5604311064342692e-05, "loss": 0.6978, "step": 7260 }, { "epoch": 0.83, "learning_rate": 1.5584570065719373e-05, "loss": 0.6463, "step": 7261 }, { "epoch": 0.83, "learning_rate": 1.5564840506839928e-05, "loss": 0.6823, "step": 7262 }, { "epoch": 0.83, "learning_rate": 1.554512239037802e-05, "loss": 0.672, "step": 7263 }, { "epoch": 0.83, "learning_rate": 1.5525415719005777e-05, "loss": 0.6917, "step": 7264 }, { "epoch": 0.83, "learning_rate": 1.5505720495393837e-05, "loss": 0.6522, "step": 7265 }, { "epoch": 0.83, "learning_rate": 1.5486036722211206e-05, "loss": 0.5936, "step": 7266 }, { "epoch": 0.83, "learning_rate": 1.5466364402125412e-05, "loss": 0.6208, "step": 7267 }, { "epoch": 0.83, "learning_rate": 1.5446703537802344e-05, "loss": 0.7246, "step": 7268 }, { "epoch": 0.83, "learning_rate": 1.542705413190645e-05, "loss": 0.6564, "step": 7269 }, { "epoch": 0.83, "learning_rate": 1.540741618710049e-05, "loss": 0.6389, "step": 7270 }, { "epoch": 0.83, "learning_rate": 1.5387789706045796e-05, "loss": 0.644, "step": 7271 }, { "epoch": 0.83, "learning_rate": 1.536817469140206e-05, "loss": 0.6749, "step": 7272 }, { "epoch": 0.83, "learning_rate": 1.5348571145827484e-05, "loss": 0.6706, "step": 7273 }, { "epoch": 0.83, "learning_rate": 1.5328979071978655e-05, "loss": 0.7234, "step": 7274 }, { "epoch": 0.83, "learning_rate": 1.5309398472510707e-05, "loss": 0.6952, "step": 7275 }, { "epoch": 0.83, "learning_rate": 1.5289829350077047e-05, "loss": 0.679, "step": 7276 }, { "epoch": 0.83, "learning_rate": 1.52702717073297e-05, "loss": 0.6726, "step": 7277 }, { "epoch": 0.83, "learning_rate": 1.525072554691901e-05, "loss": 0.6861, "step": 7278 }, { "epoch": 0.83, "learning_rate": 1.5231190871493871e-05, "loss": 0.6166, "step": 7279 }, { "epoch": 0.83, "learning_rate": 1.5211667683701558e-05, "loss": 0.6256, "step": 7280 }, { "epoch": 0.83, "learning_rate": 1.5192155986187772e-05, "loss": 0.6688, "step": 7281 }, { "epoch": 0.83, "learning_rate": 1.5172655781596679e-05, "loss": 0.7237, "step": 7282 }, { "epoch": 0.83, "learning_rate": 1.515316707257094e-05, "loss": 0.6423, "step": 7283 }, { "epoch": 0.83, "learning_rate": 1.5133689861751555e-05, "loss": 0.6196, "step": 7284 }, { "epoch": 0.83, "learning_rate": 1.5114224151778068e-05, "loss": 0.7375, "step": 7285 }, { "epoch": 0.83, "learning_rate": 1.50947699452884e-05, "loss": 0.6256, "step": 7286 }, { "epoch": 0.83, "learning_rate": 1.5075327244918902e-05, "loss": 0.6978, "step": 7287 }, { "epoch": 0.83, "learning_rate": 1.5055896053304453e-05, "loss": 0.6767, "step": 7288 }, { "epoch": 0.83, "learning_rate": 1.5036476373078257e-05, "loss": 0.7483, "step": 7289 }, { "epoch": 0.83, "learning_rate": 1.5017068206872054e-05, "loss": 0.6928, "step": 7290 }, { "epoch": 0.83, "learning_rate": 1.4997671557315984e-05, "loss": 0.6683, "step": 7291 }, { "epoch": 0.83, "learning_rate": 1.4978286427038601e-05, "loss": 0.6523, "step": 7292 }, { "epoch": 0.83, "learning_rate": 1.4958912818666915e-05, "loss": 0.6493, "step": 7293 }, { "epoch": 0.83, "learning_rate": 1.4939550734826435e-05, "loss": 0.6614, "step": 7294 }, { "epoch": 0.83, "learning_rate": 1.4920200178141008e-05, "loss": 0.626, "step": 7295 }, { "epoch": 0.83, "learning_rate": 1.4900861151232993e-05, "loss": 0.6845, "step": 7296 }, { "epoch": 0.83, "learning_rate": 1.4881533656723169e-05, "loss": 0.7382, "step": 7297 }, { "epoch": 0.83, "learning_rate": 1.4862217697230718e-05, "loss": 0.645, "step": 7298 }, { "epoch": 0.83, "learning_rate": 1.4842913275373283e-05, "loss": 0.708, "step": 7299 }, { "epoch": 0.83, "learning_rate": 1.4823620393766979e-05, "loss": 0.6272, "step": 7300 }, { "epoch": 0.83, "learning_rate": 1.4804339055026284e-05, "loss": 0.6938, "step": 7301 }, { "epoch": 0.83, "learning_rate": 1.4785069261764184e-05, "loss": 0.6562, "step": 7302 }, { "epoch": 0.83, "learning_rate": 1.4765811016592058e-05, "loss": 0.6145, "step": 7303 }, { "epoch": 0.83, "learning_rate": 1.4746564322119727e-05, "loss": 0.6448, "step": 7304 }, { "epoch": 0.83, "learning_rate": 1.472732918095543e-05, "loss": 0.6085, "step": 7305 }, { "epoch": 0.83, "learning_rate": 1.470810559570589e-05, "loss": 0.6271, "step": 7306 }, { "epoch": 0.83, "learning_rate": 1.4688893568976214e-05, "loss": 0.6695, "step": 7307 }, { "epoch": 0.83, "learning_rate": 1.4669693103369985e-05, "loss": 0.637, "step": 7308 }, { "epoch": 0.83, "learning_rate": 1.465050420148918e-05, "loss": 0.5962, "step": 7309 }, { "epoch": 0.83, "learning_rate": 1.4631326865934202e-05, "loss": 0.6323, "step": 7310 }, { "epoch": 0.83, "learning_rate": 1.4612161099303966e-05, "loss": 0.7582, "step": 7311 }, { "epoch": 0.83, "learning_rate": 1.4593006904195727e-05, "loss": 0.7185, "step": 7312 }, { "epoch": 0.83, "learning_rate": 1.4573864283205196e-05, "loss": 0.6813, "step": 7313 }, { "epoch": 0.83, "learning_rate": 1.4554733238926566e-05, "loss": 0.6106, "step": 7314 }, { "epoch": 0.83, "learning_rate": 1.4535613773952406e-05, "loss": 0.6208, "step": 7315 }, { "epoch": 0.83, "learning_rate": 1.45165058908737e-05, "loss": 0.5846, "step": 7316 }, { "epoch": 0.83, "learning_rate": 1.4497409592279954e-05, "loss": 0.701, "step": 7317 }, { "epoch": 0.83, "learning_rate": 1.4478324880758986e-05, "loss": 0.6146, "step": 7318 }, { "epoch": 0.83, "learning_rate": 1.4459251758897151e-05, "loss": 0.6231, "step": 7319 }, { "epoch": 0.83, "learning_rate": 1.4440190229279183e-05, "loss": 0.5456, "step": 7320 }, { "epoch": 0.83, "learning_rate": 1.4421140294488212e-05, "loss": 0.6404, "step": 7321 }, { "epoch": 0.83, "learning_rate": 1.4402101957105841e-05, "loss": 0.6282, "step": 7322 }, { "epoch": 0.83, "learning_rate": 1.4383075219712116e-05, "loss": 0.6074, "step": 7323 }, { "epoch": 0.83, "learning_rate": 1.4364060084885455e-05, "loss": 0.718, "step": 7324 }, { "epoch": 0.83, "learning_rate": 1.4345056555202784e-05, "loss": 0.6661, "step": 7325 }, { "epoch": 0.83, "learning_rate": 1.4326064633239378e-05, "loss": 0.6953, "step": 7326 }, { "epoch": 0.83, "learning_rate": 1.4307084321568964e-05, "loss": 0.658, "step": 7327 }, { "epoch": 0.83, "learning_rate": 1.4288115622763687e-05, "loss": 0.6746, "step": 7328 }, { "epoch": 0.83, "learning_rate": 1.4269158539394178e-05, "loss": 0.6236, "step": 7329 }, { "epoch": 0.83, "learning_rate": 1.4250213074029396e-05, "loss": 0.6995, "step": 7330 }, { "epoch": 0.83, "learning_rate": 1.4231279229236827e-05, "loss": 0.6863, "step": 7331 }, { "epoch": 0.83, "learning_rate": 1.421235700758231e-05, "loss": 0.5675, "step": 7332 }, { "epoch": 0.83, "learning_rate": 1.419344641163014e-05, "loss": 0.755, "step": 7333 }, { "epoch": 0.83, "learning_rate": 1.4174547443942998e-05, "loss": 0.7105, "step": 7334 }, { "epoch": 0.83, "learning_rate": 1.4155660107082059e-05, "loss": 0.6782, "step": 7335 }, { "epoch": 0.83, "learning_rate": 1.413678440360684e-05, "loss": 0.6691, "step": 7336 }, { "epoch": 0.83, "learning_rate": 1.4117920336075374e-05, "loss": 0.6319, "step": 7337 }, { "epoch": 0.83, "learning_rate": 1.409906790704405e-05, "loss": 0.5776, "step": 7338 }, { "epoch": 0.83, "learning_rate": 1.4080227119067657e-05, "loss": 0.6659, "step": 7339 }, { "epoch": 0.83, "learning_rate": 1.4061397974699497e-05, "loss": 0.6556, "step": 7340 }, { "epoch": 0.83, "learning_rate": 1.4042580476491207e-05, "loss": 0.5484, "step": 7341 }, { "epoch": 0.83, "learning_rate": 1.4023774626992925e-05, "loss": 0.6342, "step": 7342 }, { "epoch": 0.83, "learning_rate": 1.4004980428753134e-05, "loss": 0.6802, "step": 7343 }, { "epoch": 0.83, "learning_rate": 1.3986197884318785e-05, "loss": 0.6483, "step": 7344 }, { "epoch": 0.83, "learning_rate": 1.39674269962352e-05, "loss": 0.69, "step": 7345 }, { "epoch": 0.83, "learning_rate": 1.3948667767046209e-05, "loss": 0.6947, "step": 7346 }, { "epoch": 0.84, "learning_rate": 1.3929920199293966e-05, "loss": 0.6811, "step": 7347 }, { "epoch": 0.84, "learning_rate": 1.3911184295519142e-05, "loss": 0.6827, "step": 7348 }, { "epoch": 0.84, "learning_rate": 1.3892460058260737e-05, "loss": 0.6363, "step": 7349 }, { "epoch": 0.84, "learning_rate": 1.3873747490056222e-05, "loss": 0.6431, "step": 7350 }, { "epoch": 0.84, "learning_rate": 1.3855046593441435e-05, "loss": 0.6639, "step": 7351 }, { "epoch": 0.84, "learning_rate": 1.3836357370950726e-05, "loss": 0.6743, "step": 7352 }, { "epoch": 0.84, "learning_rate": 1.3817679825116746e-05, "loss": 0.6003, "step": 7353 }, { "epoch": 0.84, "learning_rate": 1.3799013958470708e-05, "loss": 0.664, "step": 7354 }, { "epoch": 0.84, "learning_rate": 1.3780359773542074e-05, "loss": 0.6672, "step": 7355 }, { "epoch": 0.84, "learning_rate": 1.3761717272858854e-05, "loss": 0.6196, "step": 7356 }, { "epoch": 0.84, "learning_rate": 1.3743086458947385e-05, "loss": 0.6837, "step": 7357 }, { "epoch": 0.84, "learning_rate": 1.3724467334332526e-05, "loss": 0.7065, "step": 7358 }, { "epoch": 0.84, "learning_rate": 1.3705859901537432e-05, "loss": 0.6913, "step": 7359 }, { "epoch": 0.84, "learning_rate": 1.3687264163083768e-05, "loss": 0.6148, "step": 7360 }, { "epoch": 0.84, "learning_rate": 1.3668680121491572e-05, "loss": 0.704, "step": 7361 }, { "epoch": 0.84, "learning_rate": 1.3650107779279264e-05, "loss": 0.7036, "step": 7362 }, { "epoch": 0.84, "learning_rate": 1.3631547138963763e-05, "loss": 0.6502, "step": 7363 }, { "epoch": 0.84, "learning_rate": 1.3612998203060323e-05, "loss": 0.6724, "step": 7364 }, { "epoch": 0.84, "learning_rate": 1.3594460974082667e-05, "loss": 0.5746, "step": 7365 }, { "epoch": 0.84, "learning_rate": 1.357593545454291e-05, "loss": 0.6037, "step": 7366 }, { "epoch": 0.84, "learning_rate": 1.3557421646951562e-05, "loss": 0.6094, "step": 7367 }, { "epoch": 0.84, "learning_rate": 1.3538919553817553e-05, "loss": 0.6573, "step": 7368 }, { "epoch": 0.84, "learning_rate": 1.3520429177648264e-05, "loss": 0.7291, "step": 7369 }, { "epoch": 0.84, "learning_rate": 1.3501950520949436e-05, "loss": 0.6422, "step": 7370 }, { "epoch": 0.84, "learning_rate": 1.3483483586225288e-05, "loss": 0.7033, "step": 7371 }, { "epoch": 0.84, "learning_rate": 1.3465028375978327e-05, "loss": 0.6818, "step": 7372 }, { "epoch": 0.84, "learning_rate": 1.3446584892709635e-05, "loss": 0.6329, "step": 7373 }, { "epoch": 0.84, "learning_rate": 1.3428153138918553e-05, "loss": 0.7197, "step": 7374 }, { "epoch": 0.84, "learning_rate": 1.3409733117102962e-05, "loss": 0.6626, "step": 7375 }, { "epoch": 0.84, "learning_rate": 1.3391324829759034e-05, "loss": 0.6535, "step": 7376 }, { "epoch": 0.84, "learning_rate": 1.3372928279381492e-05, "loss": 0.7124, "step": 7377 }, { "epoch": 0.84, "learning_rate": 1.3354543468463276e-05, "loss": 0.6737, "step": 7378 }, { "epoch": 0.84, "learning_rate": 1.3336170399495928e-05, "loss": 0.6718, "step": 7379 }, { "epoch": 0.84, "learning_rate": 1.3317809074969268e-05, "loss": 0.6486, "step": 7380 }, { "epoch": 0.84, "learning_rate": 1.3299459497371614e-05, "loss": 0.632, "step": 7381 }, { "epoch": 0.84, "learning_rate": 1.328112166918959e-05, "loss": 0.6158, "step": 7382 }, { "epoch": 0.84, "learning_rate": 1.3262795592908361e-05, "loss": 0.6039, "step": 7383 }, { "epoch": 0.84, "learning_rate": 1.3244481271011378e-05, "loss": 0.6865, "step": 7384 }, { "epoch": 0.84, "learning_rate": 1.322617870598054e-05, "loss": 0.6188, "step": 7385 }, { "epoch": 0.84, "learning_rate": 1.32078879002962e-05, "loss": 0.6015, "step": 7386 }, { "epoch": 0.84, "learning_rate": 1.3189608856437053e-05, "loss": 0.6437, "step": 7387 }, { "epoch": 0.84, "learning_rate": 1.3171341576880202e-05, "loss": 0.6908, "step": 7388 }, { "epoch": 0.84, "learning_rate": 1.3153086064101217e-05, "loss": 0.6457, "step": 7389 }, { "epoch": 0.84, "learning_rate": 1.3134842320574025e-05, "loss": 0.6841, "step": 7390 }, { "epoch": 0.84, "learning_rate": 1.3116610348770942e-05, "loss": 0.6083, "step": 7391 }, { "epoch": 0.84, "learning_rate": 1.3098390151162742e-05, "loss": 0.6599, "step": 7392 }, { "epoch": 0.84, "learning_rate": 1.3080181730218554e-05, "loss": 0.6522, "step": 7393 }, { "epoch": 0.84, "learning_rate": 1.3061985088405981e-05, "loss": 0.6827, "step": 7394 }, { "epoch": 0.84, "learning_rate": 1.3043800228190905e-05, "loss": 0.6359, "step": 7395 }, { "epoch": 0.84, "learning_rate": 1.3025627152037755e-05, "loss": 0.6383, "step": 7396 }, { "epoch": 0.84, "learning_rate": 1.3007465862409241e-05, "loss": 0.745, "step": 7397 }, { "epoch": 0.84, "learning_rate": 1.2989316361766569e-05, "loss": 0.6327, "step": 7398 }, { "epoch": 0.84, "learning_rate": 1.2971178652569282e-05, "loss": 0.6291, "step": 7399 }, { "epoch": 0.84, "learning_rate": 1.2953052737275418e-05, "loss": 0.674, "step": 7400 }, { "epoch": 0.84, "learning_rate": 1.293493861834124e-05, "loss": 0.7106, "step": 7401 }, { "epoch": 0.84, "learning_rate": 1.2916836298221613e-05, "loss": 0.6794, "step": 7402 }, { "epoch": 0.84, "learning_rate": 1.2898745779369659e-05, "loss": 0.6708, "step": 7403 }, { "epoch": 0.84, "learning_rate": 1.2880667064237007e-05, "loss": 0.6738, "step": 7404 }, { "epoch": 0.84, "learning_rate": 1.2862600155273575e-05, "loss": 0.7132, "step": 7405 }, { "epoch": 0.84, "learning_rate": 1.2844545054927781e-05, "loss": 0.637, "step": 7406 }, { "epoch": 0.84, "learning_rate": 1.2826501765646404e-05, "loss": 0.6641, "step": 7407 }, { "epoch": 0.84, "learning_rate": 1.2808470289874608e-05, "loss": 0.652, "step": 7408 }, { "epoch": 0.84, "learning_rate": 1.279045063005594e-05, "loss": 0.7036, "step": 7409 }, { "epoch": 0.84, "learning_rate": 1.2772442788632433e-05, "loss": 0.6935, "step": 7410 }, { "epoch": 0.84, "learning_rate": 1.2754446768044415e-05, "loss": 0.6664, "step": 7411 }, { "epoch": 0.84, "learning_rate": 1.2736462570730656e-05, "loss": 0.6489, "step": 7412 }, { "epoch": 0.84, "learning_rate": 1.2718490199128352e-05, "loss": 0.629, "step": 7413 }, { "epoch": 0.84, "learning_rate": 1.2700529655673043e-05, "loss": 0.63, "step": 7414 }, { "epoch": 0.84, "learning_rate": 1.2682580942798716e-05, "loss": 0.6454, "step": 7415 }, { "epoch": 0.84, "learning_rate": 1.2664644062937703e-05, "loss": 0.6796, "step": 7416 }, { "epoch": 0.84, "learning_rate": 1.2646719018520813e-05, "loss": 0.6573, "step": 7417 }, { "epoch": 0.84, "learning_rate": 1.2628805811977129e-05, "loss": 0.6288, "step": 7418 }, { "epoch": 0.84, "learning_rate": 1.261090444573424e-05, "loss": 0.6592, "step": 7419 }, { "epoch": 0.84, "learning_rate": 1.2593014922218061e-05, "loss": 0.6485, "step": 7420 }, { "epoch": 0.84, "learning_rate": 1.2575137243852963e-05, "loss": 0.6808, "step": 7421 }, { "epoch": 0.84, "learning_rate": 1.2557271413061656e-05, "loss": 0.6891, "step": 7422 }, { "epoch": 0.84, "learning_rate": 1.253941743226531e-05, "loss": 0.714, "step": 7423 }, { "epoch": 0.84, "learning_rate": 1.252157530388337e-05, "loss": 0.6413, "step": 7424 }, { "epoch": 0.84, "learning_rate": 1.2503745030333824e-05, "loss": 0.7021, "step": 7425 }, { "epoch": 0.84, "learning_rate": 1.2485926614032916e-05, "loss": 0.6225, "step": 7426 }, { "epoch": 0.84, "learning_rate": 1.2468120057395416e-05, "loss": 0.6243, "step": 7427 }, { "epoch": 0.84, "learning_rate": 1.2450325362834381e-05, "loss": 0.6213, "step": 7428 }, { "epoch": 0.84, "learning_rate": 1.2432542532761315e-05, "loss": 0.6483, "step": 7429 }, { "epoch": 0.84, "learning_rate": 1.241477156958606e-05, "loss": 0.7202, "step": 7430 }, { "epoch": 0.84, "learning_rate": 1.239701247571693e-05, "loss": 0.6212, "step": 7431 }, { "epoch": 0.84, "learning_rate": 1.2379265253560545e-05, "loss": 0.5783, "step": 7432 }, { "epoch": 0.84, "learning_rate": 1.2361529905522018e-05, "loss": 0.687, "step": 7433 }, { "epoch": 0.84, "learning_rate": 1.2343806434004768e-05, "loss": 0.6156, "step": 7434 }, { "epoch": 0.85, "learning_rate": 1.2326094841410586e-05, "loss": 0.6412, "step": 7435 }, { "epoch": 0.85, "learning_rate": 1.2308395130139772e-05, "loss": 0.6869, "step": 7436 }, { "epoch": 0.85, "learning_rate": 1.2290707302590875e-05, "loss": 0.7094, "step": 7437 }, { "epoch": 0.85, "learning_rate": 1.2273031361160958e-05, "loss": 0.5931, "step": 7438 }, { "epoch": 0.85, "learning_rate": 1.2255367308245358e-05, "loss": 0.6725, "step": 7439 }, { "epoch": 0.85, "learning_rate": 1.2237715146237939e-05, "loss": 0.7175, "step": 7440 }, { "epoch": 0.85, "learning_rate": 1.2220074877530784e-05, "loss": 0.7166, "step": 7441 }, { "epoch": 0.85, "learning_rate": 1.2202446504514509e-05, "loss": 0.7581, "step": 7442 }, { "epoch": 0.85, "learning_rate": 1.218483002957802e-05, "loss": 0.6725, "step": 7443 }, { "epoch": 0.85, "learning_rate": 1.21672254551087e-05, "loss": 0.6686, "step": 7444 }, { "epoch": 0.85, "learning_rate": 1.2149632783492238e-05, "loss": 0.7065, "step": 7445 }, { "epoch": 0.85, "learning_rate": 1.2132052017112772e-05, "loss": 0.6506, "step": 7446 }, { "epoch": 0.85, "learning_rate": 1.2114483158352751e-05, "loss": 0.6556, "step": 7447 }, { "epoch": 0.85, "learning_rate": 1.2096926209593108e-05, "loss": 0.6608, "step": 7448 }, { "epoch": 0.85, "learning_rate": 1.2079381173213067e-05, "loss": 0.6712, "step": 7449 }, { "epoch": 0.85, "learning_rate": 1.206184805159034e-05, "loss": 0.6685, "step": 7450 }, { "epoch": 0.85, "learning_rate": 1.2044326847100917e-05, "loss": 0.6555, "step": 7451 }, { "epoch": 0.85, "learning_rate": 1.2026817562119253e-05, "loss": 0.6927, "step": 7452 }, { "epoch": 0.85, "learning_rate": 1.2009320199018126e-05, "loss": 0.6404, "step": 7453 }, { "epoch": 0.85, "learning_rate": 1.1991834760168764e-05, "loss": 0.661, "step": 7454 }, { "epoch": 0.85, "learning_rate": 1.1974361247940703e-05, "loss": 0.7297, "step": 7455 }, { "epoch": 0.85, "learning_rate": 1.1956899664701948e-05, "loss": 0.6497, "step": 7456 }, { "epoch": 0.85, "learning_rate": 1.1939450012818842e-05, "loss": 0.6655, "step": 7457 }, { "epoch": 0.85, "learning_rate": 1.192201229465606e-05, "loss": 0.5656, "step": 7458 }, { "epoch": 0.85, "learning_rate": 1.1904586512576787e-05, "loss": 0.7004, "step": 7459 }, { "epoch": 0.85, "learning_rate": 1.1887172668942448e-05, "loss": 0.6557, "step": 7460 }, { "epoch": 0.85, "learning_rate": 1.1869770766112975e-05, "loss": 0.7113, "step": 7461 }, { "epoch": 0.85, "learning_rate": 1.1852380806446605e-05, "loss": 0.6819, "step": 7462 }, { "epoch": 0.85, "learning_rate": 1.1835002792299977e-05, "loss": 0.6912, "step": 7463 }, { "epoch": 0.85, "learning_rate": 1.181763672602808e-05, "loss": 0.6971, "step": 7464 }, { "epoch": 0.85, "learning_rate": 1.1800282609984358e-05, "loss": 0.5885, "step": 7465 }, { "epoch": 0.85, "learning_rate": 1.1782940446520563e-05, "loss": 0.6416, "step": 7466 }, { "epoch": 0.85, "learning_rate": 1.176561023798689e-05, "loss": 0.5761, "step": 7467 }, { "epoch": 0.85, "learning_rate": 1.1748291986731863e-05, "loss": 0.656, "step": 7468 }, { "epoch": 0.85, "learning_rate": 1.1730985695102403e-05, "loss": 0.658, "step": 7469 }, { "epoch": 0.85, "learning_rate": 1.171369136544378e-05, "loss": 0.7037, "step": 7470 }, { "epoch": 0.85, "learning_rate": 1.1696409000099728e-05, "loss": 0.6725, "step": 7471 }, { "epoch": 0.85, "learning_rate": 1.1679138601412255e-05, "loss": 0.6362, "step": 7472 }, { "epoch": 0.85, "learning_rate": 1.166188017172184e-05, "loss": 0.6982, "step": 7473 }, { "epoch": 0.85, "learning_rate": 1.1644633713367281e-05, "loss": 0.6441, "step": 7474 }, { "epoch": 0.85, "learning_rate": 1.1627399228685766e-05, "loss": 0.6595, "step": 7475 }, { "epoch": 0.85, "learning_rate": 1.1610176720012844e-05, "loss": 0.6405, "step": 7476 }, { "epoch": 0.85, "learning_rate": 1.1592966189682508e-05, "loss": 0.6825, "step": 7477 }, { "epoch": 0.85, "learning_rate": 1.1575767640027036e-05, "loss": 0.6347, "step": 7478 }, { "epoch": 0.85, "learning_rate": 1.1558581073377161e-05, "loss": 0.7006, "step": 7479 }, { "epoch": 0.85, "learning_rate": 1.1541406492061957e-05, "loss": 0.6233, "step": 7480 }, { "epoch": 0.85, "learning_rate": 1.1524243898408838e-05, "loss": 0.6553, "step": 7481 }, { "epoch": 0.85, "learning_rate": 1.1507093294743675e-05, "loss": 0.6246, "step": 7482 }, { "epoch": 0.85, "learning_rate": 1.1489954683390647e-05, "loss": 0.668, "step": 7483 }, { "epoch": 0.85, "learning_rate": 1.1472828066672326e-05, "loss": 0.6561, "step": 7484 }, { "epoch": 0.85, "learning_rate": 1.1455713446909689e-05, "loss": 0.5972, "step": 7485 }, { "epoch": 0.85, "learning_rate": 1.1438610826422035e-05, "loss": 0.6645, "step": 7486 }, { "epoch": 0.85, "learning_rate": 1.142152020752707e-05, "loss": 0.6166, "step": 7487 }, { "epoch": 0.85, "learning_rate": 1.1404441592540883e-05, "loss": 0.6621, "step": 7488 }, { "epoch": 0.85, "learning_rate": 1.1387374983777888e-05, "loss": 0.6171, "step": 7489 }, { "epoch": 0.85, "learning_rate": 1.1370320383550947e-05, "loss": 0.7198, "step": 7490 }, { "epoch": 0.85, "learning_rate": 1.1353277794171224e-05, "loss": 0.6164, "step": 7491 }, { "epoch": 0.85, "learning_rate": 1.1336247217948303e-05, "loss": 0.6457, "step": 7492 }, { "epoch": 0.85, "learning_rate": 1.1319228657190073e-05, "loss": 0.6075, "step": 7493 }, { "epoch": 0.85, "learning_rate": 1.1302222114202898e-05, "loss": 0.6368, "step": 7494 }, { "epoch": 0.85, "learning_rate": 1.1285227591291414e-05, "loss": 0.6037, "step": 7495 }, { "epoch": 0.85, "learning_rate": 1.1268245090758711e-05, "loss": 0.6124, "step": 7496 }, { "epoch": 0.85, "learning_rate": 1.1251274614906193e-05, "loss": 0.673, "step": 7497 }, { "epoch": 0.85, "learning_rate": 1.1234316166033642e-05, "loss": 0.6748, "step": 7498 }, { "epoch": 0.85, "learning_rate": 1.1217369746439222e-05, "loss": 0.7166, "step": 7499 }, { "epoch": 0.85, "learning_rate": 1.120043535841948e-05, "loss": 0.595, "step": 7500 }, { "epoch": 0.85, "learning_rate": 1.1183513004269286e-05, "loss": 0.7071, "step": 7501 }, { "epoch": 0.85, "learning_rate": 1.1166602686281947e-05, "loss": 0.668, "step": 7502 }, { "epoch": 0.85, "learning_rate": 1.1149704406749096e-05, "loss": 0.6789, "step": 7503 }, { "epoch": 0.85, "learning_rate": 1.1132818167960723e-05, "loss": 0.6018, "step": 7504 }, { "epoch": 0.85, "learning_rate": 1.11159439722052e-05, "loss": 0.6284, "step": 7505 }, { "epoch": 0.85, "learning_rate": 1.1099081821769297e-05, "loss": 0.6562, "step": 7506 }, { "epoch": 0.85, "learning_rate": 1.1082231718938096e-05, "loss": 0.6786, "step": 7507 }, { "epoch": 0.85, "learning_rate": 1.1065393665995105e-05, "loss": 0.6393, "step": 7508 }, { "epoch": 0.85, "learning_rate": 1.1048567665222164e-05, "loss": 0.6288, "step": 7509 }, { "epoch": 0.85, "learning_rate": 1.103175371889945e-05, "loss": 0.599, "step": 7510 }, { "epoch": 0.85, "learning_rate": 1.1014951829305598e-05, "loss": 0.7014, "step": 7511 }, { "epoch": 0.85, "learning_rate": 1.0998161998717504e-05, "loss": 0.6819, "step": 7512 }, { "epoch": 0.85, "learning_rate": 1.0981384229410518e-05, "loss": 0.6646, "step": 7513 }, { "epoch": 0.85, "learning_rate": 1.0964618523658298e-05, "loss": 0.6496, "step": 7514 }, { "epoch": 0.85, "learning_rate": 1.0947864883732895e-05, "loss": 0.7212, "step": 7515 }, { "epoch": 0.85, "learning_rate": 1.093112331190468e-05, "loss": 0.6817, "step": 7516 }, { "epoch": 0.85, "learning_rate": 1.091439381044247e-05, "loss": 0.645, "step": 7517 }, { "epoch": 0.85, "learning_rate": 1.0897676381613364e-05, "loss": 0.6449, "step": 7518 }, { "epoch": 0.85, "learning_rate": 1.0880971027682907e-05, "loss": 0.6974, "step": 7519 }, { "epoch": 0.85, "learning_rate": 1.086427775091493e-05, "loss": 0.5951, "step": 7520 }, { "epoch": 0.85, "learning_rate": 1.0847596553571659e-05, "loss": 0.6607, "step": 7521 }, { "epoch": 0.85, "learning_rate": 1.0830927437913674e-05, "loss": 0.6371, "step": 7522 }, { "epoch": 0.86, "learning_rate": 1.0814270406199966e-05, "loss": 0.7121, "step": 7523 }, { "epoch": 0.86, "learning_rate": 1.07976254606878e-05, "loss": 0.6827, "step": 7524 }, { "epoch": 0.86, "learning_rate": 1.0780992603632923e-05, "loss": 0.6912, "step": 7525 }, { "epoch": 0.86, "learning_rate": 1.0764371837289277e-05, "loss": 0.6178, "step": 7526 }, { "epoch": 0.86, "learning_rate": 1.0747763163909342e-05, "loss": 0.6229, "step": 7527 }, { "epoch": 0.86, "learning_rate": 1.0731166585743824e-05, "loss": 0.6849, "step": 7528 }, { "epoch": 0.86, "learning_rate": 1.0714582105041892e-05, "loss": 0.688, "step": 7529 }, { "epoch": 0.86, "learning_rate": 1.0698009724050995e-05, "loss": 0.7036, "step": 7530 }, { "epoch": 0.86, "learning_rate": 1.0681449445017e-05, "loss": 0.6607, "step": 7531 }, { "epoch": 0.86, "learning_rate": 1.0664901270184103e-05, "loss": 0.7003, "step": 7532 }, { "epoch": 0.86, "learning_rate": 1.0648365201794841e-05, "loss": 0.635, "step": 7533 }, { "epoch": 0.86, "learning_rate": 1.063184124209018e-05, "loss": 0.7033, "step": 7534 }, { "epoch": 0.86, "learning_rate": 1.0615329393309358e-05, "loss": 0.6409, "step": 7535 }, { "epoch": 0.86, "learning_rate": 1.0598829657690045e-05, "loss": 0.654, "step": 7536 }, { "epoch": 0.86, "learning_rate": 1.058234203746824e-05, "loss": 0.6933, "step": 7537 }, { "epoch": 0.86, "learning_rate": 1.0565866534878287e-05, "loss": 0.7147, "step": 7538 }, { "epoch": 0.86, "learning_rate": 1.0549403152152882e-05, "loss": 0.6705, "step": 7539 }, { "epoch": 0.86, "learning_rate": 1.0532951891523124e-05, "loss": 0.6231, "step": 7540 }, { "epoch": 0.86, "learning_rate": 1.0516512755218433e-05, "loss": 0.6136, "step": 7541 }, { "epoch": 0.86, "learning_rate": 1.0500085745466626e-05, "loss": 0.7246, "step": 7542 }, { "epoch": 0.86, "learning_rate": 1.0483670864493778e-05, "loss": 0.6724, "step": 7543 }, { "epoch": 0.86, "learning_rate": 1.0467268114524443e-05, "loss": 0.6411, "step": 7544 }, { "epoch": 0.86, "learning_rate": 1.0450877497781441e-05, "loss": 0.6408, "step": 7545 }, { "epoch": 0.86, "learning_rate": 1.0434499016486021e-05, "loss": 0.6698, "step": 7546 }, { "epoch": 0.86, "learning_rate": 1.0418132672857705e-05, "loss": 0.6865, "step": 7547 }, { "epoch": 0.86, "learning_rate": 1.0401778469114475e-05, "loss": 0.6692, "step": 7548 }, { "epoch": 0.86, "learning_rate": 1.0385436407472537e-05, "loss": 0.6525, "step": 7549 }, { "epoch": 0.86, "learning_rate": 1.0369106490146574e-05, "loss": 0.6245, "step": 7550 }, { "epoch": 0.86, "learning_rate": 1.0352788719349526e-05, "loss": 0.6086, "step": 7551 }, { "epoch": 0.86, "learning_rate": 1.0336483097292781e-05, "loss": 0.6523, "step": 7552 }, { "epoch": 0.86, "learning_rate": 1.0320189626185994e-05, "loss": 0.5808, "step": 7553 }, { "epoch": 0.86, "learning_rate": 1.0303908308237243e-05, "loss": 0.7033, "step": 7554 }, { "epoch": 0.86, "learning_rate": 1.0287639145652905e-05, "loss": 0.6299, "step": 7555 }, { "epoch": 0.86, "learning_rate": 1.0271382140637709e-05, "loss": 0.683, "step": 7556 }, { "epoch": 0.86, "learning_rate": 1.0255137295394813e-05, "loss": 0.6418, "step": 7557 }, { "epoch": 0.86, "learning_rate": 1.0238904612125644e-05, "loss": 0.6863, "step": 7558 }, { "epoch": 0.86, "learning_rate": 1.022268409303001e-05, "loss": 0.6322, "step": 7559 }, { "epoch": 0.86, "learning_rate": 1.0206475740306053e-05, "loss": 0.6808, "step": 7560 }, { "epoch": 0.86, "learning_rate": 1.0190279556150317e-05, "loss": 0.6289, "step": 7561 }, { "epoch": 0.86, "learning_rate": 1.0174095542757633e-05, "loss": 0.6507, "step": 7562 }, { "epoch": 0.86, "learning_rate": 1.0157923702321249e-05, "loss": 0.6771, "step": 7563 }, { "epoch": 0.86, "learning_rate": 1.0141764037032697e-05, "loss": 0.7059, "step": 7564 }, { "epoch": 0.86, "learning_rate": 1.0125616549081929e-05, "loss": 0.7065, "step": 7565 }, { "epoch": 0.86, "learning_rate": 1.0109481240657148e-05, "loss": 0.6787, "step": 7566 }, { "epoch": 0.86, "learning_rate": 1.0093358113945017e-05, "loss": 0.6328, "step": 7567 }, { "epoch": 0.86, "learning_rate": 1.0077247171130455e-05, "loss": 0.6579, "step": 7568 }, { "epoch": 0.86, "learning_rate": 1.0061148414396814e-05, "loss": 0.5921, "step": 7569 }, { "epoch": 0.86, "learning_rate": 1.0045061845925719e-05, "loss": 0.7136, "step": 7570 }, { "epoch": 0.86, "learning_rate": 1.0028987467897234e-05, "loss": 0.6618, "step": 7571 }, { "epoch": 0.86, "learning_rate": 1.0012925282489615e-05, "loss": 0.6819, "step": 7572 }, { "epoch": 0.86, "learning_rate": 9.99687529187966e-06, "loss": 0.5943, "step": 7573 }, { "epoch": 0.86, "learning_rate": 9.980837498242356e-06, "loss": 0.6159, "step": 7574 }, { "epoch": 0.86, "learning_rate": 9.964811903751137e-06, "loss": 0.6944, "step": 7575 }, { "epoch": 0.86, "learning_rate": 9.948798510577717e-06, "loss": 0.5786, "step": 7576 }, { "epoch": 0.86, "learning_rate": 9.93279732089223e-06, "loss": 0.7013, "step": 7577 }, { "epoch": 0.86, "learning_rate": 9.916808336863082e-06, "loss": 0.6614, "step": 7578 }, { "epoch": 0.86, "learning_rate": 9.900831560657064e-06, "loss": 0.7418, "step": 7579 }, { "epoch": 0.86, "learning_rate": 9.884866994439278e-06, "loss": 0.6978, "step": 7580 }, { "epoch": 0.86, "learning_rate": 9.868914640373239e-06, "loss": 0.5945, "step": 7581 }, { "epoch": 0.86, "learning_rate": 9.852974500620737e-06, "loss": 0.6038, "step": 7582 }, { "epoch": 0.86, "learning_rate": 9.837046577341934e-06, "loss": 0.644, "step": 7583 }, { "epoch": 0.86, "learning_rate": 9.821130872695373e-06, "loss": 0.6922, "step": 7584 }, { "epoch": 0.86, "learning_rate": 9.805227388837857e-06, "loss": 0.6087, "step": 7585 }, { "epoch": 0.86, "learning_rate": 9.78933612792462e-06, "loss": 0.6953, "step": 7586 }, { "epoch": 0.86, "learning_rate": 9.773457092109173e-06, "loss": 0.6131, "step": 7587 }, { "epoch": 0.86, "learning_rate": 9.75759028354345e-06, "loss": 0.697, "step": 7588 }, { "epoch": 0.86, "learning_rate": 9.741735704377607e-06, "loss": 0.6474, "step": 7589 }, { "epoch": 0.86, "learning_rate": 9.725893356760262e-06, "loss": 0.6632, "step": 7590 }, { "epoch": 0.86, "learning_rate": 9.710063242838285e-06, "loss": 0.6895, "step": 7591 }, { "epoch": 0.86, "learning_rate": 9.694245364756982e-06, "loss": 0.6879, "step": 7592 }, { "epoch": 0.86, "learning_rate": 9.678439724659894e-06, "loss": 0.7035, "step": 7593 }, { "epoch": 0.86, "learning_rate": 9.662646324689017e-06, "loss": 0.6172, "step": 7594 }, { "epoch": 0.86, "learning_rate": 9.646865166984553e-06, "loss": 0.5917, "step": 7595 }, { "epoch": 0.86, "learning_rate": 9.63109625368519e-06, "loss": 0.6606, "step": 7596 }, { "epoch": 0.86, "learning_rate": 9.615339586927841e-06, "loss": 0.6439, "step": 7597 }, { "epoch": 0.86, "learning_rate": 9.59959516884783e-06, "loss": 0.6648, "step": 7598 }, { "epoch": 0.86, "learning_rate": 9.583863001578797e-06, "loss": 0.6066, "step": 7599 }, { "epoch": 0.86, "learning_rate": 9.568143087252711e-06, "loss": 0.6482, "step": 7600 }, { "epoch": 0.86, "learning_rate": 9.552435427999873e-06, "loss": 0.6845, "step": 7601 }, { "epoch": 0.86, "learning_rate": 9.536740025948987e-06, "loss": 0.6227, "step": 7602 }, { "epoch": 0.86, "learning_rate": 9.521056883227008e-06, "loss": 0.659, "step": 7603 }, { "epoch": 0.86, "learning_rate": 9.505386001959305e-06, "loss": 0.6259, "step": 7604 }, { "epoch": 0.86, "learning_rate": 9.489727384269531e-06, "loss": 0.6567, "step": 7605 }, { "epoch": 0.86, "learning_rate": 9.474081032279691e-06, "loss": 0.7055, "step": 7606 }, { "epoch": 0.86, "learning_rate": 9.458446948110166e-06, "loss": 0.6985, "step": 7607 }, { "epoch": 0.86, "learning_rate": 9.442825133879607e-06, "loss": 0.6464, "step": 7608 }, { "epoch": 0.86, "learning_rate": 9.427215591705075e-06, "loss": 0.7141, "step": 7609 }, { "epoch": 0.86, "learning_rate": 9.411618323701898e-06, "loss": 0.686, "step": 7610 }, { "epoch": 0.87, "learning_rate": 9.396033331983823e-06, "loss": 0.6641, "step": 7611 }, { "epoch": 0.87, "learning_rate": 9.380460618662812e-06, "loss": 0.5936, "step": 7612 }, { "epoch": 0.87, "learning_rate": 9.3649001858493e-06, "loss": 0.6554, "step": 7613 }, { "epoch": 0.87, "learning_rate": 9.349352035651948e-06, "loss": 0.6947, "step": 7614 }, { "epoch": 0.87, "learning_rate": 9.333816170177834e-06, "loss": 0.6623, "step": 7615 }, { "epoch": 0.87, "learning_rate": 9.318292591532318e-06, "loss": 0.7007, "step": 7616 }, { "epoch": 0.87, "learning_rate": 9.30278130181912e-06, "loss": 0.633, "step": 7617 }, { "epoch": 0.87, "learning_rate": 9.287282303140265e-06, "loss": 0.658, "step": 7618 }, { "epoch": 0.87, "learning_rate": 9.271795597596167e-06, "loss": 0.6954, "step": 7619 }, { "epoch": 0.87, "learning_rate": 9.256321187285499e-06, "loss": 0.7486, "step": 7620 }, { "epoch": 0.87, "learning_rate": 9.240859074305353e-06, "loss": 0.6523, "step": 7621 }, { "epoch": 0.87, "learning_rate": 9.225409260751106e-06, "loss": 0.746, "step": 7622 }, { "epoch": 0.87, "learning_rate": 9.209971748716451e-06, "loss": 0.6817, "step": 7623 }, { "epoch": 0.87, "learning_rate": 9.194546540293425e-06, "loss": 0.6448, "step": 7624 }, { "epoch": 0.87, "learning_rate": 9.179133637572457e-06, "loss": 0.6331, "step": 7625 }, { "epoch": 0.87, "learning_rate": 9.163733042642219e-06, "loss": 0.6389, "step": 7626 }, { "epoch": 0.87, "learning_rate": 9.148344757589789e-06, "loss": 0.6778, "step": 7627 }, { "epoch": 0.87, "learning_rate": 9.132968784500518e-06, "loss": 0.6123, "step": 7628 }, { "epoch": 0.87, "learning_rate": 9.117605125458118e-06, "loss": 0.6424, "step": 7629 }, { "epoch": 0.87, "learning_rate": 9.102253782544645e-06, "loss": 0.6835, "step": 7630 }, { "epoch": 0.87, "learning_rate": 9.086914757840448e-06, "loss": 0.6799, "step": 7631 }, { "epoch": 0.87, "learning_rate": 9.071588053424262e-06, "loss": 0.644, "step": 7632 }, { "epoch": 0.87, "learning_rate": 9.056273671373106e-06, "loss": 0.6479, "step": 7633 }, { "epoch": 0.87, "learning_rate": 9.040971613762328e-06, "loss": 0.6201, "step": 7634 }, { "epoch": 0.87, "learning_rate": 9.025681882665615e-06, "loss": 0.7101, "step": 7635 }, { "epoch": 0.87, "learning_rate": 9.01040448015501e-06, "loss": 0.5978, "step": 7636 }, { "epoch": 0.87, "learning_rate": 8.995139408300846e-06, "loss": 0.6497, "step": 7637 }, { "epoch": 0.87, "learning_rate": 8.979886669171833e-06, "loss": 0.7245, "step": 7638 }, { "epoch": 0.87, "learning_rate": 8.964646264834952e-06, "loss": 0.6872, "step": 7639 }, { "epoch": 0.87, "learning_rate": 8.949418197355553e-06, "loss": 0.6643, "step": 7640 }, { "epoch": 0.87, "learning_rate": 8.934202468797282e-06, "loss": 0.6724, "step": 7641 }, { "epoch": 0.87, "learning_rate": 8.918999081222156e-06, "loss": 0.6037, "step": 7642 }, { "epoch": 0.87, "learning_rate": 8.903808036690475e-06, "loss": 0.5901, "step": 7643 }, { "epoch": 0.87, "learning_rate": 8.888629337260912e-06, "loss": 0.64, "step": 7644 }, { "epoch": 0.87, "learning_rate": 8.873462984990421e-06, "loss": 0.6786, "step": 7645 }, { "epoch": 0.87, "learning_rate": 8.858308981934326e-06, "loss": 0.6729, "step": 7646 }, { "epoch": 0.87, "learning_rate": 8.843167330146207e-06, "loss": 0.6722, "step": 7647 }, { "epoch": 0.87, "learning_rate": 8.828038031678077e-06, "loss": 0.6747, "step": 7648 }, { "epoch": 0.87, "learning_rate": 8.812921088580172e-06, "loss": 0.6666, "step": 7649 }, { "epoch": 0.87, "learning_rate": 8.797816502901146e-06, "loss": 0.693, "step": 7650 }, { "epoch": 0.87, "learning_rate": 8.782724276687892e-06, "loss": 0.6843, "step": 7651 }, { "epoch": 0.87, "learning_rate": 8.767644411985654e-06, "loss": 0.6634, "step": 7652 }, { "epoch": 0.87, "learning_rate": 8.752576910838051e-06, "loss": 0.6769, "step": 7653 }, { "epoch": 0.87, "learning_rate": 8.737521775286961e-06, "loss": 0.6421, "step": 7654 }, { "epoch": 0.87, "learning_rate": 8.722479007372652e-06, "loss": 0.7031, "step": 7655 }, { "epoch": 0.87, "learning_rate": 8.70744860913364e-06, "loss": 0.6919, "step": 7656 }, { "epoch": 0.87, "learning_rate": 8.692430582606814e-06, "loss": 0.6192, "step": 7657 }, { "epoch": 0.87, "learning_rate": 8.67742492982736e-06, "loss": 0.6315, "step": 7658 }, { "epoch": 0.87, "learning_rate": 8.66243165282884e-06, "loss": 0.7079, "step": 7659 }, { "epoch": 0.87, "learning_rate": 8.64745075364306e-06, "loss": 0.6974, "step": 7660 }, { "epoch": 0.87, "learning_rate": 8.632482234300221e-06, "loss": 0.6664, "step": 7661 }, { "epoch": 0.87, "learning_rate": 8.61752609682881e-06, "loss": 0.5878, "step": 7662 }, { "epoch": 0.87, "learning_rate": 8.602582343255628e-06, "loss": 0.625, "step": 7663 }, { "epoch": 0.87, "learning_rate": 8.587650975605798e-06, "loss": 0.71, "step": 7664 }, { "epoch": 0.87, "learning_rate": 8.572731995902816e-06, "loss": 0.646, "step": 7665 }, { "epoch": 0.87, "learning_rate": 8.557825406168429e-06, "loss": 0.6898, "step": 7666 }, { "epoch": 0.87, "learning_rate": 8.542931208422756e-06, "loss": 0.6756, "step": 7667 }, { "epoch": 0.87, "learning_rate": 8.528049404684213e-06, "loss": 0.6601, "step": 7668 }, { "epoch": 0.87, "learning_rate": 8.513179996969545e-06, "loss": 0.6731, "step": 7669 }, { "epoch": 0.87, "learning_rate": 8.498322987293771e-06, "loss": 0.6987, "step": 7670 }, { "epoch": 0.87, "learning_rate": 8.48347837767034e-06, "loss": 0.6937, "step": 7671 }, { "epoch": 0.87, "learning_rate": 8.468646170110883e-06, "loss": 0.6214, "step": 7672 }, { "epoch": 0.87, "learning_rate": 8.453826366625483e-06, "loss": 0.7165, "step": 7673 }, { "epoch": 0.87, "learning_rate": 8.439018969222445e-06, "loss": 0.64, "step": 7674 }, { "epoch": 0.87, "learning_rate": 8.42422397990843e-06, "loss": 0.6623, "step": 7675 }, { "epoch": 0.87, "learning_rate": 8.4094414006884e-06, "loss": 0.6701, "step": 7676 }, { "epoch": 0.87, "learning_rate": 8.394671233565676e-06, "loss": 0.6505, "step": 7677 }, { "epoch": 0.87, "learning_rate": 8.379913480541835e-06, "loss": 0.6633, "step": 7678 }, { "epoch": 0.87, "learning_rate": 8.365168143616854e-06, "loss": 0.7206, "step": 7679 }, { "epoch": 0.87, "learning_rate": 8.350435224788956e-06, "loss": 0.6364, "step": 7680 }, { "epoch": 0.87, "learning_rate": 8.335714726054678e-06, "loss": 0.6909, "step": 7681 }, { "epoch": 0.87, "learning_rate": 8.321006649408946e-06, "loss": 0.6905, "step": 7682 }, { "epoch": 0.87, "learning_rate": 8.306310996844923e-06, "loss": 0.6969, "step": 7683 }, { "epoch": 0.87, "learning_rate": 8.29162777035416e-06, "loss": 0.6268, "step": 7684 }, { "epoch": 0.87, "learning_rate": 8.276956971926465e-06, "loss": 0.6354, "step": 7685 }, { "epoch": 0.87, "learning_rate": 8.262298603549979e-06, "loss": 0.701, "step": 7686 }, { "epoch": 0.87, "learning_rate": 8.247652667211147e-06, "loss": 0.7, "step": 7687 }, { "epoch": 0.87, "learning_rate": 8.233019164894785e-06, "loss": 0.6286, "step": 7688 }, { "epoch": 0.87, "learning_rate": 8.218398098583958e-06, "loss": 0.6259, "step": 7689 }, { "epoch": 0.87, "learning_rate": 8.203789470260103e-06, "loss": 0.5899, "step": 7690 }, { "epoch": 0.87, "learning_rate": 8.189193281902885e-06, "loss": 0.7038, "step": 7691 }, { "epoch": 0.87, "learning_rate": 8.174609535490397e-06, "loss": 0.5637, "step": 7692 }, { "epoch": 0.87, "learning_rate": 8.160038232998935e-06, "loss": 0.642, "step": 7693 }, { "epoch": 0.87, "learning_rate": 8.14547937640321e-06, "loss": 0.6605, "step": 7694 }, { "epoch": 0.87, "learning_rate": 8.130932967676153e-06, "loss": 0.6754, "step": 7695 }, { "epoch": 0.87, "learning_rate": 8.116399008789122e-06, "loss": 0.6027, "step": 7696 }, { "epoch": 0.87, "learning_rate": 8.10187750171163e-06, "loss": 0.6543, "step": 7697 }, { "epoch": 0.87, "learning_rate": 8.087368448411647e-06, "loss": 0.7039, "step": 7698 }, { "epoch": 0.88, "learning_rate": 8.07287185085538e-06, "loss": 0.6825, "step": 7699 }, { "epoch": 0.88, "learning_rate": 8.058387711007388e-06, "loss": 0.6696, "step": 7700 }, { "epoch": 0.88, "learning_rate": 8.04391603083049e-06, "loss": 0.652, "step": 7701 }, { "epoch": 0.88, "learning_rate": 8.029456812285873e-06, "loss": 0.6737, "step": 7702 }, { "epoch": 0.88, "learning_rate": 8.015010057333005e-06, "loss": 0.6933, "step": 7703 }, { "epoch": 0.88, "learning_rate": 8.000575767929653e-06, "loss": 0.588, "step": 7704 }, { "epoch": 0.88, "learning_rate": 7.986153946031939e-06, "loss": 0.6376, "step": 7705 }, { "epoch": 0.88, "learning_rate": 7.971744593594244e-06, "loss": 0.6461, "step": 7706 }, { "epoch": 0.88, "learning_rate": 7.957347712569307e-06, "loss": 0.6541, "step": 7707 }, { "epoch": 0.88, "learning_rate": 7.942963304908136e-06, "loss": 0.7044, "step": 7708 }, { "epoch": 0.88, "learning_rate": 7.928591372560079e-06, "loss": 0.5782, "step": 7709 }, { "epoch": 0.88, "learning_rate": 7.914231917472747e-06, "loss": 0.6571, "step": 7710 }, { "epoch": 0.88, "learning_rate": 7.89988494159214e-06, "loss": 0.6388, "step": 7711 }, { "epoch": 0.88, "learning_rate": 7.885550446862466e-06, "loss": 0.7128, "step": 7712 }, { "epoch": 0.88, "learning_rate": 7.871228435226374e-06, "loss": 0.6853, "step": 7713 }, { "epoch": 0.88, "learning_rate": 7.856918908624667e-06, "loss": 0.6362, "step": 7714 }, { "epoch": 0.88, "learning_rate": 7.842621868996568e-06, "loss": 0.658, "step": 7715 }, { "epoch": 0.88, "learning_rate": 7.828337318279556e-06, "loss": 0.673, "step": 7716 }, { "epoch": 0.88, "learning_rate": 7.814065258409453e-06, "loss": 0.6216, "step": 7717 }, { "epoch": 0.88, "learning_rate": 7.79980569132034e-06, "loss": 0.7298, "step": 7718 }, { "epoch": 0.88, "learning_rate": 7.7855586189447e-06, "loss": 0.6349, "step": 7719 }, { "epoch": 0.88, "learning_rate": 7.771324043213158e-06, "loss": 0.6639, "step": 7720 }, { "epoch": 0.88, "learning_rate": 7.757101966054825e-06, "loss": 0.6955, "step": 7721 }, { "epoch": 0.88, "learning_rate": 7.742892389396983e-06, "loss": 0.5979, "step": 7722 }, { "epoch": 0.88, "learning_rate": 7.728695315165324e-06, "loss": 0.6832, "step": 7723 }, { "epoch": 0.88, "learning_rate": 7.714510745283742e-06, "loss": 0.6411, "step": 7724 }, { "epoch": 0.88, "learning_rate": 7.700338681674546e-06, "loss": 0.6371, "step": 7725 }, { "epoch": 0.88, "learning_rate": 7.686179126258264e-06, "loss": 0.6783, "step": 7726 }, { "epoch": 0.88, "learning_rate": 7.67203208095375e-06, "loss": 0.661, "step": 7727 }, { "epoch": 0.88, "learning_rate": 7.657897547678205e-06, "loss": 0.6075, "step": 7728 }, { "epoch": 0.88, "learning_rate": 7.643775528347053e-06, "loss": 0.6906, "step": 7729 }, { "epoch": 0.88, "learning_rate": 7.629666024874138e-06, "loss": 0.6601, "step": 7730 }, { "epoch": 0.88, "learning_rate": 7.615569039171477e-06, "loss": 0.6339, "step": 7731 }, { "epoch": 0.88, "learning_rate": 7.601484573149487e-06, "loss": 0.556, "step": 7732 }, { "epoch": 0.88, "learning_rate": 7.587412628716839e-06, "loss": 0.6551, "step": 7733 }, { "epoch": 0.88, "learning_rate": 7.573353207780542e-06, "loss": 0.6824, "step": 7734 }, { "epoch": 0.88, "learning_rate": 7.559306312245862e-06, "loss": 0.6434, "step": 7735 }, { "epoch": 0.88, "learning_rate": 7.545271944016452e-06, "loss": 0.7702, "step": 7736 }, { "epoch": 0.88, "learning_rate": 7.531250104994137e-06, "loss": 0.6907, "step": 7737 }, { "epoch": 0.88, "learning_rate": 7.5172407970791725e-06, "loss": 0.678, "step": 7738 }, { "epoch": 0.88, "learning_rate": 7.503244022170019e-06, "loss": 0.6936, "step": 7739 }, { "epoch": 0.88, "learning_rate": 7.489259782163516e-06, "loss": 0.6993, "step": 7740 }, { "epoch": 0.88, "learning_rate": 7.4752880789547454e-06, "loss": 0.6865, "step": 7741 }, { "epoch": 0.88, "learning_rate": 7.46132891443716e-06, "loss": 0.6638, "step": 7742 }, { "epoch": 0.88, "learning_rate": 7.44738229050238e-06, "loss": 0.6692, "step": 7743 }, { "epoch": 0.88, "learning_rate": 7.433448209040495e-06, "loss": 0.6382, "step": 7744 }, { "epoch": 0.88, "learning_rate": 7.419526671939758e-06, "loss": 0.6155, "step": 7745 }, { "epoch": 0.88, "learning_rate": 7.405617681086818e-06, "loss": 0.6436, "step": 7746 }, { "epoch": 0.88, "learning_rate": 7.391721238366567e-06, "loss": 0.7083, "step": 7747 }, { "epoch": 0.88, "learning_rate": 7.377837345662186e-06, "loss": 0.6799, "step": 7748 }, { "epoch": 0.88, "learning_rate": 7.363966004855227e-06, "loss": 0.6684, "step": 7749 }, { "epoch": 0.88, "learning_rate": 7.350107217825464e-06, "loss": 0.6348, "step": 7750 }, { "epoch": 0.88, "learning_rate": 7.3362609864510155e-06, "loss": 0.622, "step": 7751 }, { "epoch": 0.88, "learning_rate": 7.322427312608282e-06, "loss": 0.6787, "step": 7752 }, { "epoch": 0.88, "learning_rate": 7.308606198171963e-06, "loss": 0.6481, "step": 7753 }, { "epoch": 0.88, "learning_rate": 7.294797645015039e-06, "loss": 0.7524, "step": 7754 }, { "epoch": 0.88, "learning_rate": 7.2810016550088456e-06, "loss": 0.7009, "step": 7755 }, { "epoch": 0.88, "learning_rate": 7.267218230022932e-06, "loss": 0.6578, "step": 7756 }, { "epoch": 0.88, "learning_rate": 7.253447371925226e-06, "loss": 0.6236, "step": 7757 }, { "epoch": 0.88, "learning_rate": 7.239689082581902e-06, "loss": 0.6419, "step": 7758 }, { "epoch": 0.88, "learning_rate": 7.225943363857468e-06, "loss": 0.6429, "step": 7759 }, { "epoch": 0.88, "learning_rate": 7.2122102176146455e-06, "loss": 0.6414, "step": 7760 }, { "epoch": 0.88, "learning_rate": 7.198489645714579e-06, "loss": 0.7657, "step": 7761 }, { "epoch": 0.88, "learning_rate": 7.184781650016581e-06, "loss": 0.6173, "step": 7762 }, { "epoch": 0.88, "learning_rate": 7.171086232378388e-06, "loss": 0.6847, "step": 7763 }, { "epoch": 0.88, "learning_rate": 7.157403394655904e-06, "loss": 0.7111, "step": 7764 }, { "epoch": 0.88, "learning_rate": 7.143733138703445e-06, "loss": 0.6743, "step": 7765 }, { "epoch": 0.88, "learning_rate": 7.130075466373498e-06, "loss": 0.6609, "step": 7766 }, { "epoch": 0.88, "learning_rate": 7.116430379516981e-06, "loss": 0.6645, "step": 7767 }, { "epoch": 0.88, "learning_rate": 7.1027978799829805e-06, "loss": 0.6932, "step": 7768 }, { "epoch": 0.88, "learning_rate": 7.089177969618988e-06, "loss": 0.5805, "step": 7769 }, { "epoch": 0.88, "learning_rate": 7.075570650270702e-06, "loss": 0.7191, "step": 7770 }, { "epoch": 0.88, "learning_rate": 7.061975923782161e-06, "loss": 0.6886, "step": 7771 }, { "epoch": 0.88, "learning_rate": 7.048393791995666e-06, "loss": 0.589, "step": 7772 }, { "epoch": 0.88, "learning_rate": 7.034824256751848e-06, "loss": 0.6991, "step": 7773 }, { "epoch": 0.88, "learning_rate": 7.021267319889602e-06, "loss": 0.6926, "step": 7774 }, { "epoch": 0.88, "learning_rate": 7.007722983246145e-06, "loss": 0.6845, "step": 7775 }, { "epoch": 0.88, "learning_rate": 6.994191248656956e-06, "loss": 0.631, "step": 7776 }, { "epoch": 0.88, "learning_rate": 6.9806721179558e-06, "loss": 0.6631, "step": 7777 }, { "epoch": 0.88, "learning_rate": 6.967165592974789e-06, "loss": 0.7403, "step": 7778 }, { "epoch": 0.88, "learning_rate": 6.95367167554426e-06, "loss": 0.7422, "step": 7779 }, { "epoch": 0.88, "learning_rate": 6.940190367492883e-06, "loss": 0.6508, "step": 7780 }, { "epoch": 0.88, "learning_rate": 6.926721670647596e-06, "loss": 0.6667, "step": 7781 }, { "epoch": 0.88, "learning_rate": 6.9132655868336725e-06, "loss": 0.6652, "step": 7782 }, { "epoch": 0.88, "learning_rate": 6.899822117874599e-06, "loss": 0.5896, "step": 7783 }, { "epoch": 0.88, "learning_rate": 6.886391265592229e-06, "loss": 0.6372, "step": 7784 }, { "epoch": 0.88, "learning_rate": 6.87297303180664e-06, "loss": 0.6451, "step": 7785 }, { "epoch": 0.88, "learning_rate": 6.859567418336277e-06, "loss": 0.6755, "step": 7786 }, { "epoch": 0.89, "learning_rate": 6.84617442699782e-06, "loss": 0.6841, "step": 7787 }, { "epoch": 0.89, "learning_rate": 6.832794059606229e-06, "loss": 0.6176, "step": 7788 }, { "epoch": 0.89, "learning_rate": 6.819426317974776e-06, "loss": 0.6728, "step": 7789 }, { "epoch": 0.89, "learning_rate": 6.806071203915032e-06, "loss": 0.6066, "step": 7790 }, { "epoch": 0.89, "learning_rate": 6.7927287192368405e-06, "loss": 0.6828, "step": 7791 }, { "epoch": 0.89, "learning_rate": 6.779398865748354e-06, "loss": 0.6813, "step": 7792 }, { "epoch": 0.89, "learning_rate": 6.766081645255984e-06, "loss": 0.6988, "step": 7793 }, { "epoch": 0.89, "learning_rate": 6.75277705956443e-06, "loss": 0.7124, "step": 7794 }, { "epoch": 0.89, "learning_rate": 6.739485110476707e-06, "loss": 0.5882, "step": 7795 }, { "epoch": 0.89, "learning_rate": 6.726205799794105e-06, "loss": 0.6384, "step": 7796 }, { "epoch": 0.89, "learning_rate": 6.712939129316176e-06, "loss": 0.6425, "step": 7797 }, { "epoch": 0.89, "learning_rate": 6.699685100840824e-06, "loss": 0.7035, "step": 7798 }, { "epoch": 0.89, "learning_rate": 6.68644371616417e-06, "loss": 0.6747, "step": 7799 }, { "epoch": 0.89, "learning_rate": 6.673214977080633e-06, "loss": 0.6303, "step": 7800 }, { "epoch": 0.89, "learning_rate": 6.659998885382979e-06, "loss": 0.6931, "step": 7801 }, { "epoch": 0.89, "learning_rate": 6.646795442862175e-06, "loss": 0.6858, "step": 7802 }, { "epoch": 0.89, "learning_rate": 6.633604651307556e-06, "loss": 0.6094, "step": 7803 }, { "epoch": 0.89, "learning_rate": 6.620426512506672e-06, "loss": 0.6551, "step": 7804 }, { "epoch": 0.89, "learning_rate": 6.607261028245393e-06, "loss": 0.6179, "step": 7805 }, { "epoch": 0.89, "learning_rate": 6.594108200307858e-06, "loss": 0.7023, "step": 7806 }, { "epoch": 0.89, "learning_rate": 6.58096803047652e-06, "loss": 0.6762, "step": 7807 }, { "epoch": 0.89, "learning_rate": 6.567840520532087e-06, "loss": 0.6347, "step": 7808 }, { "epoch": 0.89, "learning_rate": 6.5547256722535695e-06, "loss": 0.6086, "step": 7809 }, { "epoch": 0.89, "learning_rate": 6.5416234874182695e-06, "loss": 0.6321, "step": 7810 }, { "epoch": 0.89, "learning_rate": 6.5285339678017306e-06, "loss": 0.7235, "step": 7811 }, { "epoch": 0.89, "learning_rate": 6.515457115177803e-06, "loss": 0.6443, "step": 7812 }, { "epoch": 0.89, "learning_rate": 6.502392931318657e-06, "loss": 0.6472, "step": 7813 }, { "epoch": 0.89, "learning_rate": 6.489341417994687e-06, "loss": 0.6644, "step": 7814 }, { "epoch": 0.89, "learning_rate": 6.476302576974624e-06, "loss": 0.6833, "step": 7815 }, { "epoch": 0.89, "learning_rate": 6.4632764100254425e-06, "loss": 0.6744, "step": 7816 }, { "epoch": 0.89, "learning_rate": 6.450262918912409e-06, "loss": 0.605, "step": 7817 }, { "epoch": 0.89, "learning_rate": 6.437262105399055e-06, "loss": 0.659, "step": 7818 }, { "epoch": 0.89, "learning_rate": 6.4242739712472635e-06, "loss": 0.5952, "step": 7819 }, { "epoch": 0.89, "learning_rate": 6.411298518217101e-06, "loss": 0.6628, "step": 7820 }, { "epoch": 0.89, "learning_rate": 6.398335748067008e-06, "loss": 0.662, "step": 7821 }, { "epoch": 0.89, "learning_rate": 6.385385662553633e-06, "loss": 0.6401, "step": 7822 }, { "epoch": 0.89, "learning_rate": 6.372448263431941e-06, "loss": 0.6128, "step": 7823 }, { "epoch": 0.89, "learning_rate": 6.3595235524551825e-06, "loss": 0.6869, "step": 7824 }, { "epoch": 0.89, "learning_rate": 6.346611531374858e-06, "loss": 0.686, "step": 7825 }, { "epoch": 0.89, "learning_rate": 6.3337122019408e-06, "loss": 0.5863, "step": 7826 }, { "epoch": 0.89, "learning_rate": 6.320825565901079e-06, "loss": 0.7383, "step": 7827 }, { "epoch": 0.89, "learning_rate": 6.30795162500204e-06, "loss": 0.7471, "step": 7828 }, { "epoch": 0.89, "learning_rate": 6.295090380988322e-06, "loss": 0.6256, "step": 7829 }, { "epoch": 0.89, "learning_rate": 6.282241835602865e-06, "loss": 0.6355, "step": 7830 }, { "epoch": 0.89, "learning_rate": 6.269405990586852e-06, "loss": 0.5905, "step": 7831 }, { "epoch": 0.89, "learning_rate": 6.256582847679782e-06, "loss": 0.6799, "step": 7832 }, { "epoch": 0.89, "learning_rate": 6.243772408619386e-06, "loss": 0.6836, "step": 7833 }, { "epoch": 0.89, "learning_rate": 6.230974675141721e-06, "loss": 0.6176, "step": 7834 }, { "epoch": 0.89, "learning_rate": 6.2181896489810765e-06, "loss": 0.6761, "step": 7835 }, { "epoch": 0.89, "learning_rate": 6.205417331870067e-06, "loss": 0.6438, "step": 7836 }, { "epoch": 0.89, "learning_rate": 6.19265772553953e-06, "loss": 0.6731, "step": 7837 }, { "epoch": 0.89, "learning_rate": 6.179910831718661e-06, "loss": 0.5749, "step": 7838 }, { "epoch": 0.89, "learning_rate": 6.167176652134843e-06, "loss": 0.6293, "step": 7839 }, { "epoch": 0.89, "learning_rate": 6.154455188513797e-06, "loss": 0.7033, "step": 7840 }, { "epoch": 0.89, "learning_rate": 6.141746442579477e-06, "loss": 0.7012, "step": 7841 }, { "epoch": 0.89, "learning_rate": 6.129050416054161e-06, "loss": 0.6533, "step": 7842 }, { "epoch": 0.89, "learning_rate": 6.1163671106583605e-06, "loss": 0.7082, "step": 7843 }, { "epoch": 0.89, "learning_rate": 6.103696528110903e-06, "loss": 0.6586, "step": 7844 }, { "epoch": 0.89, "learning_rate": 6.091038670128868e-06, "loss": 0.7076, "step": 7845 }, { "epoch": 0.89, "learning_rate": 6.078393538427574e-06, "loss": 0.622, "step": 7846 }, { "epoch": 0.89, "learning_rate": 6.065761134720715e-06, "loss": 0.6375, "step": 7847 }, { "epoch": 0.89, "learning_rate": 6.053141460720157e-06, "loss": 0.6529, "step": 7848 }, { "epoch": 0.89, "learning_rate": 6.040534518136076e-06, "loss": 0.6641, "step": 7849 }, { "epoch": 0.89, "learning_rate": 6.027940308676971e-06, "loss": 0.7038, "step": 7850 }, { "epoch": 0.89, "learning_rate": 6.015358834049556e-06, "loss": 0.6416, "step": 7851 }, { "epoch": 0.89, "learning_rate": 6.0027900959588105e-06, "loss": 0.6193, "step": 7852 }, { "epoch": 0.89, "learning_rate": 5.990234096108049e-06, "loss": 0.6812, "step": 7853 }, { "epoch": 0.89, "learning_rate": 5.977690836198802e-06, "loss": 0.6571, "step": 7854 }, { "epoch": 0.89, "learning_rate": 5.965160317930929e-06, "loss": 0.6771, "step": 7855 }, { "epoch": 0.89, "learning_rate": 5.952642543002507e-06, "loss": 0.6488, "step": 7856 }, { "epoch": 0.89, "learning_rate": 5.940137513109911e-06, "loss": 0.5914, "step": 7857 }, { "epoch": 0.89, "learning_rate": 5.927645229947776e-06, "loss": 0.6657, "step": 7858 }, { "epoch": 0.89, "learning_rate": 5.915165695209046e-06, "loss": 0.6315, "step": 7859 }, { "epoch": 0.89, "learning_rate": 5.902698910584891e-06, "loss": 0.6726, "step": 7860 }, { "epoch": 0.89, "learning_rate": 5.8902448777648276e-06, "loss": 0.646, "step": 7861 }, { "epoch": 0.89, "learning_rate": 5.8778035984365045e-06, "loss": 0.679, "step": 7862 }, { "epoch": 0.89, "learning_rate": 5.8653750742860055e-06, "loss": 0.6827, "step": 7863 }, { "epoch": 0.89, "learning_rate": 5.852959306997552e-06, "loss": 0.614, "step": 7864 }, { "epoch": 0.89, "learning_rate": 5.840556298253741e-06, "loss": 0.6674, "step": 7865 }, { "epoch": 0.89, "learning_rate": 5.828166049735362e-06, "loss": 0.6896, "step": 7866 }, { "epoch": 0.89, "learning_rate": 5.815788563121538e-06, "loss": 0.6633, "step": 7867 }, { "epoch": 0.89, "learning_rate": 5.803423840089594e-06, "loss": 0.5979, "step": 7868 }, { "epoch": 0.89, "learning_rate": 5.791071882315191e-06, "loss": 0.6829, "step": 7869 }, { "epoch": 0.89, "learning_rate": 5.77873269147221e-06, "loss": 0.6752, "step": 7870 }, { "epoch": 0.89, "learning_rate": 5.7664062692328495e-06, "loss": 0.6863, "step": 7871 }, { "epoch": 0.89, "learning_rate": 5.7540926172675255e-06, "loss": 0.6193, "step": 7872 }, { "epoch": 0.89, "learning_rate": 5.741791737244973e-06, "loss": 0.6241, "step": 7873 }, { "epoch": 0.89, "learning_rate": 5.729503630832167e-06, "loss": 0.5721, "step": 7874 }, { "epoch": 0.9, "learning_rate": 5.717228299694344e-06, "loss": 0.6021, "step": 7875 }, { "epoch": 0.9, "learning_rate": 5.704965745495039e-06, "loss": 0.6649, "step": 7876 }, { "epoch": 0.9, "learning_rate": 5.692715969896012e-06, "loss": 0.704, "step": 7877 }, { "epoch": 0.9, "learning_rate": 5.680478974557379e-06, "loss": 0.6368, "step": 7878 }, { "epoch": 0.9, "learning_rate": 5.668254761137392e-06, "loss": 0.7448, "step": 7879 }, { "epoch": 0.9, "learning_rate": 5.6560433312926815e-06, "loss": 0.6696, "step": 7880 }, { "epoch": 0.9, "learning_rate": 5.64384468667809e-06, "loss": 0.6543, "step": 7881 }, { "epoch": 0.9, "learning_rate": 5.631658828946762e-06, "loss": 0.6646, "step": 7882 }, { "epoch": 0.9, "learning_rate": 5.619485759750065e-06, "loss": 0.6726, "step": 7883 }, { "epoch": 0.9, "learning_rate": 5.607325480737713e-06, "loss": 0.7097, "step": 7884 }, { "epoch": 0.9, "learning_rate": 5.595177993557555e-06, "loss": 0.6516, "step": 7885 }, { "epoch": 0.9, "learning_rate": 5.58304329985585e-06, "loss": 0.6708, "step": 7886 }, { "epoch": 0.9, "learning_rate": 5.570921401277018e-06, "loss": 0.6786, "step": 7887 }, { "epoch": 0.9, "learning_rate": 5.558812299463811e-06, "loss": 0.6238, "step": 7888 }, { "epoch": 0.9, "learning_rate": 5.546715996057195e-06, "loss": 0.7462, "step": 7889 }, { "epoch": 0.9, "learning_rate": 5.534632492696468e-06, "loss": 0.6588, "step": 7890 }, { "epoch": 0.9, "learning_rate": 5.522561791019109e-06, "loss": 0.6728, "step": 7891 }, { "epoch": 0.9, "learning_rate": 5.510503892660934e-06, "loss": 0.6149, "step": 7892 }, { "epoch": 0.9, "learning_rate": 5.4984587992559675e-06, "loss": 0.7039, "step": 7893 }, { "epoch": 0.9, "learning_rate": 5.48642651243656e-06, "loss": 0.7328, "step": 7894 }, { "epoch": 0.9, "learning_rate": 5.474407033833262e-06, "loss": 0.6869, "step": 7895 }, { "epoch": 0.9, "learning_rate": 5.462400365074949e-06, "loss": 0.682, "step": 7896 }, { "epoch": 0.9, "learning_rate": 5.45040650778873e-06, "loss": 0.6859, "step": 7897 }, { "epoch": 0.9, "learning_rate": 5.438425463599939e-06, "loss": 0.6829, "step": 7898 }, { "epoch": 0.9, "learning_rate": 5.426457234132265e-06, "loss": 0.6507, "step": 7899 }, { "epoch": 0.9, "learning_rate": 5.414501821007567e-06, "loss": 0.6598, "step": 7900 }, { "epoch": 0.9, "learning_rate": 5.402559225846071e-06, "loss": 0.6521, "step": 7901 }, { "epoch": 0.9, "learning_rate": 5.390629450266116e-06, "loss": 0.6478, "step": 7902 }, { "epoch": 0.9, "learning_rate": 5.378712495884463e-06, "loss": 0.6156, "step": 7903 }, { "epoch": 0.9, "learning_rate": 5.366808364316022e-06, "loss": 0.6521, "step": 7904 }, { "epoch": 0.9, "learning_rate": 5.354917057174036e-06, "loss": 0.6286, "step": 7905 }, { "epoch": 0.9, "learning_rate": 5.343038576069959e-06, "loss": 0.6635, "step": 7906 }, { "epoch": 0.9, "learning_rate": 5.331172922613581e-06, "loss": 0.6121, "step": 7907 }, { "epoch": 0.9, "learning_rate": 5.319320098412817e-06, "loss": 0.6874, "step": 7908 }, { "epoch": 0.9, "learning_rate": 5.307480105074003e-06, "loss": 0.586, "step": 7909 }, { "epoch": 0.9, "learning_rate": 5.295652944201612e-06, "loss": 0.6589, "step": 7910 }, { "epoch": 0.9, "learning_rate": 5.283838617398462e-06, "loss": 0.6595, "step": 7911 }, { "epoch": 0.9, "learning_rate": 5.272037126265572e-06, "loss": 0.6902, "step": 7912 }, { "epoch": 0.9, "learning_rate": 5.260248472402285e-06, "loss": 0.7309, "step": 7913 }, { "epoch": 0.9, "learning_rate": 5.248472657406123e-06, "loss": 0.6334, "step": 7914 }, { "epoch": 0.9, "learning_rate": 5.236709682872942e-06, "loss": 0.7214, "step": 7915 }, { "epoch": 0.9, "learning_rate": 5.224959550396791e-06, "loss": 0.6267, "step": 7916 }, { "epoch": 0.9, "learning_rate": 5.213222261570072e-06, "loss": 0.6643, "step": 7917 }, { "epoch": 0.9, "learning_rate": 5.201497817983348e-06, "loss": 0.665, "step": 7918 }, { "epoch": 0.9, "learning_rate": 5.189786221225479e-06, "loss": 0.7015, "step": 7919 }, { "epoch": 0.9, "learning_rate": 5.1780874728836086e-06, "loss": 0.6583, "step": 7920 }, { "epoch": 0.9, "learning_rate": 5.166401574543112e-06, "loss": 0.6918, "step": 7921 }, { "epoch": 0.9, "learning_rate": 5.154728527787634e-06, "loss": 0.6666, "step": 7922 }, { "epoch": 0.9, "learning_rate": 5.143068334199063e-06, "loss": 0.6587, "step": 7923 }, { "epoch": 0.9, "learning_rate": 5.131420995357572e-06, "loss": 0.6422, "step": 7924 }, { "epoch": 0.9, "learning_rate": 5.119786512841551e-06, "loss": 0.6499, "step": 7925 }, { "epoch": 0.9, "learning_rate": 5.108164888227695e-06, "loss": 0.6969, "step": 7926 }, { "epoch": 0.9, "learning_rate": 5.096556123090923e-06, "loss": 0.6429, "step": 7927 }, { "epoch": 0.9, "learning_rate": 5.084960219004431e-06, "loss": 0.6011, "step": 7928 }, { "epoch": 0.9, "learning_rate": 5.073377177539651e-06, "loss": 0.5951, "step": 7929 }, { "epoch": 0.9, "learning_rate": 5.061807000266305e-06, "loss": 0.6827, "step": 7930 }, { "epoch": 0.9, "learning_rate": 5.050249688752329e-06, "loss": 0.6459, "step": 7931 }, { "epoch": 0.9, "learning_rate": 5.038705244563946e-06, "loss": 0.5982, "step": 7932 }, { "epoch": 0.9, "learning_rate": 5.027173669265628e-06, "loss": 0.6592, "step": 7933 }, { "epoch": 0.9, "learning_rate": 5.015654964420102e-06, "loss": 0.6128, "step": 7934 }, { "epoch": 0.9, "learning_rate": 5.004149131588354e-06, "loss": 0.6534, "step": 7935 }, { "epoch": 0.9, "learning_rate": 4.992656172329624e-06, "loss": 0.6914, "step": 7936 }, { "epoch": 0.9, "learning_rate": 4.981176088201378e-06, "loss": 0.5755, "step": 7937 }, { "epoch": 0.9, "learning_rate": 4.969708880759416e-06, "loss": 0.6525, "step": 7938 }, { "epoch": 0.9, "learning_rate": 4.9582545515576835e-06, "loss": 0.6254, "step": 7939 }, { "epoch": 0.9, "learning_rate": 4.946813102148495e-06, "loss": 0.6783, "step": 7940 }, { "epoch": 0.9, "learning_rate": 4.935384534082333e-06, "loss": 0.6502, "step": 7941 }, { "epoch": 0.9, "learning_rate": 4.923968848907956e-06, "loss": 0.667, "step": 7942 }, { "epoch": 0.9, "learning_rate": 4.912566048172418e-06, "loss": 0.6703, "step": 7943 }, { "epoch": 0.9, "learning_rate": 4.901176133420971e-06, "loss": 0.6544, "step": 7944 }, { "epoch": 0.9, "learning_rate": 4.889799106197146e-06, "loss": 0.6798, "step": 7945 }, { "epoch": 0.9, "learning_rate": 4.878434968042733e-06, "loss": 0.6919, "step": 7946 }, { "epoch": 0.9, "learning_rate": 4.867083720497778e-06, "loss": 0.6887, "step": 7947 }, { "epoch": 0.9, "learning_rate": 4.8557453651005395e-06, "loss": 0.6316, "step": 7948 }, { "epoch": 0.9, "learning_rate": 4.844419903387587e-06, "loss": 0.5757, "step": 7949 }, { "epoch": 0.9, "learning_rate": 4.833107336893694e-06, "loss": 0.7253, "step": 7950 }, { "epoch": 0.9, "learning_rate": 4.821807667151945e-06, "loss": 0.6989, "step": 7951 }, { "epoch": 0.9, "learning_rate": 4.810520895693593e-06, "loss": 0.6818, "step": 7952 }, { "epoch": 0.9, "learning_rate": 4.799247024048248e-06, "loss": 0.6531, "step": 7953 }, { "epoch": 0.9, "learning_rate": 4.787986053743643e-06, "loss": 0.6587, "step": 7954 }, { "epoch": 0.9, "learning_rate": 4.776737986305891e-06, "loss": 0.681, "step": 7955 }, { "epoch": 0.9, "learning_rate": 4.765502823259249e-06, "loss": 0.6902, "step": 7956 }, { "epoch": 0.9, "learning_rate": 4.7542805661263345e-06, "loss": 0.6879, "step": 7957 }, { "epoch": 0.9, "learning_rate": 4.743071216427908e-06, "loss": 0.6789, "step": 7958 }, { "epoch": 0.9, "learning_rate": 4.731874775683054e-06, "loss": 0.6496, "step": 7959 }, { "epoch": 0.9, "learning_rate": 4.720691245409059e-06, "loss": 0.7177, "step": 7960 }, { "epoch": 0.9, "learning_rate": 4.709520627121522e-06, "loss": 0.6328, "step": 7961 }, { "epoch": 0.9, "learning_rate": 4.698362922334209e-06, "loss": 0.6258, "step": 7962 }, { "epoch": 0.91, "learning_rate": 4.687218132559224e-06, "loss": 0.6576, "step": 7963 }, { "epoch": 0.91, "learning_rate": 4.676086259306845e-06, "loss": 0.6834, "step": 7964 }, { "epoch": 0.91, "learning_rate": 4.664967304085655e-06, "loss": 0.5728, "step": 7965 }, { "epoch": 0.91, "learning_rate": 4.653861268402437e-06, "loss": 0.6722, "step": 7966 }, { "epoch": 0.91, "learning_rate": 4.642768153762289e-06, "loss": 0.6354, "step": 7967 }, { "epoch": 0.91, "learning_rate": 4.631687961668474e-06, "loss": 0.6364, "step": 7968 }, { "epoch": 0.91, "learning_rate": 4.62062069362259e-06, "loss": 0.6124, "step": 7969 }, { "epoch": 0.91, "learning_rate": 4.609566351124417e-06, "loss": 0.6545, "step": 7970 }, { "epoch": 0.91, "learning_rate": 4.598524935672011e-06, "loss": 0.6447, "step": 7971 }, { "epoch": 0.91, "learning_rate": 4.5874964487616854e-06, "loss": 0.5649, "step": 7972 }, { "epoch": 0.91, "learning_rate": 4.576480891887969e-06, "loss": 0.6712, "step": 7973 }, { "epoch": 0.91, "learning_rate": 4.565478266543699e-06, "loss": 0.6751, "step": 7974 }, { "epoch": 0.91, "learning_rate": 4.554488574219884e-06, "loss": 0.6989, "step": 7975 }, { "epoch": 0.91, "learning_rate": 4.543511816405832e-06, "loss": 0.7533, "step": 7976 }, { "epoch": 0.91, "learning_rate": 4.5325479945890645e-06, "loss": 0.6784, "step": 7977 }, { "epoch": 0.91, "learning_rate": 4.521597110255393e-06, "loss": 0.695, "step": 7978 }, { "epoch": 0.91, "learning_rate": 4.510659164888831e-06, "loss": 0.5939, "step": 7979 }, { "epoch": 0.91, "learning_rate": 4.499734159971669e-06, "loss": 0.6414, "step": 7980 }, { "epoch": 0.91, "learning_rate": 4.488822096984446e-06, "loss": 0.6429, "step": 7981 }, { "epoch": 0.91, "learning_rate": 4.477922977405913e-06, "loss": 0.693, "step": 7982 }, { "epoch": 0.91, "learning_rate": 4.467036802713076e-06, "loss": 0.6773, "step": 7983 }, { "epoch": 0.91, "learning_rate": 4.4561635743812334e-06, "loss": 0.6206, "step": 7984 }, { "epoch": 0.91, "learning_rate": 4.445303293883873e-06, "loss": 0.6687, "step": 7985 }, { "epoch": 0.91, "learning_rate": 4.434455962692763e-06, "loss": 0.6766, "step": 7986 }, { "epoch": 0.91, "learning_rate": 4.423621582277904e-06, "loss": 0.6841, "step": 7987 }, { "epoch": 0.91, "learning_rate": 4.412800154107532e-06, "loss": 0.64, "step": 7988 }, { "epoch": 0.91, "learning_rate": 4.401991679648121e-06, "loss": 0.6304, "step": 7989 }, { "epoch": 0.91, "learning_rate": 4.391196160364441e-06, "loss": 0.677, "step": 7990 }, { "epoch": 0.91, "learning_rate": 4.380413597719435e-06, "loss": 0.612, "step": 7991 }, { "epoch": 0.91, "learning_rate": 4.369643993174355e-06, "loss": 0.652, "step": 7992 }, { "epoch": 0.91, "learning_rate": 4.358887348188656e-06, "loss": 0.6824, "step": 7993 }, { "epoch": 0.91, "learning_rate": 4.348143664220039e-06, "loss": 0.687, "step": 7994 }, { "epoch": 0.91, "learning_rate": 4.337412942724483e-06, "loss": 0.6985, "step": 7995 }, { "epoch": 0.91, "learning_rate": 4.326695185156149e-06, "loss": 0.6648, "step": 7996 }, { "epoch": 0.91, "learning_rate": 4.315990392967517e-06, "loss": 0.6881, "step": 7997 }, { "epoch": 0.91, "learning_rate": 4.305298567609262e-06, "loss": 0.6346, "step": 7998 }, { "epoch": 0.91, "learning_rate": 4.29461971053029e-06, "loss": 0.7203, "step": 7999 }, { "epoch": 0.91, "learning_rate": 4.283953823177767e-06, "loss": 0.6541, "step": 8000 }, { "epoch": 0.91, "learning_rate": 4.273300906997136e-06, "loss": 0.6886, "step": 8001 }, { "epoch": 0.91, "learning_rate": 4.262660963432019e-06, "loss": 0.6436, "step": 8002 }, { "epoch": 0.91, "learning_rate": 4.2520339939243316e-06, "loss": 0.5792, "step": 8003 }, { "epoch": 0.91, "learning_rate": 4.24141999991422e-06, "loss": 0.7138, "step": 8004 }, { "epoch": 0.91, "learning_rate": 4.230818982840035e-06, "loss": 0.6716, "step": 8005 }, { "epoch": 0.91, "learning_rate": 4.220230944138404e-06, "loss": 0.6444, "step": 8006 }, { "epoch": 0.91, "learning_rate": 4.209655885244202e-06, "loss": 0.6627, "step": 8007 }, { "epoch": 0.91, "learning_rate": 4.199093807590504e-06, "loss": 0.6808, "step": 8008 }, { "epoch": 0.91, "learning_rate": 4.188544712608711e-06, "loss": 0.6491, "step": 8009 }, { "epoch": 0.91, "learning_rate": 4.178008601728345e-06, "loss": 0.6481, "step": 8010 }, { "epoch": 0.91, "learning_rate": 4.167485476377253e-06, "loss": 0.5822, "step": 8011 }, { "epoch": 0.91, "learning_rate": 4.156975337981505e-06, "loss": 0.6723, "step": 8012 }, { "epoch": 0.91, "learning_rate": 4.146478187965408e-06, "loss": 0.642, "step": 8013 }, { "epoch": 0.91, "learning_rate": 4.135994027751478e-06, "loss": 0.6837, "step": 8014 }, { "epoch": 0.91, "learning_rate": 4.125522858760544e-06, "loss": 0.6754, "step": 8015 }, { "epoch": 0.91, "learning_rate": 4.1150646824116065e-06, "loss": 0.6574, "step": 8016 }, { "epoch": 0.91, "learning_rate": 4.10461950012192e-06, "loss": 0.6459, "step": 8017 }, { "epoch": 0.91, "learning_rate": 4.094187313306997e-06, "loss": 0.7087, "step": 8018 }, { "epoch": 0.91, "learning_rate": 4.083768123380582e-06, "loss": 0.7034, "step": 8019 }, { "epoch": 0.91, "learning_rate": 4.073361931754638e-06, "loss": 0.6376, "step": 8020 }, { "epoch": 0.91, "learning_rate": 4.062968739839412e-06, "loss": 0.6586, "step": 8021 }, { "epoch": 0.91, "learning_rate": 4.052588549043335e-06, "loss": 0.6499, "step": 8022 }, { "epoch": 0.91, "learning_rate": 4.042221360773102e-06, "loss": 0.7126, "step": 8023 }, { "epoch": 0.91, "learning_rate": 4.031867176433668e-06, "loss": 0.6513, "step": 8024 }, { "epoch": 0.91, "learning_rate": 4.021525997428166e-06, "loss": 0.6779, "step": 8025 }, { "epoch": 0.91, "learning_rate": 4.011197825158053e-06, "loss": 0.6534, "step": 8026 }, { "epoch": 0.91, "learning_rate": 4.0008826610229315e-06, "loss": 0.6824, "step": 8027 }, { "epoch": 0.91, "learning_rate": 3.990580506420705e-06, "loss": 0.6903, "step": 8028 }, { "epoch": 0.91, "learning_rate": 3.980291362747479e-06, "loss": 0.7159, "step": 8029 }, { "epoch": 0.91, "learning_rate": 3.970015231397628e-06, "loss": 0.7163, "step": 8030 }, { "epoch": 0.91, "learning_rate": 3.959752113763726e-06, "loss": 0.604, "step": 8031 }, { "epoch": 0.91, "learning_rate": 3.949502011236628e-06, "loss": 0.6083, "step": 8032 }, { "epoch": 0.91, "learning_rate": 3.939264925205355e-06, "loss": 0.6825, "step": 8033 }, { "epoch": 0.91, "learning_rate": 3.929040857057254e-06, "loss": 0.7033, "step": 8034 }, { "epoch": 0.91, "learning_rate": 3.918829808177826e-06, "loss": 0.6788, "step": 8035 }, { "epoch": 0.91, "learning_rate": 3.908631779950878e-06, "loss": 0.6573, "step": 8036 }, { "epoch": 0.91, "learning_rate": 3.898446773758391e-06, "loss": 0.686, "step": 8037 }, { "epoch": 0.91, "learning_rate": 3.888274790980629e-06, "loss": 0.7195, "step": 8038 }, { "epoch": 0.91, "learning_rate": 3.878115832996065e-06, "loss": 0.6279, "step": 8039 }, { "epoch": 0.91, "learning_rate": 3.867969901181401e-06, "loss": 0.6664, "step": 8040 }, { "epoch": 0.91, "learning_rate": 3.85783699691159e-06, "loss": 0.6231, "step": 8041 }, { "epoch": 0.91, "learning_rate": 3.847717121559824e-06, "loss": 0.6717, "step": 8042 }, { "epoch": 0.91, "learning_rate": 3.8376102764975056e-06, "loss": 0.5736, "step": 8043 }, { "epoch": 0.91, "learning_rate": 3.827516463094305e-06, "loss": 0.6681, "step": 8044 }, { "epoch": 0.91, "learning_rate": 3.817435682718096e-06, "loss": 0.6345, "step": 8045 }, { "epoch": 0.91, "learning_rate": 3.807367936734996e-06, "loss": 0.629, "step": 8046 }, { "epoch": 0.91, "learning_rate": 3.797313226509369e-06, "loss": 0.6374, "step": 8047 }, { "epoch": 0.91, "learning_rate": 3.7872715534037816e-06, "loss": 0.6892, "step": 8048 }, { "epoch": 0.91, "learning_rate": 3.777242918779089e-06, "loss": 0.6281, "step": 8049 }, { "epoch": 0.91, "learning_rate": 3.7672273239942932e-06, "loss": 0.6176, "step": 8050 }, { "epoch": 0.92, "learning_rate": 3.75722477040672e-06, "loss": 0.6916, "step": 8051 }, { "epoch": 0.92, "learning_rate": 3.747235259371873e-06, "loss": 0.6189, "step": 8052 }, { "epoch": 0.92, "learning_rate": 3.737258792243503e-06, "loss": 0.6196, "step": 8053 }, { "epoch": 0.92, "learning_rate": 3.7272953703735845e-06, "loss": 0.6466, "step": 8054 }, { "epoch": 0.92, "learning_rate": 3.7173449951123706e-06, "loss": 0.6578, "step": 8055 }, { "epoch": 0.92, "learning_rate": 3.7074076678082603e-06, "loss": 0.7213, "step": 8056 }, { "epoch": 0.92, "learning_rate": 3.697483389807965e-06, "loss": 0.5926, "step": 8057 }, { "epoch": 0.92, "learning_rate": 3.6875721624563654e-06, "loss": 0.6843, "step": 8058 }, { "epoch": 0.92, "learning_rate": 3.6776739870966305e-06, "loss": 0.6644, "step": 8059 }, { "epoch": 0.92, "learning_rate": 3.6677888650701208e-06, "loss": 0.6287, "step": 8060 }, { "epoch": 0.92, "learning_rate": 3.657916797716454e-06, "loss": 0.6771, "step": 8061 }, { "epoch": 0.92, "learning_rate": 3.648057786373449e-06, "loss": 0.6433, "step": 8062 }, { "epoch": 0.92, "learning_rate": 3.6382118323771807e-06, "loss": 0.672, "step": 8063 }, { "epoch": 0.92, "learning_rate": 3.628378937061927e-06, "loss": 0.7126, "step": 8064 }, { "epoch": 0.92, "learning_rate": 3.618559101760244e-06, "loss": 0.6687, "step": 8065 }, { "epoch": 0.92, "learning_rate": 3.6087523278028666e-06, "loss": 0.5847, "step": 8066 }, { "epoch": 0.92, "learning_rate": 3.598958616518788e-06, "loss": 0.664, "step": 8067 }, { "epoch": 0.92, "learning_rate": 3.5891779692352358e-06, "loss": 0.6409, "step": 8068 }, { "epoch": 0.92, "learning_rate": 3.579410387277626e-06, "loss": 0.6749, "step": 8069 }, { "epoch": 0.92, "learning_rate": 3.569655871969668e-06, "loss": 0.5936, "step": 8070 }, { "epoch": 0.92, "learning_rate": 3.5599144246332484e-06, "loss": 0.685, "step": 8071 }, { "epoch": 0.92, "learning_rate": 3.5501860465885218e-06, "loss": 0.6491, "step": 8072 }, { "epoch": 0.92, "learning_rate": 3.5404707391538115e-06, "loss": 0.6605, "step": 8073 }, { "epoch": 0.92, "learning_rate": 3.5307685036457427e-06, "loss": 0.6741, "step": 8074 }, { "epoch": 0.92, "learning_rate": 3.5210793413791078e-06, "loss": 0.6091, "step": 8075 }, { "epoch": 0.92, "learning_rate": 3.5114032536669895e-06, "loss": 0.6383, "step": 8076 }, { "epoch": 0.92, "learning_rate": 3.501740241820628e-06, "loss": 0.6856, "step": 8077 }, { "epoch": 0.92, "learning_rate": 3.492090307149576e-06, "loss": 0.6593, "step": 8078 }, { "epoch": 0.92, "learning_rate": 3.482453450961509e-06, "loss": 0.6692, "step": 8079 }, { "epoch": 0.92, "learning_rate": 3.4728296745624276e-06, "loss": 0.7502, "step": 8080 }, { "epoch": 0.92, "learning_rate": 3.4632189792564884e-06, "loss": 0.7163, "step": 8081 }, { "epoch": 0.92, "learning_rate": 3.453621366346138e-06, "loss": 0.7154, "step": 8082 }, { "epoch": 0.92, "learning_rate": 3.444036837131992e-06, "loss": 0.6309, "step": 8083 }, { "epoch": 0.92, "learning_rate": 3.4344653929129555e-06, "loss": 0.6765, "step": 8084 }, { "epoch": 0.92, "learning_rate": 3.424907034986069e-06, "loss": 0.6447, "step": 8085 }, { "epoch": 0.92, "learning_rate": 3.4153617646466963e-06, "loss": 0.6805, "step": 8086 }, { "epoch": 0.92, "learning_rate": 3.405829583188369e-06, "loss": 0.6654, "step": 8087 }, { "epoch": 0.92, "learning_rate": 3.3963104919028656e-06, "loss": 0.753, "step": 8088 }, { "epoch": 0.92, "learning_rate": 3.3868044920801976e-06, "loss": 0.627, "step": 8089 }, { "epoch": 0.92, "learning_rate": 3.377311585008569e-06, "loss": 0.6551, "step": 8090 }, { "epoch": 0.92, "learning_rate": 3.36783177197445e-06, "loss": 0.6359, "step": 8091 }, { "epoch": 0.92, "learning_rate": 3.3583650542625023e-06, "loss": 0.6887, "step": 8092 }, { "epoch": 0.92, "learning_rate": 3.3489114331556547e-06, "loss": 0.6092, "step": 8093 }, { "epoch": 0.92, "learning_rate": 3.339470909935016e-06, "loss": 0.6015, "step": 8094 }, { "epoch": 0.92, "learning_rate": 3.3300434858799524e-06, "loss": 0.6734, "step": 8095 }, { "epoch": 0.92, "learning_rate": 3.3206291622680187e-06, "loss": 0.6478, "step": 8096 }, { "epoch": 0.92, "learning_rate": 3.311227940375039e-06, "loss": 0.6706, "step": 8097 }, { "epoch": 0.92, "learning_rate": 3.3018398214750277e-06, "loss": 0.6508, "step": 8098 }, { "epoch": 0.92, "learning_rate": 3.2924648068402565e-06, "loss": 0.6068, "step": 8099 }, { "epoch": 0.92, "learning_rate": 3.2831028977411748e-06, "loss": 0.6315, "step": 8100 }, { "epoch": 0.92, "learning_rate": 3.273754095446524e-06, "loss": 0.6682, "step": 8101 }, { "epoch": 0.92, "learning_rate": 3.2644184012231684e-06, "loss": 0.6524, "step": 8102 }, { "epoch": 0.92, "learning_rate": 3.2550958163363064e-06, "loss": 0.7113, "step": 8103 }, { "epoch": 0.92, "learning_rate": 3.245786342049273e-06, "loss": 0.7404, "step": 8104 }, { "epoch": 0.92, "learning_rate": 3.2364899796236916e-06, "loss": 0.6618, "step": 8105 }, { "epoch": 0.92, "learning_rate": 3.2272067303193656e-06, "loss": 0.6805, "step": 8106 }, { "epoch": 0.92, "learning_rate": 3.217936595394333e-06, "loss": 0.6807, "step": 8107 }, { "epoch": 0.92, "learning_rate": 3.208679576104845e-06, "loss": 0.6642, "step": 8108 }, { "epoch": 0.92, "learning_rate": 3.19943567370542e-06, "loss": 0.7181, "step": 8109 }, { "epoch": 0.92, "learning_rate": 3.1902048894487223e-06, "loss": 0.5984, "step": 8110 }, { "epoch": 0.92, "learning_rate": 3.1809872245857296e-06, "loss": 0.6851, "step": 8111 }, { "epoch": 0.92, "learning_rate": 3.1717826803655757e-06, "loss": 0.6312, "step": 8112 }, { "epoch": 0.92, "learning_rate": 3.1625912580356074e-06, "loss": 0.6861, "step": 8113 }, { "epoch": 0.92, "learning_rate": 3.153412958841462e-06, "loss": 0.6976, "step": 8114 }, { "epoch": 0.92, "learning_rate": 3.1442477840269323e-06, "loss": 0.6188, "step": 8115 }, { "epoch": 0.92, "learning_rate": 3.135095734834059e-06, "loss": 0.6226, "step": 8116 }, { "epoch": 0.92, "learning_rate": 3.125956812503117e-06, "loss": 0.6317, "step": 8117 }, { "epoch": 0.92, "learning_rate": 3.116831018272581e-06, "loss": 0.7378, "step": 8118 }, { "epoch": 0.92, "learning_rate": 3.1077183533791297e-06, "loss": 0.6859, "step": 8119 }, { "epoch": 0.92, "learning_rate": 3.0986188190577194e-06, "loss": 0.6189, "step": 8120 }, { "epoch": 0.92, "learning_rate": 3.089532416541474e-06, "loss": 0.7004, "step": 8121 }, { "epoch": 0.92, "learning_rate": 3.080459147061776e-06, "loss": 0.681, "step": 8122 }, { "epoch": 0.92, "learning_rate": 3.071399011848186e-06, "loss": 0.6735, "step": 8123 }, { "epoch": 0.92, "learning_rate": 3.062352012128533e-06, "loss": 0.6531, "step": 8124 }, { "epoch": 0.92, "learning_rate": 3.0533181491288034e-06, "loss": 0.6425, "step": 8125 }, { "epoch": 0.92, "learning_rate": 3.0442974240732834e-06, "loss": 0.6777, "step": 8126 }, { "epoch": 0.92, "learning_rate": 3.0352898381844073e-06, "loss": 0.6365, "step": 8127 }, { "epoch": 0.92, "learning_rate": 3.0262953926828872e-06, "loss": 0.6201, "step": 8128 }, { "epoch": 0.92, "learning_rate": 3.017314088787604e-06, "loss": 0.6683, "step": 8129 }, { "epoch": 0.92, "learning_rate": 3.0083459277156724e-06, "loss": 0.7051, "step": 8130 }, { "epoch": 0.92, "learning_rate": 2.9993909106824425e-06, "loss": 0.6212, "step": 8131 }, { "epoch": 0.92, "learning_rate": 2.9904490389014773e-06, "loss": 0.6934, "step": 8132 }, { "epoch": 0.92, "learning_rate": 2.9815203135845515e-06, "loss": 0.6541, "step": 8133 }, { "epoch": 0.92, "learning_rate": 2.9726047359416644e-06, "loss": 0.6913, "step": 8134 }, { "epoch": 0.92, "learning_rate": 2.9637023071810153e-06, "loss": 0.6933, "step": 8135 }, { "epoch": 0.92, "learning_rate": 2.9548130285090625e-06, "loss": 0.5574, "step": 8136 }, { "epoch": 0.92, "learning_rate": 2.9459369011304193e-06, "loss": 0.6633, "step": 8137 }, { "epoch": 0.92, "learning_rate": 2.9370739262479908e-06, "loss": 0.6648, "step": 8138 }, { "epoch": 0.93, "learning_rate": 2.928224105062838e-06, "loss": 0.6463, "step": 8139 }, { "epoch": 0.93, "learning_rate": 2.9193874387742905e-06, "loss": 0.6664, "step": 8140 }, { "epoch": 0.93, "learning_rate": 2.910563928579835e-06, "loss": 0.616, "step": 8141 }, { "epoch": 0.93, "learning_rate": 2.9017535756752256e-06, "loss": 0.6005, "step": 8142 }, { "epoch": 0.93, "learning_rate": 2.89295638125443e-06, "loss": 0.6597, "step": 8143 }, { "epoch": 0.93, "learning_rate": 2.8841723465095836e-06, "loss": 0.6664, "step": 8144 }, { "epoch": 0.93, "learning_rate": 2.875401472631112e-06, "loss": 0.696, "step": 8145 }, { "epoch": 0.93, "learning_rate": 2.866643760807608e-06, "loss": 0.6777, "step": 8146 }, { "epoch": 0.93, "learning_rate": 2.8578992122258896e-06, "loss": 0.6427, "step": 8147 }, { "epoch": 0.93, "learning_rate": 2.8491678280709864e-06, "loss": 0.6488, "step": 8148 }, { "epoch": 0.93, "learning_rate": 2.8404496095261525e-06, "loss": 0.7175, "step": 8149 }, { "epoch": 0.93, "learning_rate": 2.831744557772864e-06, "loss": 0.6594, "step": 8150 }, { "epoch": 0.93, "learning_rate": 2.8230526739908116e-06, "loss": 0.6705, "step": 8151 }, { "epoch": 0.93, "learning_rate": 2.8143739593578856e-06, "loss": 0.6146, "step": 8152 }, { "epoch": 0.93, "learning_rate": 2.805708415050201e-06, "loss": 0.6726, "step": 8153 }, { "epoch": 0.93, "learning_rate": 2.7970560422420743e-06, "loss": 0.6271, "step": 8154 }, { "epoch": 0.93, "learning_rate": 2.7884168421060898e-06, "loss": 0.6644, "step": 8155 }, { "epoch": 0.93, "learning_rate": 2.779790815812966e-06, "loss": 0.6802, "step": 8156 }, { "epoch": 0.93, "learning_rate": 2.7711779645317016e-06, "loss": 0.6601, "step": 8157 }, { "epoch": 0.93, "learning_rate": 2.762578289429485e-06, "loss": 0.71, "step": 8158 }, { "epoch": 0.93, "learning_rate": 2.7539917916717172e-06, "loss": 0.6504, "step": 8159 }, { "epoch": 0.93, "learning_rate": 2.7454184724220012e-06, "loss": 0.6921, "step": 8160 }, { "epoch": 0.93, "learning_rate": 2.736858332842196e-06, "loss": 0.6498, "step": 8161 }, { "epoch": 0.93, "learning_rate": 2.7283113740923183e-06, "loss": 0.616, "step": 8162 }, { "epoch": 0.93, "learning_rate": 2.719777597330664e-06, "loss": 0.6219, "step": 8163 }, { "epoch": 0.93, "learning_rate": 2.711257003713685e-06, "loss": 0.6989, "step": 8164 }, { "epoch": 0.93, "learning_rate": 2.702749594396059e-06, "loss": 0.6437, "step": 8165 }, { "epoch": 0.93, "learning_rate": 2.694255370530718e-06, "loss": 0.7129, "step": 8166 }, { "epoch": 0.93, "learning_rate": 2.685774333268731e-06, "loss": 0.6838, "step": 8167 }, { "epoch": 0.93, "learning_rate": 2.6773064837594676e-06, "loss": 0.7077, "step": 8168 }, { "epoch": 0.93, "learning_rate": 2.668851823150453e-06, "loss": 0.6276, "step": 8169 }, { "epoch": 0.93, "learning_rate": 2.660410352587428e-06, "loss": 0.7083, "step": 8170 }, { "epoch": 0.93, "learning_rate": 2.6519820732143542e-06, "loss": 0.6482, "step": 8171 }, { "epoch": 0.93, "learning_rate": 2.64356698617344e-06, "loss": 0.6258, "step": 8172 }, { "epoch": 0.93, "learning_rate": 2.63516509260503e-06, "loss": 0.6408, "step": 8173 }, { "epoch": 0.93, "learning_rate": 2.6267763936477674e-06, "loss": 0.6416, "step": 8174 }, { "epoch": 0.93, "learning_rate": 2.618400890438444e-06, "loss": 0.6809, "step": 8175 }, { "epoch": 0.93, "learning_rate": 2.6100385841120843e-06, "loss": 0.6558, "step": 8176 }, { "epoch": 0.93, "learning_rate": 2.6016894758019162e-06, "loss": 0.7639, "step": 8177 }, { "epoch": 0.93, "learning_rate": 2.5933535666394226e-06, "loss": 0.6215, "step": 8178 }, { "epoch": 0.93, "learning_rate": 2.5850308577542115e-06, "loss": 0.6523, "step": 8179 }, { "epoch": 0.93, "learning_rate": 2.5767213502742138e-06, "loss": 0.64, "step": 8180 }, { "epoch": 0.93, "learning_rate": 2.568425045325451e-06, "loss": 0.6563, "step": 8181 }, { "epoch": 0.93, "learning_rate": 2.560141944032257e-06, "loss": 0.6219, "step": 8182 }, { "epoch": 0.93, "learning_rate": 2.551872047517112e-06, "loss": 0.6588, "step": 8183 }, { "epoch": 0.93, "learning_rate": 2.5436153569007415e-06, "loss": 0.6325, "step": 8184 }, { "epoch": 0.93, "learning_rate": 2.5353718733020615e-06, "loss": 0.7302, "step": 8185 }, { "epoch": 0.93, "learning_rate": 2.527141597838212e-06, "loss": 0.7028, "step": 8186 }, { "epoch": 0.93, "learning_rate": 2.5189245316245334e-06, "loss": 0.6137, "step": 8187 }, { "epoch": 0.93, "learning_rate": 2.5107206757745804e-06, "loss": 0.6378, "step": 8188 }, { "epoch": 0.93, "learning_rate": 2.502530031400119e-06, "loss": 0.6332, "step": 8189 }, { "epoch": 0.93, "learning_rate": 2.494352599611116e-06, "loss": 0.6482, "step": 8190 }, { "epoch": 0.93, "learning_rate": 2.486188381515764e-06, "loss": 0.7414, "step": 8191 }, { "epoch": 0.93, "learning_rate": 2.4780373782204434e-06, "loss": 0.6741, "step": 8192 }, { "epoch": 0.93, "learning_rate": 2.4698995908297715e-06, "loss": 0.654, "step": 8193 }, { "epoch": 0.93, "learning_rate": 2.461775020446533e-06, "loss": 0.6523, "step": 8194 }, { "epoch": 0.93, "learning_rate": 2.4536636681717794e-06, "loss": 0.6599, "step": 8195 }, { "epoch": 0.93, "learning_rate": 2.44556553510471e-06, "loss": 0.6646, "step": 8196 }, { "epoch": 0.93, "learning_rate": 2.4374806223427914e-06, "loss": 0.6777, "step": 8197 }, { "epoch": 0.93, "learning_rate": 2.4294089309816248e-06, "loss": 0.6658, "step": 8198 }, { "epoch": 0.93, "learning_rate": 2.421350462115102e-06, "loss": 0.6829, "step": 8199 }, { "epoch": 0.93, "learning_rate": 2.413305216835271e-06, "loss": 0.7671, "step": 8200 }, { "epoch": 0.93, "learning_rate": 2.405273196232394e-06, "loss": 0.6651, "step": 8201 }, { "epoch": 0.93, "learning_rate": 2.397254401394955e-06, "loss": 0.6342, "step": 8202 }, { "epoch": 0.93, "learning_rate": 2.389248833409663e-06, "loss": 0.6609, "step": 8203 }, { "epoch": 0.93, "learning_rate": 2.381256493361361e-06, "loss": 0.5783, "step": 8204 }, { "epoch": 0.93, "learning_rate": 2.3732773823331835e-06, "loss": 0.6781, "step": 8205 }, { "epoch": 0.93, "learning_rate": 2.3653115014064197e-06, "loss": 0.6739, "step": 8206 }, { "epoch": 0.93, "learning_rate": 2.357358851660596e-06, "loss": 0.6684, "step": 8207 }, { "epoch": 0.93, "learning_rate": 2.3494194341734167e-06, "loss": 0.6471, "step": 8208 }, { "epoch": 0.93, "learning_rate": 2.341493250020843e-06, "loss": 0.7089, "step": 8209 }, { "epoch": 0.93, "learning_rate": 2.333580300276983e-06, "loss": 0.627, "step": 8210 }, { "epoch": 0.93, "learning_rate": 2.325680586014178e-06, "loss": 0.6503, "step": 8211 }, { "epoch": 0.93, "learning_rate": 2.317794108302973e-06, "loss": 0.6546, "step": 8212 }, { "epoch": 0.93, "learning_rate": 2.3099208682121453e-06, "loss": 0.6715, "step": 8213 }, { "epoch": 0.93, "learning_rate": 2.3020608668086197e-06, "loss": 0.6663, "step": 8214 }, { "epoch": 0.93, "learning_rate": 2.294214105157588e-06, "loss": 0.657, "step": 8215 }, { "epoch": 0.93, "learning_rate": 2.2863805843224118e-06, "loss": 0.589, "step": 8216 }, { "epoch": 0.93, "learning_rate": 2.2785603053646633e-06, "loss": 0.6395, "step": 8217 }, { "epoch": 0.93, "learning_rate": 2.270753269344139e-06, "loss": 0.6833, "step": 8218 }, { "epoch": 0.93, "learning_rate": 2.2629594773188156e-06, "loss": 0.6435, "step": 8219 }, { "epoch": 0.93, "learning_rate": 2.2551789303449034e-06, "loss": 0.6642, "step": 8220 }, { "epoch": 0.93, "learning_rate": 2.24741162947677e-06, "loss": 0.6354, "step": 8221 }, { "epoch": 0.93, "learning_rate": 2.2396575757670403e-06, "loss": 0.6262, "step": 8222 }, { "epoch": 0.93, "learning_rate": 2.231916770266507e-06, "loss": 0.5966, "step": 8223 }, { "epoch": 0.93, "learning_rate": 2.224189214024197e-06, "loss": 0.6491, "step": 8224 }, { "epoch": 0.93, "learning_rate": 2.216474908087318e-06, "loss": 0.6852, "step": 8225 }, { "epoch": 0.93, "learning_rate": 2.208773853501311e-06, "loss": 0.6071, "step": 8226 }, { "epoch": 0.94, "learning_rate": 2.201086051309764e-06, "loss": 0.6068, "step": 8227 }, { "epoch": 0.94, "learning_rate": 2.193411502554543e-06, "loss": 0.6623, "step": 8228 }, { "epoch": 0.94, "learning_rate": 2.1857502082756496e-06, "loss": 0.632, "step": 8229 }, { "epoch": 0.94, "learning_rate": 2.1781021695113535e-06, "loss": 0.6509, "step": 8230 }, { "epoch": 0.94, "learning_rate": 2.17046738729807e-06, "loss": 0.6532, "step": 8231 }, { "epoch": 0.94, "learning_rate": 2.1628458626704706e-06, "loss": 0.663, "step": 8232 }, { "epoch": 0.94, "learning_rate": 2.1552375966613635e-06, "loss": 0.6745, "step": 8233 }, { "epoch": 0.94, "learning_rate": 2.147642590301846e-06, "loss": 0.6128, "step": 8234 }, { "epoch": 0.94, "learning_rate": 2.140060844621128e-06, "loss": 0.7048, "step": 8235 }, { "epoch": 0.94, "learning_rate": 2.1324923606466984e-06, "loss": 0.7035, "step": 8236 }, { "epoch": 0.94, "learning_rate": 2.124937139404204e-06, "loss": 0.6925, "step": 8237 }, { "epoch": 0.94, "learning_rate": 2.117395181917503e-06, "loss": 0.5964, "step": 8238 }, { "epoch": 0.94, "learning_rate": 2.109866489208667e-06, "loss": 0.7118, "step": 8239 }, { "epoch": 0.94, "learning_rate": 2.102351062297958e-06, "loss": 0.6315, "step": 8240 }, { "epoch": 0.94, "learning_rate": 2.094848902203861e-06, "loss": 0.6357, "step": 8241 }, { "epoch": 0.94, "learning_rate": 2.087360009943029e-06, "loss": 0.6435, "step": 8242 }, { "epoch": 0.94, "learning_rate": 2.0798843865303617e-06, "loss": 0.6903, "step": 8243 }, { "epoch": 0.94, "learning_rate": 2.0724220329789047e-06, "loss": 0.6635, "step": 8244 }, { "epoch": 0.94, "learning_rate": 2.0649729502999484e-06, "loss": 0.628, "step": 8245 }, { "epoch": 0.94, "learning_rate": 2.057537139502974e-06, "loss": 0.6149, "step": 8246 }, { "epoch": 0.94, "learning_rate": 2.050114601595654e-06, "loss": 0.6816, "step": 8247 }, { "epoch": 0.94, "learning_rate": 2.0427053375838722e-06, "loss": 0.6862, "step": 8248 }, { "epoch": 0.94, "learning_rate": 2.0353093484717366e-06, "loss": 0.5728, "step": 8249 }, { "epoch": 0.94, "learning_rate": 2.027926635261479e-06, "loss": 0.6676, "step": 8250 }, { "epoch": 0.94, "learning_rate": 2.020557198953632e-06, "loss": 0.6545, "step": 8251 }, { "epoch": 0.94, "learning_rate": 2.0132010405468525e-06, "loss": 0.6797, "step": 8252 }, { "epoch": 0.94, "learning_rate": 2.0058581610380545e-06, "loss": 0.67, "step": 8253 }, { "epoch": 0.94, "learning_rate": 1.998528561422297e-06, "loss": 0.6455, "step": 8254 }, { "epoch": 0.94, "learning_rate": 1.991212242692875e-06, "loss": 0.6675, "step": 8255 }, { "epoch": 0.94, "learning_rate": 1.9839092058412723e-06, "loss": 0.7128, "step": 8256 }, { "epoch": 0.94, "learning_rate": 1.976619451857198e-06, "loss": 0.6819, "step": 8257 }, { "epoch": 0.94, "learning_rate": 1.969342981728506e-06, "loss": 0.661, "step": 8258 }, { "epoch": 0.94, "learning_rate": 1.9620797964413073e-06, "loss": 0.6327, "step": 8259 }, { "epoch": 0.94, "learning_rate": 1.9548298969798815e-06, "loss": 0.7005, "step": 8260 }, { "epoch": 0.94, "learning_rate": 1.94759328432671e-06, "loss": 0.6503, "step": 8261 }, { "epoch": 0.94, "learning_rate": 1.9403699594624957e-06, "loss": 0.614, "step": 8262 }, { "epoch": 0.94, "learning_rate": 1.93315992336609e-06, "loss": 0.6177, "step": 8263 }, { "epoch": 0.94, "learning_rate": 1.9259631770146113e-06, "loss": 0.6422, "step": 8264 }, { "epoch": 0.94, "learning_rate": 1.9187797213833347e-06, "loss": 0.6636, "step": 8265 }, { "epoch": 0.94, "learning_rate": 1.911609557445726e-06, "loss": 0.6781, "step": 8266 }, { "epoch": 0.94, "learning_rate": 1.9044526861734745e-06, "loss": 0.6302, "step": 8267 }, { "epoch": 0.94, "learning_rate": 1.8973091085364713e-06, "loss": 0.6003, "step": 8268 }, { "epoch": 0.94, "learning_rate": 1.8901788255027753e-06, "loss": 0.6644, "step": 8269 }, { "epoch": 0.94, "learning_rate": 1.8830618380386688e-06, "loss": 0.7012, "step": 8270 }, { "epoch": 0.94, "learning_rate": 1.8759581471086362e-06, "loss": 0.6682, "step": 8271 }, { "epoch": 0.94, "learning_rate": 1.868867753675352e-06, "loss": 0.6893, "step": 8272 }, { "epoch": 0.94, "learning_rate": 1.861790658699658e-06, "loss": 0.6709, "step": 8273 }, { "epoch": 0.94, "learning_rate": 1.8547268631406434e-06, "loss": 0.6231, "step": 8274 }, { "epoch": 0.94, "learning_rate": 1.8476763679555754e-06, "loss": 0.6711, "step": 8275 }, { "epoch": 0.94, "learning_rate": 1.8406391740999118e-06, "loss": 0.6574, "step": 8276 }, { "epoch": 0.94, "learning_rate": 1.8336152825273234e-06, "loss": 0.6587, "step": 8277 }, { "epoch": 0.94, "learning_rate": 1.8266046941896597e-06, "loss": 0.6392, "step": 8278 }, { "epoch": 0.94, "learning_rate": 1.819607410036972e-06, "loss": 0.6986, "step": 8279 }, { "epoch": 0.94, "learning_rate": 1.8126234310175238e-06, "loss": 0.6387, "step": 8280 }, { "epoch": 0.94, "learning_rate": 1.8056527580777471e-06, "loss": 0.7065, "step": 8281 }, { "epoch": 0.94, "learning_rate": 1.7986953921623085e-06, "loss": 0.5649, "step": 8282 }, { "epoch": 0.94, "learning_rate": 1.7917513342140425e-06, "loss": 0.6779, "step": 8283 }, { "epoch": 0.94, "learning_rate": 1.784820585173974e-06, "loss": 0.6566, "step": 8284 }, { "epoch": 0.94, "learning_rate": 1.7779031459813633e-06, "loss": 0.6307, "step": 8285 }, { "epoch": 0.94, "learning_rate": 1.770999017573638e-06, "loss": 0.6398, "step": 8286 }, { "epoch": 0.94, "learning_rate": 1.7641082008864052e-06, "loss": 0.6235, "step": 8287 }, { "epoch": 0.94, "learning_rate": 1.7572306968535179e-06, "loss": 0.6463, "step": 8288 }, { "epoch": 0.94, "learning_rate": 1.7503665064069863e-06, "loss": 0.6313, "step": 8289 }, { "epoch": 0.94, "learning_rate": 1.7435156304769995e-06, "loss": 0.637, "step": 8290 }, { "epoch": 0.94, "learning_rate": 1.736678069992015e-06, "loss": 0.647, "step": 8291 }, { "epoch": 0.94, "learning_rate": 1.7298538258786023e-06, "loss": 0.6738, "step": 8292 }, { "epoch": 0.94, "learning_rate": 1.7230428990615888e-06, "loss": 0.6283, "step": 8293 }, { "epoch": 0.94, "learning_rate": 1.716245290463958e-06, "loss": 0.6394, "step": 8294 }, { "epoch": 0.94, "learning_rate": 1.7094610010069067e-06, "loss": 0.6663, "step": 8295 }, { "epoch": 0.94, "learning_rate": 1.7026900316098215e-06, "loss": 0.6538, "step": 8296 }, { "epoch": 0.94, "learning_rate": 1.6959323831902906e-06, "loss": 0.6008, "step": 8297 }, { "epoch": 0.94, "learning_rate": 1.6891880566640816e-06, "loss": 0.7192, "step": 8298 }, { "epoch": 0.94, "learning_rate": 1.6824570529451855e-06, "loss": 0.6726, "step": 8299 }, { "epoch": 0.94, "learning_rate": 1.6757393729457504e-06, "loss": 0.642, "step": 8300 }, { "epoch": 0.94, "learning_rate": 1.6690350175761483e-06, "loss": 0.7026, "step": 8301 }, { "epoch": 0.94, "learning_rate": 1.6623439877449186e-06, "loss": 0.6681, "step": 8302 }, { "epoch": 0.94, "learning_rate": 1.6556662843588366e-06, "loss": 0.5935, "step": 8303 }, { "epoch": 0.94, "learning_rate": 1.6490019083228226e-06, "loss": 0.6376, "step": 8304 }, { "epoch": 0.94, "learning_rate": 1.6423508605400318e-06, "loss": 0.5599, "step": 8305 }, { "epoch": 0.94, "learning_rate": 1.6357131419117878e-06, "loss": 0.6488, "step": 8306 }, { "epoch": 0.94, "learning_rate": 1.6290887533376154e-06, "loss": 0.6708, "step": 8307 }, { "epoch": 0.94, "learning_rate": 1.62247769571523e-06, "loss": 0.7205, "step": 8308 }, { "epoch": 0.94, "learning_rate": 1.615879969940559e-06, "loss": 0.6274, "step": 8309 }, { "epoch": 0.94, "learning_rate": 1.6092955769076767e-06, "loss": 0.6355, "step": 8310 }, { "epoch": 0.94, "learning_rate": 1.6027245175089133e-06, "loss": 0.693, "step": 8311 }, { "epoch": 0.94, "learning_rate": 1.5961667926347568e-06, "loss": 0.6293, "step": 8312 }, { "epoch": 0.94, "learning_rate": 1.5896224031738739e-06, "loss": 0.7003, "step": 8313 }, { "epoch": 0.94, "learning_rate": 1.583091350013155e-06, "loss": 0.7272, "step": 8314 }, { "epoch": 0.95, "learning_rate": 1.576573634037659e-06, "loss": 0.5947, "step": 8315 }, { "epoch": 0.95, "learning_rate": 1.5700692561306575e-06, "loss": 0.6529, "step": 8316 }, { "epoch": 0.95, "learning_rate": 1.5635782171736113e-06, "loss": 0.633, "step": 8317 }, { "epoch": 0.95, "learning_rate": 1.5571005180461729e-06, "loss": 0.643, "step": 8318 }, { "epoch": 0.95, "learning_rate": 1.550636159626151e-06, "loss": 0.6796, "step": 8319 }, { "epoch": 0.95, "learning_rate": 1.5441851427896004e-06, "loss": 0.6534, "step": 8320 }, { "epoch": 0.95, "learning_rate": 1.537747468410744e-06, "loss": 0.6033, "step": 8321 }, { "epoch": 0.95, "learning_rate": 1.5313231373619952e-06, "loss": 0.5973, "step": 8322 }, { "epoch": 0.95, "learning_rate": 1.5249121505139686e-06, "loss": 0.5987, "step": 8323 }, { "epoch": 0.95, "learning_rate": 1.5185145087354468e-06, "loss": 0.6142, "step": 8324 }, { "epoch": 0.95, "learning_rate": 1.5121302128934256e-06, "loss": 0.7024, "step": 8325 }, { "epoch": 0.95, "learning_rate": 1.5057592638531015e-06, "loss": 0.67, "step": 8326 }, { "epoch": 0.95, "learning_rate": 1.4994016624778285e-06, "loss": 0.6693, "step": 8327 }, { "epoch": 0.95, "learning_rate": 1.4930574096291838e-06, "loss": 0.6662, "step": 8328 }, { "epoch": 0.95, "learning_rate": 1.4867265061669245e-06, "loss": 0.6486, "step": 8329 }, { "epoch": 0.95, "learning_rate": 1.4804089529489862e-06, "loss": 0.6696, "step": 8330 }, { "epoch": 0.95, "learning_rate": 1.4741047508315065e-06, "loss": 0.6604, "step": 8331 }, { "epoch": 0.95, "learning_rate": 1.4678139006688242e-06, "loss": 0.6014, "step": 8332 }, { "epoch": 0.95, "learning_rate": 1.461536403313446e-06, "loss": 0.5961, "step": 8333 }, { "epoch": 0.95, "learning_rate": 1.4552722596160917e-06, "loss": 0.7052, "step": 8334 }, { "epoch": 0.95, "learning_rate": 1.4490214704256599e-06, "loss": 0.7288, "step": 8335 }, { "epoch": 0.95, "learning_rate": 1.4427840365892176e-06, "loss": 0.6099, "step": 8336 }, { "epoch": 0.95, "learning_rate": 1.4365599589520773e-06, "loss": 0.6958, "step": 8337 }, { "epoch": 0.95, "learning_rate": 1.4303492383576865e-06, "loss": 0.683, "step": 8338 }, { "epoch": 0.95, "learning_rate": 1.4241518756477169e-06, "loss": 0.6411, "step": 8339 }, { "epoch": 0.95, "learning_rate": 1.4179678716620181e-06, "loss": 0.6221, "step": 8340 }, { "epoch": 0.95, "learning_rate": 1.4117972272386204e-06, "loss": 0.7501, "step": 8341 }, { "epoch": 0.95, "learning_rate": 1.4056399432137546e-06, "loss": 0.635, "step": 8342 }, { "epoch": 0.95, "learning_rate": 1.399496020421831e-06, "loss": 0.6141, "step": 8343 }, { "epoch": 0.95, "learning_rate": 1.3933654596954725e-06, "loss": 0.5833, "step": 8344 }, { "epoch": 0.95, "learning_rate": 1.3872482618654704e-06, "loss": 0.66, "step": 8345 }, { "epoch": 0.95, "learning_rate": 1.3811444277608165e-06, "loss": 0.7165, "step": 8346 }, { "epoch": 0.95, "learning_rate": 1.3750539582086719e-06, "loss": 0.6813, "step": 8347 }, { "epoch": 0.95, "learning_rate": 1.3689768540343983e-06, "loss": 0.7011, "step": 8348 }, { "epoch": 0.95, "learning_rate": 1.3629131160615594e-06, "loss": 0.6348, "step": 8349 }, { "epoch": 0.95, "learning_rate": 1.3568627451118864e-06, "loss": 0.6875, "step": 8350 }, { "epoch": 0.95, "learning_rate": 1.3508257420053349e-06, "loss": 0.6153, "step": 8351 }, { "epoch": 0.95, "learning_rate": 1.3448021075599838e-06, "loss": 0.6677, "step": 8352 }, { "epoch": 0.95, "learning_rate": 1.3387918425921686e-06, "loss": 0.6388, "step": 8353 }, { "epoch": 0.95, "learning_rate": 1.3327949479163604e-06, "loss": 0.6866, "step": 8354 }, { "epoch": 0.95, "learning_rate": 1.3268114243452645e-06, "loss": 0.6197, "step": 8355 }, { "epoch": 0.95, "learning_rate": 1.3208412726897323e-06, "loss": 0.637, "step": 8356 }, { "epoch": 0.95, "learning_rate": 1.314884493758839e-06, "loss": 0.6327, "step": 8357 }, { "epoch": 0.95, "learning_rate": 1.3089410883598163e-06, "loss": 0.686, "step": 8358 }, { "epoch": 0.95, "learning_rate": 1.303011057298109e-06, "loss": 0.721, "step": 8359 }, { "epoch": 0.95, "learning_rate": 1.29709440137733e-06, "loss": 0.5868, "step": 8360 }, { "epoch": 0.95, "learning_rate": 1.2911911213992933e-06, "loss": 0.6946, "step": 8361 }, { "epoch": 0.95, "learning_rate": 1.2853012181639923e-06, "loss": 0.6347, "step": 8362 }, { "epoch": 0.95, "learning_rate": 1.2794246924696107e-06, "loss": 0.6179, "step": 8363 }, { "epoch": 0.95, "learning_rate": 1.2735615451125227e-06, "loss": 0.6779, "step": 8364 }, { "epoch": 0.95, "learning_rate": 1.2677117768872815e-06, "loss": 0.6166, "step": 8365 }, { "epoch": 0.95, "learning_rate": 1.2618753885866307e-06, "loss": 0.6375, "step": 8366 }, { "epoch": 0.95, "learning_rate": 1.2560523810014934e-06, "loss": 0.6525, "step": 8367 }, { "epoch": 0.95, "learning_rate": 1.250242754921016e-06, "loss": 0.643, "step": 8368 }, { "epoch": 0.95, "learning_rate": 1.2444465111324687e-06, "loss": 0.675, "step": 8369 }, { "epoch": 0.95, "learning_rate": 1.2386636504213677e-06, "loss": 0.6567, "step": 8370 }, { "epoch": 0.95, "learning_rate": 1.232894173571375e-06, "loss": 0.6713, "step": 8371 }, { "epoch": 0.95, "learning_rate": 1.227138081364354e-06, "loss": 0.675, "step": 8372 }, { "epoch": 0.95, "learning_rate": 1.2213953745803586e-06, "loss": 0.7357, "step": 8373 }, { "epoch": 0.95, "learning_rate": 1.215666053997644e-06, "loss": 0.681, "step": 8374 }, { "epoch": 0.95, "learning_rate": 1.209950120392589e-06, "loss": 0.6897, "step": 8375 }, { "epoch": 0.95, "learning_rate": 1.2042475745398408e-06, "loss": 0.689, "step": 8376 }, { "epoch": 0.95, "learning_rate": 1.19855841721217e-06, "loss": 0.6404, "step": 8377 }, { "epoch": 0.95, "learning_rate": 1.19288264918056e-06, "loss": 0.679, "step": 8378 }, { "epoch": 0.95, "learning_rate": 1.1872202712141733e-06, "loss": 0.6451, "step": 8379 }, { "epoch": 0.95, "learning_rate": 1.181571284080374e-06, "loss": 0.6808, "step": 8380 }, { "epoch": 0.95, "learning_rate": 1.1759356885446825e-06, "loss": 0.6386, "step": 8381 }, { "epoch": 0.95, "learning_rate": 1.170313485370822e-06, "loss": 0.66, "step": 8382 }, { "epoch": 0.95, "learning_rate": 1.1647046753206936e-06, "loss": 0.7014, "step": 8383 }, { "epoch": 0.95, "learning_rate": 1.1591092591543894e-06, "loss": 0.619, "step": 8384 }, { "epoch": 0.95, "learning_rate": 1.1535272376302032e-06, "loss": 0.6621, "step": 8385 }, { "epoch": 0.95, "learning_rate": 1.1479586115045627e-06, "loss": 0.7016, "step": 8386 }, { "epoch": 0.95, "learning_rate": 1.1424033815321423e-06, "loss": 0.6032, "step": 8387 }, { "epoch": 0.95, "learning_rate": 1.1368615484657397e-06, "loss": 0.6169, "step": 8388 }, { "epoch": 0.95, "learning_rate": 1.1313331130564097e-06, "loss": 0.7299, "step": 8389 }, { "epoch": 0.95, "learning_rate": 1.1258180760533089e-06, "loss": 0.6971, "step": 8390 }, { "epoch": 0.95, "learning_rate": 1.1203164382038611e-06, "loss": 0.6412, "step": 8391 }, { "epoch": 0.95, "learning_rate": 1.1148282002535927e-06, "loss": 0.6632, "step": 8392 }, { "epoch": 0.95, "learning_rate": 1.109353362946286e-06, "loss": 0.6786, "step": 8393 }, { "epoch": 0.95, "learning_rate": 1.103891927023848e-06, "loss": 0.662, "step": 8394 }, { "epoch": 0.95, "learning_rate": 1.0984438932264196e-06, "loss": 0.6466, "step": 8395 }, { "epoch": 0.95, "learning_rate": 1.0930092622922883e-06, "loss": 0.6486, "step": 8396 }, { "epoch": 0.95, "learning_rate": 1.0875880349579648e-06, "loss": 0.6731, "step": 8397 }, { "epoch": 0.95, "learning_rate": 1.0821802119580837e-06, "loss": 0.5569, "step": 8398 }, { "epoch": 0.95, "learning_rate": 1.0767857940255255e-06, "loss": 0.6863, "step": 8399 }, { "epoch": 0.95, "learning_rate": 1.0714047818913054e-06, "loss": 0.6858, "step": 8400 }, { "epoch": 0.95, "learning_rate": 1.0660371762846622e-06, "loss": 0.6585, "step": 8401 }, { "epoch": 0.95, "learning_rate": 1.0606829779329808e-06, "loss": 0.7023, "step": 8402 }, { "epoch": 0.96, "learning_rate": 1.0553421875618697e-06, "loss": 0.7058, "step": 8403 }, { "epoch": 0.96, "learning_rate": 1.0500148058950831e-06, "loss": 0.6795, "step": 8404 }, { "epoch": 0.96, "learning_rate": 1.0447008336545772e-06, "loss": 0.7043, "step": 8405 }, { "epoch": 0.96, "learning_rate": 1.0394002715604755e-06, "loss": 0.6463, "step": 8406 }, { "epoch": 0.96, "learning_rate": 1.0341131203311038e-06, "loss": 0.6656, "step": 8407 }, { "epoch": 0.96, "learning_rate": 1.0288393806829776e-06, "loss": 0.7312, "step": 8408 }, { "epoch": 0.96, "learning_rate": 1.0235790533307477e-06, "loss": 0.5978, "step": 8409 }, { "epoch": 0.96, "learning_rate": 1.0183321389873102e-06, "loss": 0.6562, "step": 8410 }, { "epoch": 0.96, "learning_rate": 1.0130986383636853e-06, "loss": 0.684, "step": 8411 }, { "epoch": 0.96, "learning_rate": 1.0078785521691282e-06, "loss": 0.6981, "step": 8412 }, { "epoch": 0.96, "learning_rate": 1.0026718811110281e-06, "loss": 0.692, "step": 8413 }, { "epoch": 0.96, "learning_rate": 9.974786258949986e-07, "loss": 0.6456, "step": 8414 }, { "epoch": 0.96, "learning_rate": 9.922987872247879e-07, "loss": 0.6726, "step": 8415 }, { "epoch": 0.96, "learning_rate": 9.8713236580239e-07, "loss": 0.6391, "step": 8416 }, { "epoch": 0.96, "learning_rate": 9.819793623279116e-07, "loss": 0.6753, "step": 8417 }, { "epoch": 0.96, "learning_rate": 9.768397774996828e-07, "loss": 0.5923, "step": 8418 }, { "epoch": 0.96, "learning_rate": 9.717136120142134e-07, "loss": 0.6411, "step": 8419 }, { "epoch": 0.96, "learning_rate": 9.66600866566192e-07, "loss": 0.5843, "step": 8420 }, { "epoch": 0.96, "learning_rate": 9.61501541848464e-07, "loss": 0.6757, "step": 8421 }, { "epoch": 0.96, "learning_rate": 9.564156385520883e-07, "loss": 0.7006, "step": 8422 }, { "epoch": 0.96, "learning_rate": 9.513431573662801e-07, "loss": 0.6653, "step": 8423 }, { "epoch": 0.96, "learning_rate": 9.462840989784671e-07, "loss": 0.7311, "step": 8424 }, { "epoch": 0.96, "learning_rate": 9.412384640742345e-07, "loss": 0.6804, "step": 8425 }, { "epoch": 0.96, "learning_rate": 9.362062533373462e-07, "loss": 0.6824, "step": 8426 }, { "epoch": 0.96, "learning_rate": 9.311874674497456e-07, "loss": 0.6755, "step": 8427 }, { "epoch": 0.96, "learning_rate": 9.261821070915777e-07, "loss": 0.6585, "step": 8428 }, { "epoch": 0.96, "learning_rate": 9.211901729411443e-07, "loss": 0.6595, "step": 8429 }, { "epoch": 0.96, "learning_rate": 9.162116656749598e-07, "loss": 0.6726, "step": 8430 }, { "epoch": 0.96, "learning_rate": 9.112465859676733e-07, "loss": 0.6043, "step": 8431 }, { "epoch": 0.96, "learning_rate": 9.062949344921467e-07, "loss": 0.6497, "step": 8432 }, { "epoch": 0.96, "learning_rate": 9.013567119194211e-07, "loss": 0.6915, "step": 8433 }, { "epoch": 0.96, "learning_rate": 8.964319189186942e-07, "loss": 0.6588, "step": 8434 }, { "epoch": 0.96, "learning_rate": 8.91520556157388e-07, "loss": 0.643, "step": 8435 }, { "epoch": 0.96, "learning_rate": 8.866226243010478e-07, "loss": 0.6725, "step": 8436 }, { "epoch": 0.96, "learning_rate": 8.817381240134426e-07, "loss": 0.7336, "step": 8437 }, { "epoch": 0.96, "learning_rate": 8.768670559564985e-07, "loss": 0.6885, "step": 8438 }, { "epoch": 0.96, "learning_rate": 8.720094207903429e-07, "loss": 0.6389, "step": 8439 }, { "epoch": 0.96, "learning_rate": 8.671652191732493e-07, "loss": 0.5884, "step": 8440 }, { "epoch": 0.96, "learning_rate": 8.623344517617149e-07, "loss": 0.6674, "step": 8441 }, { "epoch": 0.96, "learning_rate": 8.575171192103714e-07, "loss": 0.6817, "step": 8442 }, { "epoch": 0.96, "learning_rate": 8.527132221720524e-07, "loss": 0.5971, "step": 8443 }, { "epoch": 0.96, "learning_rate": 8.479227612977814e-07, "loss": 0.709, "step": 8444 }, { "epoch": 0.96, "learning_rate": 8.431457372367279e-07, "loss": 0.6661, "step": 8445 }, { "epoch": 0.96, "learning_rate": 8.383821506362855e-07, "loss": 0.6901, "step": 8446 }, { "epoch": 0.96, "learning_rate": 8.336320021419819e-07, "loss": 0.6767, "step": 8447 }, { "epoch": 0.96, "learning_rate": 8.28895292397558e-07, "loss": 0.6584, "step": 8448 }, { "epoch": 0.96, "learning_rate": 8.241720220449112e-07, "loss": 0.7545, "step": 8449 }, { "epoch": 0.96, "learning_rate": 8.194621917241185e-07, "loss": 0.6338, "step": 8450 }, { "epoch": 0.96, "learning_rate": 8.147658020734584e-07, "loss": 0.5826, "step": 8451 }, { "epoch": 0.96, "learning_rate": 8.100828537293659e-07, "loss": 0.6984, "step": 8452 }, { "epoch": 0.96, "learning_rate": 8.054133473264669e-07, "loss": 0.7205, "step": 8453 }, { "epoch": 0.96, "learning_rate": 8.007572834975552e-07, "loss": 0.6776, "step": 8454 }, { "epoch": 0.96, "learning_rate": 7.961146628736038e-07, "loss": 0.6497, "step": 8455 }, { "epoch": 0.96, "learning_rate": 7.914854860837762e-07, "loss": 0.6687, "step": 8456 }, { "epoch": 0.96, "learning_rate": 7.868697537553927e-07, "loss": 0.6285, "step": 8457 }, { "epoch": 0.96, "learning_rate": 7.822674665139751e-07, "loss": 0.6943, "step": 8458 }, { "epoch": 0.96, "learning_rate": 7.776786249832136e-07, "loss": 0.5833, "step": 8459 }, { "epoch": 0.96, "learning_rate": 7.731032297849661e-07, "loss": 0.6578, "step": 8460 }, { "epoch": 0.96, "learning_rate": 7.685412815392812e-07, "loss": 0.6339, "step": 8461 }, { "epoch": 0.96, "learning_rate": 7.639927808643865e-07, "loss": 0.6737, "step": 8462 }, { "epoch": 0.96, "learning_rate": 7.59457728376678e-07, "loss": 0.6422, "step": 8463 }, { "epoch": 0.96, "learning_rate": 7.549361246907305e-07, "loss": 0.7088, "step": 8464 }, { "epoch": 0.96, "learning_rate": 7.504279704193096e-07, "loss": 0.6396, "step": 8465 }, { "epoch": 0.96, "learning_rate": 7.459332661733376e-07, "loss": 0.6212, "step": 8466 }, { "epoch": 0.96, "learning_rate": 7.414520125619273e-07, "loss": 0.6197, "step": 8467 }, { "epoch": 0.96, "learning_rate": 7.369842101923596e-07, "loss": 0.6685, "step": 8468 }, { "epoch": 0.96, "learning_rate": 7.325298596701057e-07, "loss": 0.6683, "step": 8469 }, { "epoch": 0.96, "learning_rate": 7.280889615988162e-07, "loss": 0.6729, "step": 8470 }, { "epoch": 0.96, "learning_rate": 7.236615165802985e-07, "loss": 0.7257, "step": 8471 }, { "epoch": 0.96, "learning_rate": 7.192475252145392e-07, "loss": 0.6861, "step": 8472 }, { "epoch": 0.96, "learning_rate": 7.148469880997266e-07, "loss": 0.6535, "step": 8473 }, { "epoch": 0.96, "learning_rate": 7.104599058321948e-07, "loss": 0.6544, "step": 8474 }, { "epoch": 0.96, "learning_rate": 7.060862790064793e-07, "loss": 0.7451, "step": 8475 }, { "epoch": 0.96, "learning_rate": 7.017261082152726e-07, "loss": 0.6482, "step": 8476 }, { "epoch": 0.96, "learning_rate": 6.973793940494688e-07, "loss": 0.6777, "step": 8477 }, { "epoch": 0.96, "learning_rate": 6.930461370981078e-07, "loss": 0.6644, "step": 8478 }, { "epoch": 0.96, "learning_rate": 6.887263379484199e-07, "loss": 0.6811, "step": 8479 }, { "epoch": 0.96, "learning_rate": 6.844199971858257e-07, "loss": 0.7096, "step": 8480 }, { "epoch": 0.96, "learning_rate": 6.801271153938916e-07, "loss": 0.659, "step": 8481 }, { "epoch": 0.96, "learning_rate": 6.758476931543856e-07, "loss": 0.651, "step": 8482 }, { "epoch": 0.96, "learning_rate": 6.71581731047255e-07, "loss": 0.6699, "step": 8483 }, { "epoch": 0.96, "learning_rate": 6.673292296505818e-07, "loss": 0.6629, "step": 8484 }, { "epoch": 0.96, "learning_rate": 6.630901895406827e-07, "loss": 0.6238, "step": 8485 }, { "epoch": 0.96, "learning_rate": 6.588646112920094e-07, "loss": 0.5946, "step": 8486 }, { "epoch": 0.96, "learning_rate": 6.546524954771926e-07, "loss": 0.5967, "step": 8487 }, { "epoch": 0.96, "learning_rate": 6.504538426670537e-07, "loss": 0.6792, "step": 8488 }, { "epoch": 0.96, "learning_rate": 6.462686534305929e-07, "loss": 0.6173, "step": 8489 }, { "epoch": 0.96, "learning_rate": 6.420969283349453e-07, "loss": 0.6638, "step": 8490 }, { "epoch": 0.97, "learning_rate": 6.379386679454813e-07, "loss": 0.6518, "step": 8491 }, { "epoch": 0.97, "learning_rate": 6.337938728257054e-07, "loss": 0.6455, "step": 8492 }, { "epoch": 0.97, "learning_rate": 6.296625435373127e-07, "loss": 0.692, "step": 8493 }, { "epoch": 0.97, "learning_rate": 6.255446806401666e-07, "loss": 0.7065, "step": 8494 }, { "epoch": 0.97, "learning_rate": 6.214402846923096e-07, "loss": 0.7212, "step": 8495 }, { "epoch": 0.97, "learning_rate": 6.173493562499411e-07, "loss": 0.7199, "step": 8496 }, { "epoch": 0.97, "learning_rate": 6.132718958674844e-07, "loss": 0.6298, "step": 8497 }, { "epoch": 0.97, "learning_rate": 6.092079040974752e-07, "loss": 0.7083, "step": 8498 }, { "epoch": 0.97, "learning_rate": 6.051573814906841e-07, "loss": 0.6685, "step": 8499 }, { "epoch": 0.97, "learning_rate": 6.011203285959943e-07, "loss": 0.6604, "step": 8500 }, { "epoch": 0.97, "learning_rate": 5.970967459605236e-07, "loss": 0.6893, "step": 8501 }, { "epoch": 0.97, "learning_rate": 5.930866341295249e-07, "loss": 0.6722, "step": 8502 }, { "epoch": 0.97, "learning_rate": 5.8908999364643e-07, "loss": 0.6605, "step": 8503 }, { "epoch": 0.97, "learning_rate": 5.851068250528613e-07, "loss": 0.5764, "step": 8504 }, { "epoch": 0.97, "learning_rate": 5.811371288886092e-07, "loss": 0.6522, "step": 8505 }, { "epoch": 0.97, "learning_rate": 5.771809056916322e-07, "loss": 0.6089, "step": 8506 }, { "epoch": 0.97, "learning_rate": 5.732381559980571e-07, "loss": 0.6245, "step": 8507 }, { "epoch": 0.97, "learning_rate": 5.69308880342223e-07, "loss": 0.6186, "step": 8508 }, { "epoch": 0.97, "learning_rate": 5.653930792565821e-07, "loss": 0.6538, "step": 8509 }, { "epoch": 0.97, "learning_rate": 5.614907532718094e-07, "loss": 0.6412, "step": 8510 }, { "epoch": 0.97, "learning_rate": 5.576019029167268e-07, "loss": 0.627, "step": 8511 }, { "epoch": 0.97, "learning_rate": 5.537265287183569e-07, "loss": 0.6195, "step": 8512 }, { "epoch": 0.97, "learning_rate": 5.498646312018685e-07, "loss": 0.6884, "step": 8513 }, { "epoch": 0.97, "learning_rate": 5.460162108906208e-07, "loss": 0.6742, "step": 8514 }, { "epoch": 0.97, "learning_rate": 5.42181268306119e-07, "loss": 0.6645, "step": 8515 }, { "epoch": 0.97, "learning_rate": 5.383598039681026e-07, "loss": 0.6341, "step": 8516 }, { "epoch": 0.97, "learning_rate": 5.345518183944131e-07, "loss": 0.7243, "step": 8517 }, { "epoch": 0.97, "learning_rate": 5.307573121011266e-07, "loss": 0.7259, "step": 8518 }, { "epoch": 0.97, "learning_rate": 5.269762856024318e-07, "loss": 0.6825, "step": 8519 }, { "epoch": 0.97, "learning_rate": 5.23208739410741e-07, "loss": 0.6648, "step": 8520 }, { "epoch": 0.97, "learning_rate": 5.194546740366124e-07, "loss": 0.6764, "step": 8521 }, { "epoch": 0.97, "learning_rate": 5.157140899888169e-07, "loss": 0.6743, "step": 8522 }, { "epoch": 0.97, "learning_rate": 5.119869877742267e-07, "loss": 0.6314, "step": 8523 }, { "epoch": 0.97, "learning_rate": 5.08273367897949e-07, "loss": 0.7156, "step": 8524 }, { "epoch": 0.97, "learning_rate": 5.045732308632367e-07, "loss": 0.6531, "step": 8525 }, { "epoch": 0.97, "learning_rate": 5.008865771715221e-07, "loss": 0.6399, "step": 8526 }, { "epoch": 0.97, "learning_rate": 4.972134073224278e-07, "loss": 0.6614, "step": 8527 }, { "epoch": 0.97, "learning_rate": 4.93553721813711e-07, "loss": 0.6481, "step": 8528 }, { "epoch": 0.97, "learning_rate": 4.899075211413307e-07, "loss": 0.6427, "step": 8529 }, { "epoch": 0.97, "learning_rate": 4.862748057994027e-07, "loss": 0.6545, "step": 8530 }, { "epoch": 0.97, "learning_rate": 4.826555762802221e-07, "loss": 0.565, "step": 8531 }, { "epoch": 0.97, "learning_rate": 4.790498330742743e-07, "loss": 0.6463, "step": 8532 }, { "epoch": 0.97, "learning_rate": 4.7545757667017966e-07, "loss": 0.693, "step": 8533 }, { "epoch": 0.97, "learning_rate": 4.718788075547709e-07, "loss": 0.6772, "step": 8534 }, { "epoch": 0.97, "learning_rate": 4.683135262130045e-07, "loss": 0.6866, "step": 8535 }, { "epoch": 0.97, "learning_rate": 4.647617331280607e-07, "loss": 0.653, "step": 8536 }, { "epoch": 0.97, "learning_rate": 4.6122342878126554e-07, "loss": 0.6515, "step": 8537 }, { "epoch": 0.97, "learning_rate": 4.576986136521022e-07, "loss": 0.6515, "step": 8538 }, { "epoch": 0.97, "learning_rate": 4.541872882182774e-07, "loss": 0.6518, "step": 8539 }, { "epoch": 0.97, "learning_rate": 4.506894529555994e-07, "loss": 0.6238, "step": 8540 }, { "epoch": 0.97, "learning_rate": 4.4720510833811123e-07, "loss": 0.6565, "step": 8541 }, { "epoch": 0.97, "learning_rate": 4.437342548379908e-07, "loss": 0.6356, "step": 8542 }, { "epoch": 0.97, "learning_rate": 4.4027689292560624e-07, "loss": 0.6823, "step": 8543 }, { "epoch": 0.97, "learning_rate": 4.368330230694717e-07, "loss": 0.7119, "step": 8544 }, { "epoch": 0.97, "learning_rate": 4.3340264573631385e-07, "loss": 0.6253, "step": 8545 }, { "epoch": 0.97, "learning_rate": 4.29985761390983e-07, "loss": 0.7175, "step": 8546 }, { "epoch": 0.97, "learning_rate": 4.2658237049655323e-07, "loss": 0.659, "step": 8547 }, { "epoch": 0.97, "learning_rate": 4.231924735142223e-07, "loss": 0.7271, "step": 8548 }, { "epoch": 0.97, "learning_rate": 4.1981607090337826e-07, "loss": 0.703, "step": 8549 }, { "epoch": 0.97, "learning_rate": 4.1645316312159956e-07, "loss": 0.6217, "step": 8550 }, { "epoch": 0.97, "learning_rate": 4.1310375062461047e-07, "loss": 0.6266, "step": 8551 }, { "epoch": 0.97, "learning_rate": 4.0976783386630355e-07, "loss": 0.6636, "step": 8552 }, { "epoch": 0.97, "learning_rate": 4.0644541329877274e-07, "loss": 0.6531, "step": 8553 }, { "epoch": 0.97, "learning_rate": 4.031364893722356e-07, "loss": 0.7046, "step": 8554 }, { "epoch": 0.97, "learning_rate": 3.9984106253513345e-07, "loss": 0.6646, "step": 8555 }, { "epoch": 0.97, "learning_rate": 3.965591332340424e-07, "loss": 0.662, "step": 8556 }, { "epoch": 0.97, "learning_rate": 3.9329070191372885e-07, "loss": 0.6949, "step": 8557 }, { "epoch": 0.97, "learning_rate": 3.9003576901710527e-07, "loss": 0.6873, "step": 8558 }, { "epoch": 0.97, "learning_rate": 3.867943349852854e-07, "loss": 0.688, "step": 8559 }, { "epoch": 0.97, "learning_rate": 3.83566400257529e-07, "loss": 0.6635, "step": 8560 }, { "epoch": 0.97, "learning_rate": 3.8035196527128615e-07, "loss": 0.6726, "step": 8561 }, { "epoch": 0.97, "learning_rate": 3.7715103046217505e-07, "loss": 0.6746, "step": 8562 }, { "epoch": 0.97, "learning_rate": 3.739635962639487e-07, "loss": 0.59, "step": 8563 }, { "epoch": 0.97, "learning_rate": 3.7078966310858385e-07, "loss": 0.6697, "step": 8564 }, { "epoch": 0.97, "learning_rate": 3.676292314262031e-07, "loss": 0.6972, "step": 8565 }, { "epoch": 0.97, "learning_rate": 3.64482301645086e-07, "loss": 0.664, "step": 8566 }, { "epoch": 0.97, "learning_rate": 3.613488741917026e-07, "loss": 0.5822, "step": 8567 }, { "epoch": 0.97, "learning_rate": 3.5822894949069095e-07, "loss": 0.6085, "step": 8568 }, { "epoch": 0.97, "learning_rate": 3.5512252796484626e-07, "loss": 0.6905, "step": 8569 }, { "epoch": 0.97, "learning_rate": 3.520296100351428e-07, "loss": 0.6725, "step": 8570 }, { "epoch": 0.97, "learning_rate": 3.489501961207342e-07, "loss": 0.6809, "step": 8571 }, { "epoch": 0.97, "learning_rate": 3.4588428663892003e-07, "loss": 0.5868, "step": 8572 }, { "epoch": 0.97, "learning_rate": 3.428318820052012e-07, "loss": 0.6494, "step": 8573 }, { "epoch": 0.97, "learning_rate": 3.397929826332136e-07, "loss": 0.5982, "step": 8574 }, { "epoch": 0.97, "learning_rate": 3.3676758893478323e-07, "loss": 0.6738, "step": 8575 }, { "epoch": 0.97, "learning_rate": 3.337557013199155e-07, "loss": 0.6641, "step": 8576 }, { "epoch": 0.97, "learning_rate": 3.3075732019675066e-07, "loss": 0.6805, "step": 8577 }, { "epoch": 0.97, "learning_rate": 3.2777244597164135e-07, "loss": 0.644, "step": 8578 }, { "epoch": 0.98, "learning_rate": 3.248010790490974e-07, "loss": 0.6311, "step": 8579 }, { "epoch": 0.98, "learning_rate": 3.2184321983175227e-07, "loss": 0.6551, "step": 8580 }, { "epoch": 0.98, "learning_rate": 3.188988687204852e-07, "loss": 0.6492, "step": 8581 }, { "epoch": 0.98, "learning_rate": 3.1596802611428833e-07, "loss": 0.701, "step": 8582 }, { "epoch": 0.98, "learning_rate": 3.1305069241034377e-07, "loss": 0.6392, "step": 8583 }, { "epoch": 0.98, "learning_rate": 3.1014686800400205e-07, "loss": 0.668, "step": 8584 }, { "epoch": 0.98, "learning_rate": 3.0725655328878165e-07, "loss": 0.6953, "step": 8585 }, { "epoch": 0.98, "learning_rate": 3.043797486563693e-07, "loss": 0.6551, "step": 8586 }, { "epoch": 0.98, "learning_rate": 3.0151645449661983e-07, "loss": 0.6927, "step": 8587 }, { "epoch": 0.98, "learning_rate": 2.986666711975561e-07, "loss": 0.6784, "step": 8588 }, { "epoch": 0.98, "learning_rate": 2.9583039914538033e-07, "loss": 0.641, "step": 8589 }, { "epoch": 0.98, "learning_rate": 2.9300763872445183e-07, "loss": 0.6987, "step": 8590 }, { "epoch": 0.98, "learning_rate": 2.901983903173089e-07, "loss": 0.614, "step": 8591 }, { "epoch": 0.98, "learning_rate": 2.874026543046471e-07, "loss": 0.7599, "step": 8592 }, { "epoch": 0.98, "learning_rate": 2.8462043106534107e-07, "loss": 0.677, "step": 8593 }, { "epoch": 0.98, "learning_rate": 2.8185172097641156e-07, "loss": 0.688, "step": 8594 }, { "epoch": 0.98, "learning_rate": 2.7909652441309166e-07, "loss": 0.6222, "step": 8595 }, { "epoch": 0.98, "learning_rate": 2.763548417487494e-07, "loss": 0.5904, "step": 8596 }, { "epoch": 0.98, "learning_rate": 2.7362667335493195e-07, "loss": 0.6168, "step": 8597 }, { "epoch": 0.98, "learning_rate": 2.7091201960134374e-07, "loss": 0.6694, "step": 8598 }, { "epoch": 0.98, "learning_rate": 2.682108808558792e-07, "loss": 0.6332, "step": 8599 }, { "epoch": 0.98, "learning_rate": 2.655232574845679e-07, "loss": 0.6719, "step": 8600 }, { "epoch": 0.98, "learning_rate": 2.6284914985166276e-07, "loss": 0.7078, "step": 8601 }, { "epoch": 0.98, "learning_rate": 2.6018855831951847e-07, "loss": 0.7218, "step": 8602 }, { "epoch": 0.98, "learning_rate": 2.575414832487133e-07, "loss": 0.6475, "step": 8603 }, { "epoch": 0.98, "learning_rate": 2.5490792499796023e-07, "loss": 0.6416, "step": 8604 }, { "epoch": 0.98, "learning_rate": 2.522878839241516e-07, "loss": 0.6313, "step": 8605 }, { "epoch": 0.98, "learning_rate": 2.496813603823589e-07, "loss": 0.6581, "step": 8606 }, { "epoch": 0.98, "learning_rate": 2.470883547257996e-07, "loss": 0.5895, "step": 8607 }, { "epoch": 0.98, "learning_rate": 2.445088673058815e-07, "loss": 0.6803, "step": 8608 }, { "epoch": 0.98, "learning_rate": 2.419428984721472e-07, "loss": 0.6539, "step": 8609 }, { "epoch": 0.98, "learning_rate": 2.3939044857236304e-07, "loss": 0.6238, "step": 8610 }, { "epoch": 0.98, "learning_rate": 2.3685151795239668e-07, "loss": 0.6802, "step": 8611 }, { "epoch": 0.98, "learning_rate": 2.343261069563396e-07, "loss": 0.5813, "step": 8612 }, { "epoch": 0.98, "learning_rate": 2.3181421592641807e-07, "loss": 0.6724, "step": 8613 }, { "epoch": 0.98, "learning_rate": 2.293158452030486e-07, "loss": 0.6056, "step": 8614 }, { "epoch": 0.98, "learning_rate": 2.2683099512478268e-07, "loss": 0.7131, "step": 8615 }, { "epoch": 0.98, "learning_rate": 2.243596660283731e-07, "loss": 0.6369, "step": 8616 }, { "epoch": 0.98, "learning_rate": 2.2190185824872978e-07, "loss": 0.6238, "step": 8617 }, { "epoch": 0.98, "learning_rate": 2.194575721189307e-07, "loss": 0.6431, "step": 8618 }, { "epoch": 0.98, "learning_rate": 2.170268079701998e-07, "loss": 0.6145, "step": 8619 }, { "epoch": 0.98, "learning_rate": 2.1460956613197358e-07, "loss": 0.6521, "step": 8620 }, { "epoch": 0.98, "learning_rate": 2.1220584693180113e-07, "loss": 0.5957, "step": 8621 }, { "epoch": 0.98, "learning_rate": 2.0981565069545516e-07, "loss": 0.6635, "step": 8622 }, { "epoch": 0.98, "learning_rate": 2.0743897774683218e-07, "loss": 0.7254, "step": 8623 }, { "epoch": 0.98, "learning_rate": 2.05075828408019e-07, "loss": 0.6932, "step": 8624 }, { "epoch": 0.98, "learning_rate": 2.0272620299925938e-07, "loss": 0.6548, "step": 8625 }, { "epoch": 0.98, "learning_rate": 2.0039010183896533e-07, "loss": 0.6362, "step": 8626 }, { "epoch": 0.98, "learning_rate": 1.9806752524372806e-07, "loss": 0.6656, "step": 8627 }, { "epoch": 0.98, "learning_rate": 1.957584735282847e-07, "loss": 0.6666, "step": 8628 }, { "epoch": 0.98, "learning_rate": 1.9346294700556266e-07, "loss": 0.6872, "step": 8629 }, { "epoch": 0.98, "learning_rate": 1.911809459866354e-07, "loss": 0.6746, "step": 8630 }, { "epoch": 0.98, "learning_rate": 1.8891247078076657e-07, "loss": 0.6529, "step": 8631 }, { "epoch": 0.98, "learning_rate": 1.866575216953659e-07, "loss": 0.7074, "step": 8632 }, { "epoch": 0.98, "learning_rate": 1.844160990360111e-07, "loss": 0.615, "step": 8633 }, { "epoch": 0.98, "learning_rate": 1.8218820310645924e-07, "loss": 0.7076, "step": 8634 }, { "epoch": 0.98, "learning_rate": 1.7997383420863544e-07, "loss": 0.6314, "step": 8635 }, { "epoch": 0.98, "learning_rate": 1.7777299264261082e-07, "loss": 0.696, "step": 8636 }, { "epoch": 0.98, "learning_rate": 1.7558567870665787e-07, "loss": 0.6045, "step": 8637 }, { "epoch": 0.98, "learning_rate": 1.7341189269717283e-07, "loss": 0.6636, "step": 8638 }, { "epoch": 0.98, "learning_rate": 1.712516349087534e-07, "loss": 0.6431, "step": 8639 }, { "epoch": 0.98, "learning_rate": 1.6910490563414316e-07, "loss": 0.6888, "step": 8640 }, { "epoch": 0.98, "learning_rate": 1.6697170516427607e-07, "loss": 0.6815, "step": 8641 }, { "epoch": 0.98, "learning_rate": 1.648520337882209e-07, "loss": 0.6229, "step": 8642 }, { "epoch": 0.98, "learning_rate": 1.6274589179324783e-07, "loss": 0.6321, "step": 8643 }, { "epoch": 0.98, "learning_rate": 1.6065327946475084e-07, "loss": 0.6999, "step": 8644 }, { "epoch": 0.98, "learning_rate": 1.5857419708633638e-07, "loss": 0.6129, "step": 8645 }, { "epoch": 0.98, "learning_rate": 1.565086449397457e-07, "loss": 0.6935, "step": 8646 }, { "epoch": 0.98, "learning_rate": 1.544566233048994e-07, "loss": 0.6684, "step": 8647 }, { "epoch": 0.98, "learning_rate": 1.5241813245988612e-07, "loss": 0.6465, "step": 8648 }, { "epoch": 0.98, "learning_rate": 1.5039317268095155e-07, "loss": 0.6795, "step": 8649 }, { "epoch": 0.98, "learning_rate": 1.483817442424984e-07, "loss": 0.65, "step": 8650 }, { "epoch": 0.98, "learning_rate": 1.4638384741714194e-07, "loss": 0.6688, "step": 8651 }, { "epoch": 0.98, "learning_rate": 1.44399482475599e-07, "loss": 0.5971, "step": 8652 }, { "epoch": 0.98, "learning_rate": 1.4242864968680992e-07, "loss": 0.6857, "step": 8653 }, { "epoch": 0.98, "learning_rate": 1.4047134931785e-07, "loss": 0.6356, "step": 8654 }, { "epoch": 0.98, "learning_rate": 1.385275816339515e-07, "loss": 0.5891, "step": 8655 }, { "epoch": 0.98, "learning_rate": 1.365973468985482e-07, "loss": 0.5859, "step": 8656 }, { "epoch": 0.98, "learning_rate": 1.3468064537321968e-07, "loss": 0.6558, "step": 8657 }, { "epoch": 0.98, "learning_rate": 1.3277747731769152e-07, "loss": 0.6471, "step": 8658 }, { "epoch": 0.98, "learning_rate": 1.3088784298990187e-07, "loss": 0.5788, "step": 8659 }, { "epoch": 0.98, "learning_rate": 1.2901174264590143e-07, "loss": 0.6991, "step": 8660 }, { "epoch": 0.98, "learning_rate": 1.271491765399646e-07, "loss": 0.5754, "step": 8661 }, { "epoch": 0.98, "learning_rate": 1.2530014492446728e-07, "loss": 0.6171, "step": 8662 }, { "epoch": 0.98, "learning_rate": 1.2346464805002012e-07, "loss": 0.5808, "step": 8663 }, { "epoch": 0.98, "learning_rate": 1.2164268616533524e-07, "loss": 0.6565, "step": 8664 }, { "epoch": 0.98, "learning_rate": 1.198342595173374e-07, "loss": 0.6811, "step": 8665 }, { "epoch": 0.98, "learning_rate": 1.180393683510972e-07, "loss": 0.6374, "step": 8666 }, { "epoch": 0.99, "learning_rate": 1.1625801290984228e-07, "loss": 0.6561, "step": 8667 }, { "epoch": 0.99, "learning_rate": 1.1449019343499067e-07, "loss": 0.6567, "step": 8668 }, { "epoch": 0.99, "learning_rate": 1.127359101661063e-07, "loss": 0.6681, "step": 8669 }, { "epoch": 0.99, "learning_rate": 1.109951633409212e-07, "loss": 0.6655, "step": 8670 }, { "epoch": 0.99, "learning_rate": 1.0926795319534667e-07, "loss": 0.6782, "step": 8671 }, { "epoch": 0.99, "learning_rate": 1.0755427996343992e-07, "loss": 0.6709, "step": 8672 }, { "epoch": 0.99, "learning_rate": 1.0585414387743741e-07, "loss": 0.6074, "step": 8673 }, { "epoch": 0.99, "learning_rate": 1.0416754516773264e-07, "loss": 0.661, "step": 8674 }, { "epoch": 0.99, "learning_rate": 1.024944840628872e-07, "loss": 0.6231, "step": 8675 }, { "epoch": 0.99, "learning_rate": 1.0083496078964194e-07, "loss": 0.6668, "step": 8676 }, { "epoch": 0.99, "learning_rate": 9.918897557288364e-08, "loss": 0.7066, "step": 8677 }, { "epoch": 0.99, "learning_rate": 9.755652863567832e-08, "loss": 0.6007, "step": 8678 }, { "epoch": 0.99, "learning_rate": 9.59376201992268e-08, "loss": 0.5994, "step": 8679 }, { "epoch": 0.99, "learning_rate": 9.433225048294247e-08, "loss": 0.6295, "step": 8680 }, { "epoch": 0.99, "learning_rate": 9.274041970438462e-08, "loss": 0.7234, "step": 8681 }, { "epoch": 0.99, "learning_rate": 9.11621280792474e-08, "loss": 0.6759, "step": 8682 }, { "epoch": 0.99, "learning_rate": 8.959737582144856e-08, "loss": 0.6458, "step": 8683 }, { "epoch": 0.99, "learning_rate": 8.80461631430074e-08, "loss": 0.6039, "step": 8684 }, { "epoch": 0.99, "learning_rate": 8.650849025415574e-08, "loss": 0.5914, "step": 8685 }, { "epoch": 0.99, "learning_rate": 8.498435736328248e-08, "loss": 0.6316, "step": 8686 }, { "epoch": 0.99, "learning_rate": 8.347376467692236e-08, "loss": 0.6784, "step": 8687 }, { "epoch": 0.99, "learning_rate": 8.197671239978943e-08, "loss": 0.7747, "step": 8688 }, { "epoch": 0.99, "learning_rate": 8.049320073476585e-08, "loss": 0.6604, "step": 8689 }, { "epoch": 0.99, "learning_rate": 7.902322988287969e-08, "loss": 0.6674, "step": 8690 }, { "epoch": 0.99, "learning_rate": 7.756680004334937e-08, "loss": 0.6541, "step": 8691 }, { "epoch": 0.99, "learning_rate": 7.612391141353925e-08, "loss": 0.678, "step": 8692 }, { "epoch": 0.99, "learning_rate": 7.46945641889929e-08, "loss": 0.6233, "step": 8693 }, { "epoch": 0.99, "learning_rate": 7.327875856339984e-08, "loss": 0.6289, "step": 8694 }, { "epoch": 0.99, "learning_rate": 7.187649472863989e-08, "loss": 0.6325, "step": 8695 }, { "epoch": 0.99, "learning_rate": 7.048777287472774e-08, "loss": 0.6679, "step": 8696 }, { "epoch": 0.99, "learning_rate": 6.91125931898795e-08, "loss": 0.6369, "step": 8697 }, { "epoch": 0.99, "learning_rate": 6.775095586043501e-08, "loss": 0.6648, "step": 8698 }, { "epoch": 0.99, "learning_rate": 6.640286107093552e-08, "loss": 0.6123, "step": 8699 }, { "epoch": 0.99, "learning_rate": 6.506830900406824e-08, "loss": 0.6515, "step": 8700 }, { "epoch": 0.99, "learning_rate": 6.37472998406774e-08, "loss": 0.6114, "step": 8701 }, { "epoch": 0.99, "learning_rate": 6.243983375978646e-08, "loss": 0.6825, "step": 8702 }, { "epoch": 0.99, "learning_rate": 6.114591093859811e-08, "loss": 0.7108, "step": 8703 }, { "epoch": 0.99, "learning_rate": 5.98655315524277e-08, "loss": 0.6661, "step": 8704 }, { "epoch": 0.99, "learning_rate": 5.859869577481414e-08, "loss": 0.6665, "step": 8705 }, { "epoch": 0.99, "learning_rate": 5.734540377743125e-08, "loss": 0.5712, "step": 8706 }, { "epoch": 0.99, "learning_rate": 5.6105655730120946e-08, "loss": 0.6651, "step": 8707 }, { "epoch": 0.99, "learning_rate": 5.4879451800882165e-08, "loss": 0.7213, "step": 8708 }, { "epoch": 0.99, "learning_rate": 5.36667921558931e-08, "loss": 0.6891, "step": 8709 }, { "epoch": 0.99, "learning_rate": 5.246767695948895e-08, "loss": 0.659, "step": 8710 }, { "epoch": 0.99, "learning_rate": 5.1282106374173075e-08, "loss": 0.6734, "step": 8711 }, { "epoch": 0.99, "learning_rate": 5.011008056060584e-08, "loss": 0.6856, "step": 8712 }, { "epoch": 0.99, "learning_rate": 4.8951599677626856e-08, "loss": 0.5644, "step": 8713 }, { "epoch": 0.99, "learning_rate": 4.780666388222166e-08, "loss": 0.6733, "step": 8714 }, { "epoch": 0.99, "learning_rate": 4.667527332954391e-08, "loss": 0.6447, "step": 8715 }, { "epoch": 0.99, "learning_rate": 4.555742817292652e-08, "loss": 0.6156, "step": 8716 }, { "epoch": 0.99, "learning_rate": 4.4453128563848315e-08, "loss": 0.6096, "step": 8717 }, { "epoch": 0.99, "learning_rate": 4.336237465196735e-08, "loss": 0.6283, "step": 8718 }, { "epoch": 0.99, "learning_rate": 4.228516658509873e-08, "loss": 0.6597, "step": 8719 }, { "epoch": 0.99, "learning_rate": 4.1221504509225684e-08, "loss": 0.7024, "step": 8720 }, { "epoch": 0.99, "learning_rate": 4.017138856848845e-08, "loss": 0.6448, "step": 8721 }, { "epoch": 0.99, "learning_rate": 3.913481890519544e-08, "loss": 0.7014, "step": 8722 }, { "epoch": 0.99, "learning_rate": 3.8111795659812045e-08, "loss": 0.6617, "step": 8723 }, { "epoch": 0.99, "learning_rate": 3.7102318970994034e-08, "loss": 0.672, "step": 8724 }, { "epoch": 0.99, "learning_rate": 3.6106388975520874e-08, "loss": 0.649, "step": 8725 }, { "epoch": 0.99, "learning_rate": 3.5124005808384596e-08, "loss": 0.7047, "step": 8726 }, { "epoch": 0.99, "learning_rate": 3.415516960268983e-08, "loss": 0.6717, "step": 8727 }, { "epoch": 0.99, "learning_rate": 3.319988048974265e-08, "loss": 0.6298, "step": 8728 }, { "epoch": 0.99, "learning_rate": 3.225813859900617e-08, "loss": 0.6472, "step": 8729 }, { "epoch": 0.99, "learning_rate": 3.132994405808942e-08, "loss": 0.7099, "step": 8730 }, { "epoch": 0.99, "learning_rate": 3.041529699279177e-08, "loss": 0.6154, "step": 8731 }, { "epoch": 0.99, "learning_rate": 2.9514197527047427e-08, "loss": 0.6319, "step": 8732 }, { "epoch": 0.99, "learning_rate": 2.8626645782992014e-08, "loss": 0.6752, "step": 8733 }, { "epoch": 0.99, "learning_rate": 2.775264188088489e-08, "loss": 0.6455, "step": 8734 }, { "epoch": 0.99, "learning_rate": 2.6892185939186853e-08, "loss": 0.7575, "step": 8735 }, { "epoch": 0.99, "learning_rate": 2.6045278074482428e-08, "loss": 0.6362, "step": 8736 }, { "epoch": 0.99, "learning_rate": 2.5211918401557566e-08, "loss": 0.6689, "step": 8737 }, { "epoch": 0.99, "learning_rate": 2.439210703334416e-08, "loss": 0.6905, "step": 8738 }, { "epoch": 0.99, "learning_rate": 2.358584408094222e-08, "loss": 0.6234, "step": 8739 }, { "epoch": 0.99, "learning_rate": 2.2793129653608804e-08, "loss": 0.6968, "step": 8740 }, { "epoch": 0.99, "learning_rate": 2.2013963858780185e-08, "loss": 0.6704, "step": 8741 }, { "epoch": 0.99, "learning_rate": 2.1248346802027473e-08, "loss": 0.6649, "step": 8742 }, { "epoch": 0.99, "learning_rate": 2.049627858712322e-08, "loss": 0.6284, "step": 8743 }, { "epoch": 0.99, "learning_rate": 1.9757759315985892e-08, "loss": 0.6337, "step": 8744 }, { "epoch": 0.99, "learning_rate": 1.9032789088690995e-08, "loss": 0.6418, "step": 8745 }, { "epoch": 0.99, "learning_rate": 1.8321368003482163e-08, "loss": 0.6697, "step": 8746 }, { "epoch": 0.99, "learning_rate": 1.762349615677117e-08, "loss": 0.6849, "step": 8747 }, { "epoch": 0.99, "learning_rate": 1.6939173643126804e-08, "loss": 0.7017, "step": 8748 }, { "epoch": 0.99, "learning_rate": 1.6268400555297104e-08, "loss": 0.6994, "step": 8749 }, { "epoch": 0.99, "learning_rate": 1.5611176984187126e-08, "loss": 0.7292, "step": 8750 }, { "epoch": 0.99, "learning_rate": 1.4967503018836758e-08, "loss": 0.6799, "step": 8751 }, { "epoch": 0.99, "learning_rate": 1.4337378746509533e-08, "loss": 0.6092, "step": 8752 }, { "epoch": 0.99, "learning_rate": 1.3720804252570496e-08, "loss": 0.7272, "step": 8753 }, { "epoch": 0.99, "learning_rate": 1.3117779620586135e-08, "loss": 0.5801, "step": 8754 }, { "epoch": 1.0, "learning_rate": 1.2528304932279967e-08, "loss": 0.6782, "step": 8755 }, { "epoch": 1.0, "learning_rate": 1.1952380267521435e-08, "loss": 0.6911, "step": 8756 }, { "epoch": 1.0, "learning_rate": 1.1390005704381423e-08, "loss": 0.6657, "step": 8757 }, { "epoch": 1.0, "learning_rate": 1.0841181319054538e-08, "loss": 0.5865, "step": 8758 }, { "epoch": 1.0, "learning_rate": 1.0305907185925722e-08, "loss": 0.6555, "step": 8759 }, { "epoch": 1.0, "learning_rate": 9.784183377514743e-09, "loss": 0.6376, "step": 8760 }, { "epoch": 1.0, "learning_rate": 9.276009964553911e-09, "loss": 0.6571, "step": 8761 }, { "epoch": 1.0, "learning_rate": 8.781387015888155e-09, "loss": 0.6787, "step": 8762 }, { "epoch": 1.0, "learning_rate": 8.30031459855274e-09, "loss": 0.6683, "step": 8763 }, { "epoch": 1.0, "learning_rate": 7.83279277773996e-09, "loss": 0.5895, "step": 8764 }, { "epoch": 1.0, "learning_rate": 7.3788216168102494e-09, "loss": 0.6449, "step": 8765 }, { "epoch": 1.0, "learning_rate": 6.938401177281062e-09, "loss": 0.7192, "step": 8766 }, { "epoch": 1.0, "learning_rate": 6.511531518837987e-09, "loss": 0.6624, "step": 8767 }, { "epoch": 1.0, "learning_rate": 6.098212699323647e-09, "loss": 0.6798, "step": 8768 }, { "epoch": 1.0, "learning_rate": 5.698444774770995e-09, "loss": 0.6035, "step": 8769 }, { "epoch": 1.0, "learning_rate": 5.3122277993256084e-09, "loss": 0.6486, "step": 8770 }, { "epoch": 1.0, "learning_rate": 4.939561825356709e-09, "loss": 0.7015, "step": 8771 }, { "epoch": 1.0, "learning_rate": 4.580446903335034e-09, "loss": 0.6261, "step": 8772 }, { "epoch": 1.0, "learning_rate": 4.234883081954966e-09, "loss": 0.653, "step": 8773 }, { "epoch": 1.0, "learning_rate": 3.902870408034609e-09, "loss": 0.676, "step": 8774 }, { "epoch": 1.0, "learning_rate": 3.584408926560201e-09, "loss": 0.6602, "step": 8775 }, { "epoch": 1.0, "learning_rate": 3.279498680708315e-09, "loss": 0.6523, "step": 8776 }, { "epoch": 1.0, "learning_rate": 2.9881397117792474e-09, "loss": 0.7025, "step": 8777 }, { "epoch": 1.0, "learning_rate": 2.7103320592636316e-09, "loss": 0.669, "step": 8778 }, { "epoch": 1.0, "learning_rate": 2.44607576080913e-09, "loss": 0.6536, "step": 8779 }, { "epoch": 1.0, "learning_rate": 2.1953708522426396e-09, "loss": 0.6529, "step": 8780 }, { "epoch": 1.0, "learning_rate": 1.958217367514781e-09, "loss": 0.6102, "step": 8781 }, { "epoch": 1.0, "learning_rate": 1.7346153387665098e-09, "loss": 0.677, "step": 8782 }, { "epoch": 1.0, "learning_rate": 1.5245647963180177e-09, "loss": 0.683, "step": 8783 }, { "epoch": 1.0, "learning_rate": 1.3280657686243204e-09, "loss": 0.6703, "step": 8784 }, { "epoch": 1.0, "learning_rate": 1.1451182823196682e-09, "loss": 0.658, "step": 8785 }, { "epoch": 1.0, "learning_rate": 9.757223621842393e-10, "loss": 0.6475, "step": 8786 }, { "epoch": 1.0, "learning_rate": 8.198780311774457e-10, "loss": 0.701, "step": 8787 }, { "epoch": 1.0, "learning_rate": 6.775853104268315e-10, "loss": 0.6674, "step": 8788 }, { "epoch": 1.0, "learning_rate": 5.488442192058685e-10, "loss": 0.7218, "step": 8789 }, { "epoch": 1.0, "learning_rate": 4.336547749783648e-10, "loss": 0.6315, "step": 8790 }, { "epoch": 1.0, "learning_rate": 3.3201699333185175e-10, "loss": 0.6759, "step": 8791 }, { "epoch": 1.0, "learning_rate": 2.439308880552993e-10, "loss": 0.6052, "step": 8792 }, { "epoch": 1.0, "learning_rate": 1.693964710836049e-10, "loss": 0.6549, "step": 8793 }, { "epoch": 1.0, "learning_rate": 1.084137525086959e-10, "loss": 0.7087, "step": 8794 }, { "epoch": 1.0, "learning_rate": 6.098274061283604e-11, "loss": 0.6304, "step": 8795 }, { "epoch": 1.0, "learning_rate": 2.7103441802012186e-11, "loss": 0.6025, "step": 8796 }, { "epoch": 1.0, "learning_rate": 6.7758606836498815e-12, "loss": 0.6254, "step": 8797 }, { "epoch": 1.0, "learning_rate": 0.0, "loss": 0.5865, "step": 8798 }, { "epoch": 1.0, "step": 8798, "total_flos": 2316807981268992.0, "train_loss": 0.682436441881978, "train_runtime": 66237.035, "train_samples_per_second": 17.001, "train_steps_per_second": 0.133 } ], "logging_steps": 1.0, "max_steps": 8798, "num_input_tokens_seen": 0, "num_train_epochs": 1, "save_steps": 500000, "total_flos": 2316807981268992.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }