{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.0, "eval_steps": 500, "global_step": 9607, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 6.920415224913496e-07, "loss": 1.5756, "step": 1 }, { "epoch": 0.0, "learning_rate": 1.3840830449826992e-06, "loss": 1.7067, "step": 2 }, { "epoch": 0.0, "learning_rate": 2.0761245674740485e-06, "loss": 1.6699, "step": 3 }, { "epoch": 0.0, "learning_rate": 2.7681660899653983e-06, "loss": 1.6, "step": 4 }, { "epoch": 0.0, "learning_rate": 3.4602076124567477e-06, "loss": 1.7595, "step": 5 }, { "epoch": 0.0, "learning_rate": 4.152249134948097e-06, "loss": 1.6476, "step": 6 }, { "epoch": 0.0, "learning_rate": 4.8442906574394464e-06, "loss": 0.8283, "step": 7 }, { "epoch": 0.0, "learning_rate": 5.536332179930797e-06, "loss": 1.752, "step": 8 }, { "epoch": 0.0, "learning_rate": 6.228373702422145e-06, "loss": 1.6863, "step": 9 }, { "epoch": 0.0, "learning_rate": 6.920415224913495e-06, "loss": 1.5247, "step": 10 }, { "epoch": 0.0, "learning_rate": 7.612456747404845e-06, "loss": 1.6156, "step": 11 }, { "epoch": 0.0, "learning_rate": 8.304498269896194e-06, "loss": 1.5633, "step": 12 }, { "epoch": 0.0, "learning_rate": 8.996539792387544e-06, "loss": 1.6062, "step": 13 }, { "epoch": 0.0, "learning_rate": 9.688581314878893e-06, "loss": 1.6622, "step": 14 }, { "epoch": 0.0, "learning_rate": 1.0380622837370241e-05, "loss": 1.5888, "step": 15 }, { "epoch": 0.0, "learning_rate": 1.1072664359861593e-05, "loss": 1.6098, "step": 16 }, { "epoch": 0.0, "learning_rate": 1.1764705882352942e-05, "loss": 1.6436, "step": 17 }, { "epoch": 0.0, "learning_rate": 1.245674740484429e-05, "loss": 1.564, "step": 18 }, { "epoch": 0.0, "learning_rate": 1.3148788927335639e-05, "loss": 1.6281, "step": 19 }, { "epoch": 0.0, "learning_rate": 1.384083044982699e-05, "loss": 1.6813, "step": 20 }, { "epoch": 0.0, "learning_rate": 1.4532871972318341e-05, "loss": 1.674, "step": 21 }, { "epoch": 0.0, "learning_rate": 1.522491349480969e-05, "loss": 1.4708, "step": 22 }, { "epoch": 0.0, "learning_rate": 1.5916955017301038e-05, "loss": 1.5834, "step": 23 }, { "epoch": 0.0, "learning_rate": 1.6608996539792388e-05, "loss": 1.5959, "step": 24 }, { "epoch": 0.0, "learning_rate": 1.7301038062283735e-05, "loss": 1.4941, "step": 25 }, { "epoch": 0.0, "learning_rate": 1.799307958477509e-05, "loss": 1.4331, "step": 26 }, { "epoch": 0.0, "learning_rate": 1.868512110726644e-05, "loss": 1.5224, "step": 27 }, { "epoch": 0.0, "learning_rate": 1.9377162629757786e-05, "loss": 1.4801, "step": 28 }, { "epoch": 0.0, "learning_rate": 2.0069204152249136e-05, "loss": 1.4038, "step": 29 }, { "epoch": 0.0, "learning_rate": 2.0761245674740483e-05, "loss": 1.4422, "step": 30 }, { "epoch": 0.0, "learning_rate": 2.1453287197231836e-05, "loss": 1.3538, "step": 31 }, { "epoch": 0.0, "learning_rate": 2.2145328719723187e-05, "loss": 1.3676, "step": 32 }, { "epoch": 0.0, "learning_rate": 2.2837370242214533e-05, "loss": 1.3479, "step": 33 }, { "epoch": 0.0, "learning_rate": 2.3529411764705884e-05, "loss": 1.3279, "step": 34 }, { "epoch": 0.0, "learning_rate": 2.422145328719723e-05, "loss": 0.7623, "step": 35 }, { "epoch": 0.0, "learning_rate": 2.491349480968858e-05, "loss": 1.2703, "step": 36 }, { "epoch": 0.0, "learning_rate": 2.560553633217993e-05, "loss": 1.2462, "step": 37 }, { "epoch": 0.0, "learning_rate": 2.6297577854671278e-05, "loss": 1.2904, "step": 38 }, { "epoch": 0.0, "learning_rate": 2.6989619377162635e-05, "loss": 1.344, "step": 39 }, { "epoch": 0.0, "learning_rate": 2.768166089965398e-05, "loss": 1.3277, "step": 40 }, { "epoch": 0.0, "learning_rate": 2.8373702422145332e-05, "loss": 1.1892, "step": 41 }, { "epoch": 0.0, "learning_rate": 2.9065743944636682e-05, "loss": 1.1929, "step": 42 }, { "epoch": 0.0, "learning_rate": 2.975778546712803e-05, "loss": 1.3186, "step": 43 }, { "epoch": 0.0, "learning_rate": 3.044982698961938e-05, "loss": 1.2677, "step": 44 }, { "epoch": 0.0, "learning_rate": 3.1141868512110726e-05, "loss": 1.2097, "step": 45 }, { "epoch": 0.0, "learning_rate": 3.1833910034602076e-05, "loss": 0.7291, "step": 46 }, { "epoch": 0.0, "learning_rate": 3.2525951557093426e-05, "loss": 1.0898, "step": 47 }, { "epoch": 0.0, "learning_rate": 3.3217993079584777e-05, "loss": 1.1903, "step": 48 }, { "epoch": 0.01, "learning_rate": 3.391003460207613e-05, "loss": 1.1518, "step": 49 }, { "epoch": 0.01, "learning_rate": 3.460207612456747e-05, "loss": 1.0948, "step": 50 }, { "epoch": 0.01, "learning_rate": 3.529411764705883e-05, "loss": 1.1216, "step": 51 }, { "epoch": 0.01, "learning_rate": 3.598615916955018e-05, "loss": 1.064, "step": 52 }, { "epoch": 0.01, "learning_rate": 3.667820069204153e-05, "loss": 1.0863, "step": 53 }, { "epoch": 0.01, "learning_rate": 3.737024221453288e-05, "loss": 1.159, "step": 54 }, { "epoch": 0.01, "learning_rate": 3.806228373702422e-05, "loss": 1.0899, "step": 55 }, { "epoch": 0.01, "learning_rate": 3.875432525951557e-05, "loss": 1.082, "step": 56 }, { "epoch": 0.01, "learning_rate": 3.944636678200692e-05, "loss": 1.0012, "step": 57 }, { "epoch": 0.01, "learning_rate": 4.013840830449827e-05, "loss": 1.0879, "step": 58 }, { "epoch": 0.01, "learning_rate": 4.083044982698962e-05, "loss": 0.9668, "step": 59 }, { "epoch": 0.01, "learning_rate": 4.1522491349480966e-05, "loss": 1.0142, "step": 60 }, { "epoch": 0.01, "learning_rate": 4.2214532871972316e-05, "loss": 0.965, "step": 61 }, { "epoch": 0.01, "learning_rate": 4.290657439446367e-05, "loss": 0.9798, "step": 62 }, { "epoch": 0.01, "learning_rate": 4.359861591695502e-05, "loss": 0.982, "step": 63 }, { "epoch": 0.01, "learning_rate": 4.429065743944637e-05, "loss": 1.0172, "step": 64 }, { "epoch": 0.01, "learning_rate": 4.498269896193772e-05, "loss": 0.9597, "step": 65 }, { "epoch": 0.01, "learning_rate": 4.567474048442907e-05, "loss": 0.9419, "step": 66 }, { "epoch": 0.01, "learning_rate": 4.636678200692042e-05, "loss": 0.9833, "step": 67 }, { "epoch": 0.01, "learning_rate": 4.705882352941177e-05, "loss": 0.9569, "step": 68 }, { "epoch": 0.01, "learning_rate": 4.775086505190312e-05, "loss": 0.9785, "step": 69 }, { "epoch": 0.01, "learning_rate": 4.844290657439446e-05, "loss": 0.9788, "step": 70 }, { "epoch": 0.01, "learning_rate": 4.913494809688581e-05, "loss": 0.9815, "step": 71 }, { "epoch": 0.01, "learning_rate": 4.982698961937716e-05, "loss": 0.9228, "step": 72 }, { "epoch": 0.01, "learning_rate": 5.051903114186851e-05, "loss": 0.9157, "step": 73 }, { "epoch": 0.01, "learning_rate": 5.121107266435986e-05, "loss": 0.9122, "step": 74 }, { "epoch": 0.01, "learning_rate": 5.190311418685121e-05, "loss": 0.9131, "step": 75 }, { "epoch": 0.01, "learning_rate": 5.2595155709342556e-05, "loss": 0.9536, "step": 76 }, { "epoch": 0.01, "learning_rate": 5.3287197231833906e-05, "loss": 0.8817, "step": 77 }, { "epoch": 0.01, "learning_rate": 5.397923875432527e-05, "loss": 0.9106, "step": 78 }, { "epoch": 0.01, "learning_rate": 5.467128027681662e-05, "loss": 0.8643, "step": 79 }, { "epoch": 0.01, "learning_rate": 5.536332179930796e-05, "loss": 0.9068, "step": 80 }, { "epoch": 0.01, "learning_rate": 5.6055363321799313e-05, "loss": 0.9017, "step": 81 }, { "epoch": 0.01, "learning_rate": 5.6747404844290664e-05, "loss": 0.9056, "step": 82 }, { "epoch": 0.01, "learning_rate": 5.7439446366782014e-05, "loss": 0.9051, "step": 83 }, { "epoch": 0.01, "learning_rate": 5.8131487889273364e-05, "loss": 0.8899, "step": 84 }, { "epoch": 0.01, "learning_rate": 5.882352941176471e-05, "loss": 0.8886, "step": 85 }, { "epoch": 0.01, "learning_rate": 5.951557093425606e-05, "loss": 0.8989, "step": 86 }, { "epoch": 0.01, "learning_rate": 6.020761245674741e-05, "loss": 0.7904, "step": 87 }, { "epoch": 0.01, "learning_rate": 6.089965397923876e-05, "loss": 0.8167, "step": 88 }, { "epoch": 0.01, "learning_rate": 6.15916955017301e-05, "loss": 0.8805, "step": 89 }, { "epoch": 0.01, "learning_rate": 6.228373702422145e-05, "loss": 0.8169, "step": 90 }, { "epoch": 0.01, "learning_rate": 6.29757785467128e-05, "loss": 0.8548, "step": 91 }, { "epoch": 0.01, "learning_rate": 6.366782006920415e-05, "loss": 0.8482, "step": 92 }, { "epoch": 0.01, "learning_rate": 6.43598615916955e-05, "loss": 0.8343, "step": 93 }, { "epoch": 0.01, "learning_rate": 6.505190311418685e-05, "loss": 0.8783, "step": 94 }, { "epoch": 0.01, "learning_rate": 6.57439446366782e-05, "loss": 0.8813, "step": 95 }, { "epoch": 0.01, "learning_rate": 6.643598615916955e-05, "loss": 0.9045, "step": 96 }, { "epoch": 0.01, "learning_rate": 6.71280276816609e-05, "loss": 0.9161, "step": 97 }, { "epoch": 0.01, "learning_rate": 6.782006920415225e-05, "loss": 0.8357, "step": 98 }, { "epoch": 0.01, "learning_rate": 6.851211072664359e-05, "loss": 0.8466, "step": 99 }, { "epoch": 0.01, "learning_rate": 6.920415224913494e-05, "loss": 0.8599, "step": 100 }, { "epoch": 0.01, "learning_rate": 6.98961937716263e-05, "loss": 0.8354, "step": 101 }, { "epoch": 0.01, "learning_rate": 7.058823529411765e-05, "loss": 0.802, "step": 102 }, { "epoch": 0.01, "learning_rate": 7.1280276816609e-05, "loss": 0.7284, "step": 103 }, { "epoch": 0.01, "learning_rate": 7.197231833910035e-05, "loss": 0.821, "step": 104 }, { "epoch": 0.01, "learning_rate": 7.26643598615917e-05, "loss": 0.8195, "step": 105 }, { "epoch": 0.01, "learning_rate": 7.335640138408306e-05, "loss": 0.8026, "step": 106 }, { "epoch": 0.01, "learning_rate": 7.40484429065744e-05, "loss": 0.7941, "step": 107 }, { "epoch": 0.01, "learning_rate": 7.474048442906576e-05, "loss": 0.8737, "step": 108 }, { "epoch": 0.01, "learning_rate": 7.543252595155709e-05, "loss": 0.7969, "step": 109 }, { "epoch": 0.01, "learning_rate": 7.612456747404844e-05, "loss": 0.8375, "step": 110 }, { "epoch": 0.01, "learning_rate": 7.681660899653979e-05, "loss": 0.8132, "step": 111 }, { "epoch": 0.01, "learning_rate": 7.750865051903114e-05, "loss": 0.8231, "step": 112 }, { "epoch": 0.01, "learning_rate": 7.82006920415225e-05, "loss": 0.82, "step": 113 }, { "epoch": 0.01, "learning_rate": 7.889273356401384e-05, "loss": 0.8111, "step": 114 }, { "epoch": 0.01, "learning_rate": 7.95847750865052e-05, "loss": 0.8375, "step": 115 }, { "epoch": 0.01, "learning_rate": 8.027681660899654e-05, "loss": 0.8355, "step": 116 }, { "epoch": 0.01, "learning_rate": 8.09688581314879e-05, "loss": 0.7848, "step": 117 }, { "epoch": 0.01, "learning_rate": 8.166089965397924e-05, "loss": 0.8401, "step": 118 }, { "epoch": 0.01, "learning_rate": 8.23529411764706e-05, "loss": 0.7801, "step": 119 }, { "epoch": 0.01, "learning_rate": 8.304498269896193e-05, "loss": 0.887, "step": 120 }, { "epoch": 0.01, "learning_rate": 8.373702422145328e-05, "loss": 0.7932, "step": 121 }, { "epoch": 0.01, "learning_rate": 8.442906574394463e-05, "loss": 0.8263, "step": 122 }, { "epoch": 0.01, "learning_rate": 8.5121107266436e-05, "loss": 0.8153, "step": 123 }, { "epoch": 0.01, "learning_rate": 8.581314878892735e-05, "loss": 0.7902, "step": 124 }, { "epoch": 0.01, "learning_rate": 8.65051903114187e-05, "loss": 0.8852, "step": 125 }, { "epoch": 0.01, "learning_rate": 8.719723183391005e-05, "loss": 0.7502, "step": 126 }, { "epoch": 0.01, "learning_rate": 8.78892733564014e-05, "loss": 0.8386, "step": 127 }, { "epoch": 0.01, "learning_rate": 8.858131487889275e-05, "loss": 0.793, "step": 128 }, { "epoch": 0.01, "learning_rate": 8.927335640138408e-05, "loss": 0.8201, "step": 129 }, { "epoch": 0.01, "learning_rate": 8.996539792387543e-05, "loss": 0.7758, "step": 130 }, { "epoch": 0.01, "learning_rate": 9.065743944636678e-05, "loss": 0.8069, "step": 131 }, { "epoch": 0.01, "learning_rate": 9.134948096885813e-05, "loss": 0.7826, "step": 132 }, { "epoch": 0.01, "learning_rate": 9.204152249134948e-05, "loss": 0.8095, "step": 133 }, { "epoch": 0.01, "learning_rate": 9.273356401384083e-05, "loss": 0.8316, "step": 134 }, { "epoch": 0.01, "learning_rate": 9.342560553633218e-05, "loss": 0.8095, "step": 135 }, { "epoch": 0.01, "learning_rate": 9.411764705882353e-05, "loss": 0.8318, "step": 136 }, { "epoch": 0.01, "learning_rate": 9.480968858131488e-05, "loss": 0.8247, "step": 137 }, { "epoch": 0.01, "learning_rate": 9.550173010380624e-05, "loss": 0.8473, "step": 138 }, { "epoch": 0.01, "learning_rate": 9.619377162629759e-05, "loss": 0.7577, "step": 139 }, { "epoch": 0.01, "learning_rate": 9.688581314878892e-05, "loss": 0.6995, "step": 140 }, { "epoch": 0.01, "learning_rate": 9.757785467128027e-05, "loss": 0.8283, "step": 141 }, { "epoch": 0.01, "learning_rate": 9.826989619377162e-05, "loss": 0.8317, "step": 142 }, { "epoch": 0.01, "learning_rate": 9.896193771626297e-05, "loss": 0.799, "step": 143 }, { "epoch": 0.01, "learning_rate": 9.965397923875432e-05, "loss": 0.8288, "step": 144 }, { "epoch": 0.02, "learning_rate": 0.00010034602076124569, "loss": 0.7851, "step": 145 }, { "epoch": 0.02, "learning_rate": 0.00010103806228373702, "loss": 0.788, "step": 146 }, { "epoch": 0.02, "learning_rate": 0.00010173010380622839, "loss": 0.7923, "step": 147 }, { "epoch": 0.02, "learning_rate": 0.00010242214532871972, "loss": 0.8438, "step": 148 }, { "epoch": 0.02, "learning_rate": 0.00010311418685121109, "loss": 0.801, "step": 149 }, { "epoch": 0.02, "learning_rate": 0.00010380622837370242, "loss": 0.7785, "step": 150 }, { "epoch": 0.02, "learning_rate": 0.00010449826989619377, "loss": 0.7677, "step": 151 }, { "epoch": 0.02, "learning_rate": 0.00010519031141868511, "loss": 0.7733, "step": 152 }, { "epoch": 0.02, "learning_rate": 0.00010588235294117647, "loss": 0.7888, "step": 153 }, { "epoch": 0.02, "learning_rate": 0.00010657439446366781, "loss": 0.8875, "step": 154 }, { "epoch": 0.02, "learning_rate": 0.00010726643598615918, "loss": 0.7939, "step": 155 }, { "epoch": 0.02, "learning_rate": 0.00010795847750865054, "loss": 0.838, "step": 156 }, { "epoch": 0.02, "learning_rate": 0.00010865051903114188, "loss": 0.8589, "step": 157 }, { "epoch": 0.02, "learning_rate": 0.00010934256055363324, "loss": 0.8112, "step": 158 }, { "epoch": 0.02, "learning_rate": 0.00011003460207612458, "loss": 0.7312, "step": 159 }, { "epoch": 0.02, "learning_rate": 0.00011072664359861593, "loss": 0.7749, "step": 160 }, { "epoch": 0.02, "learning_rate": 0.00011141868512110726, "loss": 0.7849, "step": 161 }, { "epoch": 0.02, "learning_rate": 0.00011211072664359863, "loss": 0.7377, "step": 162 }, { "epoch": 0.02, "learning_rate": 0.00011280276816608996, "loss": 0.6824, "step": 163 }, { "epoch": 0.02, "learning_rate": 0.00011349480968858133, "loss": 0.7894, "step": 164 }, { "epoch": 0.02, "learning_rate": 0.00011418685121107266, "loss": 0.8152, "step": 165 }, { "epoch": 0.02, "learning_rate": 0.00011487889273356403, "loss": 0.854, "step": 166 }, { "epoch": 0.02, "learning_rate": 0.00011557093425605536, "loss": 0.8046, "step": 167 }, { "epoch": 0.02, "learning_rate": 0.00011626297577854673, "loss": 0.7674, "step": 168 }, { "epoch": 0.02, "learning_rate": 0.00011695501730103806, "loss": 0.8161, "step": 169 }, { "epoch": 0.02, "learning_rate": 0.00011764705882352942, "loss": 0.7405, "step": 170 }, { "epoch": 0.02, "learning_rate": 0.00011833910034602077, "loss": 0.7981, "step": 171 }, { "epoch": 0.02, "learning_rate": 0.00011903114186851212, "loss": 0.738, "step": 172 }, { "epoch": 0.02, "learning_rate": 0.00011972318339100345, "loss": 0.8147, "step": 173 }, { "epoch": 0.02, "learning_rate": 0.00012041522491349482, "loss": 0.7774, "step": 174 }, { "epoch": 0.02, "learning_rate": 0.00012110726643598615, "loss": 0.7962, "step": 175 }, { "epoch": 0.02, "learning_rate": 0.00012179930795847752, "loss": 0.7311, "step": 176 }, { "epoch": 0.02, "learning_rate": 0.00012249134948096887, "loss": 0.8084, "step": 177 }, { "epoch": 0.02, "learning_rate": 0.0001231833910034602, "loss": 0.7478, "step": 178 }, { "epoch": 0.02, "learning_rate": 0.00012387543252595157, "loss": 0.7398, "step": 179 }, { "epoch": 0.02, "learning_rate": 0.0001245674740484429, "loss": 0.821, "step": 180 }, { "epoch": 0.02, "learning_rate": 0.00012525951557093427, "loss": 0.7988, "step": 181 }, { "epoch": 0.02, "learning_rate": 0.0001259515570934256, "loss": 0.8507, "step": 182 }, { "epoch": 0.02, "learning_rate": 0.00012664359861591697, "loss": 0.706, "step": 183 }, { "epoch": 0.02, "learning_rate": 0.0001273356401384083, "loss": 0.7377, "step": 184 }, { "epoch": 0.02, "learning_rate": 0.00012802768166089967, "loss": 0.7555, "step": 185 }, { "epoch": 0.02, "learning_rate": 0.000128719723183391, "loss": 0.8172, "step": 186 }, { "epoch": 0.02, "learning_rate": 0.00012941176470588237, "loss": 0.7994, "step": 187 }, { "epoch": 0.02, "learning_rate": 0.0001301038062283737, "loss": 0.7693, "step": 188 }, { "epoch": 0.02, "learning_rate": 0.00013079584775086507, "loss": 0.7493, "step": 189 }, { "epoch": 0.02, "learning_rate": 0.0001314878892733564, "loss": 0.7881, "step": 190 }, { "epoch": 0.02, "learning_rate": 0.00013217993079584777, "loss": 0.7729, "step": 191 }, { "epoch": 0.02, "learning_rate": 0.0001328719723183391, "loss": 0.7372, "step": 192 }, { "epoch": 0.02, "learning_rate": 0.00013356401384083047, "loss": 0.7523, "step": 193 }, { "epoch": 0.02, "learning_rate": 0.0001342560553633218, "loss": 0.7808, "step": 194 }, { "epoch": 0.02, "learning_rate": 0.00013494809688581317, "loss": 0.7995, "step": 195 }, { "epoch": 0.02, "learning_rate": 0.0001356401384083045, "loss": 0.7242, "step": 196 }, { "epoch": 0.02, "learning_rate": 0.00013633217993079584, "loss": 0.7649, "step": 197 }, { "epoch": 0.02, "learning_rate": 0.00013702422145328718, "loss": 0.773, "step": 198 }, { "epoch": 0.02, "learning_rate": 0.00013771626297577854, "loss": 0.7576, "step": 199 }, { "epoch": 0.02, "learning_rate": 0.00013840830449826988, "loss": 0.7743, "step": 200 }, { "epoch": 0.02, "learning_rate": 0.00013910034602076124, "loss": 0.7408, "step": 201 }, { "epoch": 0.02, "learning_rate": 0.0001397923875432526, "loss": 0.7476, "step": 202 }, { "epoch": 0.02, "learning_rate": 0.00014048442906574395, "loss": 0.7156, "step": 203 }, { "epoch": 0.02, "learning_rate": 0.0001411764705882353, "loss": 0.7921, "step": 204 }, { "epoch": 0.02, "learning_rate": 0.00014186851211072665, "loss": 0.6979, "step": 205 }, { "epoch": 0.02, "learning_rate": 0.000142560553633218, "loss": 0.7851, "step": 206 }, { "epoch": 0.02, "learning_rate": 0.00014325259515570935, "loss": 0.7682, "step": 207 }, { "epoch": 0.02, "learning_rate": 0.0001439446366782007, "loss": 0.734, "step": 208 }, { "epoch": 0.02, "learning_rate": 0.00014463667820069205, "loss": 0.7336, "step": 209 }, { "epoch": 0.02, "learning_rate": 0.0001453287197231834, "loss": 0.7888, "step": 210 }, { "epoch": 0.02, "learning_rate": 0.00014602076124567475, "loss": 0.8122, "step": 211 }, { "epoch": 0.02, "learning_rate": 0.0001467128027681661, "loss": 0.7552, "step": 212 }, { "epoch": 0.02, "learning_rate": 0.00014740484429065745, "loss": 0.7723, "step": 213 }, { "epoch": 0.02, "learning_rate": 0.0001480968858131488, "loss": 0.7356, "step": 214 }, { "epoch": 0.02, "learning_rate": 0.00014878892733564015, "loss": 0.7852, "step": 215 }, { "epoch": 0.02, "learning_rate": 0.0001494809688581315, "loss": 0.814, "step": 216 }, { "epoch": 0.02, "learning_rate": 0.00015017301038062285, "loss": 0.7445, "step": 217 }, { "epoch": 0.02, "learning_rate": 0.00015086505190311418, "loss": 0.753, "step": 218 }, { "epoch": 0.02, "learning_rate": 0.00015155709342560552, "loss": 0.807, "step": 219 }, { "epoch": 0.02, "learning_rate": 0.00015224913494809689, "loss": 0.733, "step": 220 }, { "epoch": 0.02, "learning_rate": 0.00015294117647058822, "loss": 0.7763, "step": 221 }, { "epoch": 0.02, "learning_rate": 0.00015363321799307959, "loss": 0.7521, "step": 222 }, { "epoch": 0.02, "learning_rate": 0.00015432525951557095, "loss": 0.7773, "step": 223 }, { "epoch": 0.02, "learning_rate": 0.00015501730103806229, "loss": 0.7306, "step": 224 }, { "epoch": 0.02, "learning_rate": 0.00015570934256055365, "loss": 0.7851, "step": 225 }, { "epoch": 0.02, "learning_rate": 0.000156401384083045, "loss": 0.7558, "step": 226 }, { "epoch": 0.02, "learning_rate": 0.00015709342560553635, "loss": 0.7714, "step": 227 }, { "epoch": 0.02, "learning_rate": 0.0001577854671280277, "loss": 0.7542, "step": 228 }, { "epoch": 0.02, "learning_rate": 0.00015847750865051905, "loss": 0.7883, "step": 229 }, { "epoch": 0.02, "learning_rate": 0.0001591695501730104, "loss": 0.8085, "step": 230 }, { "epoch": 0.02, "learning_rate": 0.00015986159169550175, "loss": 0.7918, "step": 231 }, { "epoch": 0.02, "learning_rate": 0.0001605536332179931, "loss": 0.7412, "step": 232 }, { "epoch": 0.02, "learning_rate": 0.00016124567474048445, "loss": 0.7494, "step": 233 }, { "epoch": 0.02, "learning_rate": 0.0001619377162629758, "loss": 0.7948, "step": 234 }, { "epoch": 0.02, "learning_rate": 0.00016262975778546715, "loss": 0.7624, "step": 235 }, { "epoch": 0.02, "learning_rate": 0.0001633217993079585, "loss": 0.7879, "step": 236 }, { "epoch": 0.02, "learning_rate": 0.00016401384083044983, "loss": 0.6687, "step": 237 }, { "epoch": 0.02, "learning_rate": 0.0001647058823529412, "loss": 0.7921, "step": 238 }, { "epoch": 0.02, "learning_rate": 0.00016539792387543253, "loss": 0.7718, "step": 239 }, { "epoch": 0.02, "learning_rate": 0.00016608996539792386, "loss": 0.8175, "step": 240 }, { "epoch": 0.03, "learning_rate": 0.00016678200692041523, "loss": 0.7641, "step": 241 }, { "epoch": 0.03, "learning_rate": 0.00016747404844290656, "loss": 0.7365, "step": 242 }, { "epoch": 0.03, "learning_rate": 0.00016816608996539793, "loss": 0.7783, "step": 243 }, { "epoch": 0.03, "learning_rate": 0.00016885813148788926, "loss": 0.7782, "step": 244 }, { "epoch": 0.03, "learning_rate": 0.00016955017301038063, "loss": 0.7467, "step": 245 }, { "epoch": 0.03, "learning_rate": 0.000170242214532872, "loss": 0.7744, "step": 246 }, { "epoch": 0.03, "learning_rate": 0.00017093425605536333, "loss": 0.7601, "step": 247 }, { "epoch": 0.03, "learning_rate": 0.0001716262975778547, "loss": 0.753, "step": 248 }, { "epoch": 0.03, "learning_rate": 0.00017231833910034603, "loss": 0.7693, "step": 249 }, { "epoch": 0.03, "learning_rate": 0.0001730103806228374, "loss": 0.7802, "step": 250 }, { "epoch": 0.03, "learning_rate": 0.00017370242214532873, "loss": 0.7404, "step": 251 }, { "epoch": 0.03, "learning_rate": 0.0001743944636678201, "loss": 0.7461, "step": 252 }, { "epoch": 0.03, "learning_rate": 0.00017508650519031143, "loss": 0.7732, "step": 253 }, { "epoch": 0.03, "learning_rate": 0.0001757785467128028, "loss": 0.7545, "step": 254 }, { "epoch": 0.03, "learning_rate": 0.00017647058823529413, "loss": 0.6823, "step": 255 }, { "epoch": 0.03, "learning_rate": 0.0001771626297577855, "loss": 0.7592, "step": 256 }, { "epoch": 0.03, "learning_rate": 0.00017785467128027683, "loss": 0.7983, "step": 257 }, { "epoch": 0.03, "learning_rate": 0.00017854671280276817, "loss": 0.7253, "step": 258 }, { "epoch": 0.03, "learning_rate": 0.00017923875432525953, "loss": 0.747, "step": 259 }, { "epoch": 0.03, "learning_rate": 0.00017993079584775087, "loss": 0.7753, "step": 260 }, { "epoch": 0.03, "learning_rate": 0.0001806228373702422, "loss": 0.7307, "step": 261 }, { "epoch": 0.03, "learning_rate": 0.00018131487889273357, "loss": 0.772, "step": 262 }, { "epoch": 0.03, "learning_rate": 0.0001820069204152249, "loss": 0.8157, "step": 263 }, { "epoch": 0.03, "learning_rate": 0.00018269896193771627, "loss": 0.7587, "step": 264 }, { "epoch": 0.03, "learning_rate": 0.0001833910034602076, "loss": 0.7346, "step": 265 }, { "epoch": 0.03, "learning_rate": 0.00018408304498269897, "loss": 0.7856, "step": 266 }, { "epoch": 0.03, "learning_rate": 0.00018477508650519033, "loss": 0.7481, "step": 267 }, { "epoch": 0.03, "learning_rate": 0.00018546712802768167, "loss": 0.7324, "step": 268 }, { "epoch": 0.03, "learning_rate": 0.00018615916955017303, "loss": 0.7412, "step": 269 }, { "epoch": 0.03, "learning_rate": 0.00018685121107266437, "loss": 0.8052, "step": 270 }, { "epoch": 0.03, "learning_rate": 0.00018754325259515573, "loss": 0.7778, "step": 271 }, { "epoch": 0.03, "learning_rate": 0.00018823529411764707, "loss": 0.7256, "step": 272 }, { "epoch": 0.03, "learning_rate": 0.00018892733564013843, "loss": 0.8078, "step": 273 }, { "epoch": 0.03, "learning_rate": 0.00018961937716262977, "loss": 0.7127, "step": 274 }, { "epoch": 0.03, "learning_rate": 0.00019031141868512113, "loss": 0.8016, "step": 275 }, { "epoch": 0.03, "learning_rate": 0.00019100346020761247, "loss": 0.7391, "step": 276 }, { "epoch": 0.03, "learning_rate": 0.00019169550173010383, "loss": 0.7675, "step": 277 }, { "epoch": 0.03, "learning_rate": 0.00019238754325259517, "loss": 0.7877, "step": 278 }, { "epoch": 0.03, "learning_rate": 0.0001930795847750865, "loss": 0.75, "step": 279 }, { "epoch": 0.03, "learning_rate": 0.00019377162629757784, "loss": 0.7548, "step": 280 }, { "epoch": 0.03, "learning_rate": 0.0001944636678200692, "loss": 0.6957, "step": 281 }, { "epoch": 0.03, "learning_rate": 0.00019515570934256054, "loss": 0.7529, "step": 282 }, { "epoch": 0.03, "learning_rate": 0.0001958477508650519, "loss": 0.7668, "step": 283 }, { "epoch": 0.03, "learning_rate": 0.00019653979238754324, "loss": 0.7635, "step": 284 }, { "epoch": 0.03, "learning_rate": 0.0001972318339100346, "loss": 0.6895, "step": 285 }, { "epoch": 0.03, "learning_rate": 0.00019792387543252595, "loss": 0.8123, "step": 286 }, { "epoch": 0.03, "learning_rate": 0.0001986159169550173, "loss": 0.7032, "step": 287 }, { "epoch": 0.03, "learning_rate": 0.00019930795847750865, "loss": 0.789, "step": 288 }, { "epoch": 0.03, "learning_rate": 0.0002, "loss": 0.7557, "step": 289 }, { "epoch": 0.03, "learning_rate": 0.00019999999431638917, "loss": 0.7724, "step": 290 }, { "epoch": 0.03, "learning_rate": 0.00019999997726555732, "loss": 0.7964, "step": 291 }, { "epoch": 0.03, "learning_rate": 0.0001999999488475064, "loss": 0.7349, "step": 292 }, { "epoch": 0.03, "learning_rate": 0.0001999999090622396, "loss": 0.7139, "step": 293 }, { "epoch": 0.03, "learning_rate": 0.00019999985790976148, "loss": 0.7533, "step": 294 }, { "epoch": 0.03, "learning_rate": 0.00019999979539007785, "loss": 0.8029, "step": 295 }, { "epoch": 0.03, "learning_rate": 0.0001999997215031958, "loss": 0.6681, "step": 296 }, { "epoch": 0.03, "learning_rate": 0.00019999963624912375, "loss": 0.7892, "step": 297 }, { "epoch": 0.03, "learning_rate": 0.00019999953962787138, "loss": 0.8056, "step": 298 }, { "epoch": 0.03, "learning_rate": 0.00019999943163944968, "loss": 0.7907, "step": 299 }, { "epoch": 0.03, "learning_rate": 0.0001999993122838709, "loss": 0.7353, "step": 300 }, { "epoch": 0.03, "learning_rate": 0.00019999918156114865, "loss": 0.7301, "step": 301 }, { "epoch": 0.03, "learning_rate": 0.00019999903947129775, "loss": 0.6696, "step": 302 }, { "epoch": 0.03, "learning_rate": 0.0001999988860143344, "loss": 0.7268, "step": 303 }, { "epoch": 0.03, "learning_rate": 0.000199998721190276, "loss": 0.795, "step": 304 }, { "epoch": 0.03, "learning_rate": 0.00019999854499914125, "loss": 0.7503, "step": 305 }, { "epoch": 0.03, "learning_rate": 0.00019999835744095027, "loss": 0.772, "step": 306 }, { "epoch": 0.03, "learning_rate": 0.00019999815851572434, "loss": 0.7774, "step": 307 }, { "epoch": 0.03, "learning_rate": 0.00019999794822348605, "loss": 0.7567, "step": 308 }, { "epoch": 0.03, "learning_rate": 0.00019999772656425932, "loss": 0.7636, "step": 309 }, { "epoch": 0.03, "learning_rate": 0.00019999749353806937, "loss": 0.7178, "step": 310 }, { "epoch": 0.03, "learning_rate": 0.00019999724914494268, "loss": 0.7833, "step": 311 }, { "epoch": 0.03, "learning_rate": 0.000199996993384907, "loss": 0.6905, "step": 312 }, { "epoch": 0.03, "learning_rate": 0.0001999967262579914, "loss": 0.7179, "step": 313 }, { "epoch": 0.03, "learning_rate": 0.0001999964477642263, "loss": 0.7007, "step": 314 }, { "epoch": 0.03, "learning_rate": 0.0001999961579036433, "loss": 0.761, "step": 315 }, { "epoch": 0.03, "learning_rate": 0.0001999958566762754, "loss": 0.7806, "step": 316 }, { "epoch": 0.03, "learning_rate": 0.00019999554408215678, "loss": 0.6682, "step": 317 }, { "epoch": 0.03, "learning_rate": 0.00019999522012132304, "loss": 0.7772, "step": 318 }, { "epoch": 0.03, "learning_rate": 0.00019999488479381094, "loss": 0.792, "step": 319 }, { "epoch": 0.03, "learning_rate": 0.00019999453809965866, "loss": 0.7541, "step": 320 }, { "epoch": 0.03, "learning_rate": 0.00019999418003890557, "loss": 0.6801, "step": 321 }, { "epoch": 0.03, "learning_rate": 0.0001999938106115924, "loss": 0.7478, "step": 322 }, { "epoch": 0.03, "learning_rate": 0.0001999934298177611, "loss": 0.7755, "step": 323 }, { "epoch": 0.03, "learning_rate": 0.00019999303765745496, "loss": 0.7561, "step": 324 }, { "epoch": 0.03, "learning_rate": 0.0001999926341307186, "loss": 0.7084, "step": 325 }, { "epoch": 0.03, "learning_rate": 0.00019999221923759788, "loss": 0.7018, "step": 326 }, { "epoch": 0.03, "learning_rate": 0.00019999179297813994, "loss": 0.7529, "step": 327 }, { "epoch": 0.03, "learning_rate": 0.00019999135535239324, "loss": 0.7473, "step": 328 }, { "epoch": 0.03, "learning_rate": 0.0001999909063604075, "loss": 0.8573, "step": 329 }, { "epoch": 0.03, "learning_rate": 0.00019999044600223386, "loss": 0.7168, "step": 330 }, { "epoch": 0.03, "learning_rate": 0.00019998997427792453, "loss": 0.736, "step": 331 }, { "epoch": 0.03, "learning_rate": 0.0001999894911875332, "loss": 0.741, "step": 332 }, { "epoch": 0.03, "learning_rate": 0.00019998899673111473, "loss": 0.729, "step": 333 }, { "epoch": 0.03, "learning_rate": 0.00019998849090872538, "loss": 0.736, "step": 334 }, { "epoch": 0.03, "learning_rate": 0.00019998797372042262, "loss": 0.7754, "step": 335 }, { "epoch": 0.03, "learning_rate": 0.00019998744516626525, "loss": 0.7994, "step": 336 }, { "epoch": 0.04, "learning_rate": 0.00019998690524631335, "loss": 0.7808, "step": 337 }, { "epoch": 0.04, "learning_rate": 0.0001999863539606283, "loss": 0.695, "step": 338 }, { "epoch": 0.04, "learning_rate": 0.00019998579130927276, "loss": 0.7603, "step": 339 }, { "epoch": 0.04, "learning_rate": 0.00019998521729231068, "loss": 0.7789, "step": 340 }, { "epoch": 0.04, "learning_rate": 0.0001999846319098073, "loss": 0.7374, "step": 341 }, { "epoch": 0.04, "learning_rate": 0.0001999840351618292, "loss": 0.7159, "step": 342 }, { "epoch": 0.04, "learning_rate": 0.0001999834270484442, "loss": 0.7624, "step": 343 }, { "epoch": 0.04, "learning_rate": 0.00019998280756972138, "loss": 0.7049, "step": 344 }, { "epoch": 0.04, "learning_rate": 0.00019998217672573124, "loss": 0.7001, "step": 345 }, { "epoch": 0.04, "learning_rate": 0.0001999815345165454, "loss": 0.7195, "step": 346 }, { "epoch": 0.04, "learning_rate": 0.00019998088094223696, "loss": 0.6878, "step": 347 }, { "epoch": 0.04, "learning_rate": 0.00019998021600288007, "loss": 0.7454, "step": 348 }, { "epoch": 0.04, "learning_rate": 0.00019997953969855048, "loss": 0.6974, "step": 349 }, { "epoch": 0.04, "learning_rate": 0.00019997885202932498, "loss": 0.6954, "step": 350 }, { "epoch": 0.04, "learning_rate": 0.00019997815299528174, "loss": 0.7753, "step": 351 }, { "epoch": 0.04, "learning_rate": 0.00019997744259650025, "loss": 0.7668, "step": 352 }, { "epoch": 0.04, "learning_rate": 0.0001999767208330612, "loss": 0.7067, "step": 353 }, { "epoch": 0.04, "learning_rate": 0.0001999759877050467, "loss": 0.7356, "step": 354 }, { "epoch": 0.04, "learning_rate": 0.00019997524321254008, "loss": 0.7421, "step": 355 }, { "epoch": 0.04, "learning_rate": 0.00019997448735562591, "loss": 0.718, "step": 356 }, { "epoch": 0.04, "learning_rate": 0.0001999737201343902, "loss": 0.7267, "step": 357 }, { "epoch": 0.04, "learning_rate": 0.00019997294154892008, "loss": 0.7541, "step": 358 }, { "epoch": 0.04, "learning_rate": 0.0001999721515993041, "loss": 0.7271, "step": 359 }, { "epoch": 0.04, "learning_rate": 0.00019997135028563206, "loss": 0.7452, "step": 360 }, { "epoch": 0.04, "learning_rate": 0.000199970537607995, "loss": 0.8085, "step": 361 }, { "epoch": 0.04, "learning_rate": 0.00019996971356648534, "loss": 0.6929, "step": 362 }, { "epoch": 0.04, "learning_rate": 0.00019996887816119675, "loss": 0.7307, "step": 363 }, { "epoch": 0.04, "learning_rate": 0.00019996803139222418, "loss": 0.6872, "step": 364 }, { "epoch": 0.04, "learning_rate": 0.00019996717325966386, "loss": 0.7108, "step": 365 }, { "epoch": 0.04, "learning_rate": 0.00019996630376361337, "loss": 0.7747, "step": 366 }, { "epoch": 0.04, "learning_rate": 0.00019996542290417156, "loss": 0.8031, "step": 367 }, { "epoch": 0.04, "learning_rate": 0.00019996453068143856, "loss": 0.751, "step": 368 }, { "epoch": 0.04, "learning_rate": 0.00019996362709551573, "loss": 0.6838, "step": 369 }, { "epoch": 0.04, "learning_rate": 0.0001999627121465058, "loss": 0.7668, "step": 370 }, { "epoch": 0.04, "learning_rate": 0.00019996178583451285, "loss": 0.6897, "step": 371 }, { "epoch": 0.04, "learning_rate": 0.00019996084815964208, "loss": 0.7446, "step": 372 }, { "epoch": 0.04, "learning_rate": 0.00019995989912200015, "loss": 0.6586, "step": 373 }, { "epoch": 0.04, "learning_rate": 0.00019995893872169488, "loss": 0.7794, "step": 374 }, { "epoch": 0.04, "learning_rate": 0.0001999579669588355, "loss": 0.7027, "step": 375 }, { "epoch": 0.04, "learning_rate": 0.0001999569838335324, "loss": 0.7662, "step": 376 }, { "epoch": 0.04, "learning_rate": 0.00019995598934589742, "loss": 0.6531, "step": 377 }, { "epoch": 0.04, "learning_rate": 0.00019995498349604355, "loss": 0.6892, "step": 378 }, { "epoch": 0.04, "learning_rate": 0.0001999539662840851, "loss": 0.7139, "step": 379 }, { "epoch": 0.04, "learning_rate": 0.00019995293771013782, "loss": 0.6756, "step": 380 }, { "epoch": 0.04, "learning_rate": 0.00019995189777431848, "loss": 0.7343, "step": 381 }, { "epoch": 0.04, "learning_rate": 0.00019995084647674537, "loss": 0.7959, "step": 382 }, { "epoch": 0.04, "learning_rate": 0.000199949783817538, "loss": 0.674, "step": 383 }, { "epoch": 0.04, "learning_rate": 0.0001999487097968171, "loss": 0.8256, "step": 384 }, { "epoch": 0.04, "learning_rate": 0.00019994762441470488, "loss": 0.7806, "step": 385 }, { "epoch": 0.04, "learning_rate": 0.0001999465276713246, "loss": 0.6757, "step": 386 }, { "epoch": 0.04, "learning_rate": 0.000199945419566801, "loss": 0.7378, "step": 387 }, { "epoch": 0.04, "learning_rate": 0.00019994430010125997, "loss": 0.7495, "step": 388 }, { "epoch": 0.04, "learning_rate": 0.0001999431692748288, "loss": 0.674, "step": 389 }, { "epoch": 0.04, "learning_rate": 0.00019994202708763608, "loss": 0.7389, "step": 390 }, { "epoch": 0.04, "learning_rate": 0.0001999408735398116, "loss": 0.7113, "step": 391 }, { "epoch": 0.04, "learning_rate": 0.00019993970863148647, "loss": 0.6797, "step": 392 }, { "epoch": 0.04, "learning_rate": 0.00019993853236279313, "loss": 0.7514, "step": 393 }, { "epoch": 0.04, "learning_rate": 0.00019993734473386528, "loss": 0.8108, "step": 394 }, { "epoch": 0.04, "learning_rate": 0.00019993614574483792, "loss": 0.7549, "step": 395 }, { "epoch": 0.04, "learning_rate": 0.00019993493539584737, "loss": 0.7432, "step": 396 }, { "epoch": 0.04, "learning_rate": 0.00019993371368703117, "loss": 0.7751, "step": 397 }, { "epoch": 0.04, "learning_rate": 0.00019993248061852823, "loss": 0.8186, "step": 398 }, { "epoch": 0.04, "learning_rate": 0.0001999312361904787, "loss": 0.7922, "step": 399 }, { "epoch": 0.04, "learning_rate": 0.00019992998040302404, "loss": 0.7719, "step": 400 }, { "epoch": 0.04, "learning_rate": 0.00019992871325630698, "loss": 0.7163, "step": 401 }, { "epoch": 0.04, "learning_rate": 0.0001999274347504716, "loss": 0.7302, "step": 402 }, { "epoch": 0.04, "learning_rate": 0.00019992614488566316, "loss": 0.7639, "step": 403 }, { "epoch": 0.04, "learning_rate": 0.00019992484366202837, "loss": 0.7684, "step": 404 }, { "epoch": 0.04, "learning_rate": 0.00019992353107971508, "loss": 0.6883, "step": 405 }, { "epoch": 0.04, "learning_rate": 0.00019992220713887254, "loss": 0.7082, "step": 406 }, { "epoch": 0.04, "learning_rate": 0.0001999208718396512, "loss": 0.7718, "step": 407 }, { "epoch": 0.04, "learning_rate": 0.00019991952518220288, "loss": 0.7777, "step": 408 }, { "epoch": 0.04, "learning_rate": 0.00019991816716668064, "loss": 0.7143, "step": 409 }, { "epoch": 0.04, "learning_rate": 0.00019991679779323885, "loss": 0.6927, "step": 410 }, { "epoch": 0.04, "learning_rate": 0.00019991541706203316, "loss": 0.8027, "step": 411 }, { "epoch": 0.04, "learning_rate": 0.00019991402497322052, "loss": 0.7403, "step": 412 }, { "epoch": 0.04, "learning_rate": 0.00019991262152695925, "loss": 0.7598, "step": 413 }, { "epoch": 0.04, "learning_rate": 0.00019991120672340875, "loss": 0.6629, "step": 414 }, { "epoch": 0.04, "learning_rate": 0.00019990978056272994, "loss": 0.7343, "step": 415 }, { "epoch": 0.04, "learning_rate": 0.0001999083430450849, "loss": 0.7591, "step": 416 }, { "epoch": 0.04, "learning_rate": 0.00019990689417063705, "loss": 0.7271, "step": 417 }, { "epoch": 0.04, "learning_rate": 0.00019990543393955107, "loss": 0.7226, "step": 418 }, { "epoch": 0.04, "learning_rate": 0.000199903962351993, "loss": 0.6831, "step": 419 }, { "epoch": 0.04, "learning_rate": 0.00019990247940813, "loss": 0.7523, "step": 420 }, { "epoch": 0.04, "learning_rate": 0.0001999009851081308, "loss": 0.7764, "step": 421 }, { "epoch": 0.04, "learning_rate": 0.00019989947945216508, "loss": 0.712, "step": 422 }, { "epoch": 0.04, "learning_rate": 0.00019989796244040416, "loss": 0.7959, "step": 423 }, { "epoch": 0.04, "learning_rate": 0.00019989643407302036, "loss": 0.7325, "step": 424 }, { "epoch": 0.04, "learning_rate": 0.0001998948943501875, "loss": 0.741, "step": 425 }, { "epoch": 0.04, "learning_rate": 0.00019989334327208055, "loss": 0.7837, "step": 426 }, { "epoch": 0.04, "learning_rate": 0.00019989178083887582, "loss": 0.7575, "step": 427 }, { "epoch": 0.04, "learning_rate": 0.000199890207050751, "loss": 0.7531, "step": 428 }, { "epoch": 0.04, "learning_rate": 0.00019988862190788487, "loss": 0.7563, "step": 429 }, { "epoch": 0.04, "learning_rate": 0.00019988702541045767, "loss": 0.6884, "step": 430 }, { "epoch": 0.04, "learning_rate": 0.00019988541755865087, "loss": 0.7338, "step": 431 }, { "epoch": 0.04, "learning_rate": 0.00019988379835264727, "loss": 0.7769, "step": 432 }, { "epoch": 0.05, "learning_rate": 0.00019988216779263086, "loss": 0.7212, "step": 433 }, { "epoch": 0.05, "learning_rate": 0.00019988052587878707, "loss": 0.6968, "step": 434 }, { "epoch": 0.05, "learning_rate": 0.00019987887261130248, "loss": 0.7511, "step": 435 }, { "epoch": 0.05, "learning_rate": 0.00019987720799036505, "loss": 0.6989, "step": 436 }, { "epoch": 0.05, "learning_rate": 0.000199875532016164, "loss": 0.6795, "step": 437 }, { "epoch": 0.05, "learning_rate": 0.00019987384468888984, "loss": 0.7351, "step": 438 }, { "epoch": 0.05, "learning_rate": 0.00019987214600873435, "loss": 0.7762, "step": 439 }, { "epoch": 0.05, "learning_rate": 0.00019987043597589064, "loss": 0.74, "step": 440 }, { "epoch": 0.05, "learning_rate": 0.00019986871459055306, "loss": 0.752, "step": 441 }, { "epoch": 0.05, "learning_rate": 0.0001998669818529174, "loss": 0.6729, "step": 442 }, { "epoch": 0.05, "learning_rate": 0.00019986523776318048, "loss": 0.774, "step": 443 }, { "epoch": 0.05, "learning_rate": 0.0001998634823215406, "loss": 0.789, "step": 444 }, { "epoch": 0.05, "learning_rate": 0.0001998617155281974, "loss": 0.7417, "step": 445 }, { "epoch": 0.05, "learning_rate": 0.0001998599373833516, "loss": 0.7163, "step": 446 }, { "epoch": 0.05, "learning_rate": 0.00019985814788720533, "loss": 0.728, "step": 447 }, { "epoch": 0.05, "learning_rate": 0.00019985634703996203, "loss": 0.7458, "step": 448 }, { "epoch": 0.05, "learning_rate": 0.00019985453484182647, "loss": 0.7936, "step": 449 }, { "epoch": 0.05, "learning_rate": 0.00019985271129300454, "loss": 0.6654, "step": 450 }, { "epoch": 0.05, "learning_rate": 0.0001998508763937036, "loss": 0.7177, "step": 451 }, { "epoch": 0.05, "learning_rate": 0.0001998490301441322, "loss": 0.7068, "step": 452 }, { "epoch": 0.05, "learning_rate": 0.00019984717254450018, "loss": 0.748, "step": 453 }, { "epoch": 0.05, "learning_rate": 0.0001998453035950188, "loss": 0.7484, "step": 454 }, { "epoch": 0.05, "learning_rate": 0.00019984342329590037, "loss": 0.7942, "step": 455 }, { "epoch": 0.05, "learning_rate": 0.00019984153164735873, "loss": 0.6937, "step": 456 }, { "epoch": 0.05, "learning_rate": 0.00019983962864960885, "loss": 0.6737, "step": 457 }, { "epoch": 0.05, "learning_rate": 0.0001998377143028671, "loss": 0.6977, "step": 458 }, { "epoch": 0.05, "learning_rate": 0.000199835788607351, "loss": 0.6934, "step": 459 }, { "epoch": 0.05, "learning_rate": 0.00019983385156327956, "loss": 0.6662, "step": 460 }, { "epoch": 0.05, "learning_rate": 0.0001998319031708729, "loss": 0.6753, "step": 461 }, { "epoch": 0.05, "learning_rate": 0.00019982994343035253, "loss": 0.7301, "step": 462 }, { "epoch": 0.05, "learning_rate": 0.00019982797234194117, "loss": 0.7397, "step": 463 }, { "epoch": 0.05, "learning_rate": 0.00019982598990586295, "loss": 0.779, "step": 464 }, { "epoch": 0.05, "learning_rate": 0.00019982399612234313, "loss": 0.7401, "step": 465 }, { "epoch": 0.05, "learning_rate": 0.00019982199099160842, "loss": 0.7649, "step": 466 }, { "epoch": 0.05, "learning_rate": 0.00019981997451388672, "loss": 0.7105, "step": 467 }, { "epoch": 0.05, "learning_rate": 0.00019981794668940723, "loss": 0.7674, "step": 468 }, { "epoch": 0.05, "learning_rate": 0.00019981590751840049, "loss": 0.7546, "step": 469 }, { "epoch": 0.05, "learning_rate": 0.00019981385700109828, "loss": 0.7589, "step": 470 }, { "epoch": 0.05, "learning_rate": 0.0001998117951377337, "loss": 0.7062, "step": 471 }, { "epoch": 0.05, "learning_rate": 0.0001998097219285411, "loss": 0.7157, "step": 472 }, { "epoch": 0.05, "learning_rate": 0.00019980763737375618, "loss": 0.7493, "step": 473 }, { "epoch": 0.05, "learning_rate": 0.00019980554147361587, "loss": 0.7249, "step": 474 }, { "epoch": 0.05, "learning_rate": 0.00019980343422835843, "loss": 0.7167, "step": 475 }, { "epoch": 0.05, "learning_rate": 0.00019980131563822337, "loss": 0.7678, "step": 476 }, { "epoch": 0.05, "learning_rate": 0.00019979918570345157, "loss": 0.719, "step": 477 }, { "epoch": 0.05, "learning_rate": 0.00019979704442428512, "loss": 0.7345, "step": 478 }, { "epoch": 0.05, "learning_rate": 0.00019979489180096737, "loss": 0.7072, "step": 479 }, { "epoch": 0.05, "learning_rate": 0.00019979272783374308, "loss": 0.7208, "step": 480 }, { "epoch": 0.05, "learning_rate": 0.00019979055252285818, "loss": 0.7372, "step": 481 }, { "epoch": 0.05, "learning_rate": 0.00019978836586856, "loss": 0.7258, "step": 482 }, { "epoch": 0.05, "learning_rate": 0.00019978616787109704, "loss": 0.7352, "step": 483 }, { "epoch": 0.05, "learning_rate": 0.00019978395853071924, "loss": 0.7219, "step": 484 }, { "epoch": 0.05, "learning_rate": 0.00019978173784767765, "loss": 0.7073, "step": 485 }, { "epoch": 0.05, "learning_rate": 0.00019977950582222476, "loss": 0.7456, "step": 486 }, { "epoch": 0.05, "learning_rate": 0.00019977726245461424, "loss": 0.7521, "step": 487 }, { "epoch": 0.05, "learning_rate": 0.00019977500774510113, "loss": 0.7422, "step": 488 }, { "epoch": 0.05, "learning_rate": 0.00019977274169394172, "loss": 0.765, "step": 489 }, { "epoch": 0.05, "learning_rate": 0.0001997704643013936, "loss": 0.7923, "step": 490 }, { "epoch": 0.05, "learning_rate": 0.00019976817556771565, "loss": 0.7378, "step": 491 }, { "epoch": 0.05, "learning_rate": 0.00019976587549316806, "loss": 0.7152, "step": 492 }, { "epoch": 0.05, "learning_rate": 0.0001997635640780122, "loss": 0.7177, "step": 493 }, { "epoch": 0.05, "learning_rate": 0.0001997612413225109, "loss": 0.7221, "step": 494 }, { "epoch": 0.05, "learning_rate": 0.00019975890722692815, "loss": 0.7175, "step": 495 }, { "epoch": 0.05, "learning_rate": 0.0001997565617915293, "loss": 0.7001, "step": 496 }, { "epoch": 0.05, "learning_rate": 0.00019975420501658093, "loss": 0.7455, "step": 497 }, { "epoch": 0.05, "learning_rate": 0.00019975183690235096, "loss": 0.727, "step": 498 }, { "epoch": 0.05, "learning_rate": 0.00019974945744910856, "loss": 0.7407, "step": 499 }, { "epoch": 0.05, "learning_rate": 0.00019974706665712422, "loss": 0.6986, "step": 500 }, { "epoch": 0.05, "learning_rate": 0.0001997446645266697, "loss": 0.6962, "step": 501 }, { "epoch": 0.05, "learning_rate": 0.0001997422510580181, "loss": 0.7097, "step": 502 }, { "epoch": 0.05, "learning_rate": 0.0001997398262514437, "loss": 0.7452, "step": 503 }, { "epoch": 0.05, "learning_rate": 0.00019973739010722218, "loss": 0.7364, "step": 504 }, { "epoch": 0.05, "learning_rate": 0.0001997349426256304, "loss": 0.7615, "step": 505 }, { "epoch": 0.05, "learning_rate": 0.00019973248380694664, "loss": 0.709, "step": 506 }, { "epoch": 0.05, "learning_rate": 0.0001997300136514504, "loss": 0.7065, "step": 507 }, { "epoch": 0.05, "learning_rate": 0.0001997275321594224, "loss": 0.744, "step": 508 }, { "epoch": 0.05, "learning_rate": 0.00019972503933114478, "loss": 0.7344, "step": 509 }, { "epoch": 0.05, "learning_rate": 0.00019972253516690084, "loss": 0.7649, "step": 510 }, { "epoch": 0.05, "learning_rate": 0.0001997200196669753, "loss": 0.7007, "step": 511 }, { "epoch": 0.05, "learning_rate": 0.0001997174928316541, "loss": 0.7779, "step": 512 }, { "epoch": 0.05, "learning_rate": 0.00019971495466122443, "loss": 0.7287, "step": 513 }, { "epoch": 0.05, "learning_rate": 0.0001997124051559748, "loss": 0.6507, "step": 514 }, { "epoch": 0.05, "learning_rate": 0.0001997098443161951, "loss": 0.7491, "step": 515 }, { "epoch": 0.05, "learning_rate": 0.00019970727214217634, "loss": 0.7633, "step": 516 }, { "epoch": 0.05, "learning_rate": 0.00019970468863421095, "loss": 0.7223, "step": 517 }, { "epoch": 0.05, "learning_rate": 0.0001997020937925926, "loss": 0.7364, "step": 518 }, { "epoch": 0.05, "learning_rate": 0.00019969948761761622, "loss": 0.7496, "step": 519 }, { "epoch": 0.05, "learning_rate": 0.0001996968701095781, "loss": 0.6715, "step": 520 }, { "epoch": 0.05, "learning_rate": 0.00019969424126877573, "loss": 0.7324, "step": 521 }, { "epoch": 0.05, "learning_rate": 0.000199691601095508, "loss": 0.6539, "step": 522 }, { "epoch": 0.05, "learning_rate": 0.00019968894959007498, "loss": 0.6775, "step": 523 }, { "epoch": 0.05, "learning_rate": 0.00019968628675277807, "loss": 0.7047, "step": 524 }, { "epoch": 0.05, "learning_rate": 0.00019968361258391998, "loss": 0.7196, "step": 525 }, { "epoch": 0.05, "learning_rate": 0.0001996809270838047, "loss": 0.6976, "step": 526 }, { "epoch": 0.05, "learning_rate": 0.00019967823025273743, "loss": 0.7286, "step": 527 }, { "epoch": 0.05, "learning_rate": 0.00019967552209102483, "loss": 0.7213, "step": 528 }, { "epoch": 0.06, "learning_rate": 0.00019967280259897466, "loss": 0.7086, "step": 529 }, { "epoch": 0.06, "learning_rate": 0.0001996700717768961, "loss": 0.769, "step": 530 }, { "epoch": 0.06, "learning_rate": 0.0001996673296250995, "loss": 0.6838, "step": 531 }, { "epoch": 0.06, "learning_rate": 0.00019966457614389667, "loss": 0.7291, "step": 532 }, { "epoch": 0.06, "learning_rate": 0.0001996618113336005, "loss": 0.758, "step": 533 }, { "epoch": 0.06, "learning_rate": 0.00019965903519452533, "loss": 0.7227, "step": 534 }, { "epoch": 0.06, "learning_rate": 0.00019965624772698672, "loss": 0.6976, "step": 535 }, { "epoch": 0.06, "learning_rate": 0.00019965344893130152, "loss": 0.7305, "step": 536 }, { "epoch": 0.06, "learning_rate": 0.0001996506388077879, "loss": 0.7354, "step": 537 }, { "epoch": 0.06, "learning_rate": 0.00019964781735676526, "loss": 0.7565, "step": 538 }, { "epoch": 0.06, "learning_rate": 0.00019964498457855433, "loss": 0.7287, "step": 539 }, { "epoch": 0.06, "learning_rate": 0.00019964214047347713, "loss": 0.7399, "step": 540 }, { "epoch": 0.06, "learning_rate": 0.00019963928504185697, "loss": 0.7447, "step": 541 }, { "epoch": 0.06, "learning_rate": 0.00019963641828401837, "loss": 0.7468, "step": 542 }, { "epoch": 0.06, "learning_rate": 0.00019963354020028728, "loss": 0.7405, "step": 543 }, { "epoch": 0.06, "learning_rate": 0.00019963065079099082, "loss": 0.685, "step": 544 }, { "epoch": 0.06, "learning_rate": 0.0001996277500564574, "loss": 0.6787, "step": 545 }, { "epoch": 0.06, "learning_rate": 0.00019962483799701683, "loss": 0.6607, "step": 546 }, { "epoch": 0.06, "learning_rate": 0.00019962191461300006, "loss": 0.7291, "step": 547 }, { "epoch": 0.06, "learning_rate": 0.00019961897990473942, "loss": 0.7539, "step": 548 }, { "epoch": 0.06, "learning_rate": 0.00019961603387256855, "loss": 0.744, "step": 549 }, { "epoch": 0.06, "learning_rate": 0.00019961307651682227, "loss": 0.7179, "step": 550 }, { "epoch": 0.06, "learning_rate": 0.00019961010783783677, "loss": 0.7192, "step": 551 }, { "epoch": 0.06, "learning_rate": 0.00019960712783594954, "loss": 0.7515, "step": 552 }, { "epoch": 0.06, "learning_rate": 0.00019960413651149924, "loss": 0.7565, "step": 553 }, { "epoch": 0.06, "learning_rate": 0.000199601133864826, "loss": 0.6478, "step": 554 }, { "epoch": 0.06, "learning_rate": 0.00019959811989627108, "loss": 0.7083, "step": 555 }, { "epoch": 0.06, "learning_rate": 0.0001995950946061771, "loss": 0.7374, "step": 556 }, { "epoch": 0.06, "learning_rate": 0.00019959205799488793, "loss": 0.6909, "step": 557 }, { "epoch": 0.06, "learning_rate": 0.00019958901006274877, "loss": 0.7503, "step": 558 }, { "epoch": 0.06, "learning_rate": 0.00019958595081010606, "loss": 0.736, "step": 559 }, { "epoch": 0.06, "learning_rate": 0.0001995828802373076, "loss": 0.6861, "step": 560 }, { "epoch": 0.06, "learning_rate": 0.0001995797983447024, "loss": 0.6981, "step": 561 }, { "epoch": 0.06, "learning_rate": 0.00019957670513264078, "loss": 0.6902, "step": 562 }, { "epoch": 0.06, "learning_rate": 0.00019957360060147438, "loss": 0.7816, "step": 563 }, { "epoch": 0.06, "learning_rate": 0.00019957048475155605, "loss": 0.7221, "step": 564 }, { "epoch": 0.06, "learning_rate": 0.00019956735758324, "loss": 0.7387, "step": 565 }, { "epoch": 0.06, "learning_rate": 0.00019956421909688175, "loss": 0.6554, "step": 566 }, { "epoch": 0.06, "learning_rate": 0.00019956106929283797, "loss": 0.7306, "step": 567 }, { "epoch": 0.06, "learning_rate": 0.00019955790817146677, "loss": 0.7425, "step": 568 }, { "epoch": 0.06, "learning_rate": 0.00019955473573312745, "loss": 0.6661, "step": 569 }, { "epoch": 0.06, "learning_rate": 0.00019955155197818063, "loss": 0.6886, "step": 570 }, { "epoch": 0.06, "learning_rate": 0.00019954835690698825, "loss": 0.665, "step": 571 }, { "epoch": 0.06, "learning_rate": 0.00019954515051991348, "loss": 0.7033, "step": 572 }, { "epoch": 0.06, "learning_rate": 0.00019954193281732075, "loss": 0.7415, "step": 573 }, { "epoch": 0.06, "learning_rate": 0.00019953870379957588, "loss": 0.7293, "step": 574 }, { "epoch": 0.06, "learning_rate": 0.00019953546346704592, "loss": 0.7162, "step": 575 }, { "epoch": 0.06, "learning_rate": 0.0001995322118200992, "loss": 0.7295, "step": 576 }, { "epoch": 0.06, "learning_rate": 0.0001995289488591053, "loss": 0.739, "step": 577 }, { "epoch": 0.06, "learning_rate": 0.00019952567458443517, "loss": 0.7188, "step": 578 }, { "epoch": 0.06, "learning_rate": 0.00019952238899646104, "loss": 0.7364, "step": 579 }, { "epoch": 0.06, "learning_rate": 0.00019951909209555628, "loss": 0.7695, "step": 580 }, { "epoch": 0.06, "learning_rate": 0.00019951578388209575, "loss": 0.7717, "step": 581 }, { "epoch": 0.06, "learning_rate": 0.00019951246435645547, "loss": 0.6947, "step": 582 }, { "epoch": 0.06, "learning_rate": 0.00019950913351901277, "loss": 0.7568, "step": 583 }, { "epoch": 0.06, "learning_rate": 0.0001995057913701463, "loss": 0.7656, "step": 584 }, { "epoch": 0.06, "learning_rate": 0.00019950243791023596, "loss": 0.7698, "step": 585 }, { "epoch": 0.06, "learning_rate": 0.00019949907313966293, "loss": 0.7068, "step": 586 }, { "epoch": 0.06, "learning_rate": 0.00019949569705880968, "loss": 0.7339, "step": 587 }, { "epoch": 0.06, "learning_rate": 0.00019949230966806, "loss": 0.6746, "step": 588 }, { "epoch": 0.06, "learning_rate": 0.00019948891096779897, "loss": 0.7314, "step": 589 }, { "epoch": 0.06, "learning_rate": 0.0001994855009584129, "loss": 0.6505, "step": 590 }, { "epoch": 0.06, "learning_rate": 0.00019948207964028938, "loss": 0.6779, "step": 591 }, { "epoch": 0.06, "learning_rate": 0.00019947864701381734, "loss": 0.7577, "step": 592 }, { "epoch": 0.06, "learning_rate": 0.00019947520307938698, "loss": 0.6915, "step": 593 }, { "epoch": 0.06, "learning_rate": 0.00019947174783738983, "loss": 0.7671, "step": 594 }, { "epoch": 0.06, "learning_rate": 0.00019946828128821858, "loss": 0.7036, "step": 595 }, { "epoch": 0.06, "learning_rate": 0.0001994648034322673, "loss": 0.7572, "step": 596 }, { "epoch": 0.06, "learning_rate": 0.00019946131426993132, "loss": 0.6901, "step": 597 }, { "epoch": 0.06, "learning_rate": 0.00019945781380160732, "loss": 0.6987, "step": 598 }, { "epoch": 0.06, "learning_rate": 0.00019945430202769312, "loss": 0.7038, "step": 599 }, { "epoch": 0.06, "learning_rate": 0.00019945077894858797, "loss": 0.7511, "step": 600 }, { "epoch": 0.06, "learning_rate": 0.0001994472445646923, "loss": 0.6822, "step": 601 }, { "epoch": 0.06, "learning_rate": 0.00019944369887640794, "loss": 0.6257, "step": 602 }, { "epoch": 0.06, "learning_rate": 0.00019944014188413788, "loss": 0.7533, "step": 603 }, { "epoch": 0.06, "learning_rate": 0.00019943657358828648, "loss": 0.7116, "step": 604 }, { "epoch": 0.06, "learning_rate": 0.00019943299398925932, "loss": 0.7356, "step": 605 }, { "epoch": 0.06, "learning_rate": 0.00019942940308746333, "loss": 0.6927, "step": 606 }, { "epoch": 0.06, "learning_rate": 0.00019942580088330668, "loss": 0.7182, "step": 607 }, { "epoch": 0.06, "learning_rate": 0.00019942218737719884, "loss": 0.8033, "step": 608 }, { "epoch": 0.06, "learning_rate": 0.0001994185625695506, "loss": 0.7427, "step": 609 }, { "epoch": 0.06, "learning_rate": 0.00019941492646077395, "loss": 0.7055, "step": 610 }, { "epoch": 0.06, "learning_rate": 0.00019941127905128228, "loss": 0.7365, "step": 611 }, { "epoch": 0.06, "learning_rate": 0.00019940762034149011, "loss": 0.6891, "step": 612 }, { "epoch": 0.06, "learning_rate": 0.00019940395033181342, "loss": 0.7408, "step": 613 }, { "epoch": 0.06, "learning_rate": 0.00019940026902266932, "loss": 0.7011, "step": 614 }, { "epoch": 0.06, "learning_rate": 0.00019939657641447633, "loss": 0.7087, "step": 615 }, { "epoch": 0.06, "learning_rate": 0.00019939287250765416, "loss": 0.7693, "step": 616 }, { "epoch": 0.06, "learning_rate": 0.00019938915730262387, "loss": 0.7579, "step": 617 }, { "epoch": 0.06, "learning_rate": 0.00019938543079980772, "loss": 0.7134, "step": 618 }, { "epoch": 0.06, "learning_rate": 0.00019938169299962936, "loss": 0.7315, "step": 619 }, { "epoch": 0.06, "learning_rate": 0.00019937794390251367, "loss": 0.6784, "step": 620 }, { "epoch": 0.06, "learning_rate": 0.0001993741835088868, "loss": 0.6948, "step": 621 }, { "epoch": 0.06, "learning_rate": 0.00019937041181917618, "loss": 0.6635, "step": 622 }, { "epoch": 0.06, "learning_rate": 0.00019936662883381065, "loss": 0.6747, "step": 623 }, { "epoch": 0.06, "learning_rate": 0.00019936283455322012, "loss": 0.7203, "step": 624 }, { "epoch": 0.07, "learning_rate": 0.00019935902897783592, "loss": 0.7157, "step": 625 }, { "epoch": 0.07, "learning_rate": 0.00019935521210809066, "loss": 0.6976, "step": 626 }, { "epoch": 0.07, "learning_rate": 0.00019935138394441818, "loss": 0.7311, "step": 627 }, { "epoch": 0.07, "learning_rate": 0.0001993475444872537, "loss": 0.6794, "step": 628 }, { "epoch": 0.07, "learning_rate": 0.0001993436937370336, "loss": 0.6812, "step": 629 }, { "epoch": 0.07, "learning_rate": 0.00019933983169419562, "loss": 0.7361, "step": 630 }, { "epoch": 0.07, "learning_rate": 0.00019933595835917877, "loss": 0.6988, "step": 631 }, { "epoch": 0.07, "learning_rate": 0.0001993320737324233, "loss": 0.8148, "step": 632 }, { "epoch": 0.07, "learning_rate": 0.00019932817781437087, "loss": 0.7468, "step": 633 }, { "epoch": 0.07, "learning_rate": 0.00019932427060546427, "loss": 0.6644, "step": 634 }, { "epoch": 0.07, "learning_rate": 0.0001993203521061477, "loss": 0.7087, "step": 635 }, { "epoch": 0.07, "learning_rate": 0.0001993164223168665, "loss": 0.6577, "step": 636 }, { "epoch": 0.07, "learning_rate": 0.00019931248123806743, "loss": 0.7131, "step": 637 }, { "epoch": 0.07, "learning_rate": 0.00019930852887019849, "loss": 0.7126, "step": 638 }, { "epoch": 0.07, "learning_rate": 0.00019930456521370893, "loss": 0.6877, "step": 639 }, { "epoch": 0.07, "learning_rate": 0.00019930059026904932, "loss": 0.7031, "step": 640 }, { "epoch": 0.07, "learning_rate": 0.0001992966040366715, "loss": 0.7265, "step": 641 }, { "epoch": 0.07, "learning_rate": 0.00019929260651702858, "loss": 0.7128, "step": 642 }, { "epoch": 0.07, "learning_rate": 0.000199288597710575, "loss": 0.7398, "step": 643 }, { "epoch": 0.07, "learning_rate": 0.0001992845776177664, "loss": 0.7302, "step": 644 }, { "epoch": 0.07, "learning_rate": 0.00019928054623905982, "loss": 0.7021, "step": 645 }, { "epoch": 0.07, "learning_rate": 0.00019927650357491343, "loss": 0.6798, "step": 646 }, { "epoch": 0.07, "learning_rate": 0.00019927244962578684, "loss": 0.6775, "step": 647 }, { "epoch": 0.07, "learning_rate": 0.00019926838439214084, "loss": 0.6984, "step": 648 }, { "epoch": 0.07, "learning_rate": 0.00019926430787443755, "loss": 0.7092, "step": 649 }, { "epoch": 0.07, "learning_rate": 0.00019926022007314033, "loss": 0.7095, "step": 650 }, { "epoch": 0.07, "learning_rate": 0.00019925612098871393, "loss": 0.7667, "step": 651 }, { "epoch": 0.07, "learning_rate": 0.00019925201062162415, "loss": 0.7653, "step": 652 }, { "epoch": 0.07, "learning_rate": 0.00019924788897233837, "loss": 0.6998, "step": 653 }, { "epoch": 0.07, "learning_rate": 0.00019924375604132505, "loss": 0.6172, "step": 654 }, { "epoch": 0.07, "learning_rate": 0.00019923961182905395, "loss": 0.7017, "step": 655 }, { "epoch": 0.07, "learning_rate": 0.00019923545633599622, "loss": 0.7206, "step": 656 }, { "epoch": 0.07, "learning_rate": 0.0001992312895626242, "loss": 0.7797, "step": 657 }, { "epoch": 0.07, "learning_rate": 0.00019922711150941152, "loss": 0.6875, "step": 658 }, { "epoch": 0.07, "learning_rate": 0.00019922292217683314, "loss": 0.7414, "step": 659 }, { "epoch": 0.07, "learning_rate": 0.00019921872156536524, "loss": 0.7249, "step": 660 }, { "epoch": 0.07, "learning_rate": 0.00019921450967548532, "loss": 0.7214, "step": 661 }, { "epoch": 0.07, "learning_rate": 0.00019921028650767215, "loss": 0.6794, "step": 662 }, { "epoch": 0.07, "learning_rate": 0.00019920605206240582, "loss": 0.7031, "step": 663 }, { "epoch": 0.07, "learning_rate": 0.00019920180634016763, "loss": 0.733, "step": 664 }, { "epoch": 0.07, "learning_rate": 0.00019919754934144023, "loss": 0.6875, "step": 665 }, { "epoch": 0.07, "learning_rate": 0.0001991932810667075, "loss": 0.6672, "step": 666 }, { "epoch": 0.07, "learning_rate": 0.00019918900151645464, "loss": 0.7433, "step": 667 }, { "epoch": 0.07, "learning_rate": 0.0001991847106911681, "loss": 0.7321, "step": 668 }, { "epoch": 0.07, "learning_rate": 0.00019918040859133562, "loss": 0.7572, "step": 669 }, { "epoch": 0.07, "learning_rate": 0.00019917609521744628, "loss": 0.677, "step": 670 }, { "epoch": 0.07, "learning_rate": 0.00019917177056999032, "loss": 0.7287, "step": 671 }, { "epoch": 0.07, "learning_rate": 0.00019916743464945937, "loss": 0.7081, "step": 672 }, { "epoch": 0.07, "learning_rate": 0.00019916308745634634, "loss": 0.7172, "step": 673 }, { "epoch": 0.07, "learning_rate": 0.00019915872899114531, "loss": 0.7366, "step": 674 }, { "epoch": 0.07, "learning_rate": 0.00019915435925435177, "loss": 0.6758, "step": 675 }, { "epoch": 0.07, "learning_rate": 0.00019914997824646243, "loss": 0.714, "step": 676 }, { "epoch": 0.07, "learning_rate": 0.00019914558596797525, "loss": 0.6967, "step": 677 }, { "epoch": 0.07, "learning_rate": 0.00019914118241938958, "loss": 0.721, "step": 678 }, { "epoch": 0.07, "learning_rate": 0.00019913676760120592, "loss": 0.6928, "step": 679 }, { "epoch": 0.07, "learning_rate": 0.0001991323415139261, "loss": 0.6747, "step": 680 }, { "epoch": 0.07, "learning_rate": 0.00019912790415805334, "loss": 0.6754, "step": 681 }, { "epoch": 0.07, "learning_rate": 0.00019912345553409194, "loss": 0.6462, "step": 682 }, { "epoch": 0.07, "learning_rate": 0.00019911899564254766, "loss": 0.7791, "step": 683 }, { "epoch": 0.07, "learning_rate": 0.0001991145244839274, "loss": 0.6768, "step": 684 }, { "epoch": 0.07, "learning_rate": 0.00019911004205873948, "loss": 0.7374, "step": 685 }, { "epoch": 0.07, "learning_rate": 0.00019910554836749333, "loss": 0.7248, "step": 686 }, { "epoch": 0.07, "learning_rate": 0.00019910104341069982, "loss": 0.7036, "step": 687 }, { "epoch": 0.07, "learning_rate": 0.00019909652718887104, "loss": 0.6955, "step": 688 }, { "epoch": 0.07, "learning_rate": 0.00019909199970252037, "loss": 0.6767, "step": 689 }, { "epoch": 0.07, "learning_rate": 0.00019908746095216243, "loss": 0.6999, "step": 690 }, { "epoch": 0.07, "learning_rate": 0.00019908291093831315, "loss": 0.7773, "step": 691 }, { "epoch": 0.07, "learning_rate": 0.00019907834966148978, "loss": 0.701, "step": 692 }, { "epoch": 0.07, "learning_rate": 0.00019907377712221074, "loss": 0.6829, "step": 693 }, { "epoch": 0.07, "learning_rate": 0.00019906919332099586, "loss": 0.7461, "step": 694 }, { "epoch": 0.07, "learning_rate": 0.00019906459825836615, "loss": 0.7051, "step": 695 }, { "epoch": 0.07, "learning_rate": 0.000199059991934844, "loss": 0.7185, "step": 696 }, { "epoch": 0.07, "learning_rate": 0.00019905537435095294, "loss": 0.7856, "step": 697 }, { "epoch": 0.07, "learning_rate": 0.00019905074550721793, "loss": 0.7315, "step": 698 }, { "epoch": 0.07, "learning_rate": 0.00019904610540416514, "loss": 0.7203, "step": 699 }, { "epoch": 0.07, "learning_rate": 0.00019904145404232195, "loss": 0.713, "step": 700 }, { "epoch": 0.07, "learning_rate": 0.00019903679142221716, "loss": 0.7946, "step": 701 }, { "epoch": 0.07, "learning_rate": 0.00019903211754438075, "loss": 0.7173, "step": 702 }, { "epoch": 0.07, "learning_rate": 0.00019902743240934404, "loss": 0.7525, "step": 703 }, { "epoch": 0.07, "learning_rate": 0.00019902273601763956, "loss": 0.6838, "step": 704 }, { "epoch": 0.07, "learning_rate": 0.00019901802836980116, "loss": 0.7413, "step": 705 }, { "epoch": 0.07, "learning_rate": 0.000199013309466364, "loss": 0.6833, "step": 706 }, { "epoch": 0.07, "learning_rate": 0.00019900857930786449, "loss": 0.7158, "step": 707 }, { "epoch": 0.07, "learning_rate": 0.00019900383789484027, "loss": 0.7323, "step": 708 }, { "epoch": 0.07, "learning_rate": 0.00019899908522783038, "loss": 0.6787, "step": 709 }, { "epoch": 0.07, "learning_rate": 0.00019899432130737497, "loss": 0.7187, "step": 710 }, { "epoch": 0.07, "learning_rate": 0.00019898954613401567, "loss": 0.7592, "step": 711 }, { "epoch": 0.07, "learning_rate": 0.00019898475970829516, "loss": 0.7162, "step": 712 }, { "epoch": 0.07, "learning_rate": 0.00019897996203075766, "loss": 0.6892, "step": 713 }, { "epoch": 0.07, "learning_rate": 0.00019897515310194846, "loss": 0.6782, "step": 714 }, { "epoch": 0.07, "learning_rate": 0.00019897033292241422, "loss": 0.7115, "step": 715 }, { "epoch": 0.07, "learning_rate": 0.00019896550149270286, "loss": 0.6716, "step": 716 }, { "epoch": 0.07, "learning_rate": 0.00019896065881336354, "loss": 0.7041, "step": 717 }, { "epoch": 0.07, "learning_rate": 0.0001989558048849468, "loss": 0.6605, "step": 718 }, { "epoch": 0.07, "learning_rate": 0.00019895093970800435, "loss": 0.7312, "step": 719 }, { "epoch": 0.07, "learning_rate": 0.00019894606328308922, "loss": 0.7505, "step": 720 }, { "epoch": 0.08, "learning_rate": 0.00019894117561075576, "loss": 0.7807, "step": 721 }, { "epoch": 0.08, "learning_rate": 0.00019893627669155956, "loss": 0.7064, "step": 722 }, { "epoch": 0.08, "learning_rate": 0.00019893136652605748, "loss": 0.7284, "step": 723 }, { "epoch": 0.08, "learning_rate": 0.00019892644511480768, "loss": 0.7004, "step": 724 }, { "epoch": 0.08, "learning_rate": 0.00019892151245836956, "loss": 0.711, "step": 725 }, { "epoch": 0.08, "learning_rate": 0.00019891656855730382, "loss": 0.7655, "step": 726 }, { "epoch": 0.08, "learning_rate": 0.0001989116134121725, "loss": 0.7427, "step": 727 }, { "epoch": 0.08, "learning_rate": 0.00019890664702353883, "loss": 0.6857, "step": 728 }, { "epoch": 0.08, "learning_rate": 0.00019890166939196734, "loss": 0.7707, "step": 729 }, { "epoch": 0.08, "learning_rate": 0.00019889668051802385, "loss": 0.7258, "step": 730 }, { "epoch": 0.08, "learning_rate": 0.0001988916804022755, "loss": 0.6849, "step": 731 }, { "epoch": 0.08, "learning_rate": 0.00019888666904529058, "loss": 0.7169, "step": 732 }, { "epoch": 0.08, "learning_rate": 0.0001988816464476388, "loss": 0.7753, "step": 733 }, { "epoch": 0.08, "learning_rate": 0.0001988766126098911, "loss": 0.6879, "step": 734 }, { "epoch": 0.08, "learning_rate": 0.00019887156753261963, "loss": 0.7098, "step": 735 }, { "epoch": 0.08, "learning_rate": 0.00019886651121639798, "loss": 0.7309, "step": 736 }, { "epoch": 0.08, "learning_rate": 0.00019886144366180078, "loss": 0.6489, "step": 737 }, { "epoch": 0.08, "learning_rate": 0.0001988563648694042, "loss": 0.7447, "step": 738 }, { "epoch": 0.08, "learning_rate": 0.00019885127483978545, "loss": 0.7818, "step": 739 }, { "epoch": 0.08, "learning_rate": 0.00019884617357352315, "loss": 0.6816, "step": 740 }, { "epoch": 0.08, "learning_rate": 0.00019884106107119723, "loss": 0.744, "step": 741 }, { "epoch": 0.08, "learning_rate": 0.0001988359373333888, "loss": 0.6904, "step": 742 }, { "epoch": 0.08, "learning_rate": 0.00019883080236068025, "loss": 0.7317, "step": 743 }, { "epoch": 0.08, "learning_rate": 0.00019882565615365536, "loss": 0.6918, "step": 744 }, { "epoch": 0.08, "learning_rate": 0.00019882049871289905, "loss": 0.7482, "step": 745 }, { "epoch": 0.08, "learning_rate": 0.00019881533003899762, "loss": 0.7139, "step": 746 }, { "epoch": 0.08, "learning_rate": 0.00019881015013253856, "loss": 0.7768, "step": 747 }, { "epoch": 0.08, "learning_rate": 0.0001988049589941107, "loss": 0.7319, "step": 748 }, { "epoch": 0.08, "learning_rate": 0.00019879975662430414, "loss": 0.6762, "step": 749 }, { "epoch": 0.08, "learning_rate": 0.00019879454302371025, "loss": 0.7143, "step": 750 }, { "epoch": 0.08, "learning_rate": 0.00019878931819292166, "loss": 0.7344, "step": 751 }, { "epoch": 0.08, "learning_rate": 0.00019878408213253227, "loss": 0.7047, "step": 752 }, { "epoch": 0.08, "learning_rate": 0.00019877883484313734, "loss": 0.6799, "step": 753 }, { "epoch": 0.08, "learning_rate": 0.00019877357632533323, "loss": 0.6873, "step": 754 }, { "epoch": 0.08, "learning_rate": 0.0001987683065797178, "loss": 0.7001, "step": 755 }, { "epoch": 0.08, "learning_rate": 0.00019876302560689, "loss": 0.6702, "step": 756 }, { "epoch": 0.08, "learning_rate": 0.00019875773340745015, "loss": 0.7218, "step": 757 }, { "epoch": 0.08, "learning_rate": 0.00019875242998199983, "loss": 0.7876, "step": 758 }, { "epoch": 0.08, "learning_rate": 0.0001987471153311419, "loss": 0.6963, "step": 759 }, { "epoch": 0.08, "learning_rate": 0.00019874178945548048, "loss": 0.7407, "step": 760 }, { "epoch": 0.08, "learning_rate": 0.00019873645235562098, "loss": 0.6957, "step": 761 }, { "epoch": 0.08, "learning_rate": 0.0001987311040321701, "loss": 0.6534, "step": 762 }, { "epoch": 0.08, "learning_rate": 0.00019872574448573572, "loss": 0.6624, "step": 763 }, { "epoch": 0.08, "learning_rate": 0.00019872037371692716, "loss": 0.7265, "step": 764 }, { "epoch": 0.08, "learning_rate": 0.00019871499172635485, "loss": 0.7269, "step": 765 }, { "epoch": 0.08, "learning_rate": 0.00019870959851463064, "loss": 0.7629, "step": 766 }, { "epoch": 0.08, "learning_rate": 0.00019870419408236757, "loss": 0.7531, "step": 767 }, { "epoch": 0.08, "learning_rate": 0.00019869877843017994, "loss": 0.7445, "step": 768 }, { "epoch": 0.08, "learning_rate": 0.00019869335155868337, "loss": 0.7632, "step": 769 }, { "epoch": 0.08, "learning_rate": 0.0001986879134684948, "loss": 0.719, "step": 770 }, { "epoch": 0.08, "learning_rate": 0.00019868246416023232, "loss": 0.612, "step": 771 }, { "epoch": 0.08, "learning_rate": 0.0001986770036345154, "loss": 0.7025, "step": 772 }, { "epoch": 0.08, "learning_rate": 0.00019867153189196475, "loss": 0.7312, "step": 773 }, { "epoch": 0.08, "learning_rate": 0.00019866604893320236, "loss": 0.7694, "step": 774 }, { "epoch": 0.08, "learning_rate": 0.00019866055475885146, "loss": 0.6534, "step": 775 }, { "epoch": 0.08, "learning_rate": 0.0001986550493695366, "loss": 0.7737, "step": 776 }, { "epoch": 0.08, "learning_rate": 0.0001986495327658836, "loss": 0.6728, "step": 777 }, { "epoch": 0.08, "learning_rate": 0.0001986440049485195, "loss": 0.7264, "step": 778 }, { "epoch": 0.08, "learning_rate": 0.00019863846591807276, "loss": 0.73, "step": 779 }, { "epoch": 0.08, "learning_rate": 0.0001986329156751729, "loss": 0.7238, "step": 780 }, { "epoch": 0.08, "learning_rate": 0.00019862735422045093, "loss": 0.7001, "step": 781 }, { "epoch": 0.08, "learning_rate": 0.00019862178155453892, "loss": 0.693, "step": 782 }, { "epoch": 0.08, "learning_rate": 0.0001986161976780704, "loss": 0.7247, "step": 783 }, { "epoch": 0.08, "learning_rate": 0.0001986106025916801, "loss": 0.7157, "step": 784 }, { "epoch": 0.08, "learning_rate": 0.00019860499629600407, "loss": 0.6786, "step": 785 }, { "epoch": 0.08, "learning_rate": 0.00019859937879167946, "loss": 0.693, "step": 786 }, { "epoch": 0.08, "learning_rate": 0.00019859375007934494, "loss": 0.7521, "step": 787 }, { "epoch": 0.08, "learning_rate": 0.00019858811015964028, "loss": 0.7201, "step": 788 }, { "epoch": 0.08, "learning_rate": 0.00019858245903320662, "loss": 0.6963, "step": 789 }, { "epoch": 0.08, "learning_rate": 0.00019857679670068633, "loss": 0.6632, "step": 790 }, { "epoch": 0.08, "learning_rate": 0.00019857112316272303, "loss": 0.7401, "step": 791 }, { "epoch": 0.08, "learning_rate": 0.00019856543841996165, "loss": 0.7471, "step": 792 }, { "epoch": 0.08, "learning_rate": 0.0001985597424730484, "loss": 0.6759, "step": 793 }, { "epoch": 0.08, "learning_rate": 0.00019855403532263076, "loss": 0.7483, "step": 794 }, { "epoch": 0.08, "learning_rate": 0.00019854831696935742, "loss": 0.7131, "step": 795 }, { "epoch": 0.08, "learning_rate": 0.0001985425874138785, "loss": 0.7161, "step": 796 }, { "epoch": 0.08, "learning_rate": 0.00019853684665684522, "loss": 0.6559, "step": 797 }, { "epoch": 0.08, "learning_rate": 0.00019853109469891015, "loss": 0.7421, "step": 798 }, { "epoch": 0.08, "learning_rate": 0.00019852533154072712, "loss": 0.6598, "step": 799 }, { "epoch": 0.08, "learning_rate": 0.00019851955718295128, "loss": 0.7626, "step": 800 }, { "epoch": 0.08, "learning_rate": 0.00019851377162623897, "loss": 0.7455, "step": 801 }, { "epoch": 0.08, "learning_rate": 0.00019850797487124786, "loss": 0.7254, "step": 802 }, { "epoch": 0.08, "learning_rate": 0.00019850216691863693, "loss": 0.7502, "step": 803 }, { "epoch": 0.08, "learning_rate": 0.0001984963477690663, "loss": 0.7023, "step": 804 }, { "epoch": 0.08, "learning_rate": 0.00019849051742319747, "loss": 0.6663, "step": 805 }, { "epoch": 0.08, "learning_rate": 0.00019848467588169327, "loss": 0.7846, "step": 806 }, { "epoch": 0.08, "learning_rate": 0.0001984788231452176, "loss": 0.7965, "step": 807 }, { "epoch": 0.08, "learning_rate": 0.00019847295921443582, "loss": 0.7009, "step": 808 }, { "epoch": 0.08, "learning_rate": 0.00019846708409001446, "loss": 0.7442, "step": 809 }, { "epoch": 0.08, "learning_rate": 0.00019846119777262145, "loss": 0.6917, "step": 810 }, { "epoch": 0.08, "learning_rate": 0.0001984553002629258, "loss": 0.7339, "step": 811 }, { "epoch": 0.08, "learning_rate": 0.0001984493915615979, "loss": 0.7123, "step": 812 }, { "epoch": 0.08, "learning_rate": 0.00019844347166930946, "loss": 0.6998, "step": 813 }, { "epoch": 0.08, "learning_rate": 0.00019843754058673337, "loss": 0.6976, "step": 814 }, { "epoch": 0.08, "learning_rate": 0.00019843159831454382, "loss": 0.6855, "step": 815 }, { "epoch": 0.08, "learning_rate": 0.0001984256448534163, "loss": 0.7515, "step": 816 }, { "epoch": 0.09, "learning_rate": 0.0001984196802040276, "loss": 0.6539, "step": 817 }, { "epoch": 0.09, "learning_rate": 0.00019841370436705563, "loss": 0.7912, "step": 818 }, { "epoch": 0.09, "learning_rate": 0.00019840771734317978, "loss": 0.6798, "step": 819 }, { "epoch": 0.09, "learning_rate": 0.00019840171913308054, "loss": 0.7295, "step": 820 }, { "epoch": 0.09, "learning_rate": 0.00019839570973743977, "loss": 0.6827, "step": 821 }, { "epoch": 0.09, "learning_rate": 0.00019838968915694057, "loss": 0.6979, "step": 822 }, { "epoch": 0.09, "learning_rate": 0.00019838365739226728, "loss": 0.7822, "step": 823 }, { "epoch": 0.09, "learning_rate": 0.00019837761444410558, "loss": 0.7691, "step": 824 }, { "epoch": 0.09, "learning_rate": 0.00019837156031314238, "loss": 0.6986, "step": 825 }, { "epoch": 0.09, "learning_rate": 0.00019836549500006588, "loss": 0.6876, "step": 826 }, { "epoch": 0.09, "learning_rate": 0.0001983594185055655, "loss": 0.7874, "step": 827 }, { "epoch": 0.09, "learning_rate": 0.00019835333083033198, "loss": 0.6985, "step": 828 }, { "epoch": 0.09, "learning_rate": 0.00019834723197505733, "loss": 0.6632, "step": 829 }, { "epoch": 0.09, "learning_rate": 0.00019834112194043485, "loss": 0.6888, "step": 830 }, { "epoch": 0.09, "learning_rate": 0.00019833500072715903, "loss": 0.7076, "step": 831 }, { "epoch": 0.09, "learning_rate": 0.00019832886833592568, "loss": 0.7683, "step": 832 }, { "epoch": 0.09, "learning_rate": 0.00019832272476743193, "loss": 0.7231, "step": 833 }, { "epoch": 0.09, "learning_rate": 0.0001983165700223761, "loss": 0.6877, "step": 834 }, { "epoch": 0.09, "learning_rate": 0.0001983104041014578, "loss": 0.7341, "step": 835 }, { "epoch": 0.09, "learning_rate": 0.00019830422700537796, "loss": 0.6821, "step": 836 }, { "epoch": 0.09, "learning_rate": 0.00019829803873483873, "loss": 0.6601, "step": 837 }, { "epoch": 0.09, "learning_rate": 0.00019829183929054355, "loss": 0.7185, "step": 838 }, { "epoch": 0.09, "learning_rate": 0.0001982856286731971, "loss": 0.7392, "step": 839 }, { "epoch": 0.09, "learning_rate": 0.0001982794068835054, "loss": 0.7311, "step": 840 }, { "epoch": 0.09, "learning_rate": 0.00019827317392217566, "loss": 0.6923, "step": 841 }, { "epoch": 0.09, "learning_rate": 0.00019826692978991637, "loss": 0.7429, "step": 842 }, { "epoch": 0.09, "learning_rate": 0.00019826067448743738, "loss": 0.7204, "step": 843 }, { "epoch": 0.09, "learning_rate": 0.0001982544080154497, "loss": 0.7149, "step": 844 }, { "epoch": 0.09, "learning_rate": 0.00019824813037466564, "loss": 0.7208, "step": 845 }, { "epoch": 0.09, "learning_rate": 0.00019824184156579886, "loss": 0.7032, "step": 846 }, { "epoch": 0.09, "learning_rate": 0.00019823554158956413, "loss": 0.7443, "step": 847 }, { "epoch": 0.09, "learning_rate": 0.00019822923044667768, "loss": 0.7083, "step": 848 }, { "epoch": 0.09, "learning_rate": 0.0001982229081378568, "loss": 0.7379, "step": 849 }, { "epoch": 0.09, "learning_rate": 0.0001982165746638203, "loss": 0.7227, "step": 850 }, { "epoch": 0.09, "learning_rate": 0.00019821023002528803, "loss": 0.7537, "step": 851 }, { "epoch": 0.09, "learning_rate": 0.00019820387422298116, "loss": 0.6819, "step": 852 }, { "epoch": 0.09, "learning_rate": 0.00019819750725762227, "loss": 0.7063, "step": 853 }, { "epoch": 0.09, "learning_rate": 0.00019819112912993506, "loss": 0.6718, "step": 854 }, { "epoch": 0.09, "learning_rate": 0.00019818473984064452, "loss": 0.7308, "step": 855 }, { "epoch": 0.09, "learning_rate": 0.00019817833939047696, "loss": 0.7331, "step": 856 }, { "epoch": 0.09, "learning_rate": 0.00019817192778015993, "loss": 0.6897, "step": 857 }, { "epoch": 0.09, "learning_rate": 0.00019816550501042227, "loss": 0.6691, "step": 858 }, { "epoch": 0.09, "learning_rate": 0.00019815907108199405, "loss": 0.7007, "step": 859 }, { "epoch": 0.09, "learning_rate": 0.00019815262599560664, "loss": 0.7019, "step": 860 }, { "epoch": 0.09, "learning_rate": 0.00019814616975199266, "loss": 0.6962, "step": 861 }, { "epoch": 0.09, "learning_rate": 0.00019813970235188602, "loss": 0.6924, "step": 862 }, { "epoch": 0.09, "learning_rate": 0.00019813322379602183, "loss": 0.6033, "step": 863 }, { "epoch": 0.09, "learning_rate": 0.00019812673408513658, "loss": 0.7038, "step": 864 }, { "epoch": 0.09, "learning_rate": 0.00019812023321996795, "loss": 0.6958, "step": 865 }, { "epoch": 0.09, "learning_rate": 0.00019811372120125494, "loss": 0.7213, "step": 866 }, { "epoch": 0.09, "learning_rate": 0.00019810719802973773, "loss": 0.7303, "step": 867 }, { "epoch": 0.09, "learning_rate": 0.00019810066370615784, "loss": 0.7126, "step": 868 }, { "epoch": 0.09, "learning_rate": 0.00019809411823125807, "loss": 0.7276, "step": 869 }, { "epoch": 0.09, "learning_rate": 0.00019808756160578242, "loss": 0.723, "step": 870 }, { "epoch": 0.09, "learning_rate": 0.00019808099383047622, "loss": 0.7578, "step": 871 }, { "epoch": 0.09, "learning_rate": 0.00019807441490608607, "loss": 0.8037, "step": 872 }, { "epoch": 0.09, "learning_rate": 0.00019806782483335975, "loss": 0.7403, "step": 873 }, { "epoch": 0.09, "learning_rate": 0.0001980612236130464, "loss": 0.6929, "step": 874 }, { "epoch": 0.09, "learning_rate": 0.0001980546112458964, "loss": 0.737, "step": 875 }, { "epoch": 0.09, "learning_rate": 0.00019804798773266136, "loss": 0.7432, "step": 876 }, { "epoch": 0.09, "learning_rate": 0.00019804135307409425, "loss": 0.6916, "step": 877 }, { "epoch": 0.09, "learning_rate": 0.00019803470727094917, "loss": 0.6846, "step": 878 }, { "epoch": 0.09, "learning_rate": 0.00019802805032398163, "loss": 0.7368, "step": 879 }, { "epoch": 0.09, "learning_rate": 0.00019802138223394832, "loss": 0.7789, "step": 880 }, { "epoch": 0.09, "learning_rate": 0.0001980147030016072, "loss": 0.7209, "step": 881 }, { "epoch": 0.09, "learning_rate": 0.0001980080126277175, "loss": 0.6994, "step": 882 }, { "epoch": 0.09, "learning_rate": 0.0001980013111130398, "loss": 0.7157, "step": 883 }, { "epoch": 0.09, "learning_rate": 0.0001979945984583358, "loss": 0.7118, "step": 884 }, { "epoch": 0.09, "learning_rate": 0.00019798787466436858, "loss": 0.7035, "step": 885 }, { "epoch": 0.09, "learning_rate": 0.00019798113973190241, "loss": 0.7201, "step": 886 }, { "epoch": 0.09, "learning_rate": 0.00019797439366170294, "loss": 0.7151, "step": 887 }, { "epoch": 0.09, "learning_rate": 0.00019796763645453695, "loss": 0.6512, "step": 888 }, { "epoch": 0.09, "learning_rate": 0.00019796086811117256, "loss": 0.683, "step": 889 }, { "epoch": 0.09, "learning_rate": 0.00019795408863237916, "loss": 0.7467, "step": 890 }, { "epoch": 0.09, "learning_rate": 0.00019794729801892737, "loss": 0.6992, "step": 891 }, { "epoch": 0.09, "learning_rate": 0.00019794049627158908, "loss": 0.6766, "step": 892 }, { "epoch": 0.09, "learning_rate": 0.00019793368339113748, "loss": 0.6861, "step": 893 }, { "epoch": 0.09, "learning_rate": 0.000197926859378347, "loss": 0.6484, "step": 894 }, { "epoch": 0.09, "learning_rate": 0.00019792002423399337, "loss": 0.6286, "step": 895 }, { "epoch": 0.09, "learning_rate": 0.0001979131779588535, "loss": 0.7602, "step": 896 }, { "epoch": 0.09, "learning_rate": 0.00019790632055370565, "loss": 0.6996, "step": 897 }, { "epoch": 0.09, "learning_rate": 0.00019789945201932935, "loss": 0.789, "step": 898 }, { "epoch": 0.09, "learning_rate": 0.0001978925723565053, "loss": 0.7215, "step": 899 }, { "epoch": 0.09, "learning_rate": 0.00019788568156601553, "loss": 0.7058, "step": 900 }, { "epoch": 0.09, "learning_rate": 0.0001978787796486434, "loss": 0.6394, "step": 901 }, { "epoch": 0.09, "learning_rate": 0.00019787186660517344, "loss": 0.7937, "step": 902 }, { "epoch": 0.09, "learning_rate": 0.00019786494243639142, "loss": 0.7383, "step": 903 }, { "epoch": 0.09, "learning_rate": 0.00019785800714308444, "loss": 0.7096, "step": 904 }, { "epoch": 0.09, "learning_rate": 0.00019785106072604092, "loss": 0.663, "step": 905 }, { "epoch": 0.09, "learning_rate": 0.0001978441031860504, "loss": 0.7107, "step": 906 }, { "epoch": 0.09, "learning_rate": 0.00019783713452390376, "loss": 0.7481, "step": 907 }, { "epoch": 0.09, "learning_rate": 0.00019783015474039318, "loss": 0.6682, "step": 908 }, { "epoch": 0.09, "learning_rate": 0.00019782316383631205, "loss": 0.7288, "step": 909 }, { "epoch": 0.09, "learning_rate": 0.00019781616181245505, "loss": 0.7093, "step": 910 }, { "epoch": 0.09, "learning_rate": 0.00019780914866961814, "loss": 0.653, "step": 911 }, { "epoch": 0.09, "learning_rate": 0.00019780212440859846, "loss": 0.6624, "step": 912 }, { "epoch": 0.1, "learning_rate": 0.0001977950890301945, "loss": 0.6837, "step": 913 }, { "epoch": 0.1, "learning_rate": 0.00019778804253520597, "loss": 0.7499, "step": 914 }, { "epoch": 0.1, "learning_rate": 0.00019778098492443394, "loss": 0.7623, "step": 915 }, { "epoch": 0.1, "learning_rate": 0.00019777391619868055, "loss": 0.7356, "step": 916 }, { "epoch": 0.1, "learning_rate": 0.00019776683635874942, "loss": 0.6854, "step": 917 }, { "epoch": 0.1, "learning_rate": 0.00019775974540544526, "loss": 0.7388, "step": 918 }, { "epoch": 0.1, "learning_rate": 0.00019775264333957412, "loss": 0.7214, "step": 919 }, { "epoch": 0.1, "learning_rate": 0.00019774553016194338, "loss": 0.6708, "step": 920 }, { "epoch": 0.1, "learning_rate": 0.00019773840587336151, "loss": 0.6714, "step": 921 }, { "epoch": 0.1, "learning_rate": 0.0001977312704746384, "loss": 0.7013, "step": 922 }, { "epoch": 0.1, "learning_rate": 0.00019772412396658516, "loss": 0.7151, "step": 923 }, { "epoch": 0.1, "learning_rate": 0.0001977169663500141, "loss": 0.6916, "step": 924 }, { "epoch": 0.1, "learning_rate": 0.00019770979762573888, "loss": 0.669, "step": 925 }, { "epoch": 0.1, "learning_rate": 0.00019770261779457438, "loss": 0.7389, "step": 926 }, { "epoch": 0.1, "learning_rate": 0.00019769542685733673, "loss": 0.6633, "step": 927 }, { "epoch": 0.1, "learning_rate": 0.00019768822481484335, "loss": 0.7515, "step": 928 }, { "epoch": 0.1, "learning_rate": 0.0001976810116679129, "loss": 0.7636, "step": 929 }, { "epoch": 0.1, "learning_rate": 0.00019767378741736535, "loss": 0.723, "step": 930 }, { "epoch": 0.1, "learning_rate": 0.00019766655206402187, "loss": 0.6623, "step": 931 }, { "epoch": 0.1, "learning_rate": 0.00019765930560870494, "loss": 0.7004, "step": 932 }, { "epoch": 0.1, "learning_rate": 0.00019765204805223822, "loss": 0.6819, "step": 933 }, { "epoch": 0.1, "learning_rate": 0.00019764477939544678, "loss": 0.7251, "step": 934 }, { "epoch": 0.1, "learning_rate": 0.00019763749963915678, "loss": 0.673, "step": 935 }, { "epoch": 0.1, "learning_rate": 0.00019763020878419581, "loss": 0.7354, "step": 936 }, { "epoch": 0.1, "learning_rate": 0.00019762290683139258, "loss": 0.6972, "step": 937 }, { "epoch": 0.1, "learning_rate": 0.0001976155937815771, "loss": 0.7387, "step": 938 }, { "epoch": 0.1, "learning_rate": 0.00019760826963558073, "loss": 0.6755, "step": 939 }, { "epoch": 0.1, "learning_rate": 0.00019760093439423595, "loss": 0.7616, "step": 940 }, { "epoch": 0.1, "learning_rate": 0.00019759358805837666, "loss": 0.7534, "step": 941 }, { "epoch": 0.1, "learning_rate": 0.00019758623062883783, "loss": 0.6975, "step": 942 }, { "epoch": 0.1, "learning_rate": 0.00019757886210645587, "loss": 0.706, "step": 943 }, { "epoch": 0.1, "learning_rate": 0.00019757148249206836, "loss": 0.7605, "step": 944 }, { "epoch": 0.1, "learning_rate": 0.00019756409178651416, "loss": 0.6622, "step": 945 }, { "epoch": 0.1, "learning_rate": 0.00019755668999063336, "loss": 0.7732, "step": 946 }, { "epoch": 0.1, "learning_rate": 0.00019754927710526735, "loss": 0.6993, "step": 947 }, { "epoch": 0.1, "learning_rate": 0.00019754185313125878, "loss": 0.704, "step": 948 }, { "epoch": 0.1, "learning_rate": 0.00019753441806945156, "loss": 0.6642, "step": 949 }, { "epoch": 0.1, "learning_rate": 0.00019752697192069085, "loss": 0.7124, "step": 950 }, { "epoch": 0.1, "learning_rate": 0.00019751951468582304, "loss": 0.7139, "step": 951 }, { "epoch": 0.1, "learning_rate": 0.00019751204636569582, "loss": 0.7255, "step": 952 }, { "epoch": 0.1, "learning_rate": 0.00019750456696115815, "loss": 0.759, "step": 953 }, { "epoch": 0.1, "learning_rate": 0.0001974970764730602, "loss": 0.7417, "step": 954 }, { "epoch": 0.1, "learning_rate": 0.00019748957490225348, "loss": 0.6396, "step": 955 }, { "epoch": 0.1, "learning_rate": 0.00019748206224959067, "loss": 0.7516, "step": 956 }, { "epoch": 0.1, "learning_rate": 0.00019747453851592575, "loss": 0.6818, "step": 957 }, { "epoch": 0.1, "learning_rate": 0.00019746700370211397, "loss": 0.7117, "step": 958 }, { "epoch": 0.1, "learning_rate": 0.00019745945780901182, "loss": 0.7067, "step": 959 }, { "epoch": 0.1, "learning_rate": 0.00019745190083747706, "loss": 0.6933, "step": 960 }, { "epoch": 0.1, "learning_rate": 0.00019744433278836874, "loss": 0.6973, "step": 961 }, { "epoch": 0.1, "learning_rate": 0.00019743675366254708, "loss": 0.7383, "step": 962 }, { "epoch": 0.1, "learning_rate": 0.00019742916346087369, "loss": 0.6998, "step": 963 }, { "epoch": 0.1, "learning_rate": 0.00019742156218421127, "loss": 0.714, "step": 964 }, { "epoch": 0.1, "learning_rate": 0.00019741394983342395, "loss": 0.73, "step": 965 }, { "epoch": 0.1, "learning_rate": 0.00019740632640937703, "loss": 0.6762, "step": 966 }, { "epoch": 0.1, "learning_rate": 0.00019739869191293702, "loss": 0.7703, "step": 967 }, { "epoch": 0.1, "learning_rate": 0.00019739104634497183, "loss": 0.733, "step": 968 }, { "epoch": 0.1, "learning_rate": 0.00019738338970635053, "loss": 0.7032, "step": 969 }, { "epoch": 0.1, "learning_rate": 0.00019737572199794346, "loss": 0.7063, "step": 970 }, { "epoch": 0.1, "learning_rate": 0.0001973680432206222, "loss": 0.7438, "step": 971 }, { "epoch": 0.1, "learning_rate": 0.00019736035337525963, "loss": 0.6619, "step": 972 }, { "epoch": 0.1, "learning_rate": 0.00019735265246272993, "loss": 0.75, "step": 973 }, { "epoch": 0.1, "learning_rate": 0.00019734494048390838, "loss": 0.7241, "step": 974 }, { "epoch": 0.1, "learning_rate": 0.00019733721743967167, "loss": 0.6864, "step": 975 }, { "epoch": 0.1, "learning_rate": 0.00019732948333089768, "loss": 0.7173, "step": 976 }, { "epoch": 0.1, "learning_rate": 0.00019732173815846556, "loss": 0.7032, "step": 977 }, { "epoch": 0.1, "learning_rate": 0.00019731398192325577, "loss": 0.711, "step": 978 }, { "epoch": 0.1, "learning_rate": 0.0001973062146261499, "loss": 0.7384, "step": 979 }, { "epoch": 0.1, "learning_rate": 0.00019729843626803097, "loss": 0.6585, "step": 980 }, { "epoch": 0.1, "learning_rate": 0.00019729064684978308, "loss": 0.739, "step": 981 }, { "epoch": 0.1, "learning_rate": 0.0001972828463722917, "loss": 0.7502, "step": 982 }, { "epoch": 0.1, "learning_rate": 0.00019727503483644353, "loss": 0.6602, "step": 983 }, { "epoch": 0.1, "learning_rate": 0.00019726721224312655, "loss": 0.7288, "step": 984 }, { "epoch": 0.1, "learning_rate": 0.0001972593785932299, "loss": 0.6987, "step": 985 }, { "epoch": 0.1, "learning_rate": 0.00019725153388764412, "loss": 0.7363, "step": 986 }, { "epoch": 0.1, "learning_rate": 0.0001972436781272609, "loss": 0.7887, "step": 987 }, { "epoch": 0.1, "learning_rate": 0.00019723581131297327, "loss": 0.7035, "step": 988 }, { "epoch": 0.1, "learning_rate": 0.00019722793344567537, "loss": 0.8023, "step": 989 }, { "epoch": 0.1, "learning_rate": 0.00019722004452626276, "loss": 0.7493, "step": 990 }, { "epoch": 0.1, "learning_rate": 0.00019721214455563222, "loss": 0.6917, "step": 991 }, { "epoch": 0.1, "learning_rate": 0.00019720423353468172, "loss": 0.7132, "step": 992 }, { "epoch": 0.1, "learning_rate": 0.0001971963114643105, "loss": 0.721, "step": 993 }, { "epoch": 0.1, "learning_rate": 0.0001971883783454191, "loss": 0.6973, "step": 994 }, { "epoch": 0.1, "learning_rate": 0.00019718043417890933, "loss": 0.717, "step": 995 }, { "epoch": 0.1, "learning_rate": 0.00019717247896568416, "loss": 0.7531, "step": 996 }, { "epoch": 0.1, "learning_rate": 0.00019716451270664794, "loss": 0.7203, "step": 997 }, { "epoch": 0.1, "learning_rate": 0.00019715653540270615, "loss": 0.7231, "step": 998 }, { "epoch": 0.1, "learning_rate": 0.0001971485470547656, "loss": 0.7107, "step": 999 }, { "epoch": 0.1, "learning_rate": 0.0001971405476637344, "loss": 0.7733, "step": 1000 }, { "epoch": 0.1, "learning_rate": 0.0001971325372305218, "loss": 0.7615, "step": 1001 }, { "epoch": 0.1, "learning_rate": 0.00019712451575603837, "loss": 0.7383, "step": 1002 }, { "epoch": 0.1, "learning_rate": 0.00019711648324119597, "loss": 0.7659, "step": 1003 }, { "epoch": 0.1, "learning_rate": 0.0001971084396869076, "loss": 0.7287, "step": 1004 }, { "epoch": 0.1, "learning_rate": 0.00019710038509408771, "loss": 0.7392, "step": 1005 }, { "epoch": 0.1, "learning_rate": 0.00019709231946365177, "loss": 0.7314, "step": 1006 }, { "epoch": 0.1, "learning_rate": 0.00019708424279651663, "loss": 0.7778, "step": 1007 }, { "epoch": 0.1, "learning_rate": 0.00019707615509360042, "loss": 0.7176, "step": 1008 }, { "epoch": 0.11, "learning_rate": 0.0001970680563558225, "loss": 0.7411, "step": 1009 }, { "epoch": 0.11, "learning_rate": 0.00019705994658410342, "loss": 0.7105, "step": 1010 }, { "epoch": 0.11, "learning_rate": 0.00019705182577936506, "loss": 0.6774, "step": 1011 }, { "epoch": 0.11, "learning_rate": 0.00019704369394253054, "loss": 0.6844, "step": 1012 }, { "epoch": 0.11, "learning_rate": 0.00019703555107452423, "loss": 0.6846, "step": 1013 }, { "epoch": 0.11, "learning_rate": 0.0001970273971762717, "loss": 0.7374, "step": 1014 }, { "epoch": 0.11, "learning_rate": 0.00019701923224869986, "loss": 0.6932, "step": 1015 }, { "epoch": 0.11, "learning_rate": 0.00019701105629273686, "loss": 0.7123, "step": 1016 }, { "epoch": 0.11, "learning_rate": 0.00019700286930931203, "loss": 0.7116, "step": 1017 }, { "epoch": 0.11, "learning_rate": 0.00019699467129935606, "loss": 0.7378, "step": 1018 }, { "epoch": 0.11, "learning_rate": 0.00019698646226380074, "loss": 0.7147, "step": 1019 }, { "epoch": 0.11, "learning_rate": 0.0001969782422035793, "loss": 0.7711, "step": 1020 }, { "epoch": 0.11, "learning_rate": 0.0001969700111196261, "loss": 0.7213, "step": 1021 }, { "epoch": 0.11, "learning_rate": 0.00019696176901287676, "loss": 0.7283, "step": 1022 }, { "epoch": 0.11, "learning_rate": 0.00019695351588426823, "loss": 0.7354, "step": 1023 }, { "epoch": 0.11, "learning_rate": 0.00019694525173473862, "loss": 0.6392, "step": 1024 }, { "epoch": 0.11, "learning_rate": 0.00019693697656522735, "loss": 0.6818, "step": 1025 }, { "epoch": 0.11, "learning_rate": 0.00019692869037667512, "loss": 0.6435, "step": 1026 }, { "epoch": 0.11, "learning_rate": 0.00019692039317002375, "loss": 0.685, "step": 1027 }, { "epoch": 0.11, "learning_rate": 0.00019691208494621644, "loss": 0.7316, "step": 1028 }, { "epoch": 0.11, "learning_rate": 0.00019690376570619767, "loss": 0.6929, "step": 1029 }, { "epoch": 0.11, "learning_rate": 0.00019689543545091298, "loss": 0.7048, "step": 1030 }, { "epoch": 0.11, "learning_rate": 0.00019688709418130943, "loss": 0.7118, "step": 1031 }, { "epoch": 0.11, "learning_rate": 0.00019687874189833505, "loss": 0.6683, "step": 1032 }, { "epoch": 0.11, "learning_rate": 0.00019687037860293934, "loss": 0.7128, "step": 1033 }, { "epoch": 0.11, "learning_rate": 0.00019686200429607298, "loss": 0.702, "step": 1034 }, { "epoch": 0.11, "learning_rate": 0.0001968536189786879, "loss": 0.7315, "step": 1035 }, { "epoch": 0.11, "learning_rate": 0.00019684522265173723, "loss": 0.6492, "step": 1036 }, { "epoch": 0.11, "learning_rate": 0.00019683681531617545, "loss": 0.6689, "step": 1037 }, { "epoch": 0.11, "learning_rate": 0.00019682839697295821, "loss": 0.7013, "step": 1038 }, { "epoch": 0.11, "learning_rate": 0.00019681996762304244, "loss": 0.7347, "step": 1039 }, { "epoch": 0.11, "learning_rate": 0.00019681152726738632, "loss": 0.7558, "step": 1040 }, { "epoch": 0.11, "learning_rate": 0.00019680307590694932, "loss": 0.6597, "step": 1041 }, { "epoch": 0.11, "learning_rate": 0.00019679461354269207, "loss": 0.7612, "step": 1042 }, { "epoch": 0.11, "learning_rate": 0.0001967861401755766, "loss": 0.6596, "step": 1043 }, { "epoch": 0.11, "learning_rate": 0.00019677765580656598, "loss": 0.7198, "step": 1044 }, { "epoch": 0.11, "learning_rate": 0.00019676916043662472, "loss": 0.7366, "step": 1045 }, { "epoch": 0.11, "learning_rate": 0.0001967606540667185, "loss": 0.7194, "step": 1046 }, { "epoch": 0.11, "learning_rate": 0.00019675213669781422, "loss": 0.7767, "step": 1047 }, { "epoch": 0.11, "learning_rate": 0.0001967436083308801, "loss": 0.699, "step": 1048 }, { "epoch": 0.11, "learning_rate": 0.00019673506896688558, "loss": 0.7716, "step": 1049 }, { "epoch": 0.11, "learning_rate": 0.00019672651860680134, "loss": 0.7257, "step": 1050 }, { "epoch": 0.11, "learning_rate": 0.0001967179572515993, "loss": 0.6917, "step": 1051 }, { "epoch": 0.11, "learning_rate": 0.0001967093849022527, "loss": 0.7329, "step": 1052 }, { "epoch": 0.11, "learning_rate": 0.00019670080155973594, "loss": 0.614, "step": 1053 }, { "epoch": 0.11, "learning_rate": 0.0001966922072250247, "loss": 0.7039, "step": 1054 }, { "epoch": 0.11, "learning_rate": 0.00019668360189909593, "loss": 0.7115, "step": 1055 }, { "epoch": 0.11, "learning_rate": 0.00019667498558292783, "loss": 0.6576, "step": 1056 }, { "epoch": 0.11, "learning_rate": 0.0001966663582774998, "loss": 0.7614, "step": 1057 }, { "epoch": 0.11, "learning_rate": 0.00019665771998379257, "loss": 0.741, "step": 1058 }, { "epoch": 0.11, "learning_rate": 0.00019664907070278802, "loss": 0.6586, "step": 1059 }, { "epoch": 0.11, "learning_rate": 0.00019664041043546943, "loss": 0.7637, "step": 1060 }, { "epoch": 0.11, "learning_rate": 0.0001966317391828211, "loss": 0.7148, "step": 1061 }, { "epoch": 0.11, "learning_rate": 0.0001966230569458288, "loss": 0.6467, "step": 1062 }, { "epoch": 0.11, "learning_rate": 0.0001966143637254794, "loss": 0.7071, "step": 1063 }, { "epoch": 0.11, "learning_rate": 0.00019660565952276117, "loss": 0.7036, "step": 1064 }, { "epoch": 0.11, "learning_rate": 0.00019659694433866345, "loss": 0.71, "step": 1065 }, { "epoch": 0.11, "learning_rate": 0.00019658821817417695, "loss": 0.6783, "step": 1066 }, { "epoch": 0.11, "learning_rate": 0.0001965794810302936, "loss": 0.7097, "step": 1067 }, { "epoch": 0.11, "learning_rate": 0.00019657073290800652, "loss": 0.6714, "step": 1068 }, { "epoch": 0.11, "learning_rate": 0.0001965619738083102, "loss": 0.6868, "step": 1069 }, { "epoch": 0.11, "learning_rate": 0.00019655320373220025, "loss": 0.6492, "step": 1070 }, { "epoch": 0.11, "learning_rate": 0.00019654442268067363, "loss": 0.7248, "step": 1071 }, { "epoch": 0.11, "learning_rate": 0.00019653563065472843, "loss": 0.7157, "step": 1072 }, { "epoch": 0.11, "learning_rate": 0.00019652682765536417, "loss": 0.7125, "step": 1073 }, { "epoch": 0.11, "learning_rate": 0.0001965180136835814, "loss": 0.6921, "step": 1074 }, { "epoch": 0.11, "learning_rate": 0.00019650918874038209, "loss": 0.6652, "step": 1075 }, { "epoch": 0.11, "learning_rate": 0.00019650035282676935, "loss": 0.7576, "step": 1076 }, { "epoch": 0.11, "learning_rate": 0.0001964915059437476, "loss": 0.6893, "step": 1077 }, { "epoch": 0.11, "learning_rate": 0.00019648264809232248, "loss": 0.7557, "step": 1078 }, { "epoch": 0.11, "learning_rate": 0.00019647377927350089, "loss": 0.7106, "step": 1079 }, { "epoch": 0.11, "learning_rate": 0.00019646489948829093, "loss": 0.7346, "step": 1080 }, { "epoch": 0.11, "learning_rate": 0.000196456008737702, "loss": 0.678, "step": 1081 }, { "epoch": 0.11, "learning_rate": 0.0001964471070227448, "loss": 0.7205, "step": 1082 }, { "epoch": 0.11, "learning_rate": 0.00019643819434443112, "loss": 0.7654, "step": 1083 }, { "epoch": 0.11, "learning_rate": 0.00019642927070377415, "loss": 0.6543, "step": 1084 }, { "epoch": 0.11, "learning_rate": 0.0001964203361017882, "loss": 0.7158, "step": 1085 }, { "epoch": 0.11, "learning_rate": 0.00019641139053948892, "loss": 0.7239, "step": 1086 }, { "epoch": 0.11, "learning_rate": 0.00019640243401789317, "loss": 0.6759, "step": 1087 }, { "epoch": 0.11, "learning_rate": 0.00019639346653801907, "loss": 0.7289, "step": 1088 }, { "epoch": 0.11, "learning_rate": 0.00019638448810088593, "loss": 0.7106, "step": 1089 }, { "epoch": 0.11, "learning_rate": 0.00019637549870751437, "loss": 0.6821, "step": 1090 }, { "epoch": 0.11, "learning_rate": 0.00019636649835892624, "loss": 0.7142, "step": 1091 }, { "epoch": 0.11, "learning_rate": 0.00019635748705614466, "loss": 0.7485, "step": 1092 }, { "epoch": 0.11, "learning_rate": 0.0001963484648001939, "loss": 0.6693, "step": 1093 }, { "epoch": 0.11, "learning_rate": 0.0001963394315920996, "loss": 0.7822, "step": 1094 }, { "epoch": 0.11, "learning_rate": 0.00019633038743288852, "loss": 0.7697, "step": 1095 }, { "epoch": 0.11, "learning_rate": 0.0001963213323235888, "loss": 0.7375, "step": 1096 }, { "epoch": 0.11, "learning_rate": 0.0001963122662652297, "loss": 0.7231, "step": 1097 }, { "epoch": 0.11, "learning_rate": 0.00019630318925884183, "loss": 0.7146, "step": 1098 }, { "epoch": 0.11, "learning_rate": 0.00019629410130545693, "loss": 0.6788, "step": 1099 }, { "epoch": 0.11, "learning_rate": 0.00019628500240610812, "loss": 0.7346, "step": 1100 }, { "epoch": 0.11, "learning_rate": 0.00019627589256182964, "loss": 0.728, "step": 1101 }, { "epoch": 0.11, "learning_rate": 0.00019626677177365703, "loss": 0.6988, "step": 1102 }, { "epoch": 0.11, "learning_rate": 0.00019625764004262708, "loss": 0.7457, "step": 1103 }, { "epoch": 0.11, "learning_rate": 0.00019624849736977785, "loss": 0.6518, "step": 1104 }, { "epoch": 0.12, "learning_rate": 0.00019623934375614854, "loss": 0.7409, "step": 1105 }, { "epoch": 0.12, "learning_rate": 0.0001962301792027797, "loss": 0.6941, "step": 1106 }, { "epoch": 0.12, "learning_rate": 0.00019622100371071306, "loss": 0.7251, "step": 1107 }, { "epoch": 0.12, "learning_rate": 0.00019621181728099167, "loss": 0.688, "step": 1108 }, { "epoch": 0.12, "learning_rate": 0.00019620261991465973, "loss": 0.7405, "step": 1109 }, { "epoch": 0.12, "learning_rate": 0.00019619341161276275, "loss": 0.7337, "step": 1110 }, { "epoch": 0.12, "learning_rate": 0.0001961841923763474, "loss": 0.6896, "step": 1111 }, { "epoch": 0.12, "learning_rate": 0.00019617496220646175, "loss": 0.701, "step": 1112 }, { "epoch": 0.12, "learning_rate": 0.0001961657211041549, "loss": 0.6685, "step": 1113 }, { "epoch": 0.12, "learning_rate": 0.0001961564690704774, "loss": 0.699, "step": 1114 }, { "epoch": 0.12, "learning_rate": 0.00019614720610648093, "loss": 0.6631, "step": 1115 }, { "epoch": 0.12, "learning_rate": 0.00019613793221321836, "loss": 0.7258, "step": 1116 }, { "epoch": 0.12, "learning_rate": 0.000196128647391744, "loss": 0.7543, "step": 1117 }, { "epoch": 0.12, "learning_rate": 0.00019611935164311314, "loss": 0.7118, "step": 1118 }, { "epoch": 0.12, "learning_rate": 0.00019611004496838255, "loss": 0.7318, "step": 1119 }, { "epoch": 0.12, "learning_rate": 0.00019610072736861008, "loss": 0.7098, "step": 1120 }, { "epoch": 0.12, "learning_rate": 0.00019609139884485495, "loss": 0.7217, "step": 1121 }, { "epoch": 0.12, "learning_rate": 0.00019608205939817747, "loss": 0.7072, "step": 1122 }, { "epoch": 0.12, "learning_rate": 0.00019607270902963935, "loss": 0.701, "step": 1123 }, { "epoch": 0.12, "learning_rate": 0.00019606334774030339, "loss": 0.7152, "step": 1124 }, { "epoch": 0.12, "learning_rate": 0.0001960539755312338, "loss": 0.7037, "step": 1125 }, { "epoch": 0.12, "learning_rate": 0.00019604459240349584, "loss": 0.7295, "step": 1126 }, { "epoch": 0.12, "learning_rate": 0.00019603519835815618, "loss": 0.6611, "step": 1127 }, { "epoch": 0.12, "learning_rate": 0.00019602579339628265, "loss": 0.7061, "step": 1128 }, { "epoch": 0.12, "learning_rate": 0.00019601637751894436, "loss": 0.678, "step": 1129 }, { "epoch": 0.12, "learning_rate": 0.00019600695072721156, "loss": 0.7389, "step": 1130 }, { "epoch": 0.12, "learning_rate": 0.00019599751302215584, "loss": 0.7342, "step": 1131 }, { "epoch": 0.12, "learning_rate": 0.00019598806440485007, "loss": 0.7321, "step": 1132 }, { "epoch": 0.12, "learning_rate": 0.00019597860487636823, "loss": 0.7062, "step": 1133 }, { "epoch": 0.12, "learning_rate": 0.0001959691344377856, "loss": 0.7071, "step": 1134 }, { "epoch": 0.12, "learning_rate": 0.00019595965309017875, "loss": 0.7289, "step": 1135 }, { "epoch": 0.12, "learning_rate": 0.0001959501608346254, "loss": 0.7109, "step": 1136 }, { "epoch": 0.12, "learning_rate": 0.0001959406576722046, "loss": 0.7055, "step": 1137 }, { "epoch": 0.12, "learning_rate": 0.00019593114360399655, "loss": 0.6918, "step": 1138 }, { "epoch": 0.12, "learning_rate": 0.00019592161863108277, "loss": 0.7189, "step": 1139 }, { "epoch": 0.12, "learning_rate": 0.000195912082754546, "loss": 0.7102, "step": 1140 }, { "epoch": 0.12, "learning_rate": 0.00019590253597547014, "loss": 0.7147, "step": 1141 }, { "epoch": 0.12, "learning_rate": 0.00019589297829494045, "loss": 0.705, "step": 1142 }, { "epoch": 0.12, "learning_rate": 0.00019588340971404334, "loss": 0.6855, "step": 1143 }, { "epoch": 0.12, "learning_rate": 0.00019587383023386652, "loss": 0.7349, "step": 1144 }, { "epoch": 0.12, "learning_rate": 0.0001958642398554989, "loss": 0.6825, "step": 1145 }, { "epoch": 0.12, "learning_rate": 0.00019585463858003062, "loss": 0.693, "step": 1146 }, { "epoch": 0.12, "learning_rate": 0.00019584502640855313, "loss": 0.6424, "step": 1147 }, { "epoch": 0.12, "learning_rate": 0.00019583540334215899, "loss": 0.6885, "step": 1148 }, { "epoch": 0.12, "learning_rate": 0.00019582576938194214, "loss": 0.6957, "step": 1149 }, { "epoch": 0.12, "learning_rate": 0.00019581612452899765, "loss": 0.753, "step": 1150 }, { "epoch": 0.12, "learning_rate": 0.00019580646878442193, "loss": 0.7328, "step": 1151 }, { "epoch": 0.12, "learning_rate": 0.00019579680214931248, "loss": 0.6961, "step": 1152 }, { "epoch": 0.12, "learning_rate": 0.00019578712462476822, "loss": 0.6898, "step": 1153 }, { "epoch": 0.12, "learning_rate": 0.00019577743621188915, "loss": 0.7415, "step": 1154 }, { "epoch": 0.12, "learning_rate": 0.00019576773691177662, "loss": 0.7502, "step": 1155 }, { "epoch": 0.12, "learning_rate": 0.00019575802672553314, "loss": 0.7088, "step": 1156 }, { "epoch": 0.12, "learning_rate": 0.00019574830565426252, "loss": 0.7779, "step": 1157 }, { "epoch": 0.12, "learning_rate": 0.00019573857369906974, "loss": 0.6599, "step": 1158 }, { "epoch": 0.12, "learning_rate": 0.00019572883086106104, "loss": 0.6934, "step": 1159 }, { "epoch": 0.12, "learning_rate": 0.00019571907714134397, "loss": 0.6927, "step": 1160 }, { "epoch": 0.12, "learning_rate": 0.0001957093125410272, "loss": 0.7702, "step": 1161 }, { "epoch": 0.12, "learning_rate": 0.00019569953706122072, "loss": 0.7053, "step": 1162 }, { "epoch": 0.12, "learning_rate": 0.00019568975070303573, "loss": 0.6805, "step": 1163 }, { "epoch": 0.12, "learning_rate": 0.0001956799534675847, "loss": 0.6958, "step": 1164 }, { "epoch": 0.12, "learning_rate": 0.00019567014535598121, "loss": 0.6727, "step": 1165 }, { "epoch": 0.12, "learning_rate": 0.00019566032636934028, "loss": 0.7001, "step": 1166 }, { "epoch": 0.12, "learning_rate": 0.00019565049650877798, "loss": 0.6899, "step": 1167 }, { "epoch": 0.12, "learning_rate": 0.00019564065577541172, "loss": 0.7551, "step": 1168 }, { "epoch": 0.12, "learning_rate": 0.00019563080417036013, "loss": 0.766, "step": 1169 }, { "epoch": 0.12, "learning_rate": 0.00019562094169474305, "loss": 0.6491, "step": 1170 }, { "epoch": 0.12, "learning_rate": 0.0001956110683496815, "loss": 0.6753, "step": 1171 }, { "epoch": 0.12, "learning_rate": 0.00019560118413629795, "loss": 0.6994, "step": 1172 }, { "epoch": 0.12, "learning_rate": 0.00019559128905571584, "loss": 0.6823, "step": 1173 }, { "epoch": 0.12, "learning_rate": 0.00019558138310906006, "loss": 0.7613, "step": 1174 }, { "epoch": 0.12, "learning_rate": 0.00019557146629745655, "loss": 0.7433, "step": 1175 }, { "epoch": 0.12, "learning_rate": 0.0001955615386220326, "loss": 0.7294, "step": 1176 }, { "epoch": 0.12, "learning_rate": 0.00019555160008391675, "loss": 0.6899, "step": 1177 }, { "epoch": 0.12, "learning_rate": 0.00019554165068423873, "loss": 0.7381, "step": 1178 }, { "epoch": 0.12, "learning_rate": 0.00019553169042412947, "loss": 0.6979, "step": 1179 }, { "epoch": 0.12, "learning_rate": 0.0001955217193047212, "loss": 0.7207, "step": 1180 }, { "epoch": 0.12, "learning_rate": 0.00019551173732714733, "loss": 0.6966, "step": 1181 }, { "epoch": 0.12, "learning_rate": 0.00019550174449254262, "loss": 0.7393, "step": 1182 }, { "epoch": 0.12, "learning_rate": 0.00019549174080204287, "loss": 0.6807, "step": 1183 }, { "epoch": 0.12, "learning_rate": 0.00019548172625678527, "loss": 0.7172, "step": 1184 }, { "epoch": 0.12, "learning_rate": 0.0001954717008579082, "loss": 0.6922, "step": 1185 }, { "epoch": 0.12, "learning_rate": 0.0001954616646065513, "loss": 0.666, "step": 1186 }, { "epoch": 0.12, "learning_rate": 0.00019545161750385534, "loss": 0.7455, "step": 1187 }, { "epoch": 0.12, "learning_rate": 0.00019544155955096245, "loss": 0.6749, "step": 1188 }, { "epoch": 0.12, "learning_rate": 0.00019543149074901592, "loss": 0.6947, "step": 1189 }, { "epoch": 0.12, "learning_rate": 0.0001954214110991603, "loss": 0.6608, "step": 1190 }, { "epoch": 0.12, "learning_rate": 0.00019541132060254136, "loss": 0.6785, "step": 1191 }, { "epoch": 0.12, "learning_rate": 0.0001954012192603061, "loss": 0.7524, "step": 1192 }, { "epoch": 0.12, "learning_rate": 0.00019539110707360278, "loss": 0.67, "step": 1193 }, { "epoch": 0.12, "learning_rate": 0.00019538098404358088, "loss": 0.6461, "step": 1194 }, { "epoch": 0.12, "learning_rate": 0.00019537085017139107, "loss": 0.7088, "step": 1195 }, { "epoch": 0.12, "learning_rate": 0.00019536070545818533, "loss": 0.7793, "step": 1196 }, { "epoch": 0.12, "learning_rate": 0.00019535054990511684, "loss": 0.703, "step": 1197 }, { "epoch": 0.12, "learning_rate": 0.00019534038351333996, "loss": 0.7024, "step": 1198 }, { "epoch": 0.12, "learning_rate": 0.00019533020628401034, "loss": 0.6405, "step": 1199 }, { "epoch": 0.12, "learning_rate": 0.00019532001821828487, "loss": 0.728, "step": 1200 }, { "epoch": 0.13, "learning_rate": 0.00019530981931732165, "loss": 0.6815, "step": 1201 }, { "epoch": 0.13, "learning_rate": 0.00019529960958227996, "loss": 0.6984, "step": 1202 }, { "epoch": 0.13, "learning_rate": 0.00019528938901432042, "loss": 0.6991, "step": 1203 }, { "epoch": 0.13, "learning_rate": 0.0001952791576146048, "loss": 0.7409, "step": 1204 }, { "epoch": 0.13, "learning_rate": 0.00019526891538429616, "loss": 0.7476, "step": 1205 }, { "epoch": 0.13, "learning_rate": 0.0001952586623245587, "loss": 0.6497, "step": 1206 }, { "epoch": 0.13, "learning_rate": 0.00019524839843655794, "loss": 0.7052, "step": 1207 }, { "epoch": 0.13, "learning_rate": 0.0001952381237214606, "loss": 0.722, "step": 1208 }, { "epoch": 0.13, "learning_rate": 0.0001952278381804346, "loss": 0.6903, "step": 1209 }, { "epoch": 0.13, "learning_rate": 0.00019521754181464916, "loss": 0.7167, "step": 1210 }, { "epoch": 0.13, "learning_rate": 0.00019520723462527472, "loss": 0.6616, "step": 1211 }, { "epoch": 0.13, "learning_rate": 0.00019519691661348283, "loss": 0.7088, "step": 1212 }, { "epoch": 0.13, "learning_rate": 0.00019518658778044644, "loss": 0.7163, "step": 1213 }, { "epoch": 0.13, "learning_rate": 0.0001951762481273396, "loss": 0.646, "step": 1214 }, { "epoch": 0.13, "learning_rate": 0.00019516589765533767, "loss": 0.6493, "step": 1215 }, { "epoch": 0.13, "learning_rate": 0.00019515553636561717, "loss": 0.7269, "step": 1216 }, { "epoch": 0.13, "learning_rate": 0.00019514516425935596, "loss": 0.6758, "step": 1217 }, { "epoch": 0.13, "learning_rate": 0.00019513478133773303, "loss": 0.6327, "step": 1218 }, { "epoch": 0.13, "learning_rate": 0.0001951243876019286, "loss": 0.6973, "step": 1219 }, { "epoch": 0.13, "learning_rate": 0.00019511398305312416, "loss": 0.7159, "step": 1220 }, { "epoch": 0.13, "learning_rate": 0.00019510356769250245, "loss": 0.6785, "step": 1221 }, { "epoch": 0.13, "learning_rate": 0.0001950931415212474, "loss": 0.7034, "step": 1222 }, { "epoch": 0.13, "learning_rate": 0.00019508270454054414, "loss": 0.6981, "step": 1223 }, { "epoch": 0.13, "learning_rate": 0.0001950722567515791, "loss": 0.7291, "step": 1224 }, { "epoch": 0.13, "learning_rate": 0.00019506179815553988, "loss": 0.7568, "step": 1225 }, { "epoch": 0.13, "learning_rate": 0.00019505132875361535, "loss": 0.6964, "step": 1226 }, { "epoch": 0.13, "learning_rate": 0.00019504084854699558, "loss": 0.7063, "step": 1227 }, { "epoch": 0.13, "learning_rate": 0.0001950303575368719, "loss": 0.7442, "step": 1228 }, { "epoch": 0.13, "learning_rate": 0.00019501985572443678, "loss": 0.739, "step": 1229 }, { "epoch": 0.13, "learning_rate": 0.0001950093431108841, "loss": 0.7421, "step": 1230 }, { "epoch": 0.13, "learning_rate": 0.00019499881969740874, "loss": 0.6924, "step": 1231 }, { "epoch": 0.13, "learning_rate": 0.00019498828548520698, "loss": 0.7285, "step": 1232 }, { "epoch": 0.13, "learning_rate": 0.00019497774047547622, "loss": 0.7077, "step": 1233 }, { "epoch": 0.13, "learning_rate": 0.00019496718466941522, "loss": 0.7908, "step": 1234 }, { "epoch": 0.13, "learning_rate": 0.00019495661806822378, "loss": 0.7103, "step": 1235 }, { "epoch": 0.13, "learning_rate": 0.00019494604067310308, "loss": 0.7985, "step": 1236 }, { "epoch": 0.13, "learning_rate": 0.0001949354524852555, "loss": 0.6538, "step": 1237 }, { "epoch": 0.13, "learning_rate": 0.0001949248535058846, "loss": 0.6757, "step": 1238 }, { "epoch": 0.13, "learning_rate": 0.00019491424373619518, "loss": 0.7171, "step": 1239 }, { "epoch": 0.13, "learning_rate": 0.00019490362317739325, "loss": 0.7343, "step": 1240 }, { "epoch": 0.13, "learning_rate": 0.00019489299183068613, "loss": 0.7412, "step": 1241 }, { "epoch": 0.13, "learning_rate": 0.00019488234969728226, "loss": 0.6594, "step": 1242 }, { "epoch": 0.13, "learning_rate": 0.0001948716967783914, "loss": 0.7089, "step": 1243 }, { "epoch": 0.13, "learning_rate": 0.00019486103307522447, "loss": 0.6663, "step": 1244 }, { "epoch": 0.13, "learning_rate": 0.00019485035858899364, "loss": 0.701, "step": 1245 }, { "epoch": 0.13, "learning_rate": 0.00019483967332091227, "loss": 0.7201, "step": 1246 }, { "epoch": 0.13, "learning_rate": 0.00019482897727219502, "loss": 0.6856, "step": 1247 }, { "epoch": 0.13, "learning_rate": 0.00019481827044405772, "loss": 0.7432, "step": 1248 }, { "epoch": 0.13, "learning_rate": 0.00019480755283771744, "loss": 0.7081, "step": 1249 }, { "epoch": 0.13, "learning_rate": 0.00019479682445439246, "loss": 0.6807, "step": 1250 }, { "epoch": 0.13, "learning_rate": 0.00019478608529530233, "loss": 0.6685, "step": 1251 }, { "epoch": 0.13, "learning_rate": 0.00019477533536166778, "loss": 0.6735, "step": 1252 }, { "epoch": 0.13, "learning_rate": 0.00019476457465471075, "loss": 0.7522, "step": 1253 }, { "epoch": 0.13, "learning_rate": 0.00019475380317565447, "loss": 0.6571, "step": 1254 }, { "epoch": 0.13, "learning_rate": 0.00019474302092572333, "loss": 0.6806, "step": 1255 }, { "epoch": 0.13, "learning_rate": 0.000194732227906143, "loss": 0.8219, "step": 1256 }, { "epoch": 0.13, "learning_rate": 0.00019472142411814031, "loss": 0.7318, "step": 1257 }, { "epoch": 0.13, "learning_rate": 0.0001947106095629434, "loss": 0.6676, "step": 1258 }, { "epoch": 0.13, "learning_rate": 0.00019469978424178157, "loss": 0.7096, "step": 1259 }, { "epoch": 0.13, "learning_rate": 0.00019468894815588534, "loss": 0.6888, "step": 1260 }, { "epoch": 0.13, "learning_rate": 0.00019467810130648647, "loss": 0.6093, "step": 1261 }, { "epoch": 0.13, "learning_rate": 0.00019466724369481794, "loss": 0.6445, "step": 1262 }, { "epoch": 0.13, "learning_rate": 0.000194656375322114, "loss": 0.7542, "step": 1263 }, { "epoch": 0.13, "learning_rate": 0.00019464549618961006, "loss": 0.7204, "step": 1264 }, { "epoch": 0.13, "learning_rate": 0.00019463460629854274, "loss": 0.7131, "step": 1265 }, { "epoch": 0.13, "learning_rate": 0.00019462370565015, "loss": 0.6448, "step": 1266 }, { "epoch": 0.13, "learning_rate": 0.00019461279424567082, "loss": 0.6638, "step": 1267 }, { "epoch": 0.13, "learning_rate": 0.00019460187208634563, "loss": 0.6933, "step": 1268 }, { "epoch": 0.13, "learning_rate": 0.00019459093917341592, "loss": 0.7186, "step": 1269 }, { "epoch": 0.13, "learning_rate": 0.0001945799955081245, "loss": 0.8006, "step": 1270 }, { "epoch": 0.13, "learning_rate": 0.00019456904109171533, "loss": 0.7181, "step": 1271 }, { "epoch": 0.13, "learning_rate": 0.00019455807592543364, "loss": 0.7344, "step": 1272 }, { "epoch": 0.13, "learning_rate": 0.00019454710001052584, "loss": 0.7032, "step": 1273 }, { "epoch": 0.13, "learning_rate": 0.00019453611334823963, "loss": 0.7005, "step": 1274 }, { "epoch": 0.13, "learning_rate": 0.00019452511593982382, "loss": 0.6812, "step": 1275 }, { "epoch": 0.13, "learning_rate": 0.00019451410778652858, "loss": 0.6232, "step": 1276 }, { "epoch": 0.13, "learning_rate": 0.0001945030888896052, "loss": 0.6531, "step": 1277 }, { "epoch": 0.13, "learning_rate": 0.0001944920592503062, "loss": 0.6693, "step": 1278 }, { "epoch": 0.13, "learning_rate": 0.0001944810188698854, "loss": 0.7159, "step": 1279 }, { "epoch": 0.13, "learning_rate": 0.00019446996774959773, "loss": 0.6733, "step": 1280 }, { "epoch": 0.13, "learning_rate": 0.00019445890589069942, "loss": 0.6886, "step": 1281 }, { "epoch": 0.13, "learning_rate": 0.0001944478332944479, "loss": 0.6574, "step": 1282 }, { "epoch": 0.13, "learning_rate": 0.0001944367499621018, "loss": 0.7506, "step": 1283 }, { "epoch": 0.13, "learning_rate": 0.000194425655894921, "loss": 0.6995, "step": 1284 }, { "epoch": 0.13, "learning_rate": 0.0001944145510941666, "loss": 0.7219, "step": 1285 }, { "epoch": 0.13, "learning_rate": 0.0001944034355611009, "loss": 0.6553, "step": 1286 }, { "epoch": 0.13, "learning_rate": 0.00019439230929698737, "loss": 0.8095, "step": 1287 }, { "epoch": 0.13, "learning_rate": 0.00019438117230309083, "loss": 0.7006, "step": 1288 }, { "epoch": 0.13, "learning_rate": 0.00019437002458067723, "loss": 0.7271, "step": 1289 }, { "epoch": 0.13, "learning_rate": 0.00019435886613101375, "loss": 0.7053, "step": 1290 }, { "epoch": 0.13, "learning_rate": 0.00019434769695536878, "loss": 0.7809, "step": 1291 }, { "epoch": 0.13, "learning_rate": 0.00019433651705501198, "loss": 0.6258, "step": 1292 }, { "epoch": 0.13, "learning_rate": 0.00019432532643121414, "loss": 0.7267, "step": 1293 }, { "epoch": 0.13, "learning_rate": 0.0001943141250852474, "loss": 0.7222, "step": 1294 }, { "epoch": 0.13, "learning_rate": 0.00019430291301838497, "loss": 0.6663, "step": 1295 }, { "epoch": 0.13, "learning_rate": 0.0001942916902319014, "loss": 0.7294, "step": 1296 }, { "epoch": 0.14, "learning_rate": 0.00019428045672707236, "loss": 0.6829, "step": 1297 }, { "epoch": 0.14, "learning_rate": 0.0001942692125051748, "loss": 0.7061, "step": 1298 }, { "epoch": 0.14, "learning_rate": 0.00019425795756748695, "loss": 0.6932, "step": 1299 }, { "epoch": 0.14, "learning_rate": 0.0001942466919152881, "loss": 0.7022, "step": 1300 }, { "epoch": 0.14, "learning_rate": 0.00019423541554985886, "loss": 0.7138, "step": 1301 }, { "epoch": 0.14, "learning_rate": 0.00019422412847248106, "loss": 0.762, "step": 1302 }, { "epoch": 0.14, "learning_rate": 0.0001942128306844377, "loss": 0.6947, "step": 1303 }, { "epoch": 0.14, "learning_rate": 0.00019420152218701305, "loss": 0.6909, "step": 1304 }, { "epoch": 0.14, "learning_rate": 0.00019419020298149252, "loss": 0.7224, "step": 1305 }, { "epoch": 0.14, "learning_rate": 0.00019417887306916285, "loss": 0.6945, "step": 1306 }, { "epoch": 0.14, "learning_rate": 0.0001941675324513119, "loss": 0.7333, "step": 1307 }, { "epoch": 0.14, "learning_rate": 0.00019415618112922885, "loss": 0.724, "step": 1308 }, { "epoch": 0.14, "learning_rate": 0.00019414481910420394, "loss": 0.7221, "step": 1309 }, { "epoch": 0.14, "learning_rate": 0.00019413344637752875, "loss": 0.7277, "step": 1310 }, { "epoch": 0.14, "learning_rate": 0.00019412206295049608, "loss": 0.6813, "step": 1311 }, { "epoch": 0.14, "learning_rate": 0.00019411066882439983, "loss": 0.6905, "step": 1312 }, { "epoch": 0.14, "learning_rate": 0.00019409926400053529, "loss": 0.7067, "step": 1313 }, { "epoch": 0.14, "learning_rate": 0.00019408784848019882, "loss": 0.7139, "step": 1314 }, { "epoch": 0.14, "learning_rate": 0.000194076422264688, "loss": 0.6786, "step": 1315 }, { "epoch": 0.14, "learning_rate": 0.00019406498535530178, "loss": 0.7586, "step": 1316 }, { "epoch": 0.14, "learning_rate": 0.00019405353775334011, "loss": 0.7267, "step": 1317 }, { "epoch": 0.14, "learning_rate": 0.00019404207946010439, "loss": 0.7342, "step": 1318 }, { "epoch": 0.14, "learning_rate": 0.00019403061047689696, "loss": 0.7349, "step": 1319 }, { "epoch": 0.14, "learning_rate": 0.00019401913080502165, "loss": 0.7161, "step": 1320 }, { "epoch": 0.14, "learning_rate": 0.00019400764044578335, "loss": 0.7349, "step": 1321 }, { "epoch": 0.14, "learning_rate": 0.00019399613940048813, "loss": 0.7721, "step": 1322 }, { "epoch": 0.14, "learning_rate": 0.00019398462767044342, "loss": 0.7239, "step": 1323 }, { "epoch": 0.14, "learning_rate": 0.00019397310525695773, "loss": 0.8144, "step": 1324 }, { "epoch": 0.14, "learning_rate": 0.00019396157216134086, "loss": 0.7362, "step": 1325 }, { "epoch": 0.14, "learning_rate": 0.0001939500283849038, "loss": 0.6928, "step": 1326 }, { "epoch": 0.14, "learning_rate": 0.00019393847392895877, "loss": 0.7721, "step": 1327 }, { "epoch": 0.14, "learning_rate": 0.00019392690879481916, "loss": 0.6994, "step": 1328 }, { "epoch": 0.14, "learning_rate": 0.00019391533298379962, "loss": 0.669, "step": 1329 }, { "epoch": 0.14, "learning_rate": 0.00019390374649721603, "loss": 0.6967, "step": 1330 }, { "epoch": 0.14, "learning_rate": 0.0001938921493363854, "loss": 0.6519, "step": 1331 }, { "epoch": 0.14, "learning_rate": 0.00019388054150262606, "loss": 0.7199, "step": 1332 }, { "epoch": 0.14, "learning_rate": 0.0001938689229972574, "loss": 0.6998, "step": 1333 }, { "epoch": 0.14, "learning_rate": 0.00019385729382160024, "loss": 0.7252, "step": 1334 }, { "epoch": 0.14, "learning_rate": 0.0001938456539769764, "loss": 0.6953, "step": 1335 }, { "epoch": 0.14, "learning_rate": 0.00019383400346470908, "loss": 0.7061, "step": 1336 }, { "epoch": 0.14, "learning_rate": 0.00019382234228612258, "loss": 0.6732, "step": 1337 }, { "epoch": 0.14, "learning_rate": 0.00019381067044254246, "loss": 0.7115, "step": 1338 }, { "epoch": 0.14, "learning_rate": 0.0001937989879352955, "loss": 0.6992, "step": 1339 }, { "epoch": 0.14, "learning_rate": 0.00019378729476570965, "loss": 0.7476, "step": 1340 }, { "epoch": 0.14, "learning_rate": 0.00019377559093511408, "loss": 0.7882, "step": 1341 }, { "epoch": 0.14, "learning_rate": 0.00019376387644483924, "loss": 0.7144, "step": 1342 }, { "epoch": 0.14, "learning_rate": 0.00019375215129621674, "loss": 0.697, "step": 1343 }, { "epoch": 0.14, "learning_rate": 0.00019374041549057936, "loss": 0.6451, "step": 1344 }, { "epoch": 0.14, "learning_rate": 0.00019372866902926116, "loss": 0.7347, "step": 1345 }, { "epoch": 0.14, "learning_rate": 0.0001937169119135974, "loss": 0.6517, "step": 1346 }, { "epoch": 0.14, "learning_rate": 0.0001937051441449245, "loss": 0.7169, "step": 1347 }, { "epoch": 0.14, "learning_rate": 0.00019369336572458017, "loss": 0.6502, "step": 1348 }, { "epoch": 0.14, "learning_rate": 0.0001936815766539033, "loss": 0.671, "step": 1349 }, { "epoch": 0.14, "learning_rate": 0.0001936697769342339, "loss": 0.6872, "step": 1350 }, { "epoch": 0.14, "learning_rate": 0.00019365796656691333, "loss": 0.6837, "step": 1351 }, { "epoch": 0.14, "learning_rate": 0.00019364614555328414, "loss": 0.6362, "step": 1352 }, { "epoch": 0.14, "learning_rate": 0.00019363431389468993, "loss": 0.7156, "step": 1353 }, { "epoch": 0.14, "learning_rate": 0.00019362247159247575, "loss": 0.7278, "step": 1354 }, { "epoch": 0.14, "learning_rate": 0.00019361061864798767, "loss": 0.6711, "step": 1355 }, { "epoch": 0.14, "learning_rate": 0.00019359875506257308, "loss": 0.6811, "step": 1356 }, { "epoch": 0.14, "learning_rate": 0.00019358688083758051, "loss": 0.6923, "step": 1357 }, { "epoch": 0.14, "learning_rate": 0.00019357499597435978, "loss": 0.7263, "step": 1358 }, { "epoch": 0.14, "learning_rate": 0.0001935631004742618, "loss": 0.7046, "step": 1359 }, { "epoch": 0.14, "learning_rate": 0.0001935511943386388, "loss": 0.6721, "step": 1360 }, { "epoch": 0.14, "learning_rate": 0.0001935392775688442, "loss": 0.7432, "step": 1361 }, { "epoch": 0.14, "learning_rate": 0.00019352735016623252, "loss": 0.702, "step": 1362 }, { "epoch": 0.14, "learning_rate": 0.00019351541213215962, "loss": 0.7102, "step": 1363 }, { "epoch": 0.14, "learning_rate": 0.00019350346346798256, "loss": 0.7282, "step": 1364 }, { "epoch": 0.14, "learning_rate": 0.00019349150417505954, "loss": 0.686, "step": 1365 }, { "epoch": 0.14, "learning_rate": 0.00019347953425475, "loss": 0.6906, "step": 1366 }, { "epoch": 0.14, "learning_rate": 0.0001934675537084146, "loss": 0.67, "step": 1367 }, { "epoch": 0.14, "learning_rate": 0.00019345556253741518, "loss": 0.6975, "step": 1368 }, { "epoch": 0.14, "learning_rate": 0.0001934435607431148, "loss": 0.6413, "step": 1369 }, { "epoch": 0.14, "learning_rate": 0.00019343154832687773, "loss": 0.7696, "step": 1370 }, { "epoch": 0.14, "learning_rate": 0.00019341952529006946, "loss": 0.7051, "step": 1371 }, { "epoch": 0.14, "learning_rate": 0.00019340749163405664, "loss": 0.6607, "step": 1372 }, { "epoch": 0.14, "learning_rate": 0.00019339544736020722, "loss": 0.696, "step": 1373 }, { "epoch": 0.14, "learning_rate": 0.0001933833924698903, "loss": 0.6931, "step": 1374 }, { "epoch": 0.14, "learning_rate": 0.00019337132696447613, "loss": 0.7768, "step": 1375 }, { "epoch": 0.14, "learning_rate": 0.00019335925084533627, "loss": 0.7112, "step": 1376 }, { "epoch": 0.14, "learning_rate": 0.00019334716411384338, "loss": 0.6843, "step": 1377 }, { "epoch": 0.14, "learning_rate": 0.00019333506677137146, "loss": 0.681, "step": 1378 }, { "epoch": 0.14, "learning_rate": 0.00019332295881929558, "loss": 0.7044, "step": 1379 }, { "epoch": 0.14, "learning_rate": 0.00019331084025899214, "loss": 0.7106, "step": 1380 }, { "epoch": 0.14, "learning_rate": 0.0001932987110918386, "loss": 0.6577, "step": 1381 }, { "epoch": 0.14, "learning_rate": 0.00019328657131921379, "loss": 0.6849, "step": 1382 }, { "epoch": 0.14, "learning_rate": 0.00019327442094249764, "loss": 0.7418, "step": 1383 }, { "epoch": 0.14, "learning_rate": 0.0001932622599630713, "loss": 0.731, "step": 1384 }, { "epoch": 0.14, "learning_rate": 0.00019325008838231713, "loss": 0.6864, "step": 1385 }, { "epoch": 0.14, "learning_rate": 0.0001932379062016187, "loss": 0.7272, "step": 1386 }, { "epoch": 0.14, "learning_rate": 0.00019322571342236079, "loss": 0.7359, "step": 1387 }, { "epoch": 0.14, "learning_rate": 0.0001932135100459294, "loss": 0.7614, "step": 1388 }, { "epoch": 0.14, "learning_rate": 0.0001932012960737117, "loss": 0.6946, "step": 1389 }, { "epoch": 0.14, "learning_rate": 0.00019318907150709608, "loss": 0.7065, "step": 1390 }, { "epoch": 0.14, "learning_rate": 0.00019317683634747213, "loss": 0.6954, "step": 1391 }, { "epoch": 0.14, "learning_rate": 0.00019316459059623068, "loss": 0.7119, "step": 1392 }, { "epoch": 0.14, "learning_rate": 0.00019315233425476363, "loss": 0.6826, "step": 1393 }, { "epoch": 0.15, "learning_rate": 0.00019314006732446432, "loss": 0.7217, "step": 1394 }, { "epoch": 0.15, "learning_rate": 0.00019312778980672707, "loss": 0.7514, "step": 1395 }, { "epoch": 0.15, "learning_rate": 0.00019311550170294752, "loss": 0.716, "step": 1396 }, { "epoch": 0.15, "learning_rate": 0.0001931032030145225, "loss": 0.7246, "step": 1397 }, { "epoch": 0.15, "learning_rate": 0.00019309089374285, "loss": 0.6817, "step": 1398 }, { "epoch": 0.15, "learning_rate": 0.00019307857388932927, "loss": 0.7052, "step": 1399 }, { "epoch": 0.15, "learning_rate": 0.0001930662434553607, "loss": 0.6731, "step": 1400 }, { "epoch": 0.15, "learning_rate": 0.00019305390244234595, "loss": 0.6772, "step": 1401 }, { "epoch": 0.15, "learning_rate": 0.00019304155085168786, "loss": 0.7322, "step": 1402 }, { "epoch": 0.15, "learning_rate": 0.00019302918868479042, "loss": 0.6694, "step": 1403 }, { "epoch": 0.15, "learning_rate": 0.0001930168159430589, "loss": 0.6691, "step": 1404 }, { "epoch": 0.15, "learning_rate": 0.00019300443262789972, "loss": 0.7032, "step": 1405 }, { "epoch": 0.15, "learning_rate": 0.00019299203874072052, "loss": 0.6368, "step": 1406 }, { "epoch": 0.15, "learning_rate": 0.00019297963428293013, "loss": 0.7043, "step": 1407 }, { "epoch": 0.15, "learning_rate": 0.00019296721925593862, "loss": 0.6947, "step": 1408 }, { "epoch": 0.15, "learning_rate": 0.00019295479366115723, "loss": 0.6905, "step": 1409 }, { "epoch": 0.15, "learning_rate": 0.00019294235749999837, "loss": 0.7033, "step": 1410 }, { "epoch": 0.15, "learning_rate": 0.00019292991077387572, "loss": 0.728, "step": 1411 }, { "epoch": 0.15, "learning_rate": 0.00019291745348420412, "loss": 0.6968, "step": 1412 }, { "epoch": 0.15, "learning_rate": 0.00019290498563239963, "loss": 0.6624, "step": 1413 }, { "epoch": 0.15, "learning_rate": 0.00019289250721987947, "loss": 0.6813, "step": 1414 }, { "epoch": 0.15, "learning_rate": 0.0001928800182480621, "loss": 0.7198, "step": 1415 }, { "epoch": 0.15, "learning_rate": 0.0001928675187183672, "loss": 0.7056, "step": 1416 }, { "epoch": 0.15, "learning_rate": 0.00019285500863221552, "loss": 0.6636, "step": 1417 }, { "epoch": 0.15, "learning_rate": 0.00019284248799102924, "loss": 0.7078, "step": 1418 }, { "epoch": 0.15, "learning_rate": 0.00019282995679623154, "loss": 0.7166, "step": 1419 }, { "epoch": 0.15, "learning_rate": 0.00019281741504924686, "loss": 0.7012, "step": 1420 }, { "epoch": 0.15, "learning_rate": 0.0001928048627515009, "loss": 0.7474, "step": 1421 }, { "epoch": 0.15, "learning_rate": 0.00019279229990442045, "loss": 0.7238, "step": 1422 }, { "epoch": 0.15, "learning_rate": 0.00019277972650943358, "loss": 0.694, "step": 1423 }, { "epoch": 0.15, "learning_rate": 0.00019276714256796952, "loss": 0.6926, "step": 1424 }, { "epoch": 0.15, "learning_rate": 0.00019275454808145878, "loss": 0.7327, "step": 1425 }, { "epoch": 0.15, "learning_rate": 0.0001927419430513329, "loss": 0.6838, "step": 1426 }, { "epoch": 0.15, "learning_rate": 0.0001927293274790248, "loss": 0.6685, "step": 1427 }, { "epoch": 0.15, "learning_rate": 0.00019271670136596848, "loss": 0.6741, "step": 1428 }, { "epoch": 0.15, "learning_rate": 0.0001927040647135992, "loss": 0.6814, "step": 1429 }, { "epoch": 0.15, "learning_rate": 0.0001926914175233534, "loss": 0.6845, "step": 1430 }, { "epoch": 0.15, "learning_rate": 0.0001926787597966687, "loss": 0.7155, "step": 1431 }, { "epoch": 0.15, "learning_rate": 0.00019266609153498394, "loss": 0.7342, "step": 1432 }, { "epoch": 0.15, "learning_rate": 0.00019265341273973913, "loss": 0.741, "step": 1433 }, { "epoch": 0.15, "learning_rate": 0.00019264072341237555, "loss": 0.7147, "step": 1434 }, { "epoch": 0.15, "learning_rate": 0.00019262802355433554, "loss": 0.7004, "step": 1435 }, { "epoch": 0.15, "learning_rate": 0.0001926153131670628, "loss": 0.6842, "step": 1436 }, { "epoch": 0.15, "learning_rate": 0.0001926025922520021, "loss": 0.7091, "step": 1437 }, { "epoch": 0.15, "learning_rate": 0.00019258986081059946, "loss": 0.7262, "step": 1438 }, { "epoch": 0.15, "learning_rate": 0.00019257711884430208, "loss": 0.6324, "step": 1439 }, { "epoch": 0.15, "learning_rate": 0.00019256436635455845, "loss": 0.7488, "step": 1440 }, { "epoch": 0.15, "learning_rate": 0.00019255160334281807, "loss": 0.7159, "step": 1441 }, { "epoch": 0.15, "learning_rate": 0.0001925388298105318, "loss": 0.674, "step": 1442 }, { "epoch": 0.15, "learning_rate": 0.00019252604575915161, "loss": 0.7233, "step": 1443 }, { "epoch": 0.15, "learning_rate": 0.00019251325119013069, "loss": 0.6881, "step": 1444 }, { "epoch": 0.15, "learning_rate": 0.00019250044610492345, "loss": 0.7604, "step": 1445 }, { "epoch": 0.15, "learning_rate": 0.00019248763050498546, "loss": 0.6918, "step": 1446 }, { "epoch": 0.15, "learning_rate": 0.00019247480439177347, "loss": 0.639, "step": 1447 }, { "epoch": 0.15, "learning_rate": 0.0001924619677667455, "loss": 0.6304, "step": 1448 }, { "epoch": 0.15, "learning_rate": 0.0001924491206313607, "loss": 0.7367, "step": 1449 }, { "epoch": 0.15, "learning_rate": 0.00019243626298707942, "loss": 0.7108, "step": 1450 }, { "epoch": 0.15, "learning_rate": 0.0001924233948353632, "loss": 0.6914, "step": 1451 }, { "epoch": 0.15, "learning_rate": 0.00019241051617767486, "loss": 0.6761, "step": 1452 }, { "epoch": 0.15, "learning_rate": 0.00019239762701547832, "loss": 0.6884, "step": 1453 }, { "epoch": 0.15, "learning_rate": 0.00019238472735023864, "loss": 0.6878, "step": 1454 }, { "epoch": 0.15, "learning_rate": 0.00019237181718342224, "loss": 0.7273, "step": 1455 }, { "epoch": 0.15, "learning_rate": 0.00019235889651649662, "loss": 0.6536, "step": 1456 }, { "epoch": 0.15, "learning_rate": 0.00019234596535093056, "loss": 0.7017, "step": 1457 }, { "epoch": 0.15, "learning_rate": 0.00019233302368819387, "loss": 0.6104, "step": 1458 }, { "epoch": 0.15, "learning_rate": 0.00019232007152975768, "loss": 0.6387, "step": 1459 }, { "epoch": 0.15, "learning_rate": 0.00019230710887709437, "loss": 0.7382, "step": 1460 }, { "epoch": 0.15, "learning_rate": 0.00019229413573167733, "loss": 0.7427, "step": 1461 }, { "epoch": 0.15, "learning_rate": 0.00019228115209498134, "loss": 0.7439, "step": 1462 }, { "epoch": 0.15, "learning_rate": 0.00019226815796848218, "loss": 0.7033, "step": 1463 }, { "epoch": 0.15, "learning_rate": 0.00019225515335365704, "loss": 0.6407, "step": 1464 }, { "epoch": 0.15, "learning_rate": 0.00019224213825198407, "loss": 0.599, "step": 1465 }, { "epoch": 0.15, "learning_rate": 0.00019222911266494278, "loss": 0.6822, "step": 1466 }, { "epoch": 0.15, "learning_rate": 0.00019221607659401384, "loss": 0.7013, "step": 1467 }, { "epoch": 0.15, "learning_rate": 0.00019220303004067907, "loss": 0.7739, "step": 1468 }, { "epoch": 0.15, "learning_rate": 0.00019218997300642145, "loss": 0.679, "step": 1469 }, { "epoch": 0.15, "learning_rate": 0.00019217690549272525, "loss": 0.7343, "step": 1470 }, { "epoch": 0.15, "learning_rate": 0.00019216382750107588, "loss": 0.6975, "step": 1471 }, { "epoch": 0.15, "learning_rate": 0.00019215073903295997, "loss": 0.7247, "step": 1472 }, { "epoch": 0.15, "learning_rate": 0.00019213764008986525, "loss": 0.7422, "step": 1473 }, { "epoch": 0.15, "learning_rate": 0.00019212453067328077, "loss": 0.6757, "step": 1474 }, { "epoch": 0.15, "learning_rate": 0.00019211141078469667, "loss": 0.7283, "step": 1475 }, { "epoch": 0.15, "learning_rate": 0.00019209828042560432, "loss": 0.7175, "step": 1476 }, { "epoch": 0.15, "learning_rate": 0.0001920851395974963, "loss": 0.6978, "step": 1477 }, { "epoch": 0.15, "learning_rate": 0.00019207198830186633, "loss": 0.752, "step": 1478 }, { "epoch": 0.15, "learning_rate": 0.00019205882654020932, "loss": 0.7421, "step": 1479 }, { "epoch": 0.15, "learning_rate": 0.00019204565431402148, "loss": 0.6869, "step": 1480 }, { "epoch": 0.15, "learning_rate": 0.00019203247162480008, "loss": 0.6096, "step": 1481 }, { "epoch": 0.15, "learning_rate": 0.0001920192784740436, "loss": 0.682, "step": 1482 }, { "epoch": 0.15, "learning_rate": 0.00019200607486325176, "loss": 0.6386, "step": 1483 }, { "epoch": 0.15, "learning_rate": 0.00019199286079392547, "loss": 0.6635, "step": 1484 }, { "epoch": 0.15, "learning_rate": 0.00019197963626756676, "loss": 0.7099, "step": 1485 }, { "epoch": 0.15, "learning_rate": 0.0001919664012856789, "loss": 0.6568, "step": 1486 }, { "epoch": 0.15, "learning_rate": 0.00019195315584976633, "loss": 0.6967, "step": 1487 }, { "epoch": 0.15, "learning_rate": 0.00019193989996133475, "loss": 0.7101, "step": 1488 }, { "epoch": 0.15, "learning_rate": 0.0001919266336218909, "loss": 0.7378, "step": 1489 }, { "epoch": 0.16, "learning_rate": 0.00019191335683294288, "loss": 0.6783, "step": 1490 }, { "epoch": 0.16, "learning_rate": 0.0001919000695959998, "loss": 0.741, "step": 1491 }, { "epoch": 0.16, "learning_rate": 0.00019188677191257214, "loss": 0.7118, "step": 1492 }, { "epoch": 0.16, "learning_rate": 0.0001918734637841714, "loss": 0.7568, "step": 1493 }, { "epoch": 0.16, "learning_rate": 0.0001918601452123104, "loss": 0.7162, "step": 1494 }, { "epoch": 0.16, "learning_rate": 0.00019184681619850306, "loss": 0.7309, "step": 1495 }, { "epoch": 0.16, "learning_rate": 0.00019183347674426454, "loss": 0.7178, "step": 1496 }, { "epoch": 0.16, "learning_rate": 0.00019182012685111112, "loss": 0.6439, "step": 1497 }, { "epoch": 0.16, "learning_rate": 0.0001918067665205604, "loss": 0.7075, "step": 1498 }, { "epoch": 0.16, "learning_rate": 0.00019179339575413096, "loss": 0.7748, "step": 1499 }, { "epoch": 0.16, "learning_rate": 0.0001917800145533428, "loss": 0.718, "step": 1500 }, { "epoch": 0.16, "learning_rate": 0.00019176662291971693, "loss": 0.7624, "step": 1501 }, { "epoch": 0.16, "learning_rate": 0.0001917532208547756, "loss": 0.7661, "step": 1502 }, { "epoch": 0.16, "learning_rate": 0.00019173980836004228, "loss": 0.7024, "step": 1503 }, { "epoch": 0.16, "learning_rate": 0.0001917263854370416, "loss": 0.6946, "step": 1504 }, { "epoch": 0.16, "learning_rate": 0.00019171295208729932, "loss": 0.6955, "step": 1505 }, { "epoch": 0.16, "learning_rate": 0.0001916995083123425, "loss": 0.6664, "step": 1506 }, { "epoch": 0.16, "learning_rate": 0.00019168605411369933, "loss": 0.6814, "step": 1507 }, { "epoch": 0.16, "learning_rate": 0.00019167258949289912, "loss": 0.7762, "step": 1508 }, { "epoch": 0.16, "learning_rate": 0.00019165911445147247, "loss": 0.7546, "step": 1509 }, { "epoch": 0.16, "learning_rate": 0.0001916456289909511, "loss": 0.722, "step": 1510 }, { "epoch": 0.16, "learning_rate": 0.0001916321331128679, "loss": 0.72, "step": 1511 }, { "epoch": 0.16, "learning_rate": 0.00019161862681875706, "loss": 0.7181, "step": 1512 }, { "epoch": 0.16, "learning_rate": 0.00019160511011015382, "loss": 0.5985, "step": 1513 }, { "epoch": 0.16, "learning_rate": 0.00019159158298859464, "loss": 0.6968, "step": 1514 }, { "epoch": 0.16, "learning_rate": 0.00019157804545561716, "loss": 0.7313, "step": 1515 }, { "epoch": 0.16, "learning_rate": 0.00019156449751276032, "loss": 0.7484, "step": 1516 }, { "epoch": 0.16, "learning_rate": 0.00019155093916156405, "loss": 0.6896, "step": 1517 }, { "epoch": 0.16, "learning_rate": 0.00019153737040356958, "loss": 0.7127, "step": 1518 }, { "epoch": 0.16, "learning_rate": 0.0001915237912403193, "loss": 0.6923, "step": 1519 }, { "epoch": 0.16, "learning_rate": 0.0001915102016733568, "loss": 0.6519, "step": 1520 }, { "epoch": 0.16, "learning_rate": 0.00019149660170422682, "loss": 0.6797, "step": 1521 }, { "epoch": 0.16, "learning_rate": 0.00019148299133447535, "loss": 0.7522, "step": 1522 }, { "epoch": 0.16, "learning_rate": 0.00019146937056564945, "loss": 0.7296, "step": 1523 }, { "epoch": 0.16, "learning_rate": 0.00019145573939929742, "loss": 0.6689, "step": 1524 }, { "epoch": 0.16, "learning_rate": 0.00019144209783696875, "loss": 0.6714, "step": 1525 }, { "epoch": 0.16, "learning_rate": 0.00019142844588021415, "loss": 0.6697, "step": 1526 }, { "epoch": 0.16, "learning_rate": 0.00019141478353058543, "loss": 0.6542, "step": 1527 }, { "epoch": 0.16, "learning_rate": 0.00019140111078963566, "loss": 0.7121, "step": 1528 }, { "epoch": 0.16, "learning_rate": 0.00019138742765891897, "loss": 0.7754, "step": 1529 }, { "epoch": 0.16, "learning_rate": 0.00019137373413999085, "loss": 0.726, "step": 1530 }, { "epoch": 0.16, "learning_rate": 0.00019136003023440782, "loss": 0.782, "step": 1531 }, { "epoch": 0.16, "learning_rate": 0.0001913463159437276, "loss": 0.7017, "step": 1532 }, { "epoch": 0.16, "learning_rate": 0.0001913325912695092, "loss": 0.6776, "step": 1533 }, { "epoch": 0.16, "learning_rate": 0.00019131885621331268, "loss": 0.723, "step": 1534 }, { "epoch": 0.16, "learning_rate": 0.00019130511077669935, "loss": 0.7165, "step": 1535 }, { "epoch": 0.16, "learning_rate": 0.00019129135496123167, "loss": 0.7298, "step": 1536 }, { "epoch": 0.16, "learning_rate": 0.00019127758876847333, "loss": 0.6897, "step": 1537 }, { "epoch": 0.16, "learning_rate": 0.00019126381219998912, "loss": 0.7488, "step": 1538 }, { "epoch": 0.16, "learning_rate": 0.0001912500252573451, "loss": 0.7065, "step": 1539 }, { "epoch": 0.16, "learning_rate": 0.00019123622794210842, "loss": 0.6566, "step": 1540 }, { "epoch": 0.16, "learning_rate": 0.0001912224202558475, "loss": 0.6925, "step": 1541 }, { "epoch": 0.16, "learning_rate": 0.0001912086022001318, "loss": 0.7105, "step": 1542 }, { "epoch": 0.16, "learning_rate": 0.0001911947737765322, "loss": 0.675, "step": 1543 }, { "epoch": 0.16, "learning_rate": 0.00019118093498662043, "loss": 0.6449, "step": 1544 }, { "epoch": 0.16, "learning_rate": 0.0001911670858319697, "loss": 0.6981, "step": 1545 }, { "epoch": 0.16, "learning_rate": 0.00019115322631415424, "loss": 0.7166, "step": 1546 }, { "epoch": 0.16, "learning_rate": 0.0001911393564347495, "loss": 0.7068, "step": 1547 }, { "epoch": 0.16, "learning_rate": 0.00019112547619533205, "loss": 0.7596, "step": 1548 }, { "epoch": 0.16, "learning_rate": 0.00019111158559747974, "loss": 0.7242, "step": 1549 }, { "epoch": 0.16, "learning_rate": 0.00019109768464277153, "loss": 0.681, "step": 1550 }, { "epoch": 0.16, "learning_rate": 0.00019108377333278758, "loss": 0.7295, "step": 1551 }, { "epoch": 0.16, "learning_rate": 0.00019106985166910922, "loss": 0.6982, "step": 1552 }, { "epoch": 0.16, "learning_rate": 0.00019105591965331895, "loss": 0.72, "step": 1553 }, { "epoch": 0.16, "learning_rate": 0.00019104197728700043, "loss": 0.7121, "step": 1554 }, { "epoch": 0.16, "learning_rate": 0.00019102802457173857, "loss": 0.7385, "step": 1555 }, { "epoch": 0.16, "learning_rate": 0.00019101406150911937, "loss": 0.6976, "step": 1556 }, { "epoch": 0.16, "learning_rate": 0.00019100008810073003, "loss": 0.673, "step": 1557 }, { "epoch": 0.16, "learning_rate": 0.00019098610434815897, "loss": 0.66, "step": 1558 }, { "epoch": 0.16, "learning_rate": 0.00019097211025299573, "loss": 0.6995, "step": 1559 }, { "epoch": 0.16, "learning_rate": 0.0001909581058168311, "loss": 0.7238, "step": 1560 }, { "epoch": 0.16, "learning_rate": 0.0001909440910412569, "loss": 0.7223, "step": 1561 }, { "epoch": 0.16, "learning_rate": 0.00019093006592786632, "loss": 0.6445, "step": 1562 }, { "epoch": 0.16, "learning_rate": 0.0001909160304782536, "loss": 0.7526, "step": 1563 }, { "epoch": 0.16, "learning_rate": 0.00019090198469401415, "loss": 0.7048, "step": 1564 }, { "epoch": 0.16, "learning_rate": 0.0001908879285767446, "loss": 0.652, "step": 1565 }, { "epoch": 0.16, "learning_rate": 0.00019087386212804272, "loss": 0.7104, "step": 1566 }, { "epoch": 0.16, "learning_rate": 0.0001908597853495075, "loss": 0.7232, "step": 1567 }, { "epoch": 0.16, "learning_rate": 0.00019084569824273908, "loss": 0.6398, "step": 1568 }, { "epoch": 0.16, "learning_rate": 0.00019083160080933878, "loss": 0.7533, "step": 1569 }, { "epoch": 0.16, "learning_rate": 0.00019081749305090905, "loss": 0.7252, "step": 1570 }, { "epoch": 0.16, "learning_rate": 0.00019080337496905358, "loss": 0.6775, "step": 1571 }, { "epoch": 0.16, "learning_rate": 0.0001907892465653772, "loss": 0.7255, "step": 1572 }, { "epoch": 0.16, "learning_rate": 0.00019077510784148592, "loss": 0.7608, "step": 1573 }, { "epoch": 0.16, "learning_rate": 0.0001907609587989869, "loss": 0.6897, "step": 1574 }, { "epoch": 0.16, "learning_rate": 0.00019074679943948853, "loss": 0.6911, "step": 1575 }, { "epoch": 0.16, "learning_rate": 0.0001907326297646003, "loss": 0.7129, "step": 1576 }, { "epoch": 0.16, "learning_rate": 0.0001907184497759329, "loss": 0.709, "step": 1577 }, { "epoch": 0.16, "learning_rate": 0.00019070425947509824, "loss": 0.687, "step": 1578 }, { "epoch": 0.16, "learning_rate": 0.00019069005886370932, "loss": 0.7393, "step": 1579 }, { "epoch": 0.16, "learning_rate": 0.0001906758479433804, "loss": 0.7091, "step": 1580 }, { "epoch": 0.16, "learning_rate": 0.00019066162671572685, "loss": 0.7127, "step": 1581 }, { "epoch": 0.16, "learning_rate": 0.00019064739518236522, "loss": 0.6656, "step": 1582 }, { "epoch": 0.16, "learning_rate": 0.00019063315334491324, "loss": 0.6618, "step": 1583 }, { "epoch": 0.16, "learning_rate": 0.00019061890120498982, "loss": 0.6748, "step": 1584 }, { "epoch": 0.16, "learning_rate": 0.00019060463876421503, "loss": 0.7502, "step": 1585 }, { "epoch": 0.17, "learning_rate": 0.0001905903660242101, "loss": 0.7493, "step": 1586 }, { "epoch": 0.17, "learning_rate": 0.00019057608298659747, "loss": 0.6883, "step": 1587 }, { "epoch": 0.17, "learning_rate": 0.0001905617896530007, "loss": 0.6729, "step": 1588 }, { "epoch": 0.17, "learning_rate": 0.00019054748602504454, "loss": 0.6715, "step": 1589 }, { "epoch": 0.17, "learning_rate": 0.00019053317210435496, "loss": 0.7077, "step": 1590 }, { "epoch": 0.17, "learning_rate": 0.00019051884789255901, "loss": 0.6561, "step": 1591 }, { "epoch": 0.17, "learning_rate": 0.000190504513391285, "loss": 0.7201, "step": 1592 }, { "epoch": 0.17, "learning_rate": 0.0001904901686021623, "loss": 0.6164, "step": 1593 }, { "epoch": 0.17, "learning_rate": 0.00019047581352682155, "loss": 0.7023, "step": 1594 }, { "epoch": 0.17, "learning_rate": 0.00019046144816689452, "loss": 0.6971, "step": 1595 }, { "epoch": 0.17, "learning_rate": 0.00019044707252401417, "loss": 0.7264, "step": 1596 }, { "epoch": 0.17, "learning_rate": 0.00019043268659981458, "loss": 0.6402, "step": 1597 }, { "epoch": 0.17, "learning_rate": 0.00019041829039593105, "loss": 0.7021, "step": 1598 }, { "epoch": 0.17, "learning_rate": 0.000190403883914, "loss": 0.763, "step": 1599 }, { "epoch": 0.17, "learning_rate": 0.0001903894671556591, "loss": 0.7043, "step": 1600 }, { "epoch": 0.17, "learning_rate": 0.0001903750401225471, "loss": 0.6864, "step": 1601 }, { "epoch": 0.17, "learning_rate": 0.00019036060281630397, "loss": 0.6708, "step": 1602 }, { "epoch": 0.17, "learning_rate": 0.0001903461552385708, "loss": 0.7346, "step": 1603 }, { "epoch": 0.17, "learning_rate": 0.00019033169739098992, "loss": 0.7281, "step": 1604 }, { "epoch": 0.17, "learning_rate": 0.0001903172292752047, "loss": 0.693, "step": 1605 }, { "epoch": 0.17, "learning_rate": 0.0001903027508928599, "loss": 0.6222, "step": 1606 }, { "epoch": 0.17, "learning_rate": 0.0001902882622456012, "loss": 0.7592, "step": 1607 }, { "epoch": 0.17, "learning_rate": 0.0001902737633350756, "loss": 0.6649, "step": 1608 }, { "epoch": 0.17, "learning_rate": 0.0001902592541629312, "loss": 0.7474, "step": 1609 }, { "epoch": 0.17, "learning_rate": 0.00019024473473081731, "loss": 0.6833, "step": 1610 }, { "epoch": 0.17, "learning_rate": 0.0001902302050403844, "loss": 0.6712, "step": 1611 }, { "epoch": 0.17, "learning_rate": 0.00019021566509328403, "loss": 0.7234, "step": 1612 }, { "epoch": 0.17, "learning_rate": 0.00019020111489116907, "loss": 0.717, "step": 1613 }, { "epoch": 0.17, "learning_rate": 0.0001901865544356934, "loss": 0.6604, "step": 1614 }, { "epoch": 0.17, "learning_rate": 0.00019017198372851222, "loss": 0.657, "step": 1615 }, { "epoch": 0.17, "learning_rate": 0.00019015740277128176, "loss": 0.6996, "step": 1616 }, { "epoch": 0.17, "learning_rate": 0.00019014281156565945, "loss": 0.7413, "step": 1617 }, { "epoch": 0.17, "learning_rate": 0.00019012821011330395, "loss": 0.7124, "step": 1618 }, { "epoch": 0.17, "learning_rate": 0.000190113598415875, "loss": 0.6843, "step": 1619 }, { "epoch": 0.17, "learning_rate": 0.0001900989764750336, "loss": 0.7273, "step": 1620 }, { "epoch": 0.17, "learning_rate": 0.00019008434429244178, "loss": 0.7071, "step": 1621 }, { "epoch": 0.17, "learning_rate": 0.0001900697018697629, "loss": 0.7404, "step": 1622 }, { "epoch": 0.17, "learning_rate": 0.00019005504920866132, "loss": 0.6165, "step": 1623 }, { "epoch": 0.17, "learning_rate": 0.00019004038631080273, "loss": 0.6338, "step": 1624 }, { "epoch": 0.17, "learning_rate": 0.0001900257131778538, "loss": 0.679, "step": 1625 }, { "epoch": 0.17, "learning_rate": 0.00019001102981148246, "loss": 0.6764, "step": 1626 }, { "epoch": 0.17, "learning_rate": 0.00018999633621335788, "loss": 0.7308, "step": 1627 }, { "epoch": 0.17, "learning_rate": 0.00018998163238515028, "loss": 0.7345, "step": 1628 }, { "epoch": 0.17, "learning_rate": 0.00018996691832853105, "loss": 0.7159, "step": 1629 }, { "epoch": 0.17, "learning_rate": 0.00018995219404517277, "loss": 0.6764, "step": 1630 }, { "epoch": 0.17, "learning_rate": 0.00018993745953674922, "loss": 0.6279, "step": 1631 }, { "epoch": 0.17, "learning_rate": 0.0001899227148049353, "loss": 0.7246, "step": 1632 }, { "epoch": 0.17, "learning_rate": 0.00018990795985140703, "loss": 0.6597, "step": 1633 }, { "epoch": 0.17, "learning_rate": 0.00018989319467784167, "loss": 0.6722, "step": 1634 }, { "epoch": 0.17, "learning_rate": 0.00018987841928591763, "loss": 0.7617, "step": 1635 }, { "epoch": 0.17, "learning_rate": 0.0001898636336773144, "loss": 0.7307, "step": 1636 }, { "epoch": 0.17, "learning_rate": 0.00018984883785371274, "loss": 0.6906, "step": 1637 }, { "epoch": 0.17, "learning_rate": 0.00018983403181679456, "loss": 0.7243, "step": 1638 }, { "epoch": 0.17, "learning_rate": 0.00018981921556824281, "loss": 0.685, "step": 1639 }, { "epoch": 0.17, "learning_rate": 0.00018980438910974173, "loss": 0.7222, "step": 1640 }, { "epoch": 0.17, "learning_rate": 0.0001897895524429767, "loss": 0.7002, "step": 1641 }, { "epoch": 0.17, "learning_rate": 0.0001897747055696342, "loss": 0.7367, "step": 1642 }, { "epoch": 0.17, "learning_rate": 0.0001897598484914019, "loss": 0.7308, "step": 1643 }, { "epoch": 0.17, "learning_rate": 0.00018974498120996865, "loss": 0.64, "step": 1644 }, { "epoch": 0.17, "learning_rate": 0.0001897301037270245, "loss": 0.7257, "step": 1645 }, { "epoch": 0.17, "learning_rate": 0.00018971521604426047, "loss": 0.6166, "step": 1646 }, { "epoch": 0.17, "learning_rate": 0.00018970031816336903, "loss": 0.757, "step": 1647 }, { "epoch": 0.17, "learning_rate": 0.00018968541008604358, "loss": 0.7555, "step": 1648 }, { "epoch": 0.17, "learning_rate": 0.00018967049181397875, "loss": 0.6752, "step": 1649 }, { "epoch": 0.17, "learning_rate": 0.00018965556334887035, "loss": 0.7065, "step": 1650 }, { "epoch": 0.17, "learning_rate": 0.00018964062469241534, "loss": 0.6943, "step": 1651 }, { "epoch": 0.17, "learning_rate": 0.00018962567584631182, "loss": 0.6915, "step": 1652 }, { "epoch": 0.17, "learning_rate": 0.00018961071681225904, "loss": 0.6473, "step": 1653 }, { "epoch": 0.17, "learning_rate": 0.00018959574759195745, "loss": 0.6682, "step": 1654 }, { "epoch": 0.17, "learning_rate": 0.0001895807681871086, "loss": 0.6567, "step": 1655 }, { "epoch": 0.17, "learning_rate": 0.0001895657785994153, "loss": 0.6907, "step": 1656 }, { "epoch": 0.17, "learning_rate": 0.00018955077883058138, "loss": 0.7115, "step": 1657 }, { "epoch": 0.17, "learning_rate": 0.00018953576888231194, "loss": 0.7173, "step": 1658 }, { "epoch": 0.17, "learning_rate": 0.00018952074875631318, "loss": 0.7085, "step": 1659 }, { "epoch": 0.17, "learning_rate": 0.00018950571845429245, "loss": 0.7039, "step": 1660 }, { "epoch": 0.17, "learning_rate": 0.00018949067797795834, "loss": 0.7543, "step": 1661 }, { "epoch": 0.17, "learning_rate": 0.0001894756273290205, "loss": 0.7266, "step": 1662 }, { "epoch": 0.17, "learning_rate": 0.0001894605665091897, "loss": 0.7347, "step": 1663 }, { "epoch": 0.17, "learning_rate": 0.00018944549552017806, "loss": 0.7068, "step": 1664 }, { "epoch": 0.17, "learning_rate": 0.00018943041436369863, "loss": 0.6884, "step": 1665 }, { "epoch": 0.17, "learning_rate": 0.0001894153230414658, "loss": 0.7005, "step": 1666 }, { "epoch": 0.17, "learning_rate": 0.00018940022155519498, "loss": 0.7486, "step": 1667 }, { "epoch": 0.17, "learning_rate": 0.00018938510990660276, "loss": 0.6877, "step": 1668 }, { "epoch": 0.17, "learning_rate": 0.000189369988097407, "loss": 0.7481, "step": 1669 }, { "epoch": 0.17, "learning_rate": 0.00018935485612932661, "loss": 0.7503, "step": 1670 }, { "epoch": 0.17, "learning_rate": 0.00018933971400408162, "loss": 0.6648, "step": 1671 }, { "epoch": 0.17, "learning_rate": 0.00018932456172339332, "loss": 0.6923, "step": 1672 }, { "epoch": 0.17, "learning_rate": 0.0001893093992889841, "loss": 0.7769, "step": 1673 }, { "epoch": 0.17, "learning_rate": 0.00018929422670257745, "loss": 0.6967, "step": 1674 }, { "epoch": 0.17, "learning_rate": 0.00018927904396589816, "loss": 0.6867, "step": 1675 }, { "epoch": 0.17, "learning_rate": 0.00018926385108067198, "loss": 0.7185, "step": 1676 }, { "epoch": 0.17, "learning_rate": 0.00018924864804862606, "loss": 0.7785, "step": 1677 }, { "epoch": 0.17, "learning_rate": 0.00018923343487148842, "loss": 0.7655, "step": 1678 }, { "epoch": 0.17, "learning_rate": 0.00018921821155098845, "loss": 0.6952, "step": 1679 }, { "epoch": 0.17, "learning_rate": 0.00018920297808885662, "loss": 0.717, "step": 1680 }, { "epoch": 0.17, "learning_rate": 0.00018918773448682455, "loss": 0.7278, "step": 1681 }, { "epoch": 0.18, "learning_rate": 0.000189172480746625, "loss": 0.6256, "step": 1682 }, { "epoch": 0.18, "learning_rate": 0.00018915721686999187, "loss": 0.7127, "step": 1683 }, { "epoch": 0.18, "learning_rate": 0.00018914194285866027, "loss": 0.7244, "step": 1684 }, { "epoch": 0.18, "learning_rate": 0.00018912665871436644, "loss": 0.7277, "step": 1685 }, { "epoch": 0.18, "learning_rate": 0.00018911136443884775, "loss": 0.7512, "step": 1686 }, { "epoch": 0.18, "learning_rate": 0.00018909606003384273, "loss": 0.6696, "step": 1687 }, { "epoch": 0.18, "learning_rate": 0.00018908074550109106, "loss": 0.6839, "step": 1688 }, { "epoch": 0.18, "learning_rate": 0.0001890654208423336, "loss": 0.7755, "step": 1689 }, { "epoch": 0.18, "learning_rate": 0.0001890500860593123, "loss": 0.6819, "step": 1690 }, { "epoch": 0.18, "learning_rate": 0.00018903474115377033, "loss": 0.7422, "step": 1691 }, { "epoch": 0.18, "learning_rate": 0.000189019386127452, "loss": 0.666, "step": 1692 }, { "epoch": 0.18, "learning_rate": 0.00018900402098210271, "loss": 0.6688, "step": 1693 }, { "epoch": 0.18, "learning_rate": 0.00018898864571946904, "loss": 0.7448, "step": 1694 }, { "epoch": 0.18, "learning_rate": 0.00018897326034129878, "loss": 0.7855, "step": 1695 }, { "epoch": 0.18, "learning_rate": 0.00018895786484934078, "loss": 0.6429, "step": 1696 }, { "epoch": 0.18, "learning_rate": 0.00018894245924534512, "loss": 0.7082, "step": 1697 }, { "epoch": 0.18, "learning_rate": 0.00018892704353106293, "loss": 0.6926, "step": 1698 }, { "epoch": 0.18, "learning_rate": 0.00018891161770824658, "loss": 0.712, "step": 1699 }, { "epoch": 0.18, "learning_rate": 0.00018889618177864956, "loss": 0.7087, "step": 1700 }, { "epoch": 0.18, "learning_rate": 0.00018888073574402652, "loss": 0.7467, "step": 1701 }, { "epoch": 0.18, "learning_rate": 0.0001888652796061332, "loss": 0.722, "step": 1702 }, { "epoch": 0.18, "learning_rate": 0.0001888498133667266, "loss": 0.6412, "step": 1703 }, { "epoch": 0.18, "learning_rate": 0.00018883433702756474, "loss": 0.7117, "step": 1704 }, { "epoch": 0.18, "learning_rate": 0.00018881885059040689, "loss": 0.7502, "step": 1705 }, { "epoch": 0.18, "learning_rate": 0.0001888033540570134, "loss": 0.6875, "step": 1706 }, { "epoch": 0.18, "learning_rate": 0.00018878784742914578, "loss": 0.6191, "step": 1707 }, { "epoch": 0.18, "learning_rate": 0.0001887723307085668, "loss": 0.7368, "step": 1708 }, { "epoch": 0.18, "learning_rate": 0.00018875680389704013, "loss": 0.806, "step": 1709 }, { "epoch": 0.18, "learning_rate": 0.0001887412669963309, "loss": 0.6899, "step": 1710 }, { "epoch": 0.18, "learning_rate": 0.00018872572000820504, "loss": 0.7251, "step": 1711 }, { "epoch": 0.18, "learning_rate": 0.00018871016293442997, "loss": 0.6556, "step": 1712 }, { "epoch": 0.18, "learning_rate": 0.00018869459577677407, "loss": 0.7638, "step": 1713 }, { "epoch": 0.18, "learning_rate": 0.0001886790185370068, "loss": 0.7052, "step": 1714 }, { "epoch": 0.18, "learning_rate": 0.00018866343121689893, "loss": 0.723, "step": 1715 }, { "epoch": 0.18, "learning_rate": 0.00018864783381822232, "loss": 0.702, "step": 1716 }, { "epoch": 0.18, "learning_rate": 0.00018863222634274993, "loss": 0.7414, "step": 1717 }, { "epoch": 0.18, "learning_rate": 0.0001886166087922559, "loss": 0.7035, "step": 1718 }, { "epoch": 0.18, "learning_rate": 0.00018860098116851552, "loss": 0.6885, "step": 1719 }, { "epoch": 0.18, "learning_rate": 0.0001885853434733052, "loss": 0.6848, "step": 1720 }, { "epoch": 0.18, "learning_rate": 0.00018856969570840254, "loss": 0.7276, "step": 1721 }, { "epoch": 0.18, "learning_rate": 0.00018855403787558622, "loss": 0.7019, "step": 1722 }, { "epoch": 0.18, "learning_rate": 0.00018853836997663614, "loss": 0.6763, "step": 1723 }, { "epoch": 0.18, "learning_rate": 0.00018852269201333327, "loss": 0.689, "step": 1724 }, { "epoch": 0.18, "learning_rate": 0.00018850700398745978, "loss": 0.7596, "step": 1725 }, { "epoch": 0.18, "learning_rate": 0.00018849130590079896, "loss": 0.7253, "step": 1726 }, { "epoch": 0.18, "learning_rate": 0.00018847559775513523, "loss": 0.6833, "step": 1727 }, { "epoch": 0.18, "learning_rate": 0.0001884598795522542, "loss": 0.6669, "step": 1728 }, { "epoch": 0.18, "learning_rate": 0.00018844415129394256, "loss": 0.6007, "step": 1729 }, { "epoch": 0.18, "learning_rate": 0.00018842841298198819, "loss": 0.7182, "step": 1730 }, { "epoch": 0.18, "learning_rate": 0.0001884126646181801, "loss": 0.6684, "step": 1731 }, { "epoch": 0.18, "learning_rate": 0.00018839690620430844, "loss": 0.7324, "step": 1732 }, { "epoch": 0.18, "learning_rate": 0.00018838113774216451, "loss": 0.7164, "step": 1733 }, { "epoch": 0.18, "learning_rate": 0.00018836535923354074, "loss": 0.6853, "step": 1734 }, { "epoch": 0.18, "learning_rate": 0.00018834957068023073, "loss": 0.7036, "step": 1735 }, { "epoch": 0.18, "learning_rate": 0.00018833377208402917, "loss": 0.7431, "step": 1736 }, { "epoch": 0.18, "learning_rate": 0.0001883179634467319, "loss": 0.6851, "step": 1737 }, { "epoch": 0.18, "learning_rate": 0.00018830214477013598, "loss": 0.6127, "step": 1738 }, { "epoch": 0.18, "learning_rate": 0.00018828631605603951, "loss": 0.6896, "step": 1739 }, { "epoch": 0.18, "learning_rate": 0.0001882704773062418, "loss": 0.722, "step": 1740 }, { "epoch": 0.18, "learning_rate": 0.0001882546285225433, "loss": 0.6646, "step": 1741 }, { "epoch": 0.18, "learning_rate": 0.0001882387697067455, "loss": 0.6757, "step": 1742 }, { "epoch": 0.18, "learning_rate": 0.00018822290086065117, "loss": 0.6797, "step": 1743 }, { "epoch": 0.18, "learning_rate": 0.00018820702198606414, "loss": 0.7283, "step": 1744 }, { "epoch": 0.18, "learning_rate": 0.0001881911330847894, "loss": 0.681, "step": 1745 }, { "epoch": 0.18, "learning_rate": 0.00018817523415863306, "loss": 0.7235, "step": 1746 }, { "epoch": 0.18, "learning_rate": 0.0001881593252094024, "loss": 0.6856, "step": 1747 }, { "epoch": 0.18, "learning_rate": 0.00018814340623890581, "loss": 0.6574, "step": 1748 }, { "epoch": 0.18, "learning_rate": 0.00018812747724895288, "loss": 0.6751, "step": 1749 }, { "epoch": 0.18, "learning_rate": 0.00018811153824135424, "loss": 0.7039, "step": 1750 }, { "epoch": 0.18, "learning_rate": 0.00018809558921792174, "loss": 0.6969, "step": 1751 }, { "epoch": 0.18, "learning_rate": 0.00018807963018046831, "loss": 0.7453, "step": 1752 }, { "epoch": 0.18, "learning_rate": 0.00018806366113080812, "loss": 0.7096, "step": 1753 }, { "epoch": 0.18, "learning_rate": 0.00018804768207075634, "loss": 0.7537, "step": 1754 }, { "epoch": 0.18, "learning_rate": 0.00018803169300212936, "loss": 0.6738, "step": 1755 }, { "epoch": 0.18, "learning_rate": 0.0001880156939267447, "loss": 0.7567, "step": 1756 }, { "epoch": 0.18, "learning_rate": 0.00018799968484642103, "loss": 0.7487, "step": 1757 }, { "epoch": 0.18, "learning_rate": 0.0001879836657629781, "loss": 0.6518, "step": 1758 }, { "epoch": 0.18, "learning_rate": 0.00018796763667823684, "loss": 0.7145, "step": 1759 }, { "epoch": 0.18, "learning_rate": 0.00018795159759401936, "loss": 0.6908, "step": 1760 }, { "epoch": 0.18, "learning_rate": 0.00018793554851214878, "loss": 0.6888, "step": 1761 }, { "epoch": 0.18, "learning_rate": 0.0001879194894344495, "loss": 0.6805, "step": 1762 }, { "epoch": 0.18, "learning_rate": 0.00018790342036274695, "loss": 0.6763, "step": 1763 }, { "epoch": 0.18, "learning_rate": 0.00018788734129886777, "loss": 0.7017, "step": 1764 }, { "epoch": 0.18, "learning_rate": 0.00018787125224463972, "loss": 0.6814, "step": 1765 }, { "epoch": 0.18, "learning_rate": 0.00018785515320189159, "loss": 0.6965, "step": 1766 }, { "epoch": 0.18, "learning_rate": 0.00018783904417245348, "loss": 0.7217, "step": 1767 }, { "epoch": 0.18, "learning_rate": 0.0001878229251581565, "loss": 0.686, "step": 1768 }, { "epoch": 0.18, "learning_rate": 0.00018780679616083292, "loss": 0.7078, "step": 1769 }, { "epoch": 0.18, "learning_rate": 0.0001877906571823162, "loss": 0.6661, "step": 1770 }, { "epoch": 0.18, "learning_rate": 0.00018777450822444092, "loss": 0.6985, "step": 1771 }, { "epoch": 0.18, "learning_rate": 0.00018775834928904268, "loss": 0.7533, "step": 1772 }, { "epoch": 0.18, "learning_rate": 0.00018774218037795833, "loss": 0.7007, "step": 1773 }, { "epoch": 0.18, "learning_rate": 0.00018772600149302585, "loss": 0.703, "step": 1774 }, { "epoch": 0.18, "learning_rate": 0.00018770981263608433, "loss": 0.7409, "step": 1775 }, { "epoch": 0.18, "learning_rate": 0.00018769361380897398, "loss": 0.692, "step": 1776 }, { "epoch": 0.18, "learning_rate": 0.0001876774050135362, "loss": 0.7079, "step": 1777 }, { "epoch": 0.19, "learning_rate": 0.00018766118625161338, "loss": 0.7068, "step": 1778 }, { "epoch": 0.19, "learning_rate": 0.00018764495752504923, "loss": 0.7062, "step": 1779 }, { "epoch": 0.19, "learning_rate": 0.0001876287188356885, "loss": 0.6941, "step": 1780 }, { "epoch": 0.19, "learning_rate": 0.00018761247018537702, "loss": 0.596, "step": 1781 }, { "epoch": 0.19, "learning_rate": 0.00018759621157596185, "loss": 0.714, "step": 1782 }, { "epoch": 0.19, "learning_rate": 0.00018757994300929115, "loss": 0.7272, "step": 1783 }, { "epoch": 0.19, "learning_rate": 0.00018756366448721421, "loss": 0.6925, "step": 1784 }, { "epoch": 0.19, "learning_rate": 0.0001875473760115814, "loss": 0.7304, "step": 1785 }, { "epoch": 0.19, "learning_rate": 0.00018753107758424432, "loss": 0.6584, "step": 1786 }, { "epoch": 0.19, "learning_rate": 0.00018751476920705556, "loss": 0.7467, "step": 1787 }, { "epoch": 0.19, "learning_rate": 0.00018749845088186906, "loss": 0.6833, "step": 1788 }, { "epoch": 0.19, "learning_rate": 0.0001874821226105397, "loss": 0.676, "step": 1789 }, { "epoch": 0.19, "learning_rate": 0.0001874657843949235, "loss": 0.7005, "step": 1790 }, { "epoch": 0.19, "learning_rate": 0.00018744943623687772, "loss": 0.6957, "step": 1791 }, { "epoch": 0.19, "learning_rate": 0.00018743307813826068, "loss": 0.6894, "step": 1792 }, { "epoch": 0.19, "learning_rate": 0.00018741671010093181, "loss": 0.6813, "step": 1793 }, { "epoch": 0.19, "learning_rate": 0.00018740033212675178, "loss": 0.7411, "step": 1794 }, { "epoch": 0.19, "learning_rate": 0.00018738394421758222, "loss": 0.6867, "step": 1795 }, { "epoch": 0.19, "learning_rate": 0.00018736754637528608, "loss": 0.7238, "step": 1796 }, { "epoch": 0.19, "learning_rate": 0.00018735113860172723, "loss": 0.7409, "step": 1797 }, { "epoch": 0.19, "learning_rate": 0.0001873347208987708, "loss": 0.711, "step": 1798 }, { "epoch": 0.19, "learning_rate": 0.0001873182932682831, "loss": 0.686, "step": 1799 }, { "epoch": 0.19, "learning_rate": 0.0001873018557121314, "loss": 0.6538, "step": 1800 }, { "epoch": 0.19, "learning_rate": 0.0001872854082321843, "loss": 0.6635, "step": 1801 }, { "epoch": 0.19, "learning_rate": 0.00018726895083031133, "loss": 0.6781, "step": 1802 }, { "epoch": 0.19, "learning_rate": 0.00018725248350838326, "loss": 0.692, "step": 1803 }, { "epoch": 0.19, "learning_rate": 0.00018723600626827203, "loss": 0.7581, "step": 1804 }, { "epoch": 0.19, "learning_rate": 0.00018721951911185056, "loss": 0.7728, "step": 1805 }, { "epoch": 0.19, "learning_rate": 0.00018720302204099302, "loss": 0.7553, "step": 1806 }, { "epoch": 0.19, "learning_rate": 0.00018718651505757468, "loss": 0.7202, "step": 1807 }, { "epoch": 0.19, "learning_rate": 0.00018716999816347188, "loss": 0.6829, "step": 1808 }, { "epoch": 0.19, "learning_rate": 0.00018715347136056217, "loss": 0.6295, "step": 1809 }, { "epoch": 0.19, "learning_rate": 0.00018713693465072419, "loss": 0.6681, "step": 1810 }, { "epoch": 0.19, "learning_rate": 0.00018712038803583768, "loss": 0.6664, "step": 1811 }, { "epoch": 0.19, "learning_rate": 0.00018710383151778357, "loss": 0.7412, "step": 1812 }, { "epoch": 0.19, "learning_rate": 0.00018708726509844383, "loss": 0.7104, "step": 1813 }, { "epoch": 0.19, "learning_rate": 0.00018707068877970163, "loss": 0.7215, "step": 1814 }, { "epoch": 0.19, "learning_rate": 0.00018705410256344122, "loss": 0.7131, "step": 1815 }, { "epoch": 0.19, "learning_rate": 0.00018703750645154802, "loss": 0.6967, "step": 1816 }, { "epoch": 0.19, "learning_rate": 0.00018702090044590852, "loss": 0.6992, "step": 1817 }, { "epoch": 0.19, "learning_rate": 0.00018700428454841036, "loss": 0.6856, "step": 1818 }, { "epoch": 0.19, "learning_rate": 0.00018698765876094234, "loss": 0.6624, "step": 1819 }, { "epoch": 0.19, "learning_rate": 0.00018697102308539432, "loss": 0.7144, "step": 1820 }, { "epoch": 0.19, "learning_rate": 0.0001869543775236573, "loss": 0.6895, "step": 1821 }, { "epoch": 0.19, "learning_rate": 0.00018693772207762345, "loss": 0.696, "step": 1822 }, { "epoch": 0.19, "learning_rate": 0.00018692105674918602, "loss": 0.7127, "step": 1823 }, { "epoch": 0.19, "learning_rate": 0.00018690438154023937, "loss": 0.719, "step": 1824 }, { "epoch": 0.19, "learning_rate": 0.00018688769645267908, "loss": 0.7321, "step": 1825 }, { "epoch": 0.19, "learning_rate": 0.00018687100148840168, "loss": 0.7292, "step": 1826 }, { "epoch": 0.19, "learning_rate": 0.00018685429664930503, "loss": 0.7302, "step": 1827 }, { "epoch": 0.19, "learning_rate": 0.0001868375819372879, "loss": 0.7675, "step": 1828 }, { "epoch": 0.19, "learning_rate": 0.0001868208573542504, "loss": 0.6792, "step": 1829 }, { "epoch": 0.19, "learning_rate": 0.00018680412290209355, "loss": 0.5977, "step": 1830 }, { "epoch": 0.19, "learning_rate": 0.00018678737858271962, "loss": 0.7451, "step": 1831 }, { "epoch": 0.19, "learning_rate": 0.000186770624398032, "loss": 0.6623, "step": 1832 }, { "epoch": 0.19, "learning_rate": 0.00018675386034993518, "loss": 0.6393, "step": 1833 }, { "epoch": 0.19, "learning_rate": 0.00018673708644033473, "loss": 0.6705, "step": 1834 }, { "epoch": 0.19, "learning_rate": 0.00018672030267113745, "loss": 0.6826, "step": 1835 }, { "epoch": 0.19, "learning_rate": 0.00018670350904425106, "loss": 0.6993, "step": 1836 }, { "epoch": 0.19, "learning_rate": 0.00018668670556158464, "loss": 0.7076, "step": 1837 }, { "epoch": 0.19, "learning_rate": 0.00018666989222504828, "loss": 0.6927, "step": 1838 }, { "epoch": 0.19, "learning_rate": 0.0001866530690365531, "loss": 0.6893, "step": 1839 }, { "epoch": 0.19, "learning_rate": 0.00018663623599801148, "loss": 0.6644, "step": 1840 }, { "epoch": 0.19, "learning_rate": 0.0001866193931113369, "loss": 0.7134, "step": 1841 }, { "epoch": 0.19, "learning_rate": 0.00018660254037844388, "loss": 0.6948, "step": 1842 }, { "epoch": 0.19, "learning_rate": 0.00018658567780124811, "loss": 0.6663, "step": 1843 }, { "epoch": 0.19, "learning_rate": 0.00018656880538166646, "loss": 0.6713, "step": 1844 }, { "epoch": 0.19, "learning_rate": 0.00018655192312161677, "loss": 0.7146, "step": 1845 }, { "epoch": 0.19, "learning_rate": 0.00018653503102301813, "loss": 0.6582, "step": 1846 }, { "epoch": 0.19, "learning_rate": 0.0001865181290877907, "loss": 0.7585, "step": 1847 }, { "epoch": 0.19, "learning_rate": 0.00018650121731785574, "loss": 0.7392, "step": 1848 }, { "epoch": 0.19, "learning_rate": 0.00018648429571513567, "loss": 0.7384, "step": 1849 }, { "epoch": 0.19, "learning_rate": 0.00018646736428155403, "loss": 0.6576, "step": 1850 }, { "epoch": 0.19, "learning_rate": 0.00018645042301903536, "loss": 0.7206, "step": 1851 }, { "epoch": 0.19, "learning_rate": 0.00018643347192950552, "loss": 0.7015, "step": 1852 }, { "epoch": 0.19, "learning_rate": 0.00018641651101489133, "loss": 0.6908, "step": 1853 }, { "epoch": 0.19, "learning_rate": 0.00018639954027712077, "loss": 0.7047, "step": 1854 }, { "epoch": 0.19, "learning_rate": 0.00018638255971812294, "loss": 0.7155, "step": 1855 }, { "epoch": 0.19, "learning_rate": 0.00018636556933982807, "loss": 0.7004, "step": 1856 }, { "epoch": 0.19, "learning_rate": 0.0001863485691441675, "loss": 0.6675, "step": 1857 }, { "epoch": 0.19, "learning_rate": 0.00018633155913307366, "loss": 0.7457, "step": 1858 }, { "epoch": 0.19, "learning_rate": 0.0001863145393084801, "loss": 0.7278, "step": 1859 }, { "epoch": 0.19, "learning_rate": 0.00018629750967232158, "loss": 0.7246, "step": 1860 }, { "epoch": 0.19, "learning_rate": 0.0001862804702265338, "loss": 0.7518, "step": 1861 }, { "epoch": 0.19, "learning_rate": 0.00018626342097305374, "loss": 0.7631, "step": 1862 }, { "epoch": 0.19, "learning_rate": 0.00018624636191381938, "loss": 0.7098, "step": 1863 }, { "epoch": 0.19, "learning_rate": 0.00018622929305076987, "loss": 0.7309, "step": 1864 }, { "epoch": 0.19, "learning_rate": 0.0001862122143858455, "loss": 0.6882, "step": 1865 }, { "epoch": 0.19, "learning_rate": 0.00018619512592098761, "loss": 0.7431, "step": 1866 }, { "epoch": 0.19, "learning_rate": 0.00018617802765813872, "loss": 0.6822, "step": 1867 }, { "epoch": 0.19, "learning_rate": 0.00018616091959924234, "loss": 0.6714, "step": 1868 }, { "epoch": 0.19, "learning_rate": 0.00018614380174624328, "loss": 0.71, "step": 1869 }, { "epoch": 0.19, "learning_rate": 0.00018612667410108734, "loss": 0.662, "step": 1870 }, { "epoch": 0.19, "learning_rate": 0.0001861095366657214, "loss": 0.7039, "step": 1871 }, { "epoch": 0.19, "learning_rate": 0.00018609238944209354, "loss": 0.692, "step": 1872 }, { "epoch": 0.19, "learning_rate": 0.000186075232432153, "loss": 0.7122, "step": 1873 }, { "epoch": 0.2, "learning_rate": 0.00018605806563784993, "loss": 0.6775, "step": 1874 }, { "epoch": 0.2, "learning_rate": 0.00018604088906113577, "loss": 0.7077, "step": 1875 }, { "epoch": 0.2, "learning_rate": 0.00018602370270396308, "loss": 0.6994, "step": 1876 }, { "epoch": 0.2, "learning_rate": 0.00018600650656828537, "loss": 0.6776, "step": 1877 }, { "epoch": 0.2, "learning_rate": 0.00018598930065605743, "loss": 0.6854, "step": 1878 }, { "epoch": 0.2, "learning_rate": 0.00018597208496923509, "loss": 0.7009, "step": 1879 }, { "epoch": 0.2, "learning_rate": 0.00018595485950977526, "loss": 0.7012, "step": 1880 }, { "epoch": 0.2, "learning_rate": 0.00018593762427963602, "loss": 0.6348, "step": 1881 }, { "epoch": 0.2, "learning_rate": 0.00018592037928077653, "loss": 0.7415, "step": 1882 }, { "epoch": 0.2, "learning_rate": 0.00018590312451515707, "loss": 0.6294, "step": 1883 }, { "epoch": 0.2, "learning_rate": 0.00018588585998473902, "loss": 0.7159, "step": 1884 }, { "epoch": 0.2, "learning_rate": 0.0001858685856914849, "loss": 0.717, "step": 1885 }, { "epoch": 0.2, "learning_rate": 0.0001858513016373583, "loss": 0.6949, "step": 1886 }, { "epoch": 0.2, "learning_rate": 0.00018583400782432394, "loss": 0.6497, "step": 1887 }, { "epoch": 0.2, "learning_rate": 0.00018581670425434763, "loss": 0.7453, "step": 1888 }, { "epoch": 0.2, "learning_rate": 0.00018579939092939633, "loss": 0.6729, "step": 1889 }, { "epoch": 0.2, "learning_rate": 0.0001857820678514381, "loss": 0.6608, "step": 1890 }, { "epoch": 0.2, "learning_rate": 0.00018576473502244202, "loss": 0.7258, "step": 1891 }, { "epoch": 0.2, "learning_rate": 0.00018574739244437845, "loss": 0.6243, "step": 1892 }, { "epoch": 0.2, "learning_rate": 0.00018573004011921866, "loss": 0.6787, "step": 1893 }, { "epoch": 0.2, "learning_rate": 0.0001857126780489352, "loss": 0.7036, "step": 1894 }, { "epoch": 0.2, "learning_rate": 0.00018569530623550163, "loss": 0.7765, "step": 1895 }, { "epoch": 0.2, "learning_rate": 0.00018567792468089262, "loss": 0.6595, "step": 1896 }, { "epoch": 0.2, "learning_rate": 0.000185660533387084, "loss": 0.6617, "step": 1897 }, { "epoch": 0.2, "learning_rate": 0.00018564313235605267, "loss": 0.7149, "step": 1898 }, { "epoch": 0.2, "learning_rate": 0.00018562572158977667, "loss": 0.7008, "step": 1899 }, { "epoch": 0.2, "learning_rate": 0.00018560830109023505, "loss": 0.7301, "step": 1900 }, { "epoch": 0.2, "learning_rate": 0.00018559087085940812, "loss": 0.7061, "step": 1901 }, { "epoch": 0.2, "learning_rate": 0.00018557343089927714, "loss": 0.6918, "step": 1902 }, { "epoch": 0.2, "learning_rate": 0.0001855559812118246, "loss": 0.6646, "step": 1903 }, { "epoch": 0.2, "learning_rate": 0.000185538521799034, "loss": 0.6618, "step": 1904 }, { "epoch": 0.2, "learning_rate": 0.00018552105266289007, "loss": 0.7334, "step": 1905 }, { "epoch": 0.2, "learning_rate": 0.00018550357380537849, "loss": 0.7131, "step": 1906 }, { "epoch": 0.2, "learning_rate": 0.0001854860852284861, "loss": 0.6842, "step": 1907 }, { "epoch": 0.2, "learning_rate": 0.00018546858693420094, "loss": 0.6357, "step": 1908 }, { "epoch": 0.2, "learning_rate": 0.00018545107892451208, "loss": 0.7568, "step": 1909 }, { "epoch": 0.2, "learning_rate": 0.00018543356120140963, "loss": 0.6846, "step": 1910 }, { "epoch": 0.2, "learning_rate": 0.00018541603376688487, "loss": 0.6565, "step": 1911 }, { "epoch": 0.2, "learning_rate": 0.00018539849662293025, "loss": 0.7409, "step": 1912 }, { "epoch": 0.2, "learning_rate": 0.0001853809497715392, "loss": 0.6901, "step": 1913 }, { "epoch": 0.2, "learning_rate": 0.00018536339321470634, "loss": 0.7521, "step": 1914 }, { "epoch": 0.2, "learning_rate": 0.00018534582695442736, "loss": 0.7109, "step": 1915 }, { "epoch": 0.2, "learning_rate": 0.00018532825099269905, "loss": 0.6766, "step": 1916 }, { "epoch": 0.2, "learning_rate": 0.00018531066533151932, "loss": 0.6598, "step": 1917 }, { "epoch": 0.2, "learning_rate": 0.0001852930699728871, "loss": 0.6696, "step": 1918 }, { "epoch": 0.2, "learning_rate": 0.00018527546491880256, "loss": 0.645, "step": 1919 }, { "epoch": 0.2, "learning_rate": 0.00018525785017126694, "loss": 0.6998, "step": 1920 }, { "epoch": 0.2, "learning_rate": 0.00018524022573228248, "loss": 0.7192, "step": 1921 }, { "epoch": 0.2, "learning_rate": 0.0001852225916038526, "loss": 0.7435, "step": 1922 }, { "epoch": 0.2, "learning_rate": 0.00018520494778798184, "loss": 0.7205, "step": 1923 }, { "epoch": 0.2, "learning_rate": 0.00018518729428667577, "loss": 0.7763, "step": 1924 }, { "epoch": 0.2, "learning_rate": 0.00018516963110194116, "loss": 0.7604, "step": 1925 }, { "epoch": 0.2, "learning_rate": 0.00018515195823578577, "loss": 0.742, "step": 1926 }, { "epoch": 0.2, "learning_rate": 0.00018513427569021853, "loss": 0.7398, "step": 1927 }, { "epoch": 0.2, "learning_rate": 0.00018511658346724946, "loss": 0.6264, "step": 1928 }, { "epoch": 0.2, "learning_rate": 0.00018509888156888966, "loss": 0.6928, "step": 1929 }, { "epoch": 0.2, "learning_rate": 0.0001850811699971514, "loss": 0.7072, "step": 1930 }, { "epoch": 0.2, "learning_rate": 0.0001850634487540479, "loss": 0.6649, "step": 1931 }, { "epoch": 0.2, "learning_rate": 0.00018504571784159362, "loss": 0.6731, "step": 1932 }, { "epoch": 0.2, "learning_rate": 0.00018502797726180413, "loss": 0.704, "step": 1933 }, { "epoch": 0.2, "learning_rate": 0.00018501022701669593, "loss": 0.7038, "step": 1934 }, { "epoch": 0.2, "learning_rate": 0.00018499246710828682, "loss": 0.7077, "step": 1935 }, { "epoch": 0.2, "learning_rate": 0.00018497469753859556, "loss": 0.6921, "step": 1936 }, { "epoch": 0.2, "learning_rate": 0.0001849569183096421, "loss": 0.6128, "step": 1937 }, { "epoch": 0.2, "learning_rate": 0.00018493912942344737, "loss": 0.7057, "step": 1938 }, { "epoch": 0.2, "learning_rate": 0.00018492133088203355, "loss": 0.7097, "step": 1939 }, { "epoch": 0.2, "learning_rate": 0.0001849035226874238, "loss": 0.6596, "step": 1940 }, { "epoch": 0.2, "learning_rate": 0.00018488570484164238, "loss": 0.7389, "step": 1941 }, { "epoch": 0.2, "learning_rate": 0.00018486787734671477, "loss": 0.7247, "step": 1942 }, { "epoch": 0.2, "learning_rate": 0.0001848500402046674, "loss": 0.6437, "step": 1943 }, { "epoch": 0.2, "learning_rate": 0.00018483219341752788, "loss": 0.7375, "step": 1944 }, { "epoch": 0.2, "learning_rate": 0.0001848143369873249, "loss": 0.7009, "step": 1945 }, { "epoch": 0.2, "learning_rate": 0.00018479647091608823, "loss": 0.682, "step": 1946 }, { "epoch": 0.2, "learning_rate": 0.00018477859520584872, "loss": 0.6333, "step": 1947 }, { "epoch": 0.2, "learning_rate": 0.0001847607098586384, "loss": 0.7076, "step": 1948 }, { "epoch": 0.2, "learning_rate": 0.0001847428148764903, "loss": 0.7294, "step": 1949 }, { "epoch": 0.2, "learning_rate": 0.00018472491026143856, "loss": 0.7293, "step": 1950 }, { "epoch": 0.2, "learning_rate": 0.00018470699601551846, "loss": 0.692, "step": 1951 }, { "epoch": 0.2, "learning_rate": 0.0001846890721407664, "loss": 0.705, "step": 1952 }, { "epoch": 0.2, "learning_rate": 0.00018467113863921975, "loss": 0.6683, "step": 1953 }, { "epoch": 0.2, "learning_rate": 0.0001846531955129171, "loss": 0.7302, "step": 1954 }, { "epoch": 0.2, "learning_rate": 0.00018463524276389804, "loss": 0.6321, "step": 1955 }, { "epoch": 0.2, "learning_rate": 0.00018461728039420336, "loss": 0.7712, "step": 1956 }, { "epoch": 0.2, "learning_rate": 0.00018459930840587484, "loss": 0.6769, "step": 1957 }, { "epoch": 0.2, "learning_rate": 0.0001845813268009554, "loss": 0.6927, "step": 1958 }, { "epoch": 0.2, "learning_rate": 0.00018456333558148903, "loss": 0.7274, "step": 1959 }, { "epoch": 0.2, "learning_rate": 0.00018454533474952087, "loss": 0.7423, "step": 1960 }, { "epoch": 0.2, "learning_rate": 0.0001845273243070971, "loss": 0.7203, "step": 1961 }, { "epoch": 0.2, "learning_rate": 0.00018450930425626503, "loss": 0.6683, "step": 1962 }, { "epoch": 0.2, "learning_rate": 0.000184491274599073, "loss": 0.6934, "step": 1963 }, { "epoch": 0.2, "learning_rate": 0.0001844732353375705, "loss": 0.6987, "step": 1964 }, { "epoch": 0.2, "learning_rate": 0.00018445518647380808, "loss": 0.7285, "step": 1965 }, { "epoch": 0.2, "learning_rate": 0.0001844371280098374, "loss": 0.6845, "step": 1966 }, { "epoch": 0.2, "learning_rate": 0.00018441905994771125, "loss": 0.6981, "step": 1967 }, { "epoch": 0.2, "learning_rate": 0.0001844009822894834, "loss": 0.6647, "step": 1968 }, { "epoch": 0.2, "learning_rate": 0.00018438289503720881, "loss": 0.6498, "step": 1969 }, { "epoch": 0.21, "learning_rate": 0.00018436479819294345, "loss": 0.7261, "step": 1970 }, { "epoch": 0.21, "learning_rate": 0.00018434669175874452, "loss": 0.7423, "step": 1971 }, { "epoch": 0.21, "learning_rate": 0.00018432857573667019, "loss": 0.7129, "step": 1972 }, { "epoch": 0.21, "learning_rate": 0.00018431045012877966, "loss": 0.7014, "step": 1973 }, { "epoch": 0.21, "learning_rate": 0.0001842923149371334, "loss": 0.7165, "step": 1974 }, { "epoch": 0.21, "learning_rate": 0.00018427417016379286, "loss": 0.7063, "step": 1975 }, { "epoch": 0.21, "learning_rate": 0.00018425601581082058, "loss": 0.6886, "step": 1976 }, { "epoch": 0.21, "learning_rate": 0.00018423785188028026, "loss": 0.7247, "step": 1977 }, { "epoch": 0.21, "learning_rate": 0.00018421967837423654, "loss": 0.7507, "step": 1978 }, { "epoch": 0.21, "learning_rate": 0.00018420149529475532, "loss": 0.6879, "step": 1979 }, { "epoch": 0.21, "learning_rate": 0.00018418330264390346, "loss": 0.6727, "step": 1980 }, { "epoch": 0.21, "learning_rate": 0.00018416510042374898, "loss": 0.6792, "step": 1981 }, { "epoch": 0.21, "learning_rate": 0.000184146888636361, "loss": 0.745, "step": 1982 }, { "epoch": 0.21, "learning_rate": 0.00018412866728380965, "loss": 0.692, "step": 1983 }, { "epoch": 0.21, "learning_rate": 0.00018411043636816618, "loss": 0.7354, "step": 1984 }, { "epoch": 0.21, "learning_rate": 0.00018409219589150298, "loss": 0.7377, "step": 1985 }, { "epoch": 0.21, "learning_rate": 0.00018407394585589346, "loss": 0.6624, "step": 1986 }, { "epoch": 0.21, "learning_rate": 0.0001840556862634122, "loss": 0.716, "step": 1987 }, { "epoch": 0.21, "learning_rate": 0.00018403741711613472, "loss": 0.7292, "step": 1988 }, { "epoch": 0.21, "learning_rate": 0.00018401913841613774, "loss": 0.6981, "step": 1989 }, { "epoch": 0.21, "learning_rate": 0.00018400085016549906, "loss": 0.7069, "step": 1990 }, { "epoch": 0.21, "learning_rate": 0.00018398255236629755, "loss": 0.7714, "step": 1991 }, { "epoch": 0.21, "learning_rate": 0.00018396424502061312, "loss": 0.6806, "step": 1992 }, { "epoch": 0.21, "learning_rate": 0.00018394592813052686, "loss": 0.7556, "step": 1993 }, { "epoch": 0.21, "learning_rate": 0.0001839276016981209, "loss": 0.7199, "step": 1994 }, { "epoch": 0.21, "learning_rate": 0.0001839092657254784, "loss": 0.7382, "step": 1995 }, { "epoch": 0.21, "learning_rate": 0.00018389092021468364, "loss": 0.7036, "step": 1996 }, { "epoch": 0.21, "learning_rate": 0.00018387256516782204, "loss": 0.697, "step": 1997 }, { "epoch": 0.21, "learning_rate": 0.00018385420058698003, "loss": 0.7635, "step": 1998 }, { "epoch": 0.21, "learning_rate": 0.00018383582647424517, "loss": 0.7217, "step": 1999 }, { "epoch": 0.21, "learning_rate": 0.00018381744283170608, "loss": 0.7324, "step": 2000 }, { "epoch": 0.21, "learning_rate": 0.00018379904966145247, "loss": 0.7126, "step": 2001 }, { "epoch": 0.21, "learning_rate": 0.0001837806469655751, "loss": 0.6805, "step": 2002 }, { "epoch": 0.21, "learning_rate": 0.0001837622347461659, "loss": 0.7141, "step": 2003 }, { "epoch": 0.21, "learning_rate": 0.00018374381300531782, "loss": 0.7326, "step": 2004 }, { "epoch": 0.21, "learning_rate": 0.00018372538174512486, "loss": 0.7134, "step": 2005 }, { "epoch": 0.21, "learning_rate": 0.00018370694096768217, "loss": 0.6655, "step": 2006 }, { "epoch": 0.21, "learning_rate": 0.00018368849067508595, "loss": 0.7578, "step": 2007 }, { "epoch": 0.21, "learning_rate": 0.0001836700308694335, "loss": 0.6773, "step": 2008 }, { "epoch": 0.21, "learning_rate": 0.00018365156155282316, "loss": 0.7223, "step": 2009 }, { "epoch": 0.21, "learning_rate": 0.00018363308272735437, "loss": 0.7567, "step": 2010 }, { "epoch": 0.21, "learning_rate": 0.0001836145943951277, "loss": 0.6829, "step": 2011 }, { "epoch": 0.21, "learning_rate": 0.00018359609655824475, "loss": 0.6462, "step": 2012 }, { "epoch": 0.21, "learning_rate": 0.0001835775892188082, "loss": 0.7302, "step": 2013 }, { "epoch": 0.21, "learning_rate": 0.0001835590723789218, "loss": 0.7276, "step": 2014 }, { "epoch": 0.21, "learning_rate": 0.00018354054604069041, "loss": 0.7592, "step": 2015 }, { "epoch": 0.21, "learning_rate": 0.00018352201020622, "loss": 0.7092, "step": 2016 }, { "epoch": 0.21, "learning_rate": 0.00018350346487761753, "loss": 0.6902, "step": 2017 }, { "epoch": 0.21, "learning_rate": 0.00018348491005699114, "loss": 0.6765, "step": 2018 }, { "epoch": 0.21, "learning_rate": 0.0001834663457464499, "loss": 0.6844, "step": 2019 }, { "epoch": 0.21, "learning_rate": 0.00018344777194810417, "loss": 0.7494, "step": 2020 }, { "epoch": 0.21, "learning_rate": 0.00018342918866406525, "loss": 0.7404, "step": 2021 }, { "epoch": 0.21, "learning_rate": 0.00018341059589644548, "loss": 0.7017, "step": 2022 }, { "epoch": 0.21, "learning_rate": 0.00018339199364735838, "loss": 0.7267, "step": 2023 }, { "epoch": 0.21, "learning_rate": 0.0001833733819189185, "loss": 0.7356, "step": 2024 }, { "epoch": 0.21, "learning_rate": 0.00018335476071324152, "loss": 0.6662, "step": 2025 }, { "epoch": 0.21, "learning_rate": 0.0001833361300324441, "loss": 0.7137, "step": 2026 }, { "epoch": 0.21, "learning_rate": 0.00018331748987864406, "loss": 0.753, "step": 2027 }, { "epoch": 0.21, "learning_rate": 0.00018329884025396025, "loss": 0.704, "step": 2028 }, { "epoch": 0.21, "learning_rate": 0.0001832801811605126, "loss": 0.7074, "step": 2029 }, { "epoch": 0.21, "learning_rate": 0.00018326151260042223, "loss": 0.6399, "step": 2030 }, { "epoch": 0.21, "learning_rate": 0.0001832428345758111, "loss": 0.6991, "step": 2031 }, { "epoch": 0.21, "learning_rate": 0.00018322414708880243, "loss": 0.6757, "step": 2032 }, { "epoch": 0.21, "learning_rate": 0.00018320545014152053, "loss": 0.6588, "step": 2033 }, { "epoch": 0.21, "learning_rate": 0.00018318674373609062, "loss": 0.7063, "step": 2034 }, { "epoch": 0.21, "learning_rate": 0.0001831680278746392, "loss": 0.7074, "step": 2035 }, { "epoch": 0.21, "learning_rate": 0.00018314930255929366, "loss": 0.6974, "step": 2036 }, { "epoch": 0.21, "learning_rate": 0.0001831305677921826, "loss": 0.6642, "step": 2037 }, { "epoch": 0.21, "learning_rate": 0.00018311182357543562, "loss": 0.7037, "step": 2038 }, { "epoch": 0.21, "learning_rate": 0.00018309306991118343, "loss": 0.7183, "step": 2039 }, { "epoch": 0.21, "learning_rate": 0.00018307430680155777, "loss": 0.6735, "step": 2040 }, { "epoch": 0.21, "learning_rate": 0.00018305553424869154, "loss": 0.7359, "step": 2041 }, { "epoch": 0.21, "learning_rate": 0.0001830367522547186, "loss": 0.6793, "step": 2042 }, { "epoch": 0.21, "learning_rate": 0.00018301796082177395, "loss": 0.7451, "step": 2043 }, { "epoch": 0.21, "learning_rate": 0.00018299915995199372, "loss": 0.7345, "step": 2044 }, { "epoch": 0.21, "learning_rate": 0.00018298034964751495, "loss": 0.6481, "step": 2045 }, { "epoch": 0.21, "learning_rate": 0.00018296152991047594, "loss": 0.7095, "step": 2046 }, { "epoch": 0.21, "learning_rate": 0.00018294270074301593, "loss": 0.6994, "step": 2047 }, { "epoch": 0.21, "learning_rate": 0.0001829238621472752, "loss": 0.6599, "step": 2048 }, { "epoch": 0.21, "learning_rate": 0.00018290501412539532, "loss": 0.6484, "step": 2049 }, { "epoch": 0.21, "learning_rate": 0.00018288615667951867, "loss": 0.7233, "step": 2050 }, { "epoch": 0.21, "learning_rate": 0.00018286728981178888, "loss": 0.6356, "step": 2051 }, { "epoch": 0.21, "learning_rate": 0.00018284841352435055, "loss": 0.7332, "step": 2052 }, { "epoch": 0.21, "learning_rate": 0.00018282952781934945, "loss": 0.7469, "step": 2053 }, { "epoch": 0.21, "learning_rate": 0.00018281063269893225, "loss": 0.6876, "step": 2054 }, { "epoch": 0.21, "learning_rate": 0.00018279172816524692, "loss": 0.672, "step": 2055 }, { "epoch": 0.21, "learning_rate": 0.0001827728142204423, "loss": 0.6809, "step": 2056 }, { "epoch": 0.21, "learning_rate": 0.00018275389086666843, "loss": 0.685, "step": 2057 }, { "epoch": 0.21, "learning_rate": 0.00018273495810607632, "loss": 0.6957, "step": 2058 }, { "epoch": 0.21, "learning_rate": 0.00018271601594081814, "loss": 0.6998, "step": 2059 }, { "epoch": 0.21, "learning_rate": 0.00018269706437304707, "loss": 0.6894, "step": 2060 }, { "epoch": 0.21, "learning_rate": 0.0001826781034049174, "loss": 0.6104, "step": 2061 }, { "epoch": 0.21, "learning_rate": 0.0001826591330385844, "loss": 0.7259, "step": 2062 }, { "epoch": 0.21, "learning_rate": 0.00018264015327620458, "loss": 0.6594, "step": 2063 }, { "epoch": 0.21, "learning_rate": 0.0001826211641199353, "loss": 0.6988, "step": 2064 }, { "epoch": 0.21, "learning_rate": 0.0001826021655719352, "loss": 0.6982, "step": 2065 }, { "epoch": 0.22, "learning_rate": 0.0001825831576343638, "loss": 0.661, "step": 2066 }, { "epoch": 0.22, "learning_rate": 0.00018256414030938184, "loss": 0.7675, "step": 2067 }, { "epoch": 0.22, "learning_rate": 0.000182545113599151, "loss": 0.7057, "step": 2068 }, { "epoch": 0.22, "learning_rate": 0.00018252607750583413, "loss": 0.6747, "step": 2069 }, { "epoch": 0.22, "learning_rate": 0.00018250703203159512, "loss": 0.71, "step": 2070 }, { "epoch": 0.22, "learning_rate": 0.00018248797717859886, "loss": 0.7119, "step": 2071 }, { "epoch": 0.22, "learning_rate": 0.0001824689129490114, "loss": 0.7107, "step": 2072 }, { "epoch": 0.22, "learning_rate": 0.0001824498393449998, "loss": 0.7127, "step": 2073 }, { "epoch": 0.22, "learning_rate": 0.00018243075636873219, "loss": 0.6168, "step": 2074 }, { "epoch": 0.22, "learning_rate": 0.0001824116640223778, "loss": 0.6797, "step": 2075 }, { "epoch": 0.22, "learning_rate": 0.00018239256230810687, "loss": 0.66, "step": 2076 }, { "epoch": 0.22, "learning_rate": 0.00018237345122809075, "loss": 0.7218, "step": 2077 }, { "epoch": 0.22, "learning_rate": 0.0001823543307845018, "loss": 0.7307, "step": 2078 }, { "epoch": 0.22, "learning_rate": 0.00018233520097951357, "loss": 0.6991, "step": 2079 }, { "epoch": 0.22, "learning_rate": 0.00018231606181530049, "loss": 0.6206, "step": 2080 }, { "epoch": 0.22, "learning_rate": 0.00018229691329403825, "loss": 0.7334, "step": 2081 }, { "epoch": 0.22, "learning_rate": 0.0001822777554179034, "loss": 0.6832, "step": 2082 }, { "epoch": 0.22, "learning_rate": 0.0001822585881890737, "loss": 0.646, "step": 2083 }, { "epoch": 0.22, "learning_rate": 0.000182239411609728, "loss": 0.7353, "step": 2084 }, { "epoch": 0.22, "learning_rate": 0.00018222022568204605, "loss": 0.6838, "step": 2085 }, { "epoch": 0.22, "learning_rate": 0.00018220103040820877, "loss": 0.7583, "step": 2086 }, { "epoch": 0.22, "learning_rate": 0.00018218182579039818, "loss": 0.6778, "step": 2087 }, { "epoch": 0.22, "learning_rate": 0.0001821626118307973, "loss": 0.6878, "step": 2088 }, { "epoch": 0.22, "learning_rate": 0.00018214338853159018, "loss": 0.7691, "step": 2089 }, { "epoch": 0.22, "learning_rate": 0.00018212415589496199, "loss": 0.6765, "step": 2090 }, { "epoch": 0.22, "learning_rate": 0.00018210491392309897, "loss": 0.7297, "step": 2091 }, { "epoch": 0.22, "learning_rate": 0.0001820856626181884, "loss": 0.7211, "step": 2092 }, { "epoch": 0.22, "learning_rate": 0.00018206640198241859, "loss": 0.6789, "step": 2093 }, { "epoch": 0.22, "learning_rate": 0.00018204713201797895, "loss": 0.719, "step": 2094 }, { "epoch": 0.22, "learning_rate": 0.00018202785272705994, "loss": 0.6609, "step": 2095 }, { "epoch": 0.22, "learning_rate": 0.0001820085641118531, "loss": 0.6293, "step": 2096 }, { "epoch": 0.22, "learning_rate": 0.00018198926617455096, "loss": 0.643, "step": 2097 }, { "epoch": 0.22, "learning_rate": 0.00018196995891734723, "loss": 0.7138, "step": 2098 }, { "epoch": 0.22, "learning_rate": 0.00018195064234243654, "loss": 0.7118, "step": 2099 }, { "epoch": 0.22, "learning_rate": 0.00018193131645201466, "loss": 0.7254, "step": 2100 }, { "epoch": 0.22, "learning_rate": 0.00018191198124827847, "loss": 0.7061, "step": 2101 }, { "epoch": 0.22, "learning_rate": 0.0001818926367334258, "loss": 0.7222, "step": 2102 }, { "epoch": 0.22, "learning_rate": 0.00018187328290965554, "loss": 0.6858, "step": 2103 }, { "epoch": 0.22, "learning_rate": 0.00018185391977916778, "loss": 0.772, "step": 2104 }, { "epoch": 0.22, "learning_rate": 0.00018183454734416348, "loss": 0.7433, "step": 2105 }, { "epoch": 0.22, "learning_rate": 0.00018181516560684477, "loss": 0.7539, "step": 2106 }, { "epoch": 0.22, "learning_rate": 0.00018179577456941485, "loss": 0.7899, "step": 2107 }, { "epoch": 0.22, "learning_rate": 0.00018177637423407792, "loss": 0.7075, "step": 2108 }, { "epoch": 0.22, "learning_rate": 0.00018175696460303925, "loss": 0.6699, "step": 2109 }, { "epoch": 0.22, "learning_rate": 0.00018173754567850521, "loss": 0.7071, "step": 2110 }, { "epoch": 0.22, "learning_rate": 0.00018171811746268315, "loss": 0.6851, "step": 2111 }, { "epoch": 0.22, "learning_rate": 0.0001816986799577815, "loss": 0.6573, "step": 2112 }, { "epoch": 0.22, "learning_rate": 0.00018167923316600985, "loss": 0.7155, "step": 2113 }, { "epoch": 0.22, "learning_rate": 0.0001816597770895787, "loss": 0.7428, "step": 2114 }, { "epoch": 0.22, "learning_rate": 0.0001816403117306997, "loss": 0.6689, "step": 2115 }, { "epoch": 0.22, "learning_rate": 0.00018162083709158546, "loss": 0.6827, "step": 2116 }, { "epoch": 0.22, "learning_rate": 0.00018160135317444974, "loss": 0.7528, "step": 2117 }, { "epoch": 0.22, "learning_rate": 0.00018158185998150733, "loss": 0.6723, "step": 2118 }, { "epoch": 0.22, "learning_rate": 0.00018156235751497408, "loss": 0.7234, "step": 2119 }, { "epoch": 0.22, "learning_rate": 0.00018154284577706685, "loss": 0.6518, "step": 2120 }, { "epoch": 0.22, "learning_rate": 0.00018152332477000354, "loss": 0.7073, "step": 2121 }, { "epoch": 0.22, "learning_rate": 0.00018150379449600323, "loss": 0.7288, "step": 2122 }, { "epoch": 0.22, "learning_rate": 0.00018148425495728593, "loss": 0.7058, "step": 2123 }, { "epoch": 0.22, "learning_rate": 0.00018146470615607274, "loss": 0.6925, "step": 2124 }, { "epoch": 0.22, "learning_rate": 0.00018144514809458582, "loss": 0.7347, "step": 2125 }, { "epoch": 0.22, "learning_rate": 0.00018142558077504837, "loss": 0.6787, "step": 2126 }, { "epoch": 0.22, "learning_rate": 0.00018140600419968469, "loss": 0.7012, "step": 2127 }, { "epoch": 0.22, "learning_rate": 0.00018138641837072003, "loss": 0.7051, "step": 2128 }, { "epoch": 0.22, "learning_rate": 0.00018136682329038083, "loss": 0.6932, "step": 2129 }, { "epoch": 0.22, "learning_rate": 0.00018134721896089442, "loss": 0.743, "step": 2130 }, { "epoch": 0.22, "learning_rate": 0.00018132760538448932, "loss": 0.6865, "step": 2131 }, { "epoch": 0.22, "learning_rate": 0.00018130798256339503, "loss": 0.6422, "step": 2132 }, { "epoch": 0.22, "learning_rate": 0.00018128835049984217, "loss": 0.7144, "step": 2133 }, { "epoch": 0.22, "learning_rate": 0.00018126870919606228, "loss": 0.7915, "step": 2134 }, { "epoch": 0.22, "learning_rate": 0.00018124905865428808, "loss": 0.7157, "step": 2135 }, { "epoch": 0.22, "learning_rate": 0.00018122939887675328, "loss": 0.7046, "step": 2136 }, { "epoch": 0.22, "learning_rate": 0.00018120972986569264, "loss": 0.7226, "step": 2137 }, { "epoch": 0.22, "learning_rate": 0.000181190051623342, "loss": 0.7396, "step": 2138 }, { "epoch": 0.22, "learning_rate": 0.00018117036415193823, "loss": 0.7218, "step": 2139 }, { "epoch": 0.22, "learning_rate": 0.00018115066745371926, "loss": 0.7131, "step": 2140 }, { "epoch": 0.22, "learning_rate": 0.000181130961530924, "loss": 0.6888, "step": 2141 }, { "epoch": 0.22, "learning_rate": 0.00018111124638579251, "loss": 0.7039, "step": 2142 }, { "epoch": 0.22, "learning_rate": 0.00018109152202056586, "loss": 0.6735, "step": 2143 }, { "epoch": 0.22, "learning_rate": 0.00018107178843748613, "loss": 0.6914, "step": 2144 }, { "epoch": 0.22, "learning_rate": 0.00018105204563879652, "loss": 0.7105, "step": 2145 }, { "epoch": 0.22, "learning_rate": 0.0001810322936267412, "loss": 0.6757, "step": 2146 }, { "epoch": 0.22, "learning_rate": 0.00018101253240356547, "loss": 0.7271, "step": 2147 }, { "epoch": 0.22, "learning_rate": 0.00018099276197151555, "loss": 0.6962, "step": 2148 }, { "epoch": 0.22, "learning_rate": 0.00018097298233283888, "loss": 0.7213, "step": 2149 }, { "epoch": 0.22, "learning_rate": 0.00018095319348978382, "loss": 0.7122, "step": 2150 }, { "epoch": 0.22, "learning_rate": 0.0001809333954445998, "loss": 0.6302, "step": 2151 }, { "epoch": 0.22, "learning_rate": 0.00018091358819953733, "loss": 0.6956, "step": 2152 }, { "epoch": 0.22, "learning_rate": 0.00018089377175684789, "loss": 0.6972, "step": 2153 }, { "epoch": 0.22, "learning_rate": 0.00018087394611878414, "loss": 0.6811, "step": 2154 }, { "epoch": 0.22, "learning_rate": 0.00018085411128759965, "loss": 0.7014, "step": 2155 }, { "epoch": 0.22, "learning_rate": 0.0001808342672655491, "loss": 0.66, "step": 2156 }, { "epoch": 0.22, "learning_rate": 0.0001808144140548882, "loss": 0.7318, "step": 2157 }, { "epoch": 0.22, "learning_rate": 0.00018079455165787372, "loss": 0.7007, "step": 2158 }, { "epoch": 0.22, "learning_rate": 0.00018077468007676351, "loss": 0.7183, "step": 2159 }, { "epoch": 0.22, "learning_rate": 0.0001807547993138163, "loss": 0.7151, "step": 2160 }, { "epoch": 0.22, "learning_rate": 0.00018073490937129208, "loss": 0.7083, "step": 2161 }, { "epoch": 0.23, "learning_rate": 0.00018071501025145175, "loss": 0.6601, "step": 2162 }, { "epoch": 0.23, "learning_rate": 0.00018069510195655727, "loss": 0.6799, "step": 2163 }, { "epoch": 0.23, "learning_rate": 0.00018067518448887165, "loss": 0.6635, "step": 2164 }, { "epoch": 0.23, "learning_rate": 0.000180655257850659, "loss": 0.7174, "step": 2165 }, { "epoch": 0.23, "learning_rate": 0.00018063532204418443, "loss": 0.6736, "step": 2166 }, { "epoch": 0.23, "learning_rate": 0.00018061537707171404, "loss": 0.6951, "step": 2167 }, { "epoch": 0.23, "learning_rate": 0.00018059542293551503, "loss": 0.6996, "step": 2168 }, { "epoch": 0.23, "learning_rate": 0.00018057545963785567, "loss": 0.674, "step": 2169 }, { "epoch": 0.23, "learning_rate": 0.0001805554871810052, "loss": 0.6951, "step": 2170 }, { "epoch": 0.23, "learning_rate": 0.00018053550556723394, "loss": 0.6717, "step": 2171 }, { "epoch": 0.23, "learning_rate": 0.0001805155147988132, "loss": 0.6777, "step": 2172 }, { "epoch": 0.23, "learning_rate": 0.00018049551487801547, "loss": 0.6601, "step": 2173 }, { "epoch": 0.23, "learning_rate": 0.0001804755058071141, "loss": 0.6977, "step": 2174 }, { "epoch": 0.23, "learning_rate": 0.0001804554875883836, "loss": 0.6878, "step": 2175 }, { "epoch": 0.23, "learning_rate": 0.0001804354602240995, "loss": 0.7448, "step": 2176 }, { "epoch": 0.23, "learning_rate": 0.0001804154237165383, "loss": 0.7325, "step": 2177 }, { "epoch": 0.23, "learning_rate": 0.0001803953780679777, "loss": 0.7313, "step": 2178 }, { "epoch": 0.23, "learning_rate": 0.0001803753232806962, "loss": 0.7603, "step": 2179 }, { "epoch": 0.23, "learning_rate": 0.00018035525935697355, "loss": 0.6555, "step": 2180 }, { "epoch": 0.23, "learning_rate": 0.00018033518629909044, "loss": 0.6927, "step": 2181 }, { "epoch": 0.23, "learning_rate": 0.00018031510410932867, "loss": 0.733, "step": 2182 }, { "epoch": 0.23, "learning_rate": 0.00018029501278997095, "loss": 0.6903, "step": 2183 }, { "epoch": 0.23, "learning_rate": 0.00018027491234330113, "loss": 0.6484, "step": 2184 }, { "epoch": 0.23, "learning_rate": 0.00018025480277160413, "loss": 0.6685, "step": 2185 }, { "epoch": 0.23, "learning_rate": 0.00018023468407716575, "loss": 0.7063, "step": 2186 }, { "epoch": 0.23, "learning_rate": 0.000180214556262273, "loss": 0.7618, "step": 2187 }, { "epoch": 0.23, "learning_rate": 0.00018019441932921382, "loss": 0.7151, "step": 2188 }, { "epoch": 0.23, "learning_rate": 0.00018017427328027722, "loss": 0.7326, "step": 2189 }, { "epoch": 0.23, "learning_rate": 0.0001801541181177533, "loss": 0.7751, "step": 2190 }, { "epoch": 0.23, "learning_rate": 0.00018013395384393306, "loss": 0.7615, "step": 2191 }, { "epoch": 0.23, "learning_rate": 0.00018011378046110867, "loss": 0.6834, "step": 2192 }, { "epoch": 0.23, "learning_rate": 0.00018009359797157326, "loss": 0.6875, "step": 2193 }, { "epoch": 0.23, "learning_rate": 0.00018007340637762106, "loss": 0.7007, "step": 2194 }, { "epoch": 0.23, "learning_rate": 0.0001800532056815472, "loss": 0.6325, "step": 2195 }, { "epoch": 0.23, "learning_rate": 0.00018003299588564806, "loss": 0.7317, "step": 2196 }, { "epoch": 0.23, "learning_rate": 0.00018001277699222085, "loss": 0.6952, "step": 2197 }, { "epoch": 0.23, "learning_rate": 0.0001799925490035639, "loss": 0.6832, "step": 2198 }, { "epoch": 0.23, "learning_rate": 0.0001799723119219766, "loss": 0.7411, "step": 2199 }, { "epoch": 0.23, "learning_rate": 0.00017995206574975933, "loss": 0.7323, "step": 2200 }, { "epoch": 0.23, "learning_rate": 0.0001799318104892135, "loss": 0.7112, "step": 2201 }, { "epoch": 0.23, "learning_rate": 0.00017991154614264163, "loss": 0.6772, "step": 2202 }, { "epoch": 0.23, "learning_rate": 0.00017989127271234715, "loss": 0.7041, "step": 2203 }, { "epoch": 0.23, "learning_rate": 0.00017987099020063462, "loss": 0.7338, "step": 2204 }, { "epoch": 0.23, "learning_rate": 0.00017985069860980958, "loss": 0.67, "step": 2205 }, { "epoch": 0.23, "learning_rate": 0.00017983039794217863, "loss": 0.6783, "step": 2206 }, { "epoch": 0.23, "learning_rate": 0.0001798100882000494, "loss": 0.6903, "step": 2207 }, { "epoch": 0.23, "learning_rate": 0.0001797897693857305, "loss": 0.7463, "step": 2208 }, { "epoch": 0.23, "learning_rate": 0.00017976944150153166, "loss": 0.6913, "step": 2209 }, { "epoch": 0.23, "learning_rate": 0.00017974910454976358, "loss": 0.7501, "step": 2210 }, { "epoch": 0.23, "learning_rate": 0.00017972875853273802, "loss": 0.6911, "step": 2211 }, { "epoch": 0.23, "learning_rate": 0.00017970840345276772, "loss": 0.6982, "step": 2212 }, { "epoch": 0.23, "learning_rate": 0.00017968803931216654, "loss": 0.7032, "step": 2213 }, { "epoch": 0.23, "learning_rate": 0.00017966766611324928, "loss": 0.7371, "step": 2214 }, { "epoch": 0.23, "learning_rate": 0.00017964728385833181, "loss": 0.7463, "step": 2215 }, { "epoch": 0.23, "learning_rate": 0.00017962689254973104, "loss": 0.7016, "step": 2216 }, { "epoch": 0.23, "learning_rate": 0.0001796064921897649, "loss": 0.7201, "step": 2217 }, { "epoch": 0.23, "learning_rate": 0.00017958608278075228, "loss": 0.7257, "step": 2218 }, { "epoch": 0.23, "learning_rate": 0.00017956566432501326, "loss": 0.6854, "step": 2219 }, { "epoch": 0.23, "learning_rate": 0.0001795452368248688, "loss": 0.733, "step": 2220 }, { "epoch": 0.23, "learning_rate": 0.00017952480028264093, "loss": 0.6644, "step": 2221 }, { "epoch": 0.23, "learning_rate": 0.00017950435470065275, "loss": 0.6467, "step": 2222 }, { "epoch": 0.23, "learning_rate": 0.00017948390008122833, "loss": 0.6552, "step": 2223 }, { "epoch": 0.23, "learning_rate": 0.0001794634364266928, "loss": 0.7045, "step": 2224 }, { "epoch": 0.23, "learning_rate": 0.0001794429637393723, "loss": 0.6799, "step": 2225 }, { "epoch": 0.23, "learning_rate": 0.00017942248202159402, "loss": 0.7327, "step": 2226 }, { "epoch": 0.23, "learning_rate": 0.00017940199127568614, "loss": 0.6393, "step": 2227 }, { "epoch": 0.23, "learning_rate": 0.00017938149150397795, "loss": 0.7055, "step": 2228 }, { "epoch": 0.23, "learning_rate": 0.0001793609827087996, "loss": 0.6409, "step": 2229 }, { "epoch": 0.23, "learning_rate": 0.00017934046489248248, "loss": 0.7373, "step": 2230 }, { "epoch": 0.23, "learning_rate": 0.00017931993805735878, "loss": 0.7162, "step": 2231 }, { "epoch": 0.23, "learning_rate": 0.00017929940220576195, "loss": 0.6623, "step": 2232 }, { "epoch": 0.23, "learning_rate": 0.00017927885734002628, "loss": 0.6896, "step": 2233 }, { "epoch": 0.23, "learning_rate": 0.00017925830346248716, "loss": 0.6549, "step": 2234 }, { "epoch": 0.23, "learning_rate": 0.00017923774057548096, "loss": 0.669, "step": 2235 }, { "epoch": 0.23, "learning_rate": 0.0001792171686813452, "loss": 0.677, "step": 2236 }, { "epoch": 0.23, "learning_rate": 0.00017919658778241826, "loss": 0.7093, "step": 2237 }, { "epoch": 0.23, "learning_rate": 0.00017917599788103963, "loss": 0.7149, "step": 2238 }, { "epoch": 0.23, "learning_rate": 0.0001791553989795498, "loss": 0.6797, "step": 2239 }, { "epoch": 0.23, "learning_rate": 0.0001791347910802903, "loss": 0.7291, "step": 2240 }, { "epoch": 0.23, "learning_rate": 0.00017911417418560373, "loss": 0.6829, "step": 2241 }, { "epoch": 0.23, "learning_rate": 0.00017909354829783358, "loss": 0.6869, "step": 2242 }, { "epoch": 0.23, "learning_rate": 0.00017907291341932443, "loss": 0.7037, "step": 2243 }, { "epoch": 0.23, "learning_rate": 0.00017905226955242202, "loss": 0.6895, "step": 2244 }, { "epoch": 0.23, "learning_rate": 0.00017903161669947283, "loss": 0.7033, "step": 2245 }, { "epoch": 0.23, "learning_rate": 0.00017901095486282461, "loss": 0.7669, "step": 2246 }, { "epoch": 0.23, "learning_rate": 0.000178990284044826, "loss": 0.6559, "step": 2247 }, { "epoch": 0.23, "learning_rate": 0.00017896960424782673, "loss": 0.7853, "step": 2248 }, { "epoch": 0.23, "learning_rate": 0.00017894891547417746, "loss": 0.7468, "step": 2249 }, { "epoch": 0.23, "learning_rate": 0.00017892821772623, "loss": 0.6851, "step": 2250 }, { "epoch": 0.23, "learning_rate": 0.00017890751100633706, "loss": 0.7566, "step": 2251 }, { "epoch": 0.23, "learning_rate": 0.0001788867953168524, "loss": 0.6988, "step": 2252 }, { "epoch": 0.23, "learning_rate": 0.00017886607066013087, "loss": 0.6762, "step": 2253 }, { "epoch": 0.23, "learning_rate": 0.0001788453370385283, "loss": 0.6772, "step": 2254 }, { "epoch": 0.23, "learning_rate": 0.00017882459445440146, "loss": 0.6882, "step": 2255 }, { "epoch": 0.23, "learning_rate": 0.00017880384291010825, "loss": 0.676, "step": 2256 }, { "epoch": 0.23, "learning_rate": 0.00017878308240800754, "loss": 0.7251, "step": 2257 }, { "epoch": 0.24, "learning_rate": 0.0001787623129504592, "loss": 0.7012, "step": 2258 }, { "epoch": 0.24, "learning_rate": 0.0001787415345398242, "loss": 0.7606, "step": 2259 }, { "epoch": 0.24, "learning_rate": 0.0001787207471784644, "loss": 0.7169, "step": 2260 }, { "epoch": 0.24, "learning_rate": 0.00017869995086874273, "loss": 0.6525, "step": 2261 }, { "epoch": 0.24, "learning_rate": 0.00017867914561302324, "loss": 0.6841, "step": 2262 }, { "epoch": 0.24, "learning_rate": 0.00017865833141367086, "loss": 0.738, "step": 2263 }, { "epoch": 0.24, "learning_rate": 0.00017863750827305157, "loss": 0.7504, "step": 2264 }, { "epoch": 0.24, "learning_rate": 0.0001786166761935324, "loss": 0.6534, "step": 2265 }, { "epoch": 0.24, "learning_rate": 0.0001785958351774814, "loss": 0.7361, "step": 2266 }, { "epoch": 0.24, "learning_rate": 0.00017857498522726758, "loss": 0.6567, "step": 2267 }, { "epoch": 0.24, "learning_rate": 0.00017855412634526103, "loss": 0.6951, "step": 2268 }, { "epoch": 0.24, "learning_rate": 0.0001785332585338328, "loss": 0.6582, "step": 2269 }, { "epoch": 0.24, "learning_rate": 0.000178512381795355, "loss": 0.7105, "step": 2270 }, { "epoch": 0.24, "learning_rate": 0.00017849149613220072, "loss": 0.7025, "step": 2271 }, { "epoch": 0.24, "learning_rate": 0.00017847060154674407, "loss": 0.6244, "step": 2272 }, { "epoch": 0.24, "learning_rate": 0.00017844969804136021, "loss": 0.7053, "step": 2273 }, { "epoch": 0.24, "learning_rate": 0.00017842878561842527, "loss": 0.6664, "step": 2274 }, { "epoch": 0.24, "learning_rate": 0.00017840786428031642, "loss": 0.6626, "step": 2275 }, { "epoch": 0.24, "learning_rate": 0.00017838693402941183, "loss": 0.6495, "step": 2276 }, { "epoch": 0.24, "learning_rate": 0.0001783659948680907, "loss": 0.6712, "step": 2277 }, { "epoch": 0.24, "learning_rate": 0.00017834504679873324, "loss": 0.7506, "step": 2278 }, { "epoch": 0.24, "learning_rate": 0.00017832408982372061, "loss": 0.6655, "step": 2279 }, { "epoch": 0.24, "learning_rate": 0.0001783031239454351, "loss": 0.7203, "step": 2280 }, { "epoch": 0.24, "learning_rate": 0.0001782821491662599, "loss": 0.7074, "step": 2281 }, { "epoch": 0.24, "learning_rate": 0.00017826116548857928, "loss": 0.7064, "step": 2282 }, { "epoch": 0.24, "learning_rate": 0.0001782401729147785, "loss": 0.5952, "step": 2283 }, { "epoch": 0.24, "learning_rate": 0.00017821917144724382, "loss": 0.7328, "step": 2284 }, { "epoch": 0.24, "learning_rate": 0.00017819816108836256, "loss": 0.692, "step": 2285 }, { "epoch": 0.24, "learning_rate": 0.00017817714184052298, "loss": 0.7219, "step": 2286 }, { "epoch": 0.24, "learning_rate": 0.00017815611370611444, "loss": 0.7067, "step": 2287 }, { "epoch": 0.24, "learning_rate": 0.00017813507668752713, "loss": 0.7044, "step": 2288 }, { "epoch": 0.24, "learning_rate": 0.0001781140307871525, "loss": 0.743, "step": 2289 }, { "epoch": 0.24, "learning_rate": 0.00017809297600738283, "loss": 0.7301, "step": 2290 }, { "epoch": 0.24, "learning_rate": 0.00017807191235061145, "loss": 0.6705, "step": 2291 }, { "epoch": 0.24, "learning_rate": 0.00017805083981923273, "loss": 0.7016, "step": 2292 }, { "epoch": 0.24, "learning_rate": 0.00017802975841564207, "loss": 0.6961, "step": 2293 }, { "epoch": 0.24, "learning_rate": 0.0001780086681422358, "loss": 0.7626, "step": 2294 }, { "epoch": 0.24, "learning_rate": 0.00017798756900141128, "loss": 0.6996, "step": 2295 }, { "epoch": 0.24, "learning_rate": 0.00017796646099556697, "loss": 0.6774, "step": 2296 }, { "epoch": 0.24, "learning_rate": 0.00017794534412710213, "loss": 0.6745, "step": 2297 }, { "epoch": 0.24, "learning_rate": 0.00017792421839841728, "loss": 0.6822, "step": 2298 }, { "epoch": 0.24, "learning_rate": 0.00017790308381191382, "loss": 0.6723, "step": 2299 }, { "epoch": 0.24, "learning_rate": 0.00017788194036999413, "loss": 0.7666, "step": 2300 }, { "epoch": 0.24, "learning_rate": 0.00017786078807506162, "loss": 0.5848, "step": 2301 }, { "epoch": 0.24, "learning_rate": 0.00017783962692952075, "loss": 0.7252, "step": 2302 }, { "epoch": 0.24, "learning_rate": 0.00017781845693577695, "loss": 0.6936, "step": 2303 }, { "epoch": 0.24, "learning_rate": 0.00017779727809623662, "loss": 0.6659, "step": 2304 }, { "epoch": 0.24, "learning_rate": 0.00017777609041330728, "loss": 0.6946, "step": 2305 }, { "epoch": 0.24, "learning_rate": 0.0001777548938893973, "loss": 0.7265, "step": 2306 }, { "epoch": 0.24, "learning_rate": 0.00017773368852691621, "loss": 0.699, "step": 2307 }, { "epoch": 0.24, "learning_rate": 0.0001777124743282744, "loss": 0.6931, "step": 2308 }, { "epoch": 0.24, "learning_rate": 0.0001776912512958834, "loss": 0.7767, "step": 2309 }, { "epoch": 0.24, "learning_rate": 0.00017767001943215562, "loss": 0.7175, "step": 2310 }, { "epoch": 0.24, "learning_rate": 0.0001776487787395046, "loss": 0.7658, "step": 2311 }, { "epoch": 0.24, "learning_rate": 0.00017762752922034474, "loss": 0.7409, "step": 2312 }, { "epoch": 0.24, "learning_rate": 0.00017760627087709158, "loss": 0.7128, "step": 2313 }, { "epoch": 0.24, "learning_rate": 0.0001775850037121616, "loss": 0.6952, "step": 2314 }, { "epoch": 0.24, "learning_rate": 0.00017756372772797225, "loss": 0.692, "step": 2315 }, { "epoch": 0.24, "learning_rate": 0.00017754244292694202, "loss": 0.6412, "step": 2316 }, { "epoch": 0.24, "learning_rate": 0.00017752114931149046, "loss": 0.6837, "step": 2317 }, { "epoch": 0.24, "learning_rate": 0.00017749984688403796, "loss": 0.7221, "step": 2318 }, { "epoch": 0.24, "learning_rate": 0.00017747853564700612, "loss": 0.6853, "step": 2319 }, { "epoch": 0.24, "learning_rate": 0.00017745721560281737, "loss": 0.7186, "step": 2320 }, { "epoch": 0.24, "learning_rate": 0.00017743588675389523, "loss": 0.6759, "step": 2321 }, { "epoch": 0.24, "learning_rate": 0.0001774145491026642, "loss": 0.7583, "step": 2322 }, { "epoch": 0.24, "learning_rate": 0.00017739320265154973, "loss": 0.7171, "step": 2323 }, { "epoch": 0.24, "learning_rate": 0.00017737184740297841, "loss": 0.5724, "step": 2324 }, { "epoch": 0.24, "learning_rate": 0.00017735048335937767, "loss": 0.6459, "step": 2325 }, { "epoch": 0.24, "learning_rate": 0.00017732911052317603, "loss": 0.7604, "step": 2326 }, { "epoch": 0.24, "learning_rate": 0.00017730772889680297, "loss": 0.6541, "step": 2327 }, { "epoch": 0.24, "learning_rate": 0.000177286338482689, "loss": 0.6646, "step": 2328 }, { "epoch": 0.24, "learning_rate": 0.00017726493928326564, "loss": 0.7979, "step": 2329 }, { "epoch": 0.24, "learning_rate": 0.00017724353130096535, "loss": 0.701, "step": 2330 }, { "epoch": 0.24, "learning_rate": 0.00017722211453822162, "loss": 0.6552, "step": 2331 }, { "epoch": 0.24, "learning_rate": 0.00017720068899746897, "loss": 0.7123, "step": 2332 }, { "epoch": 0.24, "learning_rate": 0.00017717925468114287, "loss": 0.6344, "step": 2333 }, { "epoch": 0.24, "learning_rate": 0.0001771578115916798, "loss": 0.7348, "step": 2334 }, { "epoch": 0.24, "learning_rate": 0.00017713635973151724, "loss": 0.6894, "step": 2335 }, { "epoch": 0.24, "learning_rate": 0.0001771148991030937, "loss": 0.6572, "step": 2336 }, { "epoch": 0.24, "learning_rate": 0.00017709342970884868, "loss": 0.6609, "step": 2337 }, { "epoch": 0.24, "learning_rate": 0.00017707195155122258, "loss": 0.6948, "step": 2338 }, { "epoch": 0.24, "learning_rate": 0.00017705046463265691, "loss": 0.7095, "step": 2339 }, { "epoch": 0.24, "learning_rate": 0.00017702896895559412, "loss": 0.723, "step": 2340 }, { "epoch": 0.24, "learning_rate": 0.0001770074645224777, "loss": 0.7244, "step": 2341 }, { "epoch": 0.24, "learning_rate": 0.00017698595133575204, "loss": 0.6995, "step": 2342 }, { "epoch": 0.24, "learning_rate": 0.0001769644293978627, "loss": 0.6912, "step": 2343 }, { "epoch": 0.24, "learning_rate": 0.00017694289871125602, "loss": 0.6981, "step": 2344 }, { "epoch": 0.24, "learning_rate": 0.0001769213592783795, "loss": 0.7241, "step": 2345 }, { "epoch": 0.24, "learning_rate": 0.00017689981110168156, "loss": 0.6746, "step": 2346 }, { "epoch": 0.24, "learning_rate": 0.00017687825418361165, "loss": 0.6518, "step": 2347 }, { "epoch": 0.24, "learning_rate": 0.00017685668852662016, "loss": 0.7403, "step": 2348 }, { "epoch": 0.24, "learning_rate": 0.00017683511413315851, "loss": 0.6865, "step": 2349 }, { "epoch": 0.24, "learning_rate": 0.00017681353100567915, "loss": 0.688, "step": 2350 }, { "epoch": 0.24, "learning_rate": 0.00017679193914663541, "loss": 0.6416, "step": 2351 }, { "epoch": 0.24, "learning_rate": 0.00017677033855848176, "loss": 0.6631, "step": 2352 }, { "epoch": 0.24, "learning_rate": 0.00017674872924367354, "loss": 0.6759, "step": 2353 }, { "epoch": 0.25, "learning_rate": 0.00017672711120466711, "loss": 0.7444, "step": 2354 }, { "epoch": 0.25, "learning_rate": 0.0001767054844439199, "loss": 0.6737, "step": 2355 }, { "epoch": 0.25, "learning_rate": 0.00017668384896389025, "loss": 0.6804, "step": 2356 }, { "epoch": 0.25, "learning_rate": 0.0001766622047670375, "loss": 0.7241, "step": 2357 }, { "epoch": 0.25, "learning_rate": 0.000176640551855822, "loss": 0.7074, "step": 2358 }, { "epoch": 0.25, "learning_rate": 0.00017661889023270507, "loss": 0.6771, "step": 2359 }, { "epoch": 0.25, "learning_rate": 0.00017659721990014905, "loss": 0.7109, "step": 2360 }, { "epoch": 0.25, "learning_rate": 0.00017657554086061725, "loss": 0.7452, "step": 2361 }, { "epoch": 0.25, "learning_rate": 0.00017655385311657402, "loss": 0.6956, "step": 2362 }, { "epoch": 0.25, "learning_rate": 0.00017653215667048455, "loss": 0.6233, "step": 2363 }, { "epoch": 0.25, "learning_rate": 0.00017651045152481523, "loss": 0.7288, "step": 2364 }, { "epoch": 0.25, "learning_rate": 0.00017648873768203328, "loss": 0.6294, "step": 2365 }, { "epoch": 0.25, "learning_rate": 0.00017646701514460693, "loss": 0.7234, "step": 2366 }, { "epoch": 0.25, "learning_rate": 0.00017644528391500553, "loss": 0.6329, "step": 2367 }, { "epoch": 0.25, "learning_rate": 0.0001764235439956992, "loss": 0.607, "step": 2368 }, { "epoch": 0.25, "learning_rate": 0.00017640179538915923, "loss": 0.6838, "step": 2369 }, { "epoch": 0.25, "learning_rate": 0.00017638003809785784, "loss": 0.7164, "step": 2370 }, { "epoch": 0.25, "learning_rate": 0.0001763582721242682, "loss": 0.6973, "step": 2371 }, { "epoch": 0.25, "learning_rate": 0.00017633649747086452, "loss": 0.6754, "step": 2372 }, { "epoch": 0.25, "learning_rate": 0.00017631471414012194, "loss": 0.6841, "step": 2373 }, { "epoch": 0.25, "learning_rate": 0.00017629292213451665, "loss": 0.7431, "step": 2374 }, { "epoch": 0.25, "learning_rate": 0.00017627112145652575, "loss": 0.7246, "step": 2375 }, { "epoch": 0.25, "learning_rate": 0.00017624931210862745, "loss": 0.7147, "step": 2376 }, { "epoch": 0.25, "learning_rate": 0.00017622749409330082, "loss": 0.6666, "step": 2377 }, { "epoch": 0.25, "learning_rate": 0.00017620566741302594, "loss": 0.6832, "step": 2378 }, { "epoch": 0.25, "learning_rate": 0.00017618383207028393, "loss": 0.6867, "step": 2379 }, { "epoch": 0.25, "learning_rate": 0.00017616198806755687, "loss": 0.7428, "step": 2380 }, { "epoch": 0.25, "learning_rate": 0.00017614013540732777, "loss": 0.6919, "step": 2381 }, { "epoch": 0.25, "learning_rate": 0.00017611827409208072, "loss": 0.7445, "step": 2382 }, { "epoch": 0.25, "learning_rate": 0.00017609640412430072, "loss": 0.7176, "step": 2383 }, { "epoch": 0.25, "learning_rate": 0.0001760745255064738, "loss": 0.6845, "step": 2384 }, { "epoch": 0.25, "learning_rate": 0.00017605263824108694, "loss": 0.7591, "step": 2385 }, { "epoch": 0.25, "learning_rate": 0.00017603074233062807, "loss": 0.7493, "step": 2386 }, { "epoch": 0.25, "learning_rate": 0.00017600883777758622, "loss": 0.7038, "step": 2387 }, { "epoch": 0.25, "learning_rate": 0.00017598692458445128, "loss": 0.6766, "step": 2388 }, { "epoch": 0.25, "learning_rate": 0.00017596500275371418, "loss": 0.7471, "step": 2389 }, { "epoch": 0.25, "learning_rate": 0.00017594307228786682, "loss": 0.6753, "step": 2390 }, { "epoch": 0.25, "learning_rate": 0.0001759211331894021, "loss": 0.7333, "step": 2391 }, { "epoch": 0.25, "learning_rate": 0.0001758991854608139, "loss": 0.6958, "step": 2392 }, { "epoch": 0.25, "learning_rate": 0.000175877229104597, "loss": 0.7354, "step": 2393 }, { "epoch": 0.25, "learning_rate": 0.00017585526412324732, "loss": 0.7276, "step": 2394 }, { "epoch": 0.25, "learning_rate": 0.00017583329051926158, "loss": 0.673, "step": 2395 }, { "epoch": 0.25, "learning_rate": 0.00017581130829513763, "loss": 0.6174, "step": 2396 }, { "epoch": 0.25, "learning_rate": 0.00017578931745337422, "loss": 0.6604, "step": 2397 }, { "epoch": 0.25, "learning_rate": 0.0001757673179964711, "loss": 0.7279, "step": 2398 }, { "epoch": 0.25, "learning_rate": 0.000175745309926929, "loss": 0.7003, "step": 2399 }, { "epoch": 0.25, "learning_rate": 0.0001757232932472496, "loss": 0.6665, "step": 2400 }, { "epoch": 0.25, "learning_rate": 0.0001757012679599356, "loss": 0.7514, "step": 2401 }, { "epoch": 0.25, "learning_rate": 0.00017567923406749066, "loss": 0.6579, "step": 2402 }, { "epoch": 0.25, "learning_rate": 0.00017565719157241946, "loss": 0.6677, "step": 2403 }, { "epoch": 0.25, "learning_rate": 0.00017563514047722758, "loss": 0.6392, "step": 2404 }, { "epoch": 0.25, "learning_rate": 0.00017561308078442158, "loss": 0.67, "step": 2405 }, { "epoch": 0.25, "learning_rate": 0.00017559101249650912, "loss": 0.5873, "step": 2406 }, { "epoch": 0.25, "learning_rate": 0.0001755689356159987, "loss": 0.7489, "step": 2407 }, { "epoch": 0.25, "learning_rate": 0.00017554685014539985, "loss": 0.682, "step": 2408 }, { "epoch": 0.25, "learning_rate": 0.0001755247560872231, "loss": 0.7178, "step": 2409 }, { "epoch": 0.25, "learning_rate": 0.0001755026534439799, "loss": 0.7462, "step": 2410 }, { "epoch": 0.25, "learning_rate": 0.0001754805422181827, "loss": 0.6302, "step": 2411 }, { "epoch": 0.25, "learning_rate": 0.000175458422412345, "loss": 0.6695, "step": 2412 }, { "epoch": 0.25, "learning_rate": 0.00017543629402898113, "loss": 0.667, "step": 2413 }, { "epoch": 0.25, "learning_rate": 0.00017541415707060648, "loss": 0.699, "step": 2414 }, { "epoch": 0.25, "learning_rate": 0.00017539201153973744, "loss": 0.7057, "step": 2415 }, { "epoch": 0.25, "learning_rate": 0.00017536985743889133, "loss": 0.6767, "step": 2416 }, { "epoch": 0.25, "learning_rate": 0.00017534769477058648, "loss": 0.7312, "step": 2417 }, { "epoch": 0.25, "learning_rate": 0.00017532552353734213, "loss": 0.6644, "step": 2418 }, { "epoch": 0.25, "learning_rate": 0.00017530334374167854, "loss": 0.7027, "step": 2419 }, { "epoch": 0.25, "learning_rate": 0.00017528115538611693, "loss": 0.6578, "step": 2420 }, { "epoch": 0.25, "learning_rate": 0.00017525895847317954, "loss": 0.6943, "step": 2421 }, { "epoch": 0.25, "learning_rate": 0.00017523675300538952, "loss": 0.7613, "step": 2422 }, { "epoch": 0.25, "learning_rate": 0.00017521453898527097, "loss": 0.6809, "step": 2423 }, { "epoch": 0.25, "learning_rate": 0.0001751923164153491, "loss": 0.6823, "step": 2424 }, { "epoch": 0.25, "learning_rate": 0.00017517008529814994, "loss": 0.7342, "step": 2425 }, { "epoch": 0.25, "learning_rate": 0.00017514784563620053, "loss": 0.6747, "step": 2426 }, { "epoch": 0.25, "learning_rate": 0.0001751255974320289, "loss": 0.6723, "step": 2427 }, { "epoch": 0.25, "learning_rate": 0.00017510334068816414, "loss": 0.7143, "step": 2428 }, { "epoch": 0.25, "learning_rate": 0.00017508107540713613, "loss": 0.6993, "step": 2429 }, { "epoch": 0.25, "learning_rate": 0.00017505880159147588, "loss": 0.7213, "step": 2430 }, { "epoch": 0.25, "learning_rate": 0.00017503651924371524, "loss": 0.6584, "step": 2431 }, { "epoch": 0.25, "learning_rate": 0.00017501422836638714, "loss": 0.7178, "step": 2432 }, { "epoch": 0.25, "learning_rate": 0.00017499192896202543, "loss": 0.6925, "step": 2433 }, { "epoch": 0.25, "learning_rate": 0.00017496962103316491, "loss": 0.6901, "step": 2434 }, { "epoch": 0.25, "learning_rate": 0.00017494730458234142, "loss": 0.6437, "step": 2435 }, { "epoch": 0.25, "learning_rate": 0.00017492497961209163, "loss": 0.7232, "step": 2436 }, { "epoch": 0.25, "learning_rate": 0.00017490264612495335, "loss": 0.7285, "step": 2437 }, { "epoch": 0.25, "learning_rate": 0.00017488030412346527, "loss": 0.66, "step": 2438 }, { "epoch": 0.25, "learning_rate": 0.00017485795361016698, "loss": 0.7461, "step": 2439 }, { "epoch": 0.25, "learning_rate": 0.0001748355945875992, "loss": 0.7099, "step": 2440 }, { "epoch": 0.25, "learning_rate": 0.0001748132270583035, "loss": 0.6576, "step": 2441 }, { "epoch": 0.25, "learning_rate": 0.00017479085102482244, "loss": 0.7177, "step": 2442 }, { "epoch": 0.25, "learning_rate": 0.00017476846648969958, "loss": 0.676, "step": 2443 }, { "epoch": 0.25, "learning_rate": 0.00017474607345547937, "loss": 0.7351, "step": 2444 }, { "epoch": 0.25, "learning_rate": 0.0001747236719247073, "loss": 0.678, "step": 2445 }, { "epoch": 0.25, "learning_rate": 0.00017470126189992984, "loss": 0.7255, "step": 2446 }, { "epoch": 0.25, "learning_rate": 0.00017467884338369434, "loss": 0.6824, "step": 2447 }, { "epoch": 0.25, "learning_rate": 0.00017465641637854913, "loss": 0.6805, "step": 2448 }, { "epoch": 0.25, "learning_rate": 0.00017463398088704365, "loss": 0.684, "step": 2449 }, { "epoch": 0.26, "learning_rate": 0.00017461153691172805, "loss": 0.6692, "step": 2450 }, { "epoch": 0.26, "learning_rate": 0.0001745890844551537, "loss": 0.6585, "step": 2451 }, { "epoch": 0.26, "learning_rate": 0.00017456662351987277, "loss": 0.7187, "step": 2452 }, { "epoch": 0.26, "learning_rate": 0.00017454415410843847, "loss": 0.6695, "step": 2453 }, { "epoch": 0.26, "learning_rate": 0.00017452167622340493, "loss": 0.7838, "step": 2454 }, { "epoch": 0.26, "learning_rate": 0.00017449918986732726, "loss": 0.6815, "step": 2455 }, { "epoch": 0.26, "learning_rate": 0.0001744766950427615, "loss": 0.6779, "step": 2456 }, { "epoch": 0.26, "learning_rate": 0.0001744541917522648, "loss": 0.7532, "step": 2457 }, { "epoch": 0.26, "learning_rate": 0.00017443167999839506, "loss": 0.7182, "step": 2458 }, { "epoch": 0.26, "learning_rate": 0.00017440915978371124, "loss": 0.729, "step": 2459 }, { "epoch": 0.26, "learning_rate": 0.0001743866311107733, "loss": 0.6668, "step": 2460 }, { "epoch": 0.26, "learning_rate": 0.0001743640939821421, "loss": 0.7396, "step": 2461 }, { "epoch": 0.26, "learning_rate": 0.0001743415484003795, "loss": 0.7013, "step": 2462 }, { "epoch": 0.26, "learning_rate": 0.00017431899436804832, "loss": 0.7115, "step": 2463 }, { "epoch": 0.26, "learning_rate": 0.00017429643188771228, "loss": 0.6523, "step": 2464 }, { "epoch": 0.26, "learning_rate": 0.00017427386096193615, "loss": 0.6556, "step": 2465 }, { "epoch": 0.26, "learning_rate": 0.0001742512815932856, "loss": 0.743, "step": 2466 }, { "epoch": 0.26, "learning_rate": 0.00017422869378432728, "loss": 0.7178, "step": 2467 }, { "epoch": 0.26, "learning_rate": 0.00017420609753762882, "loss": 0.7185, "step": 2468 }, { "epoch": 0.26, "learning_rate": 0.00017418349285575876, "loss": 0.6869, "step": 2469 }, { "epoch": 0.26, "learning_rate": 0.0001741608797412866, "loss": 0.6514, "step": 2470 }, { "epoch": 0.26, "learning_rate": 0.00017413825819678286, "loss": 0.7501, "step": 2471 }, { "epoch": 0.26, "learning_rate": 0.000174115628224819, "loss": 0.6572, "step": 2472 }, { "epoch": 0.26, "learning_rate": 0.00017409298982796735, "loss": 0.7061, "step": 2473 }, { "epoch": 0.26, "learning_rate": 0.0001740703430088013, "loss": 0.6914, "step": 2474 }, { "epoch": 0.26, "learning_rate": 0.00017404768776989522, "loss": 0.6754, "step": 2475 }, { "epoch": 0.26, "learning_rate": 0.0001740250241138243, "loss": 0.6339, "step": 2476 }, { "epoch": 0.26, "learning_rate": 0.0001740023520431648, "loss": 0.7452, "step": 2477 }, { "epoch": 0.26, "learning_rate": 0.0001739796715604939, "loss": 0.7299, "step": 2478 }, { "epoch": 0.26, "learning_rate": 0.0001739569826683898, "loss": 0.7131, "step": 2479 }, { "epoch": 0.26, "learning_rate": 0.00017393428536943147, "loss": 0.7711, "step": 2480 }, { "epoch": 0.26, "learning_rate": 0.00017391157966619906, "loss": 0.7077, "step": 2481 }, { "epoch": 0.26, "learning_rate": 0.00017388886556127356, "loss": 0.687, "step": 2482 }, { "epoch": 0.26, "learning_rate": 0.0001738661430572369, "loss": 0.6997, "step": 2483 }, { "epoch": 0.26, "learning_rate": 0.00017384341215667207, "loss": 0.6789, "step": 2484 }, { "epoch": 0.26, "learning_rate": 0.00017382067286216284, "loss": 0.6708, "step": 2485 }, { "epoch": 0.26, "learning_rate": 0.00017379792517629409, "loss": 0.7144, "step": 2486 }, { "epoch": 0.26, "learning_rate": 0.00017377516910165164, "loss": 0.6578, "step": 2487 }, { "epoch": 0.26, "learning_rate": 0.00017375240464082215, "loss": 0.6956, "step": 2488 }, { "epoch": 0.26, "learning_rate": 0.00017372963179639338, "loss": 0.6564, "step": 2489 }, { "epoch": 0.26, "learning_rate": 0.0001737068505709539, "loss": 0.674, "step": 2490 }, { "epoch": 0.26, "learning_rate": 0.00017368406096709334, "loss": 0.6734, "step": 2491 }, { "epoch": 0.26, "learning_rate": 0.00017366126298740223, "loss": 0.6763, "step": 2492 }, { "epoch": 0.26, "learning_rate": 0.00017363845663447206, "loss": 0.6307, "step": 2493 }, { "epoch": 0.26, "learning_rate": 0.00017361564191089533, "loss": 0.6925, "step": 2494 }, { "epoch": 0.26, "learning_rate": 0.00017359281881926538, "loss": 0.6725, "step": 2495 }, { "epoch": 0.26, "learning_rate": 0.00017356998736217655, "loss": 0.6901, "step": 2496 }, { "epoch": 0.26, "learning_rate": 0.00017354714754222423, "loss": 0.7558, "step": 2497 }, { "epoch": 0.26, "learning_rate": 0.0001735242993620046, "loss": 0.6281, "step": 2498 }, { "epoch": 0.26, "learning_rate": 0.0001735014428241149, "loss": 0.7328, "step": 2499 }, { "epoch": 0.26, "learning_rate": 0.00017347857793115323, "loss": 0.7141, "step": 2500 }, { "epoch": 0.26, "learning_rate": 0.00017345570468571878, "loss": 0.7237, "step": 2501 }, { "epoch": 0.26, "learning_rate": 0.0001734328230904115, "loss": 0.643, "step": 2502 }, { "epoch": 0.26, "learning_rate": 0.00017340993314783246, "loss": 0.657, "step": 2503 }, { "epoch": 0.26, "learning_rate": 0.00017338703486058358, "loss": 0.7546, "step": 2504 }, { "epoch": 0.26, "learning_rate": 0.00017336412823126782, "loss": 0.6871, "step": 2505 }, { "epoch": 0.26, "learning_rate": 0.00017334121326248895, "loss": 0.6905, "step": 2506 }, { "epoch": 0.26, "learning_rate": 0.00017331828995685177, "loss": 0.6045, "step": 2507 }, { "epoch": 0.26, "learning_rate": 0.00017329535831696208, "loss": 0.6756, "step": 2508 }, { "epoch": 0.26, "learning_rate": 0.00017327241834542653, "loss": 0.6715, "step": 2509 }, { "epoch": 0.26, "learning_rate": 0.00017324947004485278, "loss": 0.6135, "step": 2510 }, { "epoch": 0.26, "learning_rate": 0.00017322651341784937, "loss": 0.7184, "step": 2511 }, { "epoch": 0.26, "learning_rate": 0.0001732035484670259, "loss": 0.645, "step": 2512 }, { "epoch": 0.26, "learning_rate": 0.00017318057519499278, "loss": 0.7108, "step": 2513 }, { "epoch": 0.26, "learning_rate": 0.00017315759360436145, "loss": 0.673, "step": 2514 }, { "epoch": 0.26, "learning_rate": 0.00017313460369774433, "loss": 0.6717, "step": 2515 }, { "epoch": 0.26, "learning_rate": 0.00017311160547775465, "loss": 0.6856, "step": 2516 }, { "epoch": 0.26, "learning_rate": 0.00017308859894700672, "loss": 0.7124, "step": 2517 }, { "epoch": 0.26, "learning_rate": 0.00017306558410811574, "loss": 0.6878, "step": 2518 }, { "epoch": 0.26, "learning_rate": 0.00017304256096369787, "loss": 0.7329, "step": 2519 }, { "epoch": 0.26, "learning_rate": 0.00017301952951637018, "loss": 0.6713, "step": 2520 }, { "epoch": 0.26, "learning_rate": 0.0001729964897687507, "loss": 0.7173, "step": 2521 }, { "epoch": 0.26, "learning_rate": 0.0001729734417234584, "loss": 0.6788, "step": 2522 }, { "epoch": 0.26, "learning_rate": 0.00017295038538311323, "loss": 0.7384, "step": 2523 }, { "epoch": 0.26, "learning_rate": 0.0001729273207503361, "loss": 0.723, "step": 2524 }, { "epoch": 0.26, "learning_rate": 0.0001729042478277487, "loss": 0.7006, "step": 2525 }, { "epoch": 0.26, "learning_rate": 0.00017288116661797384, "loss": 0.7212, "step": 2526 }, { "epoch": 0.26, "learning_rate": 0.00017285807712363527, "loss": 0.6789, "step": 2527 }, { "epoch": 0.26, "learning_rate": 0.00017283497934735754, "loss": 0.6818, "step": 2528 }, { "epoch": 0.26, "learning_rate": 0.00017281187329176628, "loss": 0.6699, "step": 2529 }, { "epoch": 0.26, "learning_rate": 0.00017278875895948795, "loss": 0.6967, "step": 2530 }, { "epoch": 0.26, "learning_rate": 0.00017276563635315007, "loss": 0.6781, "step": 2531 }, { "epoch": 0.26, "learning_rate": 0.000172742505475381, "loss": 0.6678, "step": 2532 }, { "epoch": 0.26, "learning_rate": 0.00017271936632881006, "loss": 0.6544, "step": 2533 }, { "epoch": 0.26, "learning_rate": 0.00017269621891606758, "loss": 0.6433, "step": 2534 }, { "epoch": 0.26, "learning_rate": 0.00017267306323978472, "loss": 0.6617, "step": 2535 }, { "epoch": 0.26, "learning_rate": 0.0001726498993025937, "loss": 0.6789, "step": 2536 }, { "epoch": 0.26, "learning_rate": 0.0001726267271071276, "loss": 0.644, "step": 2537 }, { "epoch": 0.26, "learning_rate": 0.0001726035466560204, "loss": 0.656, "step": 2538 }, { "epoch": 0.26, "learning_rate": 0.00017258035795190713, "loss": 0.7046, "step": 2539 }, { "epoch": 0.26, "learning_rate": 0.00017255716099742372, "loss": 0.7628, "step": 2540 }, { "epoch": 0.26, "learning_rate": 0.00017253395579520695, "loss": 0.7352, "step": 2541 }, { "epoch": 0.26, "learning_rate": 0.00017251074234789465, "loss": 0.707, "step": 2542 }, { "epoch": 0.26, "learning_rate": 0.00017248752065812553, "loss": 0.7075, "step": 2543 }, { "epoch": 0.26, "learning_rate": 0.00017246429072853925, "loss": 0.6746, "step": 2544 }, { "epoch": 0.26, "learning_rate": 0.00017244105256177642, "loss": 0.6491, "step": 2545 }, { "epoch": 0.27, "learning_rate": 0.00017241780616047855, "loss": 0.7067, "step": 2546 }, { "epoch": 0.27, "learning_rate": 0.00017239455152728817, "loss": 0.7128, "step": 2547 }, { "epoch": 0.27, "learning_rate": 0.0001723712886648486, "loss": 0.7178, "step": 2548 }, { "epoch": 0.27, "learning_rate": 0.00017234801757580427, "loss": 0.7618, "step": 2549 }, { "epoch": 0.27, "learning_rate": 0.00017232473826280038, "loss": 0.6639, "step": 2550 }, { "epoch": 0.27, "learning_rate": 0.00017230145072848316, "loss": 0.7332, "step": 2551 }, { "epoch": 0.27, "learning_rate": 0.0001722781549754998, "loss": 0.7315, "step": 2552 }, { "epoch": 0.27, "learning_rate": 0.0001722548510064983, "loss": 0.718, "step": 2553 }, { "epoch": 0.27, "learning_rate": 0.00017223153882412777, "loss": 0.672, "step": 2554 }, { "epoch": 0.27, "learning_rate": 0.0001722082184310381, "loss": 0.7072, "step": 2555 }, { "epoch": 0.27, "learning_rate": 0.00017218488982988017, "loss": 0.7238, "step": 2556 }, { "epoch": 0.27, "learning_rate": 0.0001721615530233058, "loss": 0.6389, "step": 2557 }, { "epoch": 0.27, "learning_rate": 0.00017213820801396774, "loss": 0.7116, "step": 2558 }, { "epoch": 0.27, "learning_rate": 0.0001721148548045197, "loss": 0.7194, "step": 2559 }, { "epoch": 0.27, "learning_rate": 0.0001720914933976162, "loss": 0.6603, "step": 2560 }, { "epoch": 0.27, "learning_rate": 0.00017206812379591286, "loss": 0.692, "step": 2561 }, { "epoch": 0.27, "learning_rate": 0.00017204474600206616, "loss": 0.7126, "step": 2562 }, { "epoch": 0.27, "learning_rate": 0.00017202136001873348, "loss": 0.7304, "step": 2563 }, { "epoch": 0.27, "learning_rate": 0.00017199796584857312, "loss": 0.6857, "step": 2564 }, { "epoch": 0.27, "learning_rate": 0.00017197456349424443, "loss": 0.7015, "step": 2565 }, { "epoch": 0.27, "learning_rate": 0.00017195115295840754, "loss": 0.7454, "step": 2566 }, { "epoch": 0.27, "learning_rate": 0.00017192773424372362, "loss": 0.6978, "step": 2567 }, { "epoch": 0.27, "learning_rate": 0.0001719043073528547, "loss": 0.6741, "step": 2568 }, { "epoch": 0.27, "learning_rate": 0.00017188087228846378, "loss": 0.7117, "step": 2569 }, { "epoch": 0.27, "learning_rate": 0.00017185742905321476, "loss": 0.6861, "step": 2570 }, { "epoch": 0.27, "learning_rate": 0.0001718339776497725, "loss": 0.6593, "step": 2571 }, { "epoch": 0.27, "learning_rate": 0.00017181051808080278, "loss": 0.7045, "step": 2572 }, { "epoch": 0.27, "learning_rate": 0.0001717870503489723, "loss": 0.6559, "step": 2573 }, { "epoch": 0.27, "learning_rate": 0.00017176357445694866, "loss": 0.792, "step": 2574 }, { "epoch": 0.27, "learning_rate": 0.00017174009040740043, "loss": 0.6343, "step": 2575 }, { "epoch": 0.27, "learning_rate": 0.00017171659820299707, "loss": 0.6938, "step": 2576 }, { "epoch": 0.27, "learning_rate": 0.0001716930978464091, "loss": 0.6782, "step": 2577 }, { "epoch": 0.27, "learning_rate": 0.0001716695893403077, "loss": 0.6903, "step": 2578 }, { "epoch": 0.27, "learning_rate": 0.00017164607268736526, "loss": 0.6636, "step": 2579 }, { "epoch": 0.27, "learning_rate": 0.00017162254789025488, "loss": 0.6823, "step": 2580 }, { "epoch": 0.27, "learning_rate": 0.00017159901495165077, "loss": 0.6762, "step": 2581 }, { "epoch": 0.27, "learning_rate": 0.0001715754738742279, "loss": 0.7317, "step": 2582 }, { "epoch": 0.27, "learning_rate": 0.00017155192466066223, "loss": 0.723, "step": 2583 }, { "epoch": 0.27, "learning_rate": 0.0001715283673136307, "loss": 0.6667, "step": 2584 }, { "epoch": 0.27, "learning_rate": 0.0001715048018358111, "loss": 0.7359, "step": 2585 }, { "epoch": 0.27, "learning_rate": 0.00017148122822988217, "loss": 0.6999, "step": 2586 }, { "epoch": 0.27, "learning_rate": 0.00017145764649852357, "loss": 0.6697, "step": 2587 }, { "epoch": 0.27, "learning_rate": 0.00017143405664441592, "loss": 0.6913, "step": 2588 }, { "epoch": 0.27, "learning_rate": 0.0001714104586702407, "loss": 0.6495, "step": 2589 }, { "epoch": 0.27, "learning_rate": 0.00017138685257868033, "loss": 0.6457, "step": 2590 }, { "epoch": 0.27, "learning_rate": 0.0001713632383724182, "loss": 0.6893, "step": 2591 }, { "epoch": 0.27, "learning_rate": 0.00017133961605413856, "loss": 0.6853, "step": 2592 }, { "epoch": 0.27, "learning_rate": 0.00017131598562652664, "loss": 0.6557, "step": 2593 }, { "epoch": 0.27, "learning_rate": 0.00017129234709226853, "loss": 0.7377, "step": 2594 }, { "epoch": 0.27, "learning_rate": 0.00017126870045405132, "loss": 0.6764, "step": 2595 }, { "epoch": 0.27, "learning_rate": 0.00017124504571456296, "loss": 0.7213, "step": 2596 }, { "epoch": 0.27, "learning_rate": 0.0001712213828764923, "loss": 0.6827, "step": 2597 }, { "epoch": 0.27, "learning_rate": 0.00017119771194252918, "loss": 0.699, "step": 2598 }, { "epoch": 0.27, "learning_rate": 0.00017117403291536435, "loss": 0.698, "step": 2599 }, { "epoch": 0.27, "learning_rate": 0.00017115034579768938, "loss": 0.6788, "step": 2600 }, { "epoch": 0.27, "learning_rate": 0.0001711266505921969, "loss": 0.6584, "step": 2601 }, { "epoch": 0.27, "learning_rate": 0.0001711029473015804, "loss": 0.7023, "step": 2602 }, { "epoch": 0.27, "learning_rate": 0.00017107923592853426, "loss": 0.7078, "step": 2603 }, { "epoch": 0.27, "learning_rate": 0.00017105551647575383, "loss": 0.7167, "step": 2604 }, { "epoch": 0.27, "learning_rate": 0.0001710317889459353, "loss": 0.7172, "step": 2605 }, { "epoch": 0.27, "learning_rate": 0.0001710080533417759, "loss": 0.6677, "step": 2606 }, { "epoch": 0.27, "learning_rate": 0.00017098430966597366, "loss": 0.6534, "step": 2607 }, { "epoch": 0.27, "learning_rate": 0.0001709605579212276, "loss": 0.6796, "step": 2608 }, { "epoch": 0.27, "learning_rate": 0.00017093679811023763, "loss": 0.6888, "step": 2609 }, { "epoch": 0.27, "learning_rate": 0.00017091303023570456, "loss": 0.7282, "step": 2610 }, { "epoch": 0.27, "learning_rate": 0.00017088925430033017, "loss": 0.7287, "step": 2611 }, { "epoch": 0.27, "learning_rate": 0.0001708654703068171, "loss": 0.6573, "step": 2612 }, { "epoch": 0.27, "learning_rate": 0.0001708416782578689, "loss": 0.668, "step": 2613 }, { "epoch": 0.27, "learning_rate": 0.00017081787815619013, "loss": 0.698, "step": 2614 }, { "epoch": 0.27, "learning_rate": 0.00017079407000448617, "loss": 0.667, "step": 2615 }, { "epoch": 0.27, "learning_rate": 0.00017077025380546335, "loss": 0.7261, "step": 2616 }, { "epoch": 0.27, "learning_rate": 0.0001707464295618289, "loss": 0.6071, "step": 2617 }, { "epoch": 0.27, "learning_rate": 0.00017072259727629098, "loss": 0.6809, "step": 2618 }, { "epoch": 0.27, "learning_rate": 0.00017069875695155867, "loss": 0.7058, "step": 2619 }, { "epoch": 0.27, "learning_rate": 0.0001706749085903419, "loss": 0.6502, "step": 2620 }, { "epoch": 0.27, "learning_rate": 0.00017065105219535168, "loss": 0.6678, "step": 2621 }, { "epoch": 0.27, "learning_rate": 0.00017062718776929967, "loss": 0.7152, "step": 2622 }, { "epoch": 0.27, "learning_rate": 0.0001706033153148987, "loss": 0.6558, "step": 2623 }, { "epoch": 0.27, "learning_rate": 0.0001705794348348624, "loss": 0.6538, "step": 2624 }, { "epoch": 0.27, "learning_rate": 0.00017055554633190528, "loss": 0.7098, "step": 2625 }, { "epoch": 0.27, "learning_rate": 0.00017053164980874275, "loss": 0.7387, "step": 2626 }, { "epoch": 0.27, "learning_rate": 0.00017050774526809133, "loss": 0.6668, "step": 2627 }, { "epoch": 0.27, "learning_rate": 0.00017048383271266816, "loss": 0.6604, "step": 2628 }, { "epoch": 0.27, "learning_rate": 0.0001704599121451915, "loss": 0.7468, "step": 2629 }, { "epoch": 0.27, "learning_rate": 0.00017043598356838047, "loss": 0.6805, "step": 2630 }, { "epoch": 0.27, "learning_rate": 0.000170412046984955, "loss": 0.6958, "step": 2631 }, { "epoch": 0.27, "learning_rate": 0.0001703881023976361, "loss": 0.682, "step": 2632 }, { "epoch": 0.27, "learning_rate": 0.00017036414980914555, "loss": 0.6586, "step": 2633 }, { "epoch": 0.27, "learning_rate": 0.00017034018922220615, "loss": 0.7062, "step": 2634 }, { "epoch": 0.27, "learning_rate": 0.0001703162206395415, "loss": 0.6714, "step": 2635 }, { "epoch": 0.27, "learning_rate": 0.00017029224406387618, "loss": 0.7739, "step": 2636 }, { "epoch": 0.27, "learning_rate": 0.00017026825949793568, "loss": 0.5845, "step": 2637 }, { "epoch": 0.27, "learning_rate": 0.00017024426694444634, "loss": 0.7501, "step": 2638 }, { "epoch": 0.27, "learning_rate": 0.0001702202664061355, "loss": 0.6859, "step": 2639 }, { "epoch": 0.27, "learning_rate": 0.00017019625788573128, "loss": 0.6975, "step": 2640 }, { "epoch": 0.27, "learning_rate": 0.00017017224138596285, "loss": 0.7134, "step": 2641 }, { "epoch": 0.28, "learning_rate": 0.0001701482169095602, "loss": 0.6872, "step": 2642 }, { "epoch": 0.28, "learning_rate": 0.00017012418445925423, "loss": 0.6707, "step": 2643 }, { "epoch": 0.28, "learning_rate": 0.00017010014403777676, "loss": 0.7173, "step": 2644 }, { "epoch": 0.28, "learning_rate": 0.00017007609564786055, "loss": 0.6848, "step": 2645 }, { "epoch": 0.28, "learning_rate": 0.00017005203929223918, "loss": 0.6974, "step": 2646 }, { "epoch": 0.28, "learning_rate": 0.00017002797497364723, "loss": 0.716, "step": 2647 }, { "epoch": 0.28, "learning_rate": 0.00017000390269482016, "loss": 0.678, "step": 2648 }, { "epoch": 0.28, "learning_rate": 0.00016997982245849427, "loss": 0.6313, "step": 2649 }, { "epoch": 0.28, "learning_rate": 0.00016995573426740687, "loss": 0.7245, "step": 2650 }, { "epoch": 0.28, "learning_rate": 0.00016993163812429606, "loss": 0.7285, "step": 2651 }, { "epoch": 0.28, "learning_rate": 0.0001699075340319009, "loss": 0.7304, "step": 2652 }, { "epoch": 0.28, "learning_rate": 0.00016988342199296145, "loss": 0.7202, "step": 2653 }, { "epoch": 0.28, "learning_rate": 0.0001698593020102185, "loss": 0.7547, "step": 2654 }, { "epoch": 0.28, "learning_rate": 0.00016983517408641384, "loss": 0.6624, "step": 2655 }, { "epoch": 0.28, "learning_rate": 0.0001698110382242901, "loss": 0.6828, "step": 2656 }, { "epoch": 0.28, "learning_rate": 0.00016978689442659093, "loss": 0.6832, "step": 2657 }, { "epoch": 0.28, "learning_rate": 0.00016976274269606077, "loss": 0.7397, "step": 2658 }, { "epoch": 0.28, "learning_rate": 0.000169738583035445, "loss": 0.701, "step": 2659 }, { "epoch": 0.28, "learning_rate": 0.0001697144154474899, "loss": 0.6909, "step": 2660 }, { "epoch": 0.28, "learning_rate": 0.00016969023993494267, "loss": 0.6882, "step": 2661 }, { "epoch": 0.28, "learning_rate": 0.00016966605650055137, "loss": 0.6622, "step": 2662 }, { "epoch": 0.28, "learning_rate": 0.00016964186514706504, "loss": 0.7179, "step": 2663 }, { "epoch": 0.28, "learning_rate": 0.00016961766587723348, "loss": 0.6808, "step": 2664 }, { "epoch": 0.28, "learning_rate": 0.00016959345869380757, "loss": 0.6411, "step": 2665 }, { "epoch": 0.28, "learning_rate": 0.0001695692435995389, "loss": 0.738, "step": 2666 }, { "epoch": 0.28, "learning_rate": 0.0001695450205971801, "loss": 0.6471, "step": 2667 }, { "epoch": 0.28, "learning_rate": 0.0001695207896894847, "loss": 0.6826, "step": 2668 }, { "epoch": 0.28, "learning_rate": 0.000169496550879207, "loss": 0.6339, "step": 2669 }, { "epoch": 0.28, "learning_rate": 0.0001694723041691023, "loss": 0.7421, "step": 2670 }, { "epoch": 0.28, "learning_rate": 0.00016944804956192682, "loss": 0.6755, "step": 2671 }, { "epoch": 0.28, "learning_rate": 0.00016942378706043756, "loss": 0.7104, "step": 2672 }, { "epoch": 0.28, "learning_rate": 0.00016939951666739255, "loss": 0.7552, "step": 2673 }, { "epoch": 0.28, "learning_rate": 0.00016937523838555068, "loss": 0.7019, "step": 2674 }, { "epoch": 0.28, "learning_rate": 0.00016935095221767163, "loss": 0.6766, "step": 2675 }, { "epoch": 0.28, "learning_rate": 0.00016932665816651613, "loss": 0.6622, "step": 2676 }, { "epoch": 0.28, "learning_rate": 0.00016930235623484574, "loss": 0.7049, "step": 2677 }, { "epoch": 0.28, "learning_rate": 0.0001692780464254229, "loss": 0.7182, "step": 2678 }, { "epoch": 0.28, "learning_rate": 0.00016925372874101094, "loss": 0.7352, "step": 2679 }, { "epoch": 0.28, "learning_rate": 0.0001692294031843741, "loss": 0.7162, "step": 2680 }, { "epoch": 0.28, "learning_rate": 0.0001692050697582776, "loss": 0.7122, "step": 2681 }, { "epoch": 0.28, "learning_rate": 0.00016918072846548737, "loss": 0.6734, "step": 2682 }, { "epoch": 0.28, "learning_rate": 0.0001691563793087704, "loss": 0.7376, "step": 2683 }, { "epoch": 0.28, "learning_rate": 0.00016913202229089448, "loss": 0.685, "step": 2684 }, { "epoch": 0.28, "learning_rate": 0.00016910765741462837, "loss": 0.6838, "step": 2685 }, { "epoch": 0.28, "learning_rate": 0.00016908328468274162, "loss": 0.6813, "step": 2686 }, { "epoch": 0.28, "learning_rate": 0.0001690589040980048, "loss": 0.6804, "step": 2687 }, { "epoch": 0.28, "learning_rate": 0.00016903451566318927, "loss": 0.6958, "step": 2688 }, { "epoch": 0.28, "learning_rate": 0.00016901011938106727, "loss": 0.6648, "step": 2689 }, { "epoch": 0.28, "learning_rate": 0.00016898571525441204, "loss": 0.7169, "step": 2690 }, { "epoch": 0.28, "learning_rate": 0.00016896130328599769, "loss": 0.6658, "step": 2691 }, { "epoch": 0.28, "learning_rate": 0.00016893688347859907, "loss": 0.7167, "step": 2692 }, { "epoch": 0.28, "learning_rate": 0.00016891245583499216, "loss": 0.6769, "step": 2693 }, { "epoch": 0.28, "learning_rate": 0.0001688880203579536, "loss": 0.697, "step": 2694 }, { "epoch": 0.28, "learning_rate": 0.0001688635770502611, "loss": 0.7217, "step": 2695 }, { "epoch": 0.28, "learning_rate": 0.00016883912591469306, "loss": 0.6949, "step": 2696 }, { "epoch": 0.28, "learning_rate": 0.00016881466695402905, "loss": 0.6504, "step": 2697 }, { "epoch": 0.28, "learning_rate": 0.0001687902001710493, "loss": 0.6578, "step": 2698 }, { "epoch": 0.28, "learning_rate": 0.000168765725568535, "loss": 0.7322, "step": 2699 }, { "epoch": 0.28, "learning_rate": 0.00016874124314926827, "loss": 0.7146, "step": 2700 }, { "epoch": 0.28, "learning_rate": 0.00016871675291603203, "loss": 0.6924, "step": 2701 }, { "epoch": 0.28, "learning_rate": 0.00016869225487161016, "loss": 0.7367, "step": 2702 }, { "epoch": 0.28, "learning_rate": 0.00016866774901878743, "loss": 0.7051, "step": 2703 }, { "epoch": 0.28, "learning_rate": 0.00016864323536034946, "loss": 0.6269, "step": 2704 }, { "epoch": 0.28, "learning_rate": 0.00016861871389908277, "loss": 0.6892, "step": 2705 }, { "epoch": 0.28, "learning_rate": 0.00016859418463777473, "loss": 0.7386, "step": 2706 }, { "epoch": 0.28, "learning_rate": 0.0001685696475792137, "loss": 0.6728, "step": 2707 }, { "epoch": 0.28, "learning_rate": 0.00016854510272618884, "loss": 0.7537, "step": 2708 }, { "epoch": 0.28, "learning_rate": 0.00016852055008149017, "loss": 0.6302, "step": 2709 }, { "epoch": 0.28, "learning_rate": 0.0001684959896479087, "loss": 0.6744, "step": 2710 }, { "epoch": 0.28, "learning_rate": 0.00016847142142823628, "loss": 0.6689, "step": 2711 }, { "epoch": 0.28, "learning_rate": 0.0001684468454252656, "loss": 0.7237, "step": 2712 }, { "epoch": 0.28, "learning_rate": 0.00016842226164179026, "loss": 0.7077, "step": 2713 }, { "epoch": 0.28, "learning_rate": 0.00016839767008060478, "loss": 0.6532, "step": 2714 }, { "epoch": 0.28, "learning_rate": 0.00016837307074450456, "loss": 0.6552, "step": 2715 }, { "epoch": 0.28, "learning_rate": 0.00016834846363628577, "loss": 0.6469, "step": 2716 }, { "epoch": 0.28, "learning_rate": 0.00016832384875874564, "loss": 0.7678, "step": 2717 }, { "epoch": 0.28, "learning_rate": 0.00016829922611468216, "loss": 0.6692, "step": 2718 }, { "epoch": 0.28, "learning_rate": 0.00016827459570689426, "loss": 0.6949, "step": 2719 }, { "epoch": 0.28, "learning_rate": 0.00016824995753818173, "loss": 0.7438, "step": 2720 }, { "epoch": 0.28, "learning_rate": 0.00016822531161134524, "loss": 0.7064, "step": 2721 }, { "epoch": 0.28, "learning_rate": 0.00016820065792918633, "loss": 0.7236, "step": 2722 }, { "epoch": 0.28, "learning_rate": 0.00016817599649450747, "loss": 0.7156, "step": 2723 }, { "epoch": 0.28, "learning_rate": 0.00016815132731011197, "loss": 0.6765, "step": 2724 }, { "epoch": 0.28, "learning_rate": 0.00016812665037880403, "loss": 0.6398, "step": 2725 }, { "epoch": 0.28, "learning_rate": 0.00016810196570338868, "loss": 0.7085, "step": 2726 }, { "epoch": 0.28, "learning_rate": 0.00016807727328667195, "loss": 0.6773, "step": 2727 }, { "epoch": 0.28, "learning_rate": 0.0001680525731314607, "loss": 0.5975, "step": 2728 }, { "epoch": 0.28, "learning_rate": 0.00016802786524056256, "loss": 0.7284, "step": 2729 }, { "epoch": 0.28, "learning_rate": 0.0001680031496167862, "loss": 0.7577, "step": 2730 }, { "epoch": 0.28, "learning_rate": 0.0001679784262629411, "loss": 0.7575, "step": 2731 }, { "epoch": 0.28, "learning_rate": 0.0001679536951818376, "loss": 0.6914, "step": 2732 }, { "epoch": 0.28, "learning_rate": 0.00016792895637628692, "loss": 0.7314, "step": 2733 }, { "epoch": 0.28, "learning_rate": 0.0001679042098491012, "loss": 0.7425, "step": 2734 }, { "epoch": 0.28, "learning_rate": 0.00016787945560309343, "loss": 0.7319, "step": 2735 }, { "epoch": 0.28, "learning_rate": 0.00016785469364107746, "loss": 0.7554, "step": 2736 }, { "epoch": 0.28, "learning_rate": 0.00016782992396586804, "loss": 0.7699, "step": 2737 }, { "epoch": 0.29, "learning_rate": 0.00016780514658028086, "loss": 0.7033, "step": 2738 }, { "epoch": 0.29, "learning_rate": 0.00016778036148713232, "loss": 0.7193, "step": 2739 }, { "epoch": 0.29, "learning_rate": 0.00016775556868923986, "loss": 0.6956, "step": 2740 }, { "epoch": 0.29, "learning_rate": 0.00016773076818942174, "loss": 0.6818, "step": 2741 }, { "epoch": 0.29, "learning_rate": 0.00016770595999049702, "loss": 0.7075, "step": 2742 }, { "epoch": 0.29, "learning_rate": 0.00016768114409528576, "loss": 0.6676, "step": 2743 }, { "epoch": 0.29, "learning_rate": 0.00016765632050660885, "loss": 0.6302, "step": 2744 }, { "epoch": 0.29, "learning_rate": 0.00016763148922728798, "loss": 0.6698, "step": 2745 }, { "epoch": 0.29, "learning_rate": 0.00016760665026014583, "loss": 0.6412, "step": 2746 }, { "epoch": 0.29, "learning_rate": 0.00016758180360800588, "loss": 0.6518, "step": 2747 }, { "epoch": 0.29, "learning_rate": 0.0001675569492736925, "loss": 0.6655, "step": 2748 }, { "epoch": 0.29, "learning_rate": 0.00016753208726003096, "loss": 0.7103, "step": 2749 }, { "epoch": 0.29, "learning_rate": 0.00016750721756984737, "loss": 0.7253, "step": 2750 }, { "epoch": 0.29, "learning_rate": 0.0001674823402059687, "loss": 0.7248, "step": 2751 }, { "epoch": 0.29, "learning_rate": 0.00016745745517122282, "loss": 0.6781, "step": 2752 }, { "epoch": 0.29, "learning_rate": 0.00016743256246843852, "loss": 0.6712, "step": 2753 }, { "epoch": 0.29, "learning_rate": 0.00016740766210044533, "loss": 0.7547, "step": 2754 }, { "epoch": 0.29, "learning_rate": 0.0001673827540700738, "loss": 0.6989, "step": 2755 }, { "epoch": 0.29, "learning_rate": 0.00016735783838015523, "loss": 0.6793, "step": 2756 }, { "epoch": 0.29, "learning_rate": 0.0001673329150335219, "loss": 0.7234, "step": 2757 }, { "epoch": 0.29, "learning_rate": 0.0001673079840330068, "loss": 0.6876, "step": 2758 }, { "epoch": 0.29, "learning_rate": 0.00016728304538144397, "loss": 0.7066, "step": 2759 }, { "epoch": 0.29, "learning_rate": 0.00016725809908166826, "loss": 0.7131, "step": 2760 }, { "epoch": 0.29, "learning_rate": 0.0001672331451365153, "loss": 0.6924, "step": 2761 }, { "epoch": 0.29, "learning_rate": 0.00016720818354882172, "loss": 0.6646, "step": 2762 }, { "epoch": 0.29, "learning_rate": 0.00016718321432142498, "loss": 0.7192, "step": 2763 }, { "epoch": 0.29, "learning_rate": 0.00016715823745716327, "loss": 0.6839, "step": 2764 }, { "epoch": 0.29, "learning_rate": 0.00016713325295887588, "loss": 0.6966, "step": 2765 }, { "epoch": 0.29, "learning_rate": 0.0001671082608294028, "loss": 0.6962, "step": 2766 }, { "epoch": 0.29, "learning_rate": 0.00016708326107158498, "loss": 0.6535, "step": 2767 }, { "epoch": 0.29, "learning_rate": 0.00016705825368826415, "loss": 0.6764, "step": 2768 }, { "epoch": 0.29, "learning_rate": 0.00016703323868228297, "loss": 0.7087, "step": 2769 }, { "epoch": 0.29, "learning_rate": 0.00016700821605648497, "loss": 0.6967, "step": 2770 }, { "epoch": 0.29, "learning_rate": 0.00016698318581371454, "loss": 0.7272, "step": 2771 }, { "epoch": 0.29, "learning_rate": 0.00016695814795681687, "loss": 0.6777, "step": 2772 }, { "epoch": 0.29, "learning_rate": 0.0001669331024886381, "loss": 0.6873, "step": 2773 }, { "epoch": 0.29, "learning_rate": 0.0001669080494120252, "loss": 0.7561, "step": 2774 }, { "epoch": 0.29, "learning_rate": 0.00016688298872982605, "loss": 0.7162, "step": 2775 }, { "epoch": 0.29, "learning_rate": 0.00016685792044488924, "loss": 0.6671, "step": 2776 }, { "epoch": 0.29, "learning_rate": 0.00016683284456006447, "loss": 0.6846, "step": 2777 }, { "epoch": 0.29, "learning_rate": 0.00016680776107820208, "loss": 0.6485, "step": 2778 }, { "epoch": 0.29, "learning_rate": 0.0001667826700021534, "loss": 0.7161, "step": 2779 }, { "epoch": 0.29, "learning_rate": 0.0001667575713347706, "loss": 0.6673, "step": 2780 }, { "epoch": 0.29, "learning_rate": 0.0001667324650789067, "loss": 0.6939, "step": 2781 }, { "epoch": 0.29, "learning_rate": 0.00016670735123741555, "loss": 0.6679, "step": 2782 }, { "epoch": 0.29, "learning_rate": 0.0001666822298131519, "loss": 0.688, "step": 2783 }, { "epoch": 0.29, "learning_rate": 0.0001666571008089714, "loss": 0.7774, "step": 2784 }, { "epoch": 0.29, "learning_rate": 0.00016663196422773052, "loss": 0.656, "step": 2785 }, { "epoch": 0.29, "learning_rate": 0.00016660682007228652, "loss": 0.7292, "step": 2786 }, { "epoch": 0.29, "learning_rate": 0.00016658166834549766, "loss": 0.6525, "step": 2787 }, { "epoch": 0.29, "learning_rate": 0.00016655650905022298, "loss": 0.6618, "step": 2788 }, { "epoch": 0.29, "learning_rate": 0.00016653134218932232, "loss": 0.6708, "step": 2789 }, { "epoch": 0.29, "learning_rate": 0.00016650616776565659, "loss": 0.7152, "step": 2790 }, { "epoch": 0.29, "learning_rate": 0.0001664809857820873, "loss": 0.6981, "step": 2791 }, { "epoch": 0.29, "learning_rate": 0.000166455796241477, "loss": 0.674, "step": 2792 }, { "epoch": 0.29, "learning_rate": 0.00016643059914668907, "loss": 0.7368, "step": 2793 }, { "epoch": 0.29, "learning_rate": 0.00016640539450058764, "loss": 0.6306, "step": 2794 }, { "epoch": 0.29, "learning_rate": 0.00016638018230603782, "loss": 0.65, "step": 2795 }, { "epoch": 0.29, "learning_rate": 0.00016635496256590555, "loss": 0.7147, "step": 2796 }, { "epoch": 0.29, "learning_rate": 0.00016632973528305758, "loss": 0.679, "step": 2797 }, { "epoch": 0.29, "learning_rate": 0.0001663045004603616, "loss": 0.67, "step": 2798 }, { "epoch": 0.29, "learning_rate": 0.00016627925810068603, "loss": 0.67, "step": 2799 }, { "epoch": 0.29, "learning_rate": 0.0001662540082069003, "loss": 0.6918, "step": 2800 }, { "epoch": 0.29, "learning_rate": 0.0001662287507818746, "loss": 0.6433, "step": 2801 }, { "epoch": 0.29, "learning_rate": 0.00016620348582847998, "loss": 0.689, "step": 2802 }, { "epoch": 0.29, "learning_rate": 0.00016617821334958838, "loss": 0.6818, "step": 2803 }, { "epoch": 0.29, "learning_rate": 0.00016615293334807258, "loss": 0.7236, "step": 2804 }, { "epoch": 0.29, "learning_rate": 0.0001661276458268062, "loss": 0.6887, "step": 2805 }, { "epoch": 0.29, "learning_rate": 0.00016610235078866374, "loss": 0.6718, "step": 2806 }, { "epoch": 0.29, "learning_rate": 0.00016607704823652053, "loss": 0.6661, "step": 2807 }, { "epoch": 0.29, "learning_rate": 0.0001660517381732528, "loss": 0.6775, "step": 2808 }, { "epoch": 0.29, "learning_rate": 0.00016602642060173755, "loss": 0.6938, "step": 2809 }, { "epoch": 0.29, "learning_rate": 0.00016600109552485272, "loss": 0.755, "step": 2810 }, { "epoch": 0.29, "learning_rate": 0.00016597576294547704, "loss": 0.6653, "step": 2811 }, { "epoch": 0.29, "learning_rate": 0.00016595042286649016, "loss": 0.7048, "step": 2812 }, { "epoch": 0.29, "learning_rate": 0.0001659250752907725, "loss": 0.7124, "step": 2813 }, { "epoch": 0.29, "learning_rate": 0.00016589972022120546, "loss": 0.6067, "step": 2814 }, { "epoch": 0.29, "learning_rate": 0.00016587435766067106, "loss": 0.6713, "step": 2815 }, { "epoch": 0.29, "learning_rate": 0.00016584898761205248, "loss": 0.6591, "step": 2816 }, { "epoch": 0.29, "learning_rate": 0.00016582361007823346, "loss": 0.6564, "step": 2817 }, { "epoch": 0.29, "learning_rate": 0.0001657982250620988, "loss": 0.6609, "step": 2818 }, { "epoch": 0.29, "learning_rate": 0.000165772832566534, "loss": 0.6407, "step": 2819 }, { "epoch": 0.29, "learning_rate": 0.0001657474325944256, "loss": 0.7189, "step": 2820 }, { "epoch": 0.29, "learning_rate": 0.00016572202514866078, "loss": 0.6737, "step": 2821 }, { "epoch": 0.29, "learning_rate": 0.00016569661023212764, "loss": 0.6789, "step": 2822 }, { "epoch": 0.29, "learning_rate": 0.0001656711878477152, "loss": 0.7166, "step": 2823 }, { "epoch": 0.29, "learning_rate": 0.00016564575799831328, "loss": 0.728, "step": 2824 }, { "epoch": 0.29, "learning_rate": 0.0001656203206868125, "loss": 0.6838, "step": 2825 }, { "epoch": 0.29, "learning_rate": 0.00016559487591610443, "loss": 0.7218, "step": 2826 }, { "epoch": 0.29, "learning_rate": 0.00016556942368908142, "loss": 0.7229, "step": 2827 }, { "epoch": 0.29, "learning_rate": 0.00016554396400863668, "loss": 0.6834, "step": 2828 }, { "epoch": 0.29, "learning_rate": 0.00016551849687766423, "loss": 0.6707, "step": 2829 }, { "epoch": 0.29, "learning_rate": 0.00016549302229905904, "loss": 0.6747, "step": 2830 }, { "epoch": 0.29, "learning_rate": 0.00016546754027571683, "loss": 0.6213, "step": 2831 }, { "epoch": 0.29, "learning_rate": 0.00016544205081053416, "loss": 0.7364, "step": 2832 }, { "epoch": 0.29, "learning_rate": 0.00016541655390640852, "loss": 0.7018, "step": 2833 }, { "epoch": 0.29, "learning_rate": 0.00016539104956623824, "loss": 0.6564, "step": 2834 }, { "epoch": 0.3, "learning_rate": 0.00016536553779292236, "loss": 0.7324, "step": 2835 }, { "epoch": 0.3, "learning_rate": 0.0001653400185893609, "loss": 0.7038, "step": 2836 }, { "epoch": 0.3, "learning_rate": 0.00016531449195845472, "loss": 0.6762, "step": 2837 }, { "epoch": 0.3, "learning_rate": 0.00016528895790310542, "loss": 0.6952, "step": 2838 }, { "epoch": 0.3, "learning_rate": 0.00016526341642621558, "loss": 0.7335, "step": 2839 }, { "epoch": 0.3, "learning_rate": 0.00016523786753068853, "loss": 0.6573, "step": 2840 }, { "epoch": 0.3, "learning_rate": 0.00016521231121942846, "loss": 0.6355, "step": 2841 }, { "epoch": 0.3, "learning_rate": 0.00016518674749534042, "loss": 0.7326, "step": 2842 }, { "epoch": 0.3, "learning_rate": 0.0001651611763613303, "loss": 0.7602, "step": 2843 }, { "epoch": 0.3, "learning_rate": 0.0001651355978203048, "loss": 0.6037, "step": 2844 }, { "epoch": 0.3, "learning_rate": 0.00016511001187517158, "loss": 0.7273, "step": 2845 }, { "epoch": 0.3, "learning_rate": 0.00016508441852883889, "loss": 0.7434, "step": 2846 }, { "epoch": 0.3, "learning_rate": 0.00016505881778421612, "loss": 0.6931, "step": 2847 }, { "epoch": 0.3, "learning_rate": 0.00016503320964421332, "loss": 0.7179, "step": 2848 }, { "epoch": 0.3, "learning_rate": 0.0001650075941117414, "loss": 0.7224, "step": 2849 }, { "epoch": 0.3, "learning_rate": 0.0001649819711897122, "loss": 0.6889, "step": 2850 }, { "epoch": 0.3, "learning_rate": 0.00016495634088103825, "loss": 0.6804, "step": 2851 }, { "epoch": 0.3, "learning_rate": 0.00016493070318863306, "loss": 0.716, "step": 2852 }, { "epoch": 0.3, "learning_rate": 0.00016490505811541092, "loss": 0.7124, "step": 2853 }, { "epoch": 0.3, "learning_rate": 0.00016487940566428696, "loss": 0.7238, "step": 2854 }, { "epoch": 0.3, "learning_rate": 0.0001648537458381771, "loss": 0.7093, "step": 2855 }, { "epoch": 0.3, "learning_rate": 0.00016482807863999824, "loss": 0.6648, "step": 2856 }, { "epoch": 0.3, "learning_rate": 0.00016480240407266793, "loss": 0.6684, "step": 2857 }, { "epoch": 0.3, "learning_rate": 0.00016477672213910472, "loss": 0.7021, "step": 2858 }, { "epoch": 0.3, "learning_rate": 0.00016475103284222792, "loss": 0.6952, "step": 2859 }, { "epoch": 0.3, "learning_rate": 0.0001647253361849577, "loss": 0.6711, "step": 2860 }, { "epoch": 0.3, "learning_rate": 0.00016469963217021502, "loss": 0.6922, "step": 2861 }, { "epoch": 0.3, "learning_rate": 0.00016467392080092173, "loss": 0.6725, "step": 2862 }, { "epoch": 0.3, "learning_rate": 0.00016464820208000053, "loss": 0.6696, "step": 2863 }, { "epoch": 0.3, "learning_rate": 0.00016462247601037487, "loss": 0.6975, "step": 2864 }, { "epoch": 0.3, "learning_rate": 0.00016459674259496914, "loss": 0.6595, "step": 2865 }, { "epoch": 0.3, "learning_rate": 0.00016457100183670846, "loss": 0.7314, "step": 2866 }, { "epoch": 0.3, "learning_rate": 0.0001645452537385189, "loss": 0.6973, "step": 2867 }, { "epoch": 0.3, "learning_rate": 0.00016451949830332727, "loss": 0.6019, "step": 2868 }, { "epoch": 0.3, "learning_rate": 0.00016449373553406121, "loss": 0.6919, "step": 2869 }, { "epoch": 0.3, "learning_rate": 0.0001644679654336493, "loss": 0.7091, "step": 2870 }, { "epoch": 0.3, "learning_rate": 0.00016444218800502086, "loss": 0.72, "step": 2871 }, { "epoch": 0.3, "learning_rate": 0.00016441640325110606, "loss": 0.62, "step": 2872 }, { "epoch": 0.3, "learning_rate": 0.00016439061117483588, "loss": 0.682, "step": 2873 }, { "epoch": 0.3, "learning_rate": 0.00016436481177914224, "loss": 0.7271, "step": 2874 }, { "epoch": 0.3, "learning_rate": 0.00016433900506695776, "loss": 0.7332, "step": 2875 }, { "epoch": 0.3, "learning_rate": 0.00016431319104121594, "loss": 0.661, "step": 2876 }, { "epoch": 0.3, "learning_rate": 0.00016428736970485115, "loss": 0.7125, "step": 2877 }, { "epoch": 0.3, "learning_rate": 0.0001642615410607985, "loss": 0.6681, "step": 2878 }, { "epoch": 0.3, "learning_rate": 0.0001642357051119941, "loss": 0.6503, "step": 2879 }, { "epoch": 0.3, "learning_rate": 0.00016420986186137465, "loss": 0.7098, "step": 2880 }, { "epoch": 0.3, "learning_rate": 0.0001641840113118779, "loss": 0.6525, "step": 2881 }, { "epoch": 0.3, "learning_rate": 0.0001641581534664423, "loss": 0.6894, "step": 2882 }, { "epoch": 0.3, "learning_rate": 0.0001641322883280072, "loss": 0.6594, "step": 2883 }, { "epoch": 0.3, "learning_rate": 0.0001641064158995127, "loss": 0.6859, "step": 2884 }, { "epoch": 0.3, "learning_rate": 0.0001640805361838998, "loss": 0.6764, "step": 2885 }, { "epoch": 0.3, "learning_rate": 0.00016405464918411032, "loss": 0.7544, "step": 2886 }, { "epoch": 0.3, "learning_rate": 0.00016402875490308686, "loss": 0.6888, "step": 2887 }, { "epoch": 0.3, "learning_rate": 0.00016400285334377293, "loss": 0.6512, "step": 2888 }, { "epoch": 0.3, "learning_rate": 0.00016397694450911277, "loss": 0.6968, "step": 2889 }, { "epoch": 0.3, "learning_rate": 0.00016395102840205153, "loss": 0.681, "step": 2890 }, { "epoch": 0.3, "learning_rate": 0.0001639251050255351, "loss": 0.6427, "step": 2891 }, { "epoch": 0.3, "learning_rate": 0.00016389917438251031, "loss": 0.7063, "step": 2892 }, { "epoch": 0.3, "learning_rate": 0.0001638732364759247, "loss": 0.6825, "step": 2893 }, { "epoch": 0.3, "learning_rate": 0.00016384729130872674, "loss": 0.618, "step": 2894 }, { "epoch": 0.3, "learning_rate": 0.00016382133888386563, "loss": 0.7498, "step": 2895 }, { "epoch": 0.3, "learning_rate": 0.00016379537920429148, "loss": 0.6944, "step": 2896 }, { "epoch": 0.3, "learning_rate": 0.00016376941227295514, "loss": 0.6394, "step": 2897 }, { "epoch": 0.3, "learning_rate": 0.00016374343809280836, "loss": 0.7059, "step": 2898 }, { "epoch": 0.3, "learning_rate": 0.00016371745666680365, "loss": 0.6507, "step": 2899 }, { "epoch": 0.3, "learning_rate": 0.00016369146799789444, "loss": 0.6868, "step": 2900 }, { "epoch": 0.3, "learning_rate": 0.00016366547208903487, "loss": 0.6031, "step": 2901 }, { "epoch": 0.3, "learning_rate": 0.00016363946894317995, "loss": 0.657, "step": 2902 }, { "epoch": 0.3, "learning_rate": 0.00016361345856328555, "loss": 0.7385, "step": 2903 }, { "epoch": 0.3, "learning_rate": 0.00016358744095230828, "loss": 0.6751, "step": 2904 }, { "epoch": 0.3, "learning_rate": 0.00016356141611320563, "loss": 0.6607, "step": 2905 }, { "epoch": 0.3, "learning_rate": 0.00016353538404893594, "loss": 0.681, "step": 2906 }, { "epoch": 0.3, "learning_rate": 0.00016350934476245832, "loss": 0.6927, "step": 2907 }, { "epoch": 0.3, "learning_rate": 0.00016348329825673267, "loss": 0.656, "step": 2908 }, { "epoch": 0.3, "learning_rate": 0.00016345724453471983, "loss": 0.7467, "step": 2909 }, { "epoch": 0.3, "learning_rate": 0.0001634311835993813, "loss": 0.6572, "step": 2910 }, { "epoch": 0.3, "learning_rate": 0.00016340511545367953, "loss": 0.7581, "step": 2911 }, { "epoch": 0.3, "learning_rate": 0.00016337904010057773, "loss": 0.7415, "step": 2912 }, { "epoch": 0.3, "learning_rate": 0.00016335295754304, "loss": 0.7472, "step": 2913 }, { "epoch": 0.3, "learning_rate": 0.00016332686778403112, "loss": 0.7583, "step": 2914 }, { "epoch": 0.3, "learning_rate": 0.0001633007708265168, "loss": 0.6917, "step": 2915 }, { "epoch": 0.3, "learning_rate": 0.00016327466667346354, "loss": 0.681, "step": 2916 }, { "epoch": 0.3, "learning_rate": 0.00016324855532783868, "loss": 0.6834, "step": 2917 }, { "epoch": 0.3, "learning_rate": 0.00016322243679261033, "loss": 0.6955, "step": 2918 }, { "epoch": 0.3, "learning_rate": 0.00016319631107074742, "loss": 0.6942, "step": 2919 }, { "epoch": 0.3, "learning_rate": 0.00016317017816521977, "loss": 0.7281, "step": 2920 }, { "epoch": 0.3, "learning_rate": 0.00016314403807899793, "loss": 0.6562, "step": 2921 }, { "epoch": 0.3, "learning_rate": 0.00016311789081505332, "loss": 0.6403, "step": 2922 }, { "epoch": 0.3, "learning_rate": 0.00016309173637635814, "loss": 0.6861, "step": 2923 }, { "epoch": 0.3, "learning_rate": 0.00016306557476588544, "loss": 0.7416, "step": 2924 }, { "epoch": 0.3, "learning_rate": 0.00016303940598660907, "loss": 0.796, "step": 2925 }, { "epoch": 0.3, "learning_rate": 0.0001630132300415037, "loss": 0.6583, "step": 2926 }, { "epoch": 0.3, "learning_rate": 0.00016298704693354474, "loss": 0.7096, "step": 2927 }, { "epoch": 0.3, "learning_rate": 0.00016296085666570858, "loss": 0.6998, "step": 2928 }, { "epoch": 0.3, "learning_rate": 0.00016293465924097225, "loss": 0.7329, "step": 2929 }, { "epoch": 0.3, "learning_rate": 0.00016290845466231373, "loss": 0.6493, "step": 2930 }, { "epoch": 0.31, "learning_rate": 0.00016288224293271167, "loss": 0.6392, "step": 2931 }, { "epoch": 0.31, "learning_rate": 0.0001628560240551457, "loss": 0.666, "step": 2932 }, { "epoch": 0.31, "learning_rate": 0.00016282979803259614, "loss": 0.6879, "step": 2933 }, { "epoch": 0.31, "learning_rate": 0.00016280356486804418, "loss": 0.6692, "step": 2934 }, { "epoch": 0.31, "learning_rate": 0.00016277732456447178, "loss": 0.6674, "step": 2935 }, { "epoch": 0.31, "learning_rate": 0.00016275107712486174, "loss": 0.697, "step": 2936 }, { "epoch": 0.31, "learning_rate": 0.00016272482255219766, "loss": 0.6921, "step": 2937 }, { "epoch": 0.31, "learning_rate": 0.00016269856084946395, "loss": 0.7212, "step": 2938 }, { "epoch": 0.31, "learning_rate": 0.00016267229201964584, "loss": 0.7538, "step": 2939 }, { "epoch": 0.31, "learning_rate": 0.0001626460160657294, "loss": 0.7316, "step": 2940 }, { "epoch": 0.31, "learning_rate": 0.00016261973299070144, "loss": 0.7022, "step": 2941 }, { "epoch": 0.31, "learning_rate": 0.0001625934427975496, "loss": 0.6926, "step": 2942 }, { "epoch": 0.31, "learning_rate": 0.0001625671454892624, "loss": 0.7583, "step": 2943 }, { "epoch": 0.31, "learning_rate": 0.00016254084106882908, "loss": 0.6845, "step": 2944 }, { "epoch": 0.31, "learning_rate": 0.0001625145295392397, "loss": 0.6848, "step": 2945 }, { "epoch": 0.31, "learning_rate": 0.00016248821090348518, "loss": 0.6928, "step": 2946 }, { "epoch": 0.31, "learning_rate": 0.0001624618851645572, "loss": 0.6642, "step": 2947 }, { "epoch": 0.31, "learning_rate": 0.00016243555232544834, "loss": 0.6784, "step": 2948 }, { "epoch": 0.31, "learning_rate": 0.00016240921238915175, "loss": 0.6502, "step": 2949 }, { "epoch": 0.31, "learning_rate": 0.00016238286535866174, "loss": 0.6685, "step": 2950 }, { "epoch": 0.31, "learning_rate": 0.0001623565112369731, "loss": 0.6596, "step": 2951 }, { "epoch": 0.31, "learning_rate": 0.0001623301500270816, "loss": 0.69, "step": 2952 }, { "epoch": 0.31, "learning_rate": 0.00016230378173198376, "loss": 0.6601, "step": 2953 }, { "epoch": 0.31, "learning_rate": 0.00016227740635467702, "loss": 0.7499, "step": 2954 }, { "epoch": 0.31, "learning_rate": 0.0001622510238981594, "loss": 0.6038, "step": 2955 }, { "epoch": 0.31, "learning_rate": 0.0001622246343654299, "loss": 0.7365, "step": 2956 }, { "epoch": 0.31, "learning_rate": 0.00016219823775948827, "loss": 0.719, "step": 2957 }, { "epoch": 0.31, "learning_rate": 0.0001621718340833351, "loss": 0.6906, "step": 2958 }, { "epoch": 0.31, "learning_rate": 0.00016214542333997173, "loss": 0.6835, "step": 2959 }, { "epoch": 0.31, "learning_rate": 0.00016211900553240034, "loss": 0.689, "step": 2960 }, { "epoch": 0.31, "learning_rate": 0.0001620925806636239, "loss": 0.7023, "step": 2961 }, { "epoch": 0.31, "learning_rate": 0.00016206614873664617, "loss": 0.6569, "step": 2962 }, { "epoch": 0.31, "learning_rate": 0.00016203970975447172, "loss": 0.6096, "step": 2963 }, { "epoch": 0.31, "learning_rate": 0.00016201326372010594, "loss": 0.7117, "step": 2964 }, { "epoch": 0.31, "learning_rate": 0.00016198681063655504, "loss": 0.7065, "step": 2965 }, { "epoch": 0.31, "learning_rate": 0.00016196035050682593, "loss": 0.6685, "step": 2966 }, { "epoch": 0.31, "learning_rate": 0.00016193388333392647, "loss": 0.7105, "step": 2967 }, { "epoch": 0.31, "learning_rate": 0.00016190740912086518, "loss": 0.7283, "step": 2968 }, { "epoch": 0.31, "learning_rate": 0.00016188092787065145, "loss": 0.6305, "step": 2969 }, { "epoch": 0.31, "learning_rate": 0.00016185443958629555, "loss": 0.6532, "step": 2970 }, { "epoch": 0.31, "learning_rate": 0.00016182794427080835, "loss": 0.6933, "step": 2971 }, { "epoch": 0.31, "learning_rate": 0.00016180144192720164, "loss": 0.6699, "step": 2972 }, { "epoch": 0.31, "learning_rate": 0.0001617749325584881, "loss": 0.6697, "step": 2973 }, { "epoch": 0.31, "learning_rate": 0.00016174841616768096, "loss": 0.6503, "step": 2974 }, { "epoch": 0.31, "learning_rate": 0.00016172189275779454, "loss": 0.7356, "step": 2975 }, { "epoch": 0.31, "learning_rate": 0.00016169536233184373, "loss": 0.6647, "step": 2976 }, { "epoch": 0.31, "learning_rate": 0.0001616688248928443, "loss": 0.7256, "step": 2977 }, { "epoch": 0.31, "learning_rate": 0.0001616422804438129, "loss": 0.6734, "step": 2978 }, { "epoch": 0.31, "learning_rate": 0.0001616157289877668, "loss": 0.7266, "step": 2979 }, { "epoch": 0.31, "learning_rate": 0.00016158917052772425, "loss": 0.6664, "step": 2980 }, { "epoch": 0.31, "learning_rate": 0.00016156260506670412, "loss": 0.6932, "step": 2981 }, { "epoch": 0.31, "learning_rate": 0.00016153603260772622, "loss": 0.7247, "step": 2982 }, { "epoch": 0.31, "learning_rate": 0.0001615094531538111, "loss": 0.7059, "step": 2983 }, { "epoch": 0.31, "learning_rate": 0.0001614828667079801, "loss": 0.6548, "step": 2984 }, { "epoch": 0.31, "learning_rate": 0.00016145627327325532, "loss": 0.6577, "step": 2985 }, { "epoch": 0.31, "learning_rate": 0.00016142967285265973, "loss": 0.6629, "step": 2986 }, { "epoch": 0.31, "learning_rate": 0.00016140306544921708, "loss": 0.6642, "step": 2987 }, { "epoch": 0.31, "learning_rate": 0.0001613764510659519, "loss": 0.6786, "step": 2988 }, { "epoch": 0.31, "learning_rate": 0.00016134982970588942, "loss": 0.7135, "step": 2989 }, { "epoch": 0.31, "learning_rate": 0.0001613232013720558, "loss": 0.647, "step": 2990 }, { "epoch": 0.31, "learning_rate": 0.000161296566067478, "loss": 0.6758, "step": 2991 }, { "epoch": 0.31, "learning_rate": 0.00016126992379518365, "loss": 0.6727, "step": 2992 }, { "epoch": 0.31, "learning_rate": 0.00016124327455820122, "loss": 0.6508, "step": 2993 }, { "epoch": 0.31, "learning_rate": 0.00016121661835956003, "loss": 0.7521, "step": 2994 }, { "epoch": 0.31, "learning_rate": 0.00016118995520229013, "loss": 0.6209, "step": 2995 }, { "epoch": 0.31, "learning_rate": 0.00016116328508942237, "loss": 0.6623, "step": 2996 }, { "epoch": 0.31, "learning_rate": 0.00016113660802398845, "loss": 0.6774, "step": 2997 }, { "epoch": 0.31, "learning_rate": 0.00016110992400902076, "loss": 0.7061, "step": 2998 }, { "epoch": 0.31, "learning_rate": 0.00016108323304755252, "loss": 0.7621, "step": 2999 }, { "epoch": 0.31, "learning_rate": 0.00016105653514261783, "loss": 0.6638, "step": 3000 }, { "epoch": 0.31, "learning_rate": 0.0001610298302972514, "loss": 0.7018, "step": 3001 }, { "epoch": 0.31, "learning_rate": 0.00016100311851448892, "loss": 0.6023, "step": 3002 }, { "epoch": 0.31, "learning_rate": 0.0001609763997973667, "loss": 0.7383, "step": 3003 }, { "epoch": 0.31, "learning_rate": 0.00016094967414892196, "loss": 0.6451, "step": 3004 }, { "epoch": 0.31, "learning_rate": 0.00016092294157219267, "loss": 0.6913, "step": 3005 }, { "epoch": 0.31, "learning_rate": 0.00016089620207021752, "loss": 0.674, "step": 3006 }, { "epoch": 0.31, "learning_rate": 0.00016086945564603613, "loss": 0.6597, "step": 3007 }, { "epoch": 0.31, "learning_rate": 0.00016084270230268879, "loss": 0.6393, "step": 3008 }, { "epoch": 0.31, "learning_rate": 0.00016081594204321663, "loss": 0.7359, "step": 3009 }, { "epoch": 0.31, "learning_rate": 0.00016078917487066148, "loss": 0.7137, "step": 3010 }, { "epoch": 0.31, "learning_rate": 0.0001607624007880661, "loss": 0.7092, "step": 3011 }, { "epoch": 0.31, "learning_rate": 0.00016073561979847395, "loss": 0.6276, "step": 3012 }, { "epoch": 0.31, "learning_rate": 0.00016070883190492924, "loss": 0.6629, "step": 3013 }, { "epoch": 0.31, "learning_rate": 0.00016068203711047704, "loss": 0.6902, "step": 3014 }, { "epoch": 0.31, "learning_rate": 0.00016065523541816318, "loss": 0.689, "step": 3015 }, { "epoch": 0.31, "learning_rate": 0.00016062842683103426, "loss": 0.7245, "step": 3016 }, { "epoch": 0.31, "learning_rate": 0.00016060161135213766, "loss": 0.7526, "step": 3017 }, { "epoch": 0.31, "learning_rate": 0.00016057478898452157, "loss": 0.6368, "step": 3018 }, { "epoch": 0.31, "learning_rate": 0.00016054795973123492, "loss": 0.7049, "step": 3019 }, { "epoch": 0.31, "learning_rate": 0.0001605211235953275, "loss": 0.6464, "step": 3020 }, { "epoch": 0.31, "learning_rate": 0.00016049428057984978, "loss": 0.6827, "step": 3021 }, { "epoch": 0.31, "learning_rate": 0.00016046743068785313, "loss": 0.6974, "step": 3022 }, { "epoch": 0.31, "learning_rate": 0.00016044057392238954, "loss": 0.7294, "step": 3023 }, { "epoch": 0.31, "learning_rate": 0.00016041371028651196, "loss": 0.6564, "step": 3024 }, { "epoch": 0.31, "learning_rate": 0.00016038683978327405, "loss": 0.6768, "step": 3025 }, { "epoch": 0.31, "learning_rate": 0.00016035996241573017, "loss": 0.765, "step": 3026 }, { "epoch": 0.32, "learning_rate": 0.00016033307818693558, "loss": 0.7406, "step": 3027 }, { "epoch": 0.32, "learning_rate": 0.00016030618709994625, "loss": 0.7261, "step": 3028 }, { "epoch": 0.32, "learning_rate": 0.00016027928915781893, "loss": 0.7207, "step": 3029 }, { "epoch": 0.32, "learning_rate": 0.00016025238436361122, "loss": 0.6911, "step": 3030 }, { "epoch": 0.32, "learning_rate": 0.0001602254727203814, "loss": 0.6319, "step": 3031 }, { "epoch": 0.32, "learning_rate": 0.00016019855423118863, "loss": 0.6917, "step": 3032 }, { "epoch": 0.32, "learning_rate": 0.0001601716288990927, "loss": 0.6977, "step": 3033 }, { "epoch": 0.32, "learning_rate": 0.0001601446967271544, "loss": 0.6566, "step": 3034 }, { "epoch": 0.32, "learning_rate": 0.0001601177577184351, "loss": 0.7359, "step": 3035 }, { "epoch": 0.32, "learning_rate": 0.00016009081187599695, "loss": 0.6818, "step": 3036 }, { "epoch": 0.32, "learning_rate": 0.00016006385920290308, "loss": 0.637, "step": 3037 }, { "epoch": 0.32, "learning_rate": 0.00016003689970221717, "loss": 0.6351, "step": 3038 }, { "epoch": 0.32, "learning_rate": 0.00016000993337700377, "loss": 0.7112, "step": 3039 }, { "epoch": 0.32, "learning_rate": 0.00015998296023032822, "loss": 0.6973, "step": 3040 }, { "epoch": 0.32, "learning_rate": 0.00015995598026525664, "loss": 0.7058, "step": 3041 }, { "epoch": 0.32, "learning_rate": 0.00015992899348485587, "loss": 0.6721, "step": 3042 }, { "epoch": 0.32, "learning_rate": 0.00015990199989219356, "loss": 0.7145, "step": 3043 }, { "epoch": 0.32, "learning_rate": 0.00015987499949033819, "loss": 0.6668, "step": 3044 }, { "epoch": 0.32, "learning_rate": 0.00015984799228235884, "loss": 0.7185, "step": 3045 }, { "epoch": 0.32, "learning_rate": 0.00015982097827132557, "loss": 0.7165, "step": 3046 }, { "epoch": 0.32, "learning_rate": 0.00015979395746030912, "loss": 0.7031, "step": 3047 }, { "epoch": 0.32, "learning_rate": 0.00015976692985238095, "loss": 0.7166, "step": 3048 }, { "epoch": 0.32, "learning_rate": 0.0001597398954506134, "loss": 0.6657, "step": 3049 }, { "epoch": 0.32, "learning_rate": 0.0001597128542580795, "loss": 0.6963, "step": 3050 }, { "epoch": 0.32, "learning_rate": 0.0001596858062778531, "loss": 0.7005, "step": 3051 }, { "epoch": 0.32, "learning_rate": 0.0001596587515130088, "loss": 0.6674, "step": 3052 }, { "epoch": 0.32, "learning_rate": 0.00015963168996662195, "loss": 0.6863, "step": 3053 }, { "epoch": 0.32, "learning_rate": 0.00015960462164176873, "loss": 0.7292, "step": 3054 }, { "epoch": 0.32, "learning_rate": 0.00015957754654152603, "loss": 0.6792, "step": 3055 }, { "epoch": 0.32, "learning_rate": 0.00015955046466897157, "loss": 0.6826, "step": 3056 }, { "epoch": 0.32, "learning_rate": 0.0001595233760271838, "loss": 0.6796, "step": 3057 }, { "epoch": 0.32, "learning_rate": 0.00015949628061924192, "loss": 0.6942, "step": 3058 }, { "epoch": 0.32, "learning_rate": 0.0001594691784482259, "loss": 0.7075, "step": 3059 }, { "epoch": 0.32, "learning_rate": 0.00015944206951721662, "loss": 0.7154, "step": 3060 }, { "epoch": 0.32, "learning_rate": 0.00015941495382929547, "loss": 0.7154, "step": 3061 }, { "epoch": 0.32, "learning_rate": 0.00015938783138754484, "loss": 0.7036, "step": 3062 }, { "epoch": 0.32, "learning_rate": 0.00015936070219504776, "loss": 0.6938, "step": 3063 }, { "epoch": 0.32, "learning_rate": 0.00015933356625488809, "loss": 0.684, "step": 3064 }, { "epoch": 0.32, "learning_rate": 0.00015930642357015043, "loss": 0.6766, "step": 3065 }, { "epoch": 0.32, "learning_rate": 0.00015927927414392012, "loss": 0.6922, "step": 3066 }, { "epoch": 0.32, "learning_rate": 0.00015925211797928332, "loss": 0.7033, "step": 3067 }, { "epoch": 0.32, "learning_rate": 0.00015922495507932695, "loss": 0.6961, "step": 3068 }, { "epoch": 0.32, "learning_rate": 0.00015919778544713862, "loss": 0.6902, "step": 3069 }, { "epoch": 0.32, "learning_rate": 0.0001591706090858068, "loss": 0.6937, "step": 3070 }, { "epoch": 0.32, "learning_rate": 0.00015914342599842072, "loss": 0.7125, "step": 3071 }, { "epoch": 0.32, "learning_rate": 0.00015911623618807027, "loss": 0.661, "step": 3072 }, { "epoch": 0.32, "learning_rate": 0.00015908903965784622, "loss": 0.6907, "step": 3073 }, { "epoch": 0.32, "learning_rate": 0.00015906183641084006, "loss": 0.7674, "step": 3074 }, { "epoch": 0.32, "learning_rate": 0.00015903462645014402, "loss": 0.693, "step": 3075 }, { "epoch": 0.32, "learning_rate": 0.00015900740977885117, "loss": 0.713, "step": 3076 }, { "epoch": 0.32, "learning_rate": 0.00015898018640005522, "loss": 0.6979, "step": 3077 }, { "epoch": 0.32, "learning_rate": 0.00015895295631685073, "loss": 0.722, "step": 3078 }, { "epoch": 0.32, "learning_rate": 0.00015892571953233302, "loss": 0.6504, "step": 3079 }, { "epoch": 0.32, "learning_rate": 0.0001588984760495982, "loss": 0.7504, "step": 3080 }, { "epoch": 0.32, "learning_rate": 0.00015887122587174298, "loss": 0.709, "step": 3081 }, { "epoch": 0.32, "learning_rate": 0.00015884396900186503, "loss": 0.7359, "step": 3082 }, { "epoch": 0.32, "learning_rate": 0.0001588167054430627, "loss": 0.6752, "step": 3083 }, { "epoch": 0.32, "learning_rate": 0.0001587894351984351, "loss": 0.7715, "step": 3084 }, { "epoch": 0.32, "learning_rate": 0.0001587621582710821, "loss": 0.7533, "step": 3085 }, { "epoch": 0.32, "learning_rate": 0.00015873487466410425, "loss": 0.7447, "step": 3086 }, { "epoch": 0.32, "learning_rate": 0.00015870758438060305, "loss": 0.6385, "step": 3087 }, { "epoch": 0.32, "learning_rate": 0.00015868028742368058, "loss": 0.7375, "step": 3088 }, { "epoch": 0.32, "learning_rate": 0.00015865298379643975, "loss": 0.711, "step": 3089 }, { "epoch": 0.32, "learning_rate": 0.00015862567350198427, "loss": 0.6851, "step": 3090 }, { "epoch": 0.32, "learning_rate": 0.00015859835654341852, "loss": 0.6991, "step": 3091 }, { "epoch": 0.32, "learning_rate": 0.00015857103292384769, "loss": 0.7284, "step": 3092 }, { "epoch": 0.32, "learning_rate": 0.00015854370264637772, "loss": 0.6253, "step": 3093 }, { "epoch": 0.32, "learning_rate": 0.00015851636571411528, "loss": 0.6594, "step": 3094 }, { "epoch": 0.32, "learning_rate": 0.00015848902213016786, "loss": 0.7309, "step": 3095 }, { "epoch": 0.32, "learning_rate": 0.0001584616718976436, "loss": 0.6929, "step": 3096 }, { "epoch": 0.32, "learning_rate": 0.00015843431501965153, "loss": 0.7155, "step": 3097 }, { "epoch": 0.32, "learning_rate": 0.00015840695149930135, "loss": 0.6632, "step": 3098 }, { "epoch": 0.32, "learning_rate": 0.00015837958133970353, "loss": 0.7059, "step": 3099 }, { "epoch": 0.32, "learning_rate": 0.00015835220454396928, "loss": 0.6679, "step": 3100 }, { "epoch": 0.32, "learning_rate": 0.0001583248211152106, "loss": 0.807, "step": 3101 }, { "epoch": 0.32, "learning_rate": 0.0001582974310565402, "loss": 0.7282, "step": 3102 }, { "epoch": 0.32, "learning_rate": 0.0001582700343710716, "loss": 0.7236, "step": 3103 }, { "epoch": 0.32, "learning_rate": 0.00015824263106191904, "loss": 0.7008, "step": 3104 }, { "epoch": 0.32, "learning_rate": 0.00015821522113219748, "loss": 0.6782, "step": 3105 }, { "epoch": 0.32, "learning_rate": 0.0001581878045850227, "loss": 0.7059, "step": 3106 }, { "epoch": 0.32, "learning_rate": 0.00015816038142351117, "loss": 0.7171, "step": 3107 }, { "epoch": 0.32, "learning_rate": 0.0001581329516507802, "loss": 0.705, "step": 3108 }, { "epoch": 0.32, "learning_rate": 0.0001581055152699477, "loss": 0.72, "step": 3109 }, { "epoch": 0.32, "learning_rate": 0.00015807807228413254, "loss": 0.7308, "step": 3110 }, { "epoch": 0.32, "learning_rate": 0.00015805062269645413, "loss": 0.7393, "step": 3111 }, { "epoch": 0.32, "learning_rate": 0.00015802316651003276, "loss": 0.713, "step": 3112 }, { "epoch": 0.32, "learning_rate": 0.00015799570372798945, "loss": 0.6887, "step": 3113 }, { "epoch": 0.32, "learning_rate": 0.0001579682343534459, "loss": 0.6739, "step": 3114 }, { "epoch": 0.32, "learning_rate": 0.0001579407583895247, "loss": 0.7598, "step": 3115 }, { "epoch": 0.32, "learning_rate": 0.00015791327583934903, "loss": 0.7093, "step": 3116 }, { "epoch": 0.32, "learning_rate": 0.00015788578670604294, "loss": 0.6248, "step": 3117 }, { "epoch": 0.32, "learning_rate": 0.00015785829099273116, "loss": 0.6884, "step": 3118 }, { "epoch": 0.32, "learning_rate": 0.00015783078870253918, "loss": 0.7448, "step": 3119 }, { "epoch": 0.32, "learning_rate": 0.00015780327983859328, "loss": 0.719, "step": 3120 }, { "epoch": 0.32, "learning_rate": 0.0001577757644040204, "loss": 0.7145, "step": 3121 }, { "epoch": 0.32, "learning_rate": 0.00015774824240194835, "loss": 0.7147, "step": 3122 }, { "epoch": 0.33, "learning_rate": 0.00015772071383550552, "loss": 0.7562, "step": 3123 }, { "epoch": 0.33, "learning_rate": 0.00015769317870782123, "loss": 0.6428, "step": 3124 }, { "epoch": 0.33, "learning_rate": 0.00015766563702202544, "loss": 0.7354, "step": 3125 }, { "epoch": 0.33, "learning_rate": 0.00015763808878124883, "loss": 0.6623, "step": 3126 }, { "epoch": 0.33, "learning_rate": 0.00015761053398862294, "loss": 0.6838, "step": 3127 }, { "epoch": 0.33, "learning_rate": 0.00015758297264727993, "loss": 0.7094, "step": 3128 }, { "epoch": 0.33, "learning_rate": 0.00015755540476035276, "loss": 0.7132, "step": 3129 }, { "epoch": 0.33, "learning_rate": 0.0001575278303309752, "loss": 0.6654, "step": 3130 }, { "epoch": 0.33, "learning_rate": 0.00015750024936228162, "loss": 0.7102, "step": 3131 }, { "epoch": 0.33, "learning_rate": 0.00015747266185740723, "loss": 0.7493, "step": 3132 }, { "epoch": 0.33, "learning_rate": 0.00015744506781948796, "loss": 0.7483, "step": 3133 }, { "epoch": 0.33, "learning_rate": 0.00015741746725166054, "loss": 0.6443, "step": 3134 }, { "epoch": 0.33, "learning_rate": 0.0001573898601570623, "loss": 0.6713, "step": 3135 }, { "epoch": 0.33, "learning_rate": 0.00015736224653883143, "loss": 0.6518, "step": 3136 }, { "epoch": 0.33, "learning_rate": 0.00015733462640010686, "loss": 0.7029, "step": 3137 }, { "epoch": 0.33, "learning_rate": 0.00015730699974402822, "loss": 0.7233, "step": 3138 }, { "epoch": 0.33, "learning_rate": 0.00015727936657373588, "loss": 0.6822, "step": 3139 }, { "epoch": 0.33, "learning_rate": 0.000157251726892371, "loss": 0.7477, "step": 3140 }, { "epoch": 0.33, "learning_rate": 0.00015722408070307538, "loss": 0.7174, "step": 3141 }, { "epoch": 0.33, "learning_rate": 0.00015719642800899168, "loss": 0.669, "step": 3142 }, { "epoch": 0.33, "learning_rate": 0.00015716876881326323, "loss": 0.6614, "step": 3143 }, { "epoch": 0.33, "learning_rate": 0.00015714110311903408, "loss": 0.6947, "step": 3144 }, { "epoch": 0.33, "learning_rate": 0.0001571134309294491, "loss": 0.7556, "step": 3145 }, { "epoch": 0.33, "learning_rate": 0.0001570857522476538, "loss": 0.6751, "step": 3146 }, { "epoch": 0.33, "learning_rate": 0.00015705806707679452, "loss": 0.7247, "step": 3147 }, { "epoch": 0.33, "learning_rate": 0.0001570303754200183, "loss": 0.7446, "step": 3148 }, { "epoch": 0.33, "learning_rate": 0.00015700267728047283, "loss": 0.7199, "step": 3149 }, { "epoch": 0.33, "learning_rate": 0.00015697497266130669, "loss": 0.6787, "step": 3150 }, { "epoch": 0.33, "learning_rate": 0.00015694726156566914, "loss": 0.7068, "step": 3151 }, { "epoch": 0.33, "learning_rate": 0.0001569195439967101, "loss": 0.702, "step": 3152 }, { "epoch": 0.33, "learning_rate": 0.00015689181995758036, "loss": 0.7006, "step": 3153 }, { "epoch": 0.33, "learning_rate": 0.0001568640894514313, "loss": 0.6819, "step": 3154 }, { "epoch": 0.33, "learning_rate": 0.0001568363524814152, "loss": 0.75, "step": 3155 }, { "epoch": 0.33, "learning_rate": 0.0001568086090506849, "loss": 0.6834, "step": 3156 }, { "epoch": 0.33, "learning_rate": 0.00015678085916239406, "loss": 0.6971, "step": 3157 }, { "epoch": 0.33, "learning_rate": 0.00015675310281969713, "loss": 0.7351, "step": 3158 }, { "epoch": 0.33, "learning_rate": 0.00015672534002574918, "loss": 0.6504, "step": 3159 }, { "epoch": 0.33, "learning_rate": 0.00015669757078370605, "loss": 0.7078, "step": 3160 }, { "epoch": 0.33, "learning_rate": 0.00015666979509672442, "loss": 0.7118, "step": 3161 }, { "epoch": 0.33, "learning_rate": 0.00015664201296796155, "loss": 0.6513, "step": 3162 }, { "epoch": 0.33, "learning_rate": 0.0001566142244005755, "loss": 0.6679, "step": 3163 }, { "epoch": 0.33, "learning_rate": 0.0001565864293977251, "loss": 0.695, "step": 3164 }, { "epoch": 0.33, "learning_rate": 0.0001565586279625698, "loss": 0.651, "step": 3165 }, { "epoch": 0.33, "learning_rate": 0.00015653082009826989, "loss": 0.6854, "step": 3166 }, { "epoch": 0.33, "learning_rate": 0.0001565030058079864, "loss": 0.6811, "step": 3167 }, { "epoch": 0.33, "learning_rate": 0.00015647518509488093, "loss": 0.6739, "step": 3168 }, { "epoch": 0.33, "learning_rate": 0.000156447357962116, "loss": 0.7046, "step": 3169 }, { "epoch": 0.33, "learning_rate": 0.00015641952441285476, "loss": 0.6758, "step": 3170 }, { "epoch": 0.33, "learning_rate": 0.00015639168445026114, "loss": 0.6545, "step": 3171 }, { "epoch": 0.33, "learning_rate": 0.00015636383807749973, "loss": 0.7578, "step": 3172 }, { "epoch": 0.33, "learning_rate": 0.0001563359852977359, "loss": 0.6573, "step": 3173 }, { "epoch": 0.33, "learning_rate": 0.00015630812611413573, "loss": 0.719, "step": 3174 }, { "epoch": 0.33, "learning_rate": 0.00015628026052986611, "loss": 0.6654, "step": 3175 }, { "epoch": 0.33, "learning_rate": 0.00015625238854809448, "loss": 0.713, "step": 3176 }, { "epoch": 0.33, "learning_rate": 0.00015622451017198913, "loss": 0.6411, "step": 3177 }, { "epoch": 0.33, "learning_rate": 0.0001561966254047191, "loss": 0.6476, "step": 3178 }, { "epoch": 0.33, "learning_rate": 0.00015616873424945408, "loss": 0.6998, "step": 3179 }, { "epoch": 0.33, "learning_rate": 0.00015614083670936456, "loss": 0.7089, "step": 3180 }, { "epoch": 0.33, "learning_rate": 0.00015611293278762166, "loss": 0.7264, "step": 3181 }, { "epoch": 0.33, "learning_rate": 0.00015608502248739731, "loss": 0.69, "step": 3182 }, { "epoch": 0.33, "learning_rate": 0.00015605710581186415, "loss": 0.6509, "step": 3183 }, { "epoch": 0.33, "learning_rate": 0.00015602918276419548, "loss": 0.7166, "step": 3184 }, { "epoch": 0.33, "learning_rate": 0.00015600125334756543, "loss": 0.7575, "step": 3185 }, { "epoch": 0.33, "learning_rate": 0.00015597331756514877, "loss": 0.7007, "step": 3186 }, { "epoch": 0.33, "learning_rate": 0.00015594537542012104, "loss": 0.669, "step": 3187 }, { "epoch": 0.33, "learning_rate": 0.00015591742691565847, "loss": 0.7102, "step": 3188 }, { "epoch": 0.33, "learning_rate": 0.000155889472054938, "loss": 0.667, "step": 3189 }, { "epoch": 0.33, "learning_rate": 0.00015586151084113738, "loss": 0.6994, "step": 3190 }, { "epoch": 0.33, "learning_rate": 0.00015583354327743503, "loss": 0.7079, "step": 3191 }, { "epoch": 0.33, "learning_rate": 0.00015580556936701002, "loss": 0.7223, "step": 3192 }, { "epoch": 0.33, "learning_rate": 0.00015577758911304219, "loss": 0.705, "step": 3193 }, { "epoch": 0.33, "learning_rate": 0.00015574960251871223, "loss": 0.7435, "step": 3194 }, { "epoch": 0.33, "learning_rate": 0.00015572160958720135, "loss": 0.7062, "step": 3195 }, { "epoch": 0.33, "learning_rate": 0.00015569361032169158, "loss": 0.7109, "step": 3196 }, { "epoch": 0.33, "learning_rate": 0.00015566560472536568, "loss": 0.7497, "step": 3197 }, { "epoch": 0.33, "learning_rate": 0.0001556375928014071, "loss": 0.6307, "step": 3198 }, { "epoch": 0.33, "learning_rate": 0.00015560957455300003, "loss": 0.669, "step": 3199 }, { "epoch": 0.33, "learning_rate": 0.00015558154998332935, "loss": 0.6368, "step": 3200 }, { "epoch": 0.33, "learning_rate": 0.00015555351909558068, "loss": 0.6995, "step": 3201 }, { "epoch": 0.33, "learning_rate": 0.00015552548189294032, "loss": 0.6768, "step": 3202 }, { "epoch": 0.33, "learning_rate": 0.00015549743837859535, "loss": 0.6775, "step": 3203 }, { "epoch": 0.33, "learning_rate": 0.00015546938855573358, "loss": 0.6342, "step": 3204 }, { "epoch": 0.33, "learning_rate": 0.00015544133242754345, "loss": 0.7031, "step": 3205 }, { "epoch": 0.33, "learning_rate": 0.00015541326999721412, "loss": 0.6914, "step": 3206 }, { "epoch": 0.33, "learning_rate": 0.0001553852012679356, "loss": 0.7002, "step": 3207 }, { "epoch": 0.33, "learning_rate": 0.0001553571262428985, "loss": 0.6807, "step": 3208 }, { "epoch": 0.33, "learning_rate": 0.0001553290449252941, "loss": 0.6371, "step": 3209 }, { "epoch": 0.33, "learning_rate": 0.00015530095731831453, "loss": 0.6903, "step": 3210 }, { "epoch": 0.33, "learning_rate": 0.00015527286342515258, "loss": 0.7056, "step": 3211 }, { "epoch": 0.33, "learning_rate": 0.00015524476324900173, "loss": 0.6964, "step": 3212 }, { "epoch": 0.33, "learning_rate": 0.00015521665679305615, "loss": 0.6276, "step": 3213 }, { "epoch": 0.33, "learning_rate": 0.0001551885440605108, "loss": 0.7073, "step": 3214 }, { "epoch": 0.33, "learning_rate": 0.00015516042505456134, "loss": 0.7085, "step": 3215 }, { "epoch": 0.33, "learning_rate": 0.00015513229977840408, "loss": 0.725, "step": 3216 }, { "epoch": 0.33, "learning_rate": 0.00015510416823523606, "loss": 0.6831, "step": 3217 }, { "epoch": 0.33, "learning_rate": 0.0001550760304282551, "loss": 0.6831, "step": 3218 }, { "epoch": 0.34, "learning_rate": 0.0001550478863606597, "loss": 0.7133, "step": 3219 }, { "epoch": 0.34, "learning_rate": 0.00015501973603564904, "loss": 0.6588, "step": 3220 }, { "epoch": 0.34, "learning_rate": 0.000154991579456423, "loss": 0.6426, "step": 3221 }, { "epoch": 0.34, "learning_rate": 0.00015496341662618224, "loss": 0.6182, "step": 3222 }, { "epoch": 0.34, "learning_rate": 0.00015493524754812808, "loss": 0.6373, "step": 3223 }, { "epoch": 0.34, "learning_rate": 0.00015490707222546253, "loss": 0.6626, "step": 3224 }, { "epoch": 0.34, "learning_rate": 0.00015487889066138842, "loss": 0.7256, "step": 3225 }, { "epoch": 0.34, "learning_rate": 0.0001548507028591091, "loss": 0.7055, "step": 3226 }, { "epoch": 0.34, "learning_rate": 0.00015482250882182884, "loss": 0.7221, "step": 3227 }, { "epoch": 0.34, "learning_rate": 0.00015479430855275248, "loss": 0.654, "step": 3228 }, { "epoch": 0.34, "learning_rate": 0.00015476610205508558, "loss": 0.7216, "step": 3229 }, { "epoch": 0.34, "learning_rate": 0.00015473788933203448, "loss": 0.6159, "step": 3230 }, { "epoch": 0.34, "learning_rate": 0.00015470967038680615, "loss": 0.7225, "step": 3231 }, { "epoch": 0.34, "learning_rate": 0.0001546814452226083, "loss": 0.66, "step": 3232 }, { "epoch": 0.34, "learning_rate": 0.0001546532138426494, "loss": 0.6558, "step": 3233 }, { "epoch": 0.34, "learning_rate": 0.00015462497625013855, "loss": 0.6763, "step": 3234 }, { "epoch": 0.34, "learning_rate": 0.00015459673244828552, "loss": 0.6665, "step": 3235 }, { "epoch": 0.34, "learning_rate": 0.0001545684824403009, "loss": 0.7086, "step": 3236 }, { "epoch": 0.34, "learning_rate": 0.00015454022622939591, "loss": 0.6605, "step": 3237 }, { "epoch": 0.34, "learning_rate": 0.00015451196381878254, "loss": 0.7203, "step": 3238 }, { "epoch": 0.34, "learning_rate": 0.00015448369521167335, "loss": 0.6639, "step": 3239 }, { "epoch": 0.34, "learning_rate": 0.00015445542041128183, "loss": 0.6921, "step": 3240 }, { "epoch": 0.34, "learning_rate": 0.00015442713942082192, "loss": 0.7071, "step": 3241 }, { "epoch": 0.34, "learning_rate": 0.00015439885224350844, "loss": 0.6957, "step": 3242 }, { "epoch": 0.34, "learning_rate": 0.0001543705588825568, "loss": 0.7062, "step": 3243 }, { "epoch": 0.34, "learning_rate": 0.00015434225934118326, "loss": 0.6859, "step": 3244 }, { "epoch": 0.34, "learning_rate": 0.0001543139536226046, "loss": 0.6595, "step": 3245 }, { "epoch": 0.34, "learning_rate": 0.00015428564173003846, "loss": 0.6454, "step": 3246 }, { "epoch": 0.34, "learning_rate": 0.0001542573236667031, "loss": 0.7206, "step": 3247 }, { "epoch": 0.34, "learning_rate": 0.0001542289994358175, "loss": 0.7249, "step": 3248 }, { "epoch": 0.34, "learning_rate": 0.00015420066904060128, "loss": 0.6592, "step": 3249 }, { "epoch": 0.34, "learning_rate": 0.0001541723324842749, "loss": 0.6932, "step": 3250 }, { "epoch": 0.34, "learning_rate": 0.0001541439897700594, "loss": 0.738, "step": 3251 }, { "epoch": 0.34, "learning_rate": 0.00015411564090117653, "loss": 0.6589, "step": 3252 }, { "epoch": 0.34, "learning_rate": 0.00015408728588084882, "loss": 0.6612, "step": 3253 }, { "epoch": 0.34, "learning_rate": 0.00015405892471229946, "loss": 0.6883, "step": 3254 }, { "epoch": 0.34, "learning_rate": 0.00015403055739875228, "loss": 0.7562, "step": 3255 }, { "epoch": 0.34, "learning_rate": 0.00015400218394343184, "loss": 0.7251, "step": 3256 }, { "epoch": 0.34, "learning_rate": 0.0001539738043495635, "loss": 0.6497, "step": 3257 }, { "epoch": 0.34, "learning_rate": 0.00015394541862037318, "loss": 0.7175, "step": 3258 }, { "epoch": 0.34, "learning_rate": 0.00015391702675908748, "loss": 0.698, "step": 3259 }, { "epoch": 0.34, "learning_rate": 0.0001538886287689339, "loss": 0.7139, "step": 3260 }, { "epoch": 0.34, "learning_rate": 0.00015386022465314038, "loss": 0.6619, "step": 3261 }, { "epoch": 0.34, "learning_rate": 0.00015383181441493577, "loss": 0.6636, "step": 3262 }, { "epoch": 0.34, "learning_rate": 0.00015380339805754945, "loss": 0.721, "step": 3263 }, { "epoch": 0.34, "learning_rate": 0.0001537749755842117, "loss": 0.7238, "step": 3264 }, { "epoch": 0.34, "learning_rate": 0.0001537465469981532, "loss": 0.7219, "step": 3265 }, { "epoch": 0.34, "learning_rate": 0.00015371811230260556, "loss": 0.6992, "step": 3266 }, { "epoch": 0.34, "learning_rate": 0.00015368967150080102, "loss": 0.6372, "step": 3267 }, { "epoch": 0.34, "learning_rate": 0.00015366122459597252, "loss": 0.7116, "step": 3268 }, { "epoch": 0.34, "learning_rate": 0.00015363277159135364, "loss": 0.715, "step": 3269 }, { "epoch": 0.34, "learning_rate": 0.00015360431249017878, "loss": 0.676, "step": 3270 }, { "epoch": 0.34, "learning_rate": 0.0001535758472956829, "loss": 0.6798, "step": 3271 }, { "epoch": 0.34, "learning_rate": 0.00015354737601110168, "loss": 0.702, "step": 3272 }, { "epoch": 0.34, "learning_rate": 0.0001535188986396715, "loss": 0.7292, "step": 3273 }, { "epoch": 0.34, "learning_rate": 0.0001534904151846295, "loss": 0.6782, "step": 3274 }, { "epoch": 0.34, "learning_rate": 0.00015346192564921345, "loss": 0.6364, "step": 3275 }, { "epoch": 0.34, "learning_rate": 0.00015343343003666182, "loss": 0.679, "step": 3276 }, { "epoch": 0.34, "learning_rate": 0.00015340492835021373, "loss": 0.6798, "step": 3277 }, { "epoch": 0.34, "learning_rate": 0.00015337642059310905, "loss": 0.6748, "step": 3278 }, { "epoch": 0.34, "learning_rate": 0.0001533479067685883, "loss": 0.7404, "step": 3279 }, { "epoch": 0.34, "learning_rate": 0.00015331938687989275, "loss": 0.722, "step": 3280 }, { "epoch": 0.34, "learning_rate": 0.0001532908609302643, "loss": 0.6897, "step": 3281 }, { "epoch": 0.34, "learning_rate": 0.00015326232892294559, "loss": 0.6379, "step": 3282 }, { "epoch": 0.34, "learning_rate": 0.0001532337908611799, "loss": 0.7392, "step": 3283 }, { "epoch": 0.34, "learning_rate": 0.00015320524674821115, "loss": 0.6994, "step": 3284 }, { "epoch": 0.34, "learning_rate": 0.00015317669658728407, "loss": 0.7201, "step": 3285 }, { "epoch": 0.34, "learning_rate": 0.00015314814038164403, "loss": 0.6795, "step": 3286 }, { "epoch": 0.34, "learning_rate": 0.00015311957813453702, "loss": 0.741, "step": 3287 }, { "epoch": 0.34, "learning_rate": 0.00015309100984920986, "loss": 0.6974, "step": 3288 }, { "epoch": 0.34, "learning_rate": 0.00015306243552890993, "loss": 0.6673, "step": 3289 }, { "epoch": 0.34, "learning_rate": 0.00015303385517688534, "loss": 0.5874, "step": 3290 }, { "epoch": 0.34, "learning_rate": 0.0001530052687963848, "loss": 0.7529, "step": 3291 }, { "epoch": 0.34, "learning_rate": 0.00015297667639065793, "loss": 0.7201, "step": 3292 }, { "epoch": 0.34, "learning_rate": 0.0001529480779629548, "loss": 0.624, "step": 3293 }, { "epoch": 0.34, "learning_rate": 0.00015291947351652629, "loss": 0.7134, "step": 3294 }, { "epoch": 0.34, "learning_rate": 0.00015289086305462392, "loss": 0.6514, "step": 3295 }, { "epoch": 0.34, "learning_rate": 0.0001528622465804999, "loss": 0.6377, "step": 3296 }, { "epoch": 0.34, "learning_rate": 0.00015283362409740714, "loss": 0.6917, "step": 3297 }, { "epoch": 0.34, "learning_rate": 0.0001528049956085992, "loss": 0.6657, "step": 3298 }, { "epoch": 0.34, "learning_rate": 0.00015277636111733035, "loss": 0.6466, "step": 3299 }, { "epoch": 0.34, "learning_rate": 0.00015274772062685556, "loss": 0.6064, "step": 3300 }, { "epoch": 0.34, "learning_rate": 0.00015271907414043045, "loss": 0.7168, "step": 3301 }, { "epoch": 0.34, "learning_rate": 0.0001526904216613113, "loss": 0.7179, "step": 3302 }, { "epoch": 0.34, "learning_rate": 0.00015266176319275515, "loss": 0.6885, "step": 3303 }, { "epoch": 0.34, "learning_rate": 0.00015263309873801963, "loss": 0.6794, "step": 3304 }, { "epoch": 0.34, "learning_rate": 0.0001526044283003631, "loss": 0.7195, "step": 3305 }, { "epoch": 0.34, "learning_rate": 0.0001525757518830446, "loss": 0.6561, "step": 3306 }, { "epoch": 0.34, "learning_rate": 0.00015254706948932386, "loss": 0.6228, "step": 3307 }, { "epoch": 0.34, "learning_rate": 0.0001525183811224612, "loss": 0.734, "step": 3308 }, { "epoch": 0.34, "learning_rate": 0.00015248968678571782, "loss": 0.6385, "step": 3309 }, { "epoch": 0.34, "learning_rate": 0.00015246098648235534, "loss": 0.6768, "step": 3310 }, { "epoch": 0.34, "learning_rate": 0.00015243228021563624, "loss": 0.7193, "step": 3311 }, { "epoch": 0.34, "learning_rate": 0.00015240356798882366, "loss": 0.6835, "step": 3312 }, { "epoch": 0.34, "learning_rate": 0.0001523748498051813, "loss": 0.6915, "step": 3313 }, { "epoch": 0.34, "learning_rate": 0.00015234612566797368, "loss": 0.6586, "step": 3314 }, { "epoch": 0.35, "learning_rate": 0.0001523173955804659, "loss": 0.7085, "step": 3315 }, { "epoch": 0.35, "learning_rate": 0.0001522886595459238, "loss": 0.7258, "step": 3316 }, { "epoch": 0.35, "learning_rate": 0.0001522599175676139, "loss": 0.6636, "step": 3317 }, { "epoch": 0.35, "learning_rate": 0.00015223116964880332, "loss": 0.6723, "step": 3318 }, { "epoch": 0.35, "learning_rate": 0.00015220241579275986, "loss": 0.6783, "step": 3319 }, { "epoch": 0.35, "learning_rate": 0.00015217365600275214, "loss": 0.6976, "step": 3320 }, { "epoch": 0.35, "learning_rate": 0.00015214489028204925, "loss": 0.705, "step": 3321 }, { "epoch": 0.35, "learning_rate": 0.00015211611863392115, "loss": 0.6316, "step": 3322 }, { "epoch": 0.35, "learning_rate": 0.00015208734106163826, "loss": 0.7253, "step": 3323 }, { "epoch": 0.35, "learning_rate": 0.00015205855756847186, "loss": 0.6539, "step": 3324 }, { "epoch": 0.35, "learning_rate": 0.00015202976815769384, "loss": 0.6725, "step": 3325 }, { "epoch": 0.35, "learning_rate": 0.00015200097283257674, "loss": 0.6536, "step": 3326 }, { "epoch": 0.35, "learning_rate": 0.00015197217159639375, "loss": 0.6879, "step": 3327 }, { "epoch": 0.35, "learning_rate": 0.0001519433644524189, "loss": 0.672, "step": 3328 }, { "epoch": 0.35, "learning_rate": 0.0001519145514039266, "loss": 0.7177, "step": 3329 }, { "epoch": 0.35, "learning_rate": 0.00015188573245419217, "loss": 0.6687, "step": 3330 }, { "epoch": 0.35, "learning_rate": 0.00015185690760649153, "loss": 0.7184, "step": 3331 }, { "epoch": 0.35, "learning_rate": 0.00015182807686410125, "loss": 0.6835, "step": 3332 }, { "epoch": 0.35, "learning_rate": 0.00015179924023029856, "loss": 0.6696, "step": 3333 }, { "epoch": 0.35, "learning_rate": 0.00015177039770836146, "loss": 0.6857, "step": 3334 }, { "epoch": 0.35, "learning_rate": 0.0001517415493015685, "loss": 0.7014, "step": 3335 }, { "epoch": 0.35, "learning_rate": 0.0001517126950131989, "loss": 0.6361, "step": 3336 }, { "epoch": 0.35, "learning_rate": 0.00015168383484653265, "loss": 0.7219, "step": 3337 }, { "epoch": 0.35, "learning_rate": 0.00015165496880485032, "loss": 0.7241, "step": 3338 }, { "epoch": 0.35, "learning_rate": 0.00015162609689143314, "loss": 0.7241, "step": 3339 }, { "epoch": 0.35, "learning_rate": 0.00015159721910956315, "loss": 0.6723, "step": 3340 }, { "epoch": 0.35, "learning_rate": 0.0001515683354625229, "loss": 0.7273, "step": 3341 }, { "epoch": 0.35, "learning_rate": 0.00015153944595359563, "loss": 0.7127, "step": 3342 }, { "epoch": 0.35, "learning_rate": 0.00015151055058606523, "loss": 0.6839, "step": 3343 }, { "epoch": 0.35, "learning_rate": 0.00015148164936321643, "loss": 0.6567, "step": 3344 }, { "epoch": 0.35, "learning_rate": 0.00015145274228833442, "loss": 0.6713, "step": 3345 }, { "epoch": 0.35, "learning_rate": 0.0001514238293647051, "loss": 0.6188, "step": 3346 }, { "epoch": 0.35, "learning_rate": 0.00015139491059561517, "loss": 0.7108, "step": 3347 }, { "epoch": 0.35, "learning_rate": 0.0001513659859843518, "loss": 0.7453, "step": 3348 }, { "epoch": 0.35, "learning_rate": 0.00015133705553420292, "loss": 0.6718, "step": 3349 }, { "epoch": 0.35, "learning_rate": 0.00015130811924845715, "loss": 0.6245, "step": 3350 }, { "epoch": 0.35, "learning_rate": 0.00015127917713040375, "loss": 0.7187, "step": 3351 }, { "epoch": 0.35, "learning_rate": 0.0001512502291833326, "loss": 0.7469, "step": 3352 }, { "epoch": 0.35, "learning_rate": 0.0001512212754105343, "loss": 0.7198, "step": 3353 }, { "epoch": 0.35, "learning_rate": 0.0001511923158153001, "loss": 0.7436, "step": 3354 }, { "epoch": 0.35, "learning_rate": 0.00015116335040092188, "loss": 0.7124, "step": 3355 }, { "epoch": 0.35, "learning_rate": 0.00015113437917069217, "loss": 0.7424, "step": 3356 }, { "epoch": 0.35, "learning_rate": 0.00015110540212790428, "loss": 0.6745, "step": 3357 }, { "epoch": 0.35, "learning_rate": 0.000151076419275852, "loss": 0.68, "step": 3358 }, { "epoch": 0.35, "learning_rate": 0.00015104743061782996, "loss": 0.6638, "step": 3359 }, { "epoch": 0.35, "learning_rate": 0.0001510184361571333, "loss": 0.6576, "step": 3360 }, { "epoch": 0.35, "learning_rate": 0.00015098943589705795, "loss": 0.6957, "step": 3361 }, { "epoch": 0.35, "learning_rate": 0.00015096042984090037, "loss": 0.6112, "step": 3362 }, { "epoch": 0.35, "learning_rate": 0.00015093141799195773, "loss": 0.6847, "step": 3363 }, { "epoch": 0.35, "learning_rate": 0.00015090240035352796, "loss": 0.7107, "step": 3364 }, { "epoch": 0.35, "learning_rate": 0.00015087337692890952, "loss": 0.659, "step": 3365 }, { "epoch": 0.35, "learning_rate": 0.0001508443477214015, "loss": 0.7053, "step": 3366 }, { "epoch": 0.35, "learning_rate": 0.0001508153127343038, "loss": 0.7071, "step": 3367 }, { "epoch": 0.35, "learning_rate": 0.00015078627197091685, "loss": 0.716, "step": 3368 }, { "epoch": 0.35, "learning_rate": 0.0001507572254345418, "loss": 0.742, "step": 3369 }, { "epoch": 0.35, "learning_rate": 0.00015072817312848042, "loss": 0.6936, "step": 3370 }, { "epoch": 0.35, "learning_rate": 0.00015069911505603516, "loss": 0.7001, "step": 3371 }, { "epoch": 0.35, "learning_rate": 0.0001506700512205091, "loss": 0.678, "step": 3372 }, { "epoch": 0.35, "learning_rate": 0.000150640981625206, "loss": 0.6822, "step": 3373 }, { "epoch": 0.35, "learning_rate": 0.00015061190627343028, "loss": 0.6549, "step": 3374 }, { "epoch": 0.35, "learning_rate": 0.00015058282516848697, "loss": 0.6798, "step": 3375 }, { "epoch": 0.35, "learning_rate": 0.00015055373831368178, "loss": 0.6798, "step": 3376 }, { "epoch": 0.35, "learning_rate": 0.0001505246457123211, "loss": 0.7203, "step": 3377 }, { "epoch": 0.35, "learning_rate": 0.00015049554736771198, "loss": 0.726, "step": 3378 }, { "epoch": 0.35, "learning_rate": 0.00015046644328316203, "loss": 0.6677, "step": 3379 }, { "epoch": 0.35, "learning_rate": 0.0001504373334619796, "loss": 0.7127, "step": 3380 }, { "epoch": 0.35, "learning_rate": 0.0001504082179074737, "loss": 0.6976, "step": 3381 }, { "epoch": 0.35, "learning_rate": 0.0001503790966229539, "loss": 0.6834, "step": 3382 }, { "epoch": 0.35, "learning_rate": 0.00015034996961173054, "loss": 0.6613, "step": 3383 }, { "epoch": 0.35, "learning_rate": 0.00015032083687711452, "loss": 0.7233, "step": 3384 }, { "epoch": 0.35, "learning_rate": 0.0001502916984224174, "loss": 0.714, "step": 3385 }, { "epoch": 0.35, "learning_rate": 0.00015026255425095147, "loss": 0.7006, "step": 3386 }, { "epoch": 0.35, "learning_rate": 0.00015023340436602956, "loss": 0.6985, "step": 3387 }, { "epoch": 0.35, "learning_rate": 0.00015020424877096525, "loss": 0.7325, "step": 3388 }, { "epoch": 0.35, "learning_rate": 0.0001501750874690727, "loss": 0.664, "step": 3389 }, { "epoch": 0.35, "learning_rate": 0.00015014592046366668, "loss": 0.7518, "step": 3390 }, { "epoch": 0.35, "learning_rate": 0.0001501167477580628, "loss": 0.7198, "step": 3391 }, { "epoch": 0.35, "learning_rate": 0.0001500875693555771, "loss": 0.5972, "step": 3392 }, { "epoch": 0.35, "learning_rate": 0.0001500583852595263, "loss": 0.703, "step": 3393 }, { "epoch": 0.35, "learning_rate": 0.00015002919547322795, "loss": 0.68, "step": 3394 }, { "epoch": 0.35, "learning_rate": 0.00015000000000000001, "loss": 0.6838, "step": 3395 }, { "epoch": 0.35, "learning_rate": 0.00014997079884316125, "loss": 0.6978, "step": 3396 }, { "epoch": 0.35, "learning_rate": 0.000149941592006031, "loss": 0.7021, "step": 3397 }, { "epoch": 0.35, "learning_rate": 0.00014991237949192932, "loss": 0.7419, "step": 3398 }, { "epoch": 0.35, "learning_rate": 0.00014988316130417682, "loss": 0.6936, "step": 3399 }, { "epoch": 0.35, "learning_rate": 0.00014985393744609477, "loss": 0.7208, "step": 3400 }, { "epoch": 0.35, "learning_rate": 0.00014982470792100516, "loss": 0.6803, "step": 3401 }, { "epoch": 0.35, "learning_rate": 0.00014979547273223057, "loss": 0.6067, "step": 3402 }, { "epoch": 0.35, "learning_rate": 0.00014976623188309418, "loss": 0.6981, "step": 3403 }, { "epoch": 0.35, "learning_rate": 0.0001497369853769199, "loss": 0.654, "step": 3404 }, { "epoch": 0.35, "learning_rate": 0.00014970773321703226, "loss": 0.7168, "step": 3405 }, { "epoch": 0.35, "learning_rate": 0.0001496784754067564, "loss": 0.6413, "step": 3406 }, { "epoch": 0.35, "learning_rate": 0.00014964921194941813, "loss": 0.7225, "step": 3407 }, { "epoch": 0.35, "learning_rate": 0.00014961994284834386, "loss": 0.7342, "step": 3408 }, { "epoch": 0.35, "learning_rate": 0.0001495906681068607, "loss": 0.7091, "step": 3409 }, { "epoch": 0.35, "learning_rate": 0.00014956138772829637, "loss": 0.754, "step": 3410 }, { "epoch": 0.36, "learning_rate": 0.00014953210171597924, "loss": 0.7081, "step": 3411 }, { "epoch": 0.36, "learning_rate": 0.00014950281007323834, "loss": 0.7607, "step": 3412 }, { "epoch": 0.36, "learning_rate": 0.0001494735128034032, "loss": 0.6859, "step": 3413 }, { "epoch": 0.36, "learning_rate": 0.0001494442099098043, "loss": 0.6722, "step": 3414 }, { "epoch": 0.36, "learning_rate": 0.0001494149013957724, "loss": 0.6875, "step": 3415 }, { "epoch": 0.36, "learning_rate": 0.0001493855872646391, "loss": 0.7181, "step": 3416 }, { "epoch": 0.36, "learning_rate": 0.00014935626751973668, "loss": 0.6531, "step": 3417 }, { "epoch": 0.36, "learning_rate": 0.0001493269421643979, "loss": 0.7182, "step": 3418 }, { "epoch": 0.36, "learning_rate": 0.00014929761120195627, "loss": 0.7275, "step": 3419 }, { "epoch": 0.36, "learning_rate": 0.00014926827463574588, "loss": 0.656, "step": 3420 }, { "epoch": 0.36, "learning_rate": 0.00014923893246910152, "loss": 0.6533, "step": 3421 }, { "epoch": 0.36, "learning_rate": 0.00014920958470535854, "loss": 0.6947, "step": 3422 }, { "epoch": 0.36, "learning_rate": 0.000149180231347853, "loss": 0.7024, "step": 3423 }, { "epoch": 0.36, "learning_rate": 0.00014915087239992156, "loss": 0.6732, "step": 3424 }, { "epoch": 0.36, "learning_rate": 0.0001491215078649015, "loss": 0.67, "step": 3425 }, { "epoch": 0.36, "learning_rate": 0.00014909213774613072, "loss": 0.6936, "step": 3426 }, { "epoch": 0.36, "learning_rate": 0.00014906276204694783, "loss": 0.7064, "step": 3427 }, { "epoch": 0.36, "learning_rate": 0.00014903338077069204, "loss": 0.704, "step": 3428 }, { "epoch": 0.36, "learning_rate": 0.00014900399392070316, "loss": 0.6768, "step": 3429 }, { "epoch": 0.36, "learning_rate": 0.00014897460150032165, "loss": 0.6987, "step": 3430 }, { "epoch": 0.36, "learning_rate": 0.0001489452035128887, "loss": 0.6577, "step": 3431 }, { "epoch": 0.36, "learning_rate": 0.00014891579996174589, "loss": 0.7083, "step": 3432 }, { "epoch": 0.36, "learning_rate": 0.00014888639085023568, "loss": 0.7347, "step": 3433 }, { "epoch": 0.36, "learning_rate": 0.00014885697618170107, "loss": 0.7187, "step": 3434 }, { "epoch": 0.36, "learning_rate": 0.00014882755595948567, "loss": 0.6151, "step": 3435 }, { "epoch": 0.36, "learning_rate": 0.00014879813018693375, "loss": 0.6716, "step": 3436 }, { "epoch": 0.36, "learning_rate": 0.00014876869886739025, "loss": 0.742, "step": 3437 }, { "epoch": 0.36, "learning_rate": 0.00014873926200420062, "loss": 0.6781, "step": 3438 }, { "epoch": 0.36, "learning_rate": 0.00014870981960071096, "loss": 0.656, "step": 3439 }, { "epoch": 0.36, "learning_rate": 0.00014868037166026823, "loss": 0.7143, "step": 3440 }, { "epoch": 0.36, "learning_rate": 0.00014865091818621972, "loss": 0.7335, "step": 3441 }, { "epoch": 0.36, "learning_rate": 0.00014862145918191348, "loss": 0.7109, "step": 3442 }, { "epoch": 0.36, "learning_rate": 0.00014859199465069823, "loss": 0.6737, "step": 3443 }, { "epoch": 0.36, "learning_rate": 0.00014856252459592318, "loss": 0.7564, "step": 3444 }, { "epoch": 0.36, "learning_rate": 0.00014853304902093836, "loss": 0.751, "step": 3445 }, { "epoch": 0.36, "learning_rate": 0.00014850356792909427, "loss": 0.7327, "step": 3446 }, { "epoch": 0.36, "learning_rate": 0.00014847408132374207, "loss": 0.713, "step": 3447 }, { "epoch": 0.36, "learning_rate": 0.0001484445892082336, "loss": 0.6966, "step": 3448 }, { "epoch": 0.36, "learning_rate": 0.00014841509158592132, "loss": 0.6132, "step": 3449 }, { "epoch": 0.36, "learning_rate": 0.00014838558846015824, "loss": 0.6958, "step": 3450 }, { "epoch": 0.36, "learning_rate": 0.0001483560798342981, "loss": 0.6934, "step": 3451 }, { "epoch": 0.36, "learning_rate": 0.00014832656571169513, "loss": 0.6986, "step": 3452 }, { "epoch": 0.36, "learning_rate": 0.0001482970460957043, "loss": 0.6923, "step": 3453 }, { "epoch": 0.36, "learning_rate": 0.0001482675209896812, "loss": 0.6662, "step": 3454 }, { "epoch": 0.36, "learning_rate": 0.00014823799039698202, "loss": 0.7145, "step": 3455 }, { "epoch": 0.36, "learning_rate": 0.00014820845432096351, "loss": 0.7511, "step": 3456 }, { "epoch": 0.36, "learning_rate": 0.00014817891276498317, "loss": 0.6737, "step": 3457 }, { "epoch": 0.36, "learning_rate": 0.000148149365732399, "loss": 0.7284, "step": 3458 }, { "epoch": 0.36, "learning_rate": 0.00014811981322656966, "loss": 0.6836, "step": 3459 }, { "epoch": 0.36, "learning_rate": 0.00014809025525085452, "loss": 0.678, "step": 3460 }, { "epoch": 0.36, "learning_rate": 0.00014806069180861348, "loss": 0.7031, "step": 3461 }, { "epoch": 0.36, "learning_rate": 0.00014803112290320705, "loss": 0.6856, "step": 3462 }, { "epoch": 0.36, "learning_rate": 0.00014800154853799645, "loss": 0.6395, "step": 3463 }, { "epoch": 0.36, "learning_rate": 0.00014797196871634338, "loss": 0.743, "step": 3464 }, { "epoch": 0.36, "learning_rate": 0.00014794238344161028, "loss": 0.7118, "step": 3465 }, { "epoch": 0.36, "learning_rate": 0.0001479127927171602, "loss": 0.686, "step": 3466 }, { "epoch": 0.36, "learning_rate": 0.00014788319654635677, "loss": 0.6884, "step": 3467 }, { "epoch": 0.36, "learning_rate": 0.00014785359493256424, "loss": 0.6839, "step": 3468 }, { "epoch": 0.36, "learning_rate": 0.00014782398787914751, "loss": 0.6375, "step": 3469 }, { "epoch": 0.36, "learning_rate": 0.00014779437538947206, "loss": 0.6729, "step": 3470 }, { "epoch": 0.36, "learning_rate": 0.00014776475746690402, "loss": 0.6961, "step": 3471 }, { "epoch": 0.36, "learning_rate": 0.0001477351341148101, "loss": 0.7211, "step": 3472 }, { "epoch": 0.36, "learning_rate": 0.00014770550533655768, "loss": 0.6644, "step": 3473 }, { "epoch": 0.36, "learning_rate": 0.00014767587113551471, "loss": 0.6728, "step": 3474 }, { "epoch": 0.36, "learning_rate": 0.0001476462315150498, "loss": 0.6821, "step": 3475 }, { "epoch": 0.36, "learning_rate": 0.00014761658647853215, "loss": 0.6618, "step": 3476 }, { "epoch": 0.36, "learning_rate": 0.00014758693602933155, "loss": 0.6747, "step": 3477 }, { "epoch": 0.36, "learning_rate": 0.00014755728017081847, "loss": 0.7392, "step": 3478 }, { "epoch": 0.36, "learning_rate": 0.00014752761890636387, "loss": 0.7522, "step": 3479 }, { "epoch": 0.36, "learning_rate": 0.00014749795223933956, "loss": 0.7209, "step": 3480 }, { "epoch": 0.36, "learning_rate": 0.0001474682801731177, "loss": 0.7273, "step": 3481 }, { "epoch": 0.36, "learning_rate": 0.0001474386027110712, "loss": 0.7049, "step": 3482 }, { "epoch": 0.36, "learning_rate": 0.00014740891985657356, "loss": 0.7237, "step": 3483 }, { "epoch": 0.36, "learning_rate": 0.00014737923161299893, "loss": 0.6679, "step": 3484 }, { "epoch": 0.36, "learning_rate": 0.00014734953798372204, "loss": 0.7184, "step": 3485 }, { "epoch": 0.36, "learning_rate": 0.00014731983897211815, "loss": 0.6846, "step": 3486 }, { "epoch": 0.36, "learning_rate": 0.00014729013458156332, "loss": 0.6675, "step": 3487 }, { "epoch": 0.36, "learning_rate": 0.00014726042481543407, "loss": 0.6295, "step": 3488 }, { "epoch": 0.36, "learning_rate": 0.00014723070967710754, "loss": 0.6688, "step": 3489 }, { "epoch": 0.36, "learning_rate": 0.00014720098916996157, "loss": 0.6993, "step": 3490 }, { "epoch": 0.36, "learning_rate": 0.00014717126329737452, "loss": 0.6813, "step": 3491 }, { "epoch": 0.36, "learning_rate": 0.00014714153206272544, "loss": 0.6844, "step": 3492 }, { "epoch": 0.36, "learning_rate": 0.00014711179546939387, "loss": 0.6903, "step": 3493 }, { "epoch": 0.36, "learning_rate": 0.00014708205352076007, "loss": 0.6115, "step": 3494 }, { "epoch": 0.36, "learning_rate": 0.00014705230622020493, "loss": 0.6898, "step": 3495 }, { "epoch": 0.36, "learning_rate": 0.00014702255357110978, "loss": 0.6858, "step": 3496 }, { "epoch": 0.36, "learning_rate": 0.00014699279557685679, "loss": 0.6768, "step": 3497 }, { "epoch": 0.36, "learning_rate": 0.00014696303224082856, "loss": 0.6578, "step": 3498 }, { "epoch": 0.36, "learning_rate": 0.00014693326356640828, "loss": 0.72, "step": 3499 }, { "epoch": 0.36, "learning_rate": 0.00014690348955697996, "loss": 0.6463, "step": 3500 }, { "epoch": 0.36, "learning_rate": 0.000146873710215928, "loss": 0.7057, "step": 3501 }, { "epoch": 0.36, "learning_rate": 0.00014684392554663753, "loss": 0.6808, "step": 3502 }, { "epoch": 0.36, "learning_rate": 0.00014681413555249414, "loss": 0.7625, "step": 3503 }, { "epoch": 0.36, "learning_rate": 0.00014678434023688422, "loss": 0.7085, "step": 3504 }, { "epoch": 0.36, "learning_rate": 0.00014675453960319464, "loss": 0.7336, "step": 3505 }, { "epoch": 0.36, "learning_rate": 0.00014672473365481289, "loss": 0.6429, "step": 3506 }, { "epoch": 0.37, "learning_rate": 0.00014669492239512713, "loss": 0.7345, "step": 3507 }, { "epoch": 0.37, "learning_rate": 0.00014666510582752603, "loss": 0.6571, "step": 3508 }, { "epoch": 0.37, "learning_rate": 0.00014663528395539888, "loss": 0.617, "step": 3509 }, { "epoch": 0.37, "learning_rate": 0.00014660545678213562, "loss": 0.6638, "step": 3510 }, { "epoch": 0.37, "learning_rate": 0.0001465756243111268, "loss": 0.6845, "step": 3511 }, { "epoch": 0.37, "learning_rate": 0.0001465457865457635, "loss": 0.7538, "step": 3512 }, { "epoch": 0.37, "learning_rate": 0.00014651594348943749, "loss": 0.6764, "step": 3513 }, { "epoch": 0.37, "learning_rate": 0.0001464860951455411, "loss": 0.6719, "step": 3514 }, { "epoch": 0.37, "learning_rate": 0.0001464562415174672, "loss": 0.7146, "step": 3515 }, { "epoch": 0.37, "learning_rate": 0.00014642638260860933, "loss": 0.6506, "step": 3516 }, { "epoch": 0.37, "learning_rate": 0.00014639651842236165, "loss": 0.6684, "step": 3517 }, { "epoch": 0.37, "learning_rate": 0.0001463666489621189, "loss": 0.6957, "step": 3518 }, { "epoch": 0.37, "learning_rate": 0.00014633677423127634, "loss": 0.7728, "step": 3519 }, { "epoch": 0.37, "learning_rate": 0.00014630689423323, "loss": 0.7054, "step": 3520 }, { "epoch": 0.37, "learning_rate": 0.0001462770089713763, "loss": 0.7451, "step": 3521 }, { "epoch": 0.37, "learning_rate": 0.0001462471184491124, "loss": 0.6495, "step": 3522 }, { "epoch": 0.37, "learning_rate": 0.00014621722266983605, "loss": 0.6551, "step": 3523 }, { "epoch": 0.37, "learning_rate": 0.00014618732163694555, "loss": 0.7019, "step": 3524 }, { "epoch": 0.37, "learning_rate": 0.0001461574153538398, "loss": 0.6936, "step": 3525 }, { "epoch": 0.37, "learning_rate": 0.00014612750382391837, "loss": 0.6805, "step": 3526 }, { "epoch": 0.37, "learning_rate": 0.00014609758705058133, "loss": 0.687, "step": 3527 }, { "epoch": 0.37, "learning_rate": 0.00014606766503722936, "loss": 0.6628, "step": 3528 }, { "epoch": 0.37, "learning_rate": 0.00014603773778726378, "loss": 0.7305, "step": 3529 }, { "epoch": 0.37, "learning_rate": 0.0001460078053040865, "loss": 0.6882, "step": 3530 }, { "epoch": 0.37, "learning_rate": 0.00014597786759110002, "loss": 0.6682, "step": 3531 }, { "epoch": 0.37, "learning_rate": 0.00014594792465170742, "loss": 0.5951, "step": 3532 }, { "epoch": 0.37, "learning_rate": 0.00014591797648931236, "loss": 0.6996, "step": 3533 }, { "epoch": 0.37, "learning_rate": 0.00014588802310731911, "loss": 0.6967, "step": 3534 }, { "epoch": 0.37, "learning_rate": 0.00014585806450913259, "loss": 0.7037, "step": 3535 }, { "epoch": 0.37, "learning_rate": 0.0001458281006981582, "loss": 0.6547, "step": 3536 }, { "epoch": 0.37, "learning_rate": 0.00014579813167780206, "loss": 0.69, "step": 3537 }, { "epoch": 0.37, "learning_rate": 0.00014576815745147073, "loss": 0.6338, "step": 3538 }, { "epoch": 0.37, "learning_rate": 0.0001457381780225715, "loss": 0.7207, "step": 3539 }, { "epoch": 0.37, "learning_rate": 0.0001457081933945122, "loss": 0.7162, "step": 3540 }, { "epoch": 0.37, "learning_rate": 0.0001456782035707012, "loss": 0.7117, "step": 3541 }, { "epoch": 0.37, "learning_rate": 0.00014564820855454759, "loss": 0.6405, "step": 3542 }, { "epoch": 0.37, "learning_rate": 0.0001456182083494609, "loss": 0.7506, "step": 3543 }, { "epoch": 0.37, "learning_rate": 0.00014558820295885135, "loss": 0.6618, "step": 3544 }, { "epoch": 0.37, "learning_rate": 0.00014555819238612974, "loss": 0.6544, "step": 3545 }, { "epoch": 0.37, "learning_rate": 0.0001455281766347074, "loss": 0.7324, "step": 3546 }, { "epoch": 0.37, "learning_rate": 0.0001454981557079963, "loss": 0.6368, "step": 3547 }, { "epoch": 0.37, "learning_rate": 0.00014546812960940898, "loss": 0.703, "step": 3548 }, { "epoch": 0.37, "learning_rate": 0.00014543809834235857, "loss": 0.6972, "step": 3549 }, { "epoch": 0.37, "learning_rate": 0.00014540806191025882, "loss": 0.6845, "step": 3550 }, { "epoch": 0.37, "learning_rate": 0.000145378020316524, "loss": 0.6761, "step": 3551 }, { "epoch": 0.37, "learning_rate": 0.00014534797356456904, "loss": 0.641, "step": 3552 }, { "epoch": 0.37, "learning_rate": 0.0001453179216578094, "loss": 0.7146, "step": 3553 }, { "epoch": 0.37, "learning_rate": 0.00014528786459966115, "loss": 0.6786, "step": 3554 }, { "epoch": 0.37, "learning_rate": 0.00014525780239354094, "loss": 0.6652, "step": 3555 }, { "epoch": 0.37, "learning_rate": 0.000145227735042866, "loss": 0.6811, "step": 3556 }, { "epoch": 0.37, "learning_rate": 0.00014519766255105418, "loss": 0.6418, "step": 3557 }, { "epoch": 0.37, "learning_rate": 0.00014516758492152387, "loss": 0.6824, "step": 3558 }, { "epoch": 0.37, "learning_rate": 0.00014513750215769405, "loss": 0.661, "step": 3559 }, { "epoch": 0.37, "learning_rate": 0.0001451074142629843, "loss": 0.6716, "step": 3560 }, { "epoch": 0.37, "learning_rate": 0.0001450773212408148, "loss": 0.7085, "step": 3561 }, { "epoch": 0.37, "learning_rate": 0.00014504722309460627, "loss": 0.6548, "step": 3562 }, { "epoch": 0.37, "learning_rate": 0.00014501711982778002, "loss": 0.703, "step": 3563 }, { "epoch": 0.37, "learning_rate": 0.00014498701144375798, "loss": 0.73, "step": 3564 }, { "epoch": 0.37, "learning_rate": 0.00014495689794596263, "loss": 0.7202, "step": 3565 }, { "epoch": 0.37, "learning_rate": 0.00014492677933781705, "loss": 0.6944, "step": 3566 }, { "epoch": 0.37, "learning_rate": 0.00014489665562274486, "loss": 0.6637, "step": 3567 }, { "epoch": 0.37, "learning_rate": 0.0001448665268041703, "loss": 0.698, "step": 3568 }, { "epoch": 0.37, "learning_rate": 0.00014483639288551817, "loss": 0.6948, "step": 3569 }, { "epoch": 0.37, "learning_rate": 0.0001448062538702139, "loss": 0.7217, "step": 3570 }, { "epoch": 0.37, "learning_rate": 0.00014477610976168344, "loss": 0.7253, "step": 3571 }, { "epoch": 0.37, "learning_rate": 0.0001447459605633533, "loss": 0.6161, "step": 3572 }, { "epoch": 0.37, "learning_rate": 0.00014471580627865066, "loss": 0.7242, "step": 3573 }, { "epoch": 0.37, "learning_rate": 0.0001446856469110032, "loss": 0.6976, "step": 3574 }, { "epoch": 0.37, "learning_rate": 0.0001446554824638392, "loss": 0.7115, "step": 3575 }, { "epoch": 0.37, "learning_rate": 0.00014462531294058748, "loss": 0.7146, "step": 3576 }, { "epoch": 0.37, "learning_rate": 0.00014459513834467756, "loss": 0.649, "step": 3577 }, { "epoch": 0.37, "learning_rate": 0.00014456495867953942, "loss": 0.7047, "step": 3578 }, { "epoch": 0.37, "learning_rate": 0.0001445347739486036, "loss": 0.7105, "step": 3579 }, { "epoch": 0.37, "learning_rate": 0.00014450458415530136, "loss": 0.6496, "step": 3580 }, { "epoch": 0.37, "learning_rate": 0.00014447438930306433, "loss": 0.7554, "step": 3581 }, { "epoch": 0.37, "learning_rate": 0.00014444418939532492, "loss": 0.7438, "step": 3582 }, { "epoch": 0.37, "learning_rate": 0.00014441398443551596, "loss": 0.6493, "step": 3583 }, { "epoch": 0.37, "learning_rate": 0.00014438377442707096, "loss": 0.7595, "step": 3584 }, { "epoch": 0.37, "learning_rate": 0.00014435355937342394, "loss": 0.6935, "step": 3585 }, { "epoch": 0.37, "learning_rate": 0.0001443233392780095, "loss": 0.7093, "step": 3586 }, { "epoch": 0.37, "learning_rate": 0.00014429311414426284, "loss": 0.7348, "step": 3587 }, { "epoch": 0.37, "learning_rate": 0.00014426288397561968, "loss": 0.7111, "step": 3588 }, { "epoch": 0.37, "learning_rate": 0.0001442326487755164, "loss": 0.6737, "step": 3589 }, { "epoch": 0.37, "learning_rate": 0.00014420240854738991, "loss": 0.7944, "step": 3590 }, { "epoch": 0.37, "learning_rate": 0.00014417216329467767, "loss": 0.6331, "step": 3591 }, { "epoch": 0.37, "learning_rate": 0.00014414191302081767, "loss": 0.6913, "step": 3592 }, { "epoch": 0.37, "learning_rate": 0.00014411165772924858, "loss": 0.6534, "step": 3593 }, { "epoch": 0.37, "learning_rate": 0.00014408139742340956, "loss": 0.6678, "step": 3594 }, { "epoch": 0.37, "learning_rate": 0.00014405113210674042, "loss": 0.7091, "step": 3595 }, { "epoch": 0.37, "learning_rate": 0.0001440208617826814, "loss": 0.6886, "step": 3596 }, { "epoch": 0.37, "learning_rate": 0.00014399058645467346, "loss": 0.7433, "step": 3597 }, { "epoch": 0.37, "learning_rate": 0.00014396030612615808, "loss": 0.7171, "step": 3598 }, { "epoch": 0.37, "learning_rate": 0.0001439300208005772, "loss": 0.696, "step": 3599 }, { "epoch": 0.37, "learning_rate": 0.00014389973048137354, "loss": 0.6565, "step": 3600 }, { "epoch": 0.37, "learning_rate": 0.00014386943517199016, "loss": 0.6964, "step": 3601 }, { "epoch": 0.37, "learning_rate": 0.00014383913487587085, "loss": 0.6997, "step": 3602 }, { "epoch": 0.38, "learning_rate": 0.00014380882959645988, "loss": 0.6287, "step": 3603 }, { "epoch": 0.38, "learning_rate": 0.00014377851933720218, "loss": 0.7072, "step": 3604 }, { "epoch": 0.38, "learning_rate": 0.00014374820410154314, "loss": 0.7129, "step": 3605 }, { "epoch": 0.38, "learning_rate": 0.00014371788389292873, "loss": 0.6789, "step": 3606 }, { "epoch": 0.38, "learning_rate": 0.00014368755871480558, "loss": 0.708, "step": 3607 }, { "epoch": 0.38, "learning_rate": 0.0001436572285706208, "loss": 0.643, "step": 3608 }, { "epoch": 0.38, "learning_rate": 0.00014362689346382202, "loss": 0.6314, "step": 3609 }, { "epoch": 0.38, "learning_rate": 0.00014359655339785763, "loss": 0.6788, "step": 3610 }, { "epoch": 0.38, "learning_rate": 0.00014356620837617634, "loss": 0.6774, "step": 3611 }, { "epoch": 0.38, "learning_rate": 0.00014353585840222755, "loss": 0.6608, "step": 3612 }, { "epoch": 0.38, "learning_rate": 0.00014350550347946124, "loss": 0.7018, "step": 3613 }, { "epoch": 0.38, "learning_rate": 0.0001434751436113279, "loss": 0.683, "step": 3614 }, { "epoch": 0.38, "learning_rate": 0.00014344477880127868, "loss": 0.6725, "step": 3615 }, { "epoch": 0.38, "learning_rate": 0.0001434144090527651, "loss": 0.7055, "step": 3616 }, { "epoch": 0.38, "learning_rate": 0.00014338403436923942, "loss": 0.757, "step": 3617 }, { "epoch": 0.38, "learning_rate": 0.00014335365475415439, "loss": 0.641, "step": 3618 }, { "epoch": 0.38, "learning_rate": 0.0001433232702109633, "loss": 0.6667, "step": 3619 }, { "epoch": 0.38, "learning_rate": 0.00014329288074312006, "loss": 0.6866, "step": 3620 }, { "epoch": 0.38, "learning_rate": 0.00014326248635407912, "loss": 0.6167, "step": 3621 }, { "epoch": 0.38, "learning_rate": 0.00014323208704729542, "loss": 0.6431, "step": 3622 }, { "epoch": 0.38, "learning_rate": 0.0001432016828262246, "loss": 0.6852, "step": 3623 }, { "epoch": 0.38, "learning_rate": 0.0001431712736943227, "loss": 0.7118, "step": 3624 }, { "epoch": 0.38, "learning_rate": 0.00014314085965504644, "loss": 0.7287, "step": 3625 }, { "epoch": 0.38, "learning_rate": 0.000143110440711853, "loss": 0.64, "step": 3626 }, { "epoch": 0.38, "learning_rate": 0.00014308001686820022, "loss": 0.7439, "step": 3627 }, { "epoch": 0.38, "learning_rate": 0.00014304958812754647, "loss": 0.7192, "step": 3628 }, { "epoch": 0.38, "learning_rate": 0.00014301915449335057, "loss": 0.6598, "step": 3629 }, { "epoch": 0.38, "learning_rate": 0.00014298871596907201, "loss": 0.7047, "step": 3630 }, { "epoch": 0.38, "learning_rate": 0.00014295827255817085, "loss": 0.699, "step": 3631 }, { "epoch": 0.38, "learning_rate": 0.0001429278242641076, "loss": 0.5892, "step": 3632 }, { "epoch": 0.38, "learning_rate": 0.00014289737109034342, "loss": 0.7021, "step": 3633 }, { "epoch": 0.38, "learning_rate": 0.00014286691304033993, "loss": 0.6707, "step": 3634 }, { "epoch": 0.38, "learning_rate": 0.0001428364501175595, "loss": 0.7295, "step": 3635 }, { "epoch": 0.38, "learning_rate": 0.00014280598232546479, "loss": 0.7324, "step": 3636 }, { "epoch": 0.38, "learning_rate": 0.00014277550966751917, "loss": 0.6097, "step": 3637 }, { "epoch": 0.38, "learning_rate": 0.00014274503214718655, "loss": 0.6761, "step": 3638 }, { "epoch": 0.38, "learning_rate": 0.00014271454976793138, "loss": 0.6973, "step": 3639 }, { "epoch": 0.38, "learning_rate": 0.00014268406253321864, "loss": 0.7145, "step": 3640 }, { "epoch": 0.38, "learning_rate": 0.0001426535704465139, "loss": 0.6957, "step": 3641 }, { "epoch": 0.38, "learning_rate": 0.00014262307351128328, "loss": 0.6681, "step": 3642 }, { "epoch": 0.38, "learning_rate": 0.00014259257173099342, "loss": 0.7203, "step": 3643 }, { "epoch": 0.38, "learning_rate": 0.00014256206510911148, "loss": 0.6679, "step": 3644 }, { "epoch": 0.38, "learning_rate": 0.0001425315536491053, "loss": 0.6482, "step": 3645 }, { "epoch": 0.38, "learning_rate": 0.00014250103735444306, "loss": 0.7029, "step": 3646 }, { "epoch": 0.38, "learning_rate": 0.00014247051622859376, "loss": 0.6873, "step": 3647 }, { "epoch": 0.38, "learning_rate": 0.00014243999027502673, "loss": 0.6583, "step": 3648 }, { "epoch": 0.38, "learning_rate": 0.00014240945949721193, "loss": 0.7373, "step": 3649 }, { "epoch": 0.38, "learning_rate": 0.00014237892389861982, "loss": 0.7018, "step": 3650 }, { "epoch": 0.38, "learning_rate": 0.00014234838348272156, "loss": 0.754, "step": 3651 }, { "epoch": 0.38, "learning_rate": 0.0001423178382529886, "loss": 0.7043, "step": 3652 }, { "epoch": 0.38, "learning_rate": 0.00014228728821289322, "loss": 0.6105, "step": 3653 }, { "epoch": 0.38, "learning_rate": 0.00014225673336590801, "loss": 0.7435, "step": 3654 }, { "epoch": 0.38, "learning_rate": 0.00014222617371550627, "loss": 0.6645, "step": 3655 }, { "epoch": 0.38, "learning_rate": 0.00014219560926516178, "loss": 0.6763, "step": 3656 }, { "epoch": 0.38, "learning_rate": 0.00014216504001834883, "loss": 0.7075, "step": 3657 }, { "epoch": 0.38, "learning_rate": 0.00014213446597854232, "loss": 0.7163, "step": 3658 }, { "epoch": 0.38, "learning_rate": 0.00014210388714921767, "loss": 0.6642, "step": 3659 }, { "epoch": 0.38, "learning_rate": 0.00014207330353385082, "loss": 0.7406, "step": 3660 }, { "epoch": 0.38, "learning_rate": 0.0001420427151359183, "loss": 0.6938, "step": 3661 }, { "epoch": 0.38, "learning_rate": 0.0001420121219588972, "loss": 0.6785, "step": 3662 }, { "epoch": 0.38, "learning_rate": 0.000141981524006265, "loss": 0.6889, "step": 3663 }, { "epoch": 0.38, "learning_rate": 0.00014195092128149994, "loss": 0.721, "step": 3664 }, { "epoch": 0.38, "learning_rate": 0.0001419203137880807, "loss": 0.6992, "step": 3665 }, { "epoch": 0.38, "learning_rate": 0.0001418897015294864, "loss": 0.6519, "step": 3666 }, { "epoch": 0.38, "learning_rate": 0.0001418590845091969, "loss": 0.6723, "step": 3667 }, { "epoch": 0.38, "learning_rate": 0.00014182846273069248, "loss": 0.5978, "step": 3668 }, { "epoch": 0.38, "learning_rate": 0.00014179783619745398, "loss": 0.7118, "step": 3669 }, { "epoch": 0.38, "learning_rate": 0.0001417672049129628, "loss": 0.6897, "step": 3670 }, { "epoch": 0.38, "learning_rate": 0.00014173656888070085, "loss": 0.6896, "step": 3671 }, { "epoch": 0.38, "learning_rate": 0.0001417059281041506, "loss": 0.708, "step": 3672 }, { "epoch": 0.38, "learning_rate": 0.00014167528258679504, "loss": 0.6761, "step": 3673 }, { "epoch": 0.38, "learning_rate": 0.0001416446323321177, "loss": 0.6741, "step": 3674 }, { "epoch": 0.38, "learning_rate": 0.00014161397734360276, "loss": 0.721, "step": 3675 }, { "epoch": 0.38, "learning_rate": 0.00014158331762473473, "loss": 0.6631, "step": 3676 }, { "epoch": 0.38, "learning_rate": 0.00014155265317899882, "loss": 0.7501, "step": 3677 }, { "epoch": 0.38, "learning_rate": 0.00014152198400988071, "loss": 0.7045, "step": 3678 }, { "epoch": 0.38, "learning_rate": 0.00014149131012086664, "loss": 0.7019, "step": 3679 }, { "epoch": 0.38, "learning_rate": 0.00014146063151544336, "loss": 0.6108, "step": 3680 }, { "epoch": 0.38, "learning_rate": 0.00014142994819709822, "loss": 0.6347, "step": 3681 }, { "epoch": 0.38, "learning_rate": 0.00014139926016931904, "loss": 0.6511, "step": 3682 }, { "epoch": 0.38, "learning_rate": 0.00014136856743559412, "loss": 0.6851, "step": 3683 }, { "epoch": 0.38, "learning_rate": 0.0001413378699994125, "loss": 0.7069, "step": 3684 }, { "epoch": 0.38, "learning_rate": 0.00014130716786426355, "loss": 0.7149, "step": 3685 }, { "epoch": 0.38, "learning_rate": 0.00014127646103363726, "loss": 0.7082, "step": 3686 }, { "epoch": 0.38, "learning_rate": 0.00014124574951102415, "loss": 0.7119, "step": 3687 }, { "epoch": 0.38, "learning_rate": 0.00014121503329991527, "loss": 0.6293, "step": 3688 }, { "epoch": 0.38, "learning_rate": 0.00014118431240380222, "loss": 0.6647, "step": 3689 }, { "epoch": 0.38, "learning_rate": 0.00014115358682617704, "loss": 0.6845, "step": 3690 }, { "epoch": 0.38, "learning_rate": 0.00014112285657053245, "loss": 0.7149, "step": 3691 }, { "epoch": 0.38, "learning_rate": 0.00014109212164036157, "loss": 0.6959, "step": 3692 }, { "epoch": 0.38, "learning_rate": 0.00014106138203915815, "loss": 0.6003, "step": 3693 }, { "epoch": 0.38, "learning_rate": 0.00014103063777041642, "loss": 0.6959, "step": 3694 }, { "epoch": 0.38, "learning_rate": 0.00014099988883763115, "loss": 0.702, "step": 3695 }, { "epoch": 0.38, "learning_rate": 0.0001409691352442976, "loss": 0.7849, "step": 3696 }, { "epoch": 0.38, "learning_rate": 0.00014093837699391166, "loss": 0.7066, "step": 3697 }, { "epoch": 0.38, "learning_rate": 0.00014090761408996967, "loss": 0.6916, "step": 3698 }, { "epoch": 0.39, "learning_rate": 0.00014087684653596848, "loss": 0.6921, "step": 3699 }, { "epoch": 0.39, "learning_rate": 0.00014084607433540556, "loss": 0.6769, "step": 3700 }, { "epoch": 0.39, "learning_rate": 0.00014081529749177882, "loss": 0.7024, "step": 3701 }, { "epoch": 0.39, "learning_rate": 0.00014078451600858674, "loss": 0.7027, "step": 3702 }, { "epoch": 0.39, "learning_rate": 0.00014075372988932828, "loss": 0.7413, "step": 3703 }, { "epoch": 0.39, "learning_rate": 0.00014072293913750306, "loss": 0.6152, "step": 3704 }, { "epoch": 0.39, "learning_rate": 0.00014069214375661107, "loss": 0.7155, "step": 3705 }, { "epoch": 0.39, "learning_rate": 0.00014066134375015287, "loss": 0.711, "step": 3706 }, { "epoch": 0.39, "learning_rate": 0.00014063053912162962, "loss": 0.625, "step": 3707 }, { "epoch": 0.39, "learning_rate": 0.0001405997298745429, "loss": 0.7091, "step": 3708 }, { "epoch": 0.39, "learning_rate": 0.00014056891601239494, "loss": 0.7168, "step": 3709 }, { "epoch": 0.39, "learning_rate": 0.00014053809753868828, "loss": 0.772, "step": 3710 }, { "epoch": 0.39, "learning_rate": 0.0001405072744569263, "loss": 0.6913, "step": 3711 }, { "epoch": 0.39, "learning_rate": 0.0001404764467706126, "loss": 0.7217, "step": 3712 }, { "epoch": 0.39, "learning_rate": 0.00014044561448325147, "loss": 0.6374, "step": 3713 }, { "epoch": 0.39, "learning_rate": 0.00014041477759834772, "loss": 0.676, "step": 3714 }, { "epoch": 0.39, "learning_rate": 0.0001403839361194066, "loss": 0.6574, "step": 3715 }, { "epoch": 0.39, "learning_rate": 0.00014035309004993392, "loss": 0.6122, "step": 3716 }, { "epoch": 0.39, "learning_rate": 0.00014032223939343605, "loss": 0.6625, "step": 3717 }, { "epoch": 0.39, "learning_rate": 0.00014029138415341987, "loss": 0.6933, "step": 3718 }, { "epoch": 0.39, "learning_rate": 0.00014026052433339272, "loss": 0.721, "step": 3719 }, { "epoch": 0.39, "learning_rate": 0.00014022965993686252, "loss": 0.7797, "step": 3720 }, { "epoch": 0.39, "learning_rate": 0.00014019879096733773, "loss": 0.6725, "step": 3721 }, { "epoch": 0.39, "learning_rate": 0.00014016791742832725, "loss": 0.6546, "step": 3722 }, { "epoch": 0.39, "learning_rate": 0.0001401370393233405, "loss": 0.6969, "step": 3723 }, { "epoch": 0.39, "learning_rate": 0.0001401061566558876, "loss": 0.6938, "step": 3724 }, { "epoch": 0.39, "learning_rate": 0.00014007526942947895, "loss": 0.6873, "step": 3725 }, { "epoch": 0.39, "learning_rate": 0.0001400443776476256, "loss": 0.6905, "step": 3726 }, { "epoch": 0.39, "learning_rate": 0.00014001348131383905, "loss": 0.6315, "step": 3727 }, { "epoch": 0.39, "learning_rate": 0.0001399825804316314, "loss": 0.6857, "step": 3728 }, { "epoch": 0.39, "learning_rate": 0.0001399516750045152, "loss": 0.7334, "step": 3729 }, { "epoch": 0.39, "learning_rate": 0.00013992076503600352, "loss": 0.7169, "step": 3730 }, { "epoch": 0.39, "learning_rate": 0.00013988985052961001, "loss": 0.6623, "step": 3731 }, { "epoch": 0.39, "learning_rate": 0.00013985893148884876, "loss": 0.6903, "step": 3732 }, { "epoch": 0.39, "learning_rate": 0.00013982800791723443, "loss": 0.6772, "step": 3733 }, { "epoch": 0.39, "learning_rate": 0.00013979707981828213, "loss": 0.6896, "step": 3734 }, { "epoch": 0.39, "learning_rate": 0.0001397661471955076, "loss": 0.6696, "step": 3735 }, { "epoch": 0.39, "learning_rate": 0.00013973521005242688, "loss": 0.6445, "step": 3736 }, { "epoch": 0.39, "learning_rate": 0.0001397042683925568, "loss": 0.7103, "step": 3737 }, { "epoch": 0.39, "learning_rate": 0.00013967332221941455, "loss": 0.6338, "step": 3738 }, { "epoch": 0.39, "learning_rate": 0.00013964237153651782, "loss": 0.7158, "step": 3739 }, { "epoch": 0.39, "learning_rate": 0.0001396114163473848, "loss": 0.6441, "step": 3740 }, { "epoch": 0.39, "learning_rate": 0.00013958045665553428, "loss": 0.6573, "step": 3741 }, { "epoch": 0.39, "learning_rate": 0.00013954949246448557, "loss": 0.725, "step": 3742 }, { "epoch": 0.39, "learning_rate": 0.00013951852377775832, "loss": 0.7111, "step": 3743 }, { "epoch": 0.39, "learning_rate": 0.0001394875505988729, "loss": 0.7457, "step": 3744 }, { "epoch": 0.39, "learning_rate": 0.00013945657293135008, "loss": 0.6756, "step": 3745 }, { "epoch": 0.39, "learning_rate": 0.00013942559077871115, "loss": 0.6796, "step": 3746 }, { "epoch": 0.39, "learning_rate": 0.00013939460414447795, "loss": 0.6862, "step": 3747 }, { "epoch": 0.39, "learning_rate": 0.0001393636130321727, "loss": 0.7493, "step": 3748 }, { "epoch": 0.39, "learning_rate": 0.00013933261744531836, "loss": 0.7387, "step": 3749 }, { "epoch": 0.39, "learning_rate": 0.00013930161738743817, "loss": 0.7644, "step": 3750 }, { "epoch": 0.39, "learning_rate": 0.00013927061286205604, "loss": 0.608, "step": 3751 }, { "epoch": 0.39, "learning_rate": 0.00013923960387269633, "loss": 0.6633, "step": 3752 }, { "epoch": 0.39, "learning_rate": 0.0001392085904228838, "loss": 0.6359, "step": 3753 }, { "epoch": 0.39, "learning_rate": 0.0001391775725161439, "loss": 0.7069, "step": 3754 }, { "epoch": 0.39, "learning_rate": 0.0001391465501560025, "loss": 0.6815, "step": 3755 }, { "epoch": 0.39, "learning_rate": 0.00013911552334598594, "loss": 0.698, "step": 3756 }, { "epoch": 0.39, "learning_rate": 0.00013908449208962118, "loss": 0.671, "step": 3757 }, { "epoch": 0.39, "learning_rate": 0.00013905345639043557, "loss": 0.6611, "step": 3758 }, { "epoch": 0.39, "learning_rate": 0.000139022416251957, "loss": 0.7399, "step": 3759 }, { "epoch": 0.39, "learning_rate": 0.00013899137167771382, "loss": 0.6672, "step": 3760 }, { "epoch": 0.39, "learning_rate": 0.000138960322671235, "loss": 0.6772, "step": 3761 }, { "epoch": 0.39, "learning_rate": 0.00013892926923605, "loss": 0.7286, "step": 3762 }, { "epoch": 0.39, "learning_rate": 0.0001388982113756886, "loss": 0.6696, "step": 3763 }, { "epoch": 0.39, "learning_rate": 0.00013886714909368137, "loss": 0.6682, "step": 3764 }, { "epoch": 0.39, "learning_rate": 0.0001388360823935591, "loss": 0.6324, "step": 3765 }, { "epoch": 0.39, "learning_rate": 0.00013880501127885327, "loss": 0.6865, "step": 3766 }, { "epoch": 0.39, "learning_rate": 0.00013877393575309577, "loss": 0.6755, "step": 3767 }, { "epoch": 0.39, "learning_rate": 0.00013874285581981906, "loss": 0.6384, "step": 3768 }, { "epoch": 0.39, "learning_rate": 0.00013871177148255606, "loss": 0.6811, "step": 3769 }, { "epoch": 0.39, "learning_rate": 0.00013868068274484015, "loss": 0.7223, "step": 3770 }, { "epoch": 0.39, "learning_rate": 0.0001386495896102053, "loss": 0.7175, "step": 3771 }, { "epoch": 0.39, "learning_rate": 0.00013861849208218595, "loss": 0.7316, "step": 3772 }, { "epoch": 0.39, "learning_rate": 0.00013858739016431697, "loss": 0.7099, "step": 3773 }, { "epoch": 0.39, "learning_rate": 0.00013855628386013385, "loss": 0.7514, "step": 3774 }, { "epoch": 0.39, "learning_rate": 0.00013852517317317244, "loss": 0.7304, "step": 3775 }, { "epoch": 0.39, "learning_rate": 0.0001384940581069692, "loss": 0.6548, "step": 3776 }, { "epoch": 0.39, "learning_rate": 0.0001384629386650611, "loss": 0.6279, "step": 3777 }, { "epoch": 0.39, "learning_rate": 0.00013843181485098546, "loss": 0.7344, "step": 3778 }, { "epoch": 0.39, "learning_rate": 0.00013840068666828026, "loss": 0.6831, "step": 3779 }, { "epoch": 0.39, "learning_rate": 0.00013836955412048382, "loss": 0.733, "step": 3780 }, { "epoch": 0.39, "learning_rate": 0.0001383384172111352, "loss": 0.6958, "step": 3781 }, { "epoch": 0.39, "learning_rate": 0.00013830727594377364, "loss": 0.7207, "step": 3782 }, { "epoch": 0.39, "learning_rate": 0.00013827613032193914, "loss": 0.6792, "step": 3783 }, { "epoch": 0.39, "learning_rate": 0.00013824498034917205, "loss": 0.6454, "step": 3784 }, { "epoch": 0.39, "learning_rate": 0.0001382138260290133, "loss": 0.7588, "step": 3785 }, { "epoch": 0.39, "learning_rate": 0.00013818266736500417, "loss": 0.7282, "step": 3786 }, { "epoch": 0.39, "learning_rate": 0.00013815150436068666, "loss": 0.6383, "step": 3787 }, { "epoch": 0.39, "learning_rate": 0.00013812033701960307, "loss": 0.7372, "step": 3788 }, { "epoch": 0.39, "learning_rate": 0.00013808916534529625, "loss": 0.6694, "step": 3789 }, { "epoch": 0.39, "learning_rate": 0.0001380579893413096, "loss": 0.6391, "step": 3790 }, { "epoch": 0.39, "learning_rate": 0.00013802680901118695, "loss": 0.7443, "step": 3791 }, { "epoch": 0.39, "learning_rate": 0.0001379956243584726, "loss": 0.6626, "step": 3792 }, { "epoch": 0.39, "learning_rate": 0.0001379644353867114, "loss": 0.681, "step": 3793 }, { "epoch": 0.39, "learning_rate": 0.0001379332420994487, "loss": 0.6862, "step": 3794 }, { "epoch": 0.4, "learning_rate": 0.00013790204450023026, "loss": 0.6422, "step": 3795 }, { "epoch": 0.4, "learning_rate": 0.0001378708425926024, "loss": 0.6562, "step": 3796 }, { "epoch": 0.4, "learning_rate": 0.00013783963638011194, "loss": 0.6577, "step": 3797 }, { "epoch": 0.4, "learning_rate": 0.00013780842586630615, "loss": 0.6704, "step": 3798 }, { "epoch": 0.4, "learning_rate": 0.00013777721105473275, "loss": 0.6435, "step": 3799 }, { "epoch": 0.4, "learning_rate": 0.00013774599194894002, "loss": 0.695, "step": 3800 }, { "epoch": 0.4, "learning_rate": 0.00013771476855247675, "loss": 0.7002, "step": 3801 }, { "epoch": 0.4, "learning_rate": 0.00013768354086889212, "loss": 0.6225, "step": 3802 }, { "epoch": 0.4, "learning_rate": 0.00013765230890173589, "loss": 0.6991, "step": 3803 }, { "epoch": 0.4, "learning_rate": 0.00013762107265455822, "loss": 0.7022, "step": 3804 }, { "epoch": 0.4, "learning_rate": 0.00013758983213090983, "loss": 0.6808, "step": 3805 }, { "epoch": 0.4, "learning_rate": 0.0001375585873343419, "loss": 0.7075, "step": 3806 }, { "epoch": 0.4, "learning_rate": 0.00013752733826840607, "loss": 0.7199, "step": 3807 }, { "epoch": 0.4, "learning_rate": 0.00013749608493665452, "loss": 0.6944, "step": 3808 }, { "epoch": 0.4, "learning_rate": 0.0001374648273426399, "loss": 0.648, "step": 3809 }, { "epoch": 0.4, "learning_rate": 0.00013743356548991532, "loss": 0.6889, "step": 3810 }, { "epoch": 0.4, "learning_rate": 0.00013740229938203436, "loss": 0.6679, "step": 3811 }, { "epoch": 0.4, "learning_rate": 0.00013737102902255114, "loss": 0.7111, "step": 3812 }, { "epoch": 0.4, "learning_rate": 0.00013733975441502017, "loss": 0.6625, "step": 3813 }, { "epoch": 0.4, "learning_rate": 0.00013730847556299656, "loss": 0.7012, "step": 3814 }, { "epoch": 0.4, "learning_rate": 0.00013727719247003583, "loss": 0.7057, "step": 3815 }, { "epoch": 0.4, "learning_rate": 0.00013724590513969402, "loss": 0.7523, "step": 3816 }, { "epoch": 0.4, "learning_rate": 0.0001372146135755276, "loss": 0.7232, "step": 3817 }, { "epoch": 0.4, "learning_rate": 0.00013718331778109357, "loss": 0.6621, "step": 3818 }, { "epoch": 0.4, "learning_rate": 0.00013715201775994936, "loss": 0.6909, "step": 3819 }, { "epoch": 0.4, "learning_rate": 0.00013712071351565294, "loss": 0.696, "step": 3820 }, { "epoch": 0.4, "learning_rate": 0.00013708940505176276, "loss": 0.7268, "step": 3821 }, { "epoch": 0.4, "learning_rate": 0.00013705809237183768, "loss": 0.6047, "step": 3822 }, { "epoch": 0.4, "learning_rate": 0.0001370267754794371, "loss": 0.6963, "step": 3823 }, { "epoch": 0.4, "learning_rate": 0.00013699545437812085, "loss": 0.6995, "step": 3824 }, { "epoch": 0.4, "learning_rate": 0.0001369641290714493, "loss": 0.6697, "step": 3825 }, { "epoch": 0.4, "learning_rate": 0.00013693279956298327, "loss": 0.6834, "step": 3826 }, { "epoch": 0.4, "learning_rate": 0.00013690146585628406, "loss": 0.64, "step": 3827 }, { "epoch": 0.4, "learning_rate": 0.00013687012795491344, "loss": 0.6671, "step": 3828 }, { "epoch": 0.4, "learning_rate": 0.0001368387858624336, "loss": 0.7281, "step": 3829 }, { "epoch": 0.4, "learning_rate": 0.00013680743958240733, "loss": 0.7458, "step": 3830 }, { "epoch": 0.4, "learning_rate": 0.00013677608911839782, "loss": 0.7181, "step": 3831 }, { "epoch": 0.4, "learning_rate": 0.00013674473447396874, "loss": 0.6774, "step": 3832 }, { "epoch": 0.4, "learning_rate": 0.00013671337565268423, "loss": 0.7329, "step": 3833 }, { "epoch": 0.4, "learning_rate": 0.00013668201265810894, "loss": 0.6791, "step": 3834 }, { "epoch": 0.4, "learning_rate": 0.00013665064549380797, "loss": 0.6567, "step": 3835 }, { "epoch": 0.4, "learning_rate": 0.00013661927416334685, "loss": 0.678, "step": 3836 }, { "epoch": 0.4, "learning_rate": 0.0001365878986702917, "loss": 0.7425, "step": 3837 }, { "epoch": 0.4, "learning_rate": 0.00013655651901820897, "loss": 0.6371, "step": 3838 }, { "epoch": 0.4, "learning_rate": 0.00013652513521066571, "loss": 0.7388, "step": 3839 }, { "epoch": 0.4, "learning_rate": 0.00013649374725122935, "loss": 0.6576, "step": 3840 }, { "epoch": 0.4, "learning_rate": 0.0001364623551434679, "loss": 0.6724, "step": 3841 }, { "epoch": 0.4, "learning_rate": 0.00013643095889094968, "loss": 0.6482, "step": 3842 }, { "epoch": 0.4, "learning_rate": 0.00013639955849724356, "loss": 0.6853, "step": 3843 }, { "epoch": 0.4, "learning_rate": 0.000136368153965919, "loss": 0.7028, "step": 3844 }, { "epoch": 0.4, "learning_rate": 0.00013633674530054573, "loss": 0.6903, "step": 3845 }, { "epoch": 0.4, "learning_rate": 0.00013630533250469408, "loss": 0.6949, "step": 3846 }, { "epoch": 0.4, "learning_rate": 0.00013627391558193483, "loss": 0.6316, "step": 3847 }, { "epoch": 0.4, "learning_rate": 0.0001362424945358392, "loss": 0.6583, "step": 3848 }, { "epoch": 0.4, "learning_rate": 0.00013621106936997885, "loss": 0.6315, "step": 3849 }, { "epoch": 0.4, "learning_rate": 0.00013617964008792597, "loss": 0.671, "step": 3850 }, { "epoch": 0.4, "learning_rate": 0.00013614820669325322, "loss": 0.6383, "step": 3851 }, { "epoch": 0.4, "learning_rate": 0.00013611676918953366, "loss": 0.7081, "step": 3852 }, { "epoch": 0.4, "learning_rate": 0.00013608532758034093, "loss": 0.706, "step": 3853 }, { "epoch": 0.4, "learning_rate": 0.00013605388186924898, "loss": 0.6596, "step": 3854 }, { "epoch": 0.4, "learning_rate": 0.0001360224320598324, "loss": 0.6423, "step": 3855 }, { "epoch": 0.4, "learning_rate": 0.0001359909781556661, "loss": 0.6813, "step": 3856 }, { "epoch": 0.4, "learning_rate": 0.00013595952016032551, "loss": 0.626, "step": 3857 }, { "epoch": 0.4, "learning_rate": 0.0001359280580773866, "loss": 0.666, "step": 3858 }, { "epoch": 0.4, "learning_rate": 0.00013589659191042566, "loss": 0.7364, "step": 3859 }, { "epoch": 0.4, "learning_rate": 0.00013586512166301954, "loss": 0.7063, "step": 3860 }, { "epoch": 0.4, "learning_rate": 0.00013583364733874554, "loss": 0.6917, "step": 3861 }, { "epoch": 0.4, "learning_rate": 0.00013580216894118146, "loss": 0.6552, "step": 3862 }, { "epoch": 0.4, "learning_rate": 0.0001357706864739054, "loss": 0.6702, "step": 3863 }, { "epoch": 0.4, "learning_rate": 0.00013573919994049616, "loss": 0.6825, "step": 3864 }, { "epoch": 0.4, "learning_rate": 0.00013570770934453284, "loss": 0.7408, "step": 3865 }, { "epoch": 0.4, "learning_rate": 0.00013567621468959503, "loss": 0.7247, "step": 3866 }, { "epoch": 0.4, "learning_rate": 0.00013564471597926286, "loss": 0.6965, "step": 3867 }, { "epoch": 0.4, "learning_rate": 0.00013561321321711676, "loss": 0.6791, "step": 3868 }, { "epoch": 0.4, "learning_rate": 0.0001355817064067378, "loss": 0.6854, "step": 3869 }, { "epoch": 0.4, "learning_rate": 0.00013555019555170738, "loss": 0.7808, "step": 3870 }, { "epoch": 0.4, "learning_rate": 0.00013551868065560745, "loss": 0.7157, "step": 3871 }, { "epoch": 0.4, "learning_rate": 0.00013548716172202035, "loss": 0.6933, "step": 3872 }, { "epoch": 0.4, "learning_rate": 0.00013545563875452888, "loss": 0.6646, "step": 3873 }, { "epoch": 0.4, "learning_rate": 0.0001354241117567164, "loss": 0.7043, "step": 3874 }, { "epoch": 0.4, "learning_rate": 0.00013539258073216664, "loss": 0.6647, "step": 3875 }, { "epoch": 0.4, "learning_rate": 0.0001353610456844637, "loss": 0.7139, "step": 3876 }, { "epoch": 0.4, "learning_rate": 0.00013532950661719235, "loss": 0.825, "step": 3877 }, { "epoch": 0.4, "learning_rate": 0.00013529796353393766, "loss": 0.6977, "step": 3878 }, { "epoch": 0.4, "learning_rate": 0.00013526641643828524, "loss": 0.6877, "step": 3879 }, { "epoch": 0.4, "learning_rate": 0.0001352348653338211, "loss": 0.5959, "step": 3880 }, { "epoch": 0.4, "learning_rate": 0.00013520331022413167, "loss": 0.611, "step": 3881 }, { "epoch": 0.4, "learning_rate": 0.00013517175111280394, "loss": 0.694, "step": 3882 }, { "epoch": 0.4, "learning_rate": 0.00013514018800342528, "loss": 0.6698, "step": 3883 }, { "epoch": 0.4, "learning_rate": 0.0001351086208995836, "loss": 0.7039, "step": 3884 }, { "epoch": 0.4, "learning_rate": 0.0001350770498048671, "loss": 0.6211, "step": 3885 }, { "epoch": 0.4, "learning_rate": 0.00013504547472286468, "loss": 0.6933, "step": 3886 }, { "epoch": 0.4, "learning_rate": 0.00013501389565716537, "loss": 0.7479, "step": 3887 }, { "epoch": 0.4, "learning_rate": 0.00013498231261135902, "loss": 0.6869, "step": 3888 }, { "epoch": 0.4, "learning_rate": 0.00013495072558903558, "loss": 0.6419, "step": 3889 }, { "epoch": 0.4, "learning_rate": 0.0001349191345937857, "loss": 0.6739, "step": 3890 }, { "epoch": 0.41, "learning_rate": 0.00013488753962920039, "loss": 0.7444, "step": 3891 }, { "epoch": 0.41, "learning_rate": 0.00013485594069887114, "loss": 0.709, "step": 3892 }, { "epoch": 0.41, "learning_rate": 0.00013482433780638984, "loss": 0.6486, "step": 3893 }, { "epoch": 0.41, "learning_rate": 0.00013479273095534885, "loss": 0.6863, "step": 3894 }, { "epoch": 0.41, "learning_rate": 0.000134761120149341, "loss": 0.6016, "step": 3895 }, { "epoch": 0.41, "learning_rate": 0.00013472950539195958, "loss": 0.7471, "step": 3896 }, { "epoch": 0.41, "learning_rate": 0.0001346978866867983, "loss": 0.6588, "step": 3897 }, { "epoch": 0.41, "learning_rate": 0.00013466626403745133, "loss": 0.6832, "step": 3898 }, { "epoch": 0.41, "learning_rate": 0.0001346346374475133, "loss": 0.7398, "step": 3899 }, { "epoch": 0.41, "learning_rate": 0.00013460300692057922, "loss": 0.6901, "step": 3900 }, { "epoch": 0.41, "learning_rate": 0.0001345713724602447, "loss": 0.7461, "step": 3901 }, { "epoch": 0.41, "learning_rate": 0.00013453973407010557, "loss": 0.6489, "step": 3902 }, { "epoch": 0.41, "learning_rate": 0.00013450809175375833, "loss": 0.6941, "step": 3903 }, { "epoch": 0.41, "learning_rate": 0.00013447644551479982, "loss": 0.7128, "step": 3904 }, { "epoch": 0.41, "learning_rate": 0.00013444479535682733, "loss": 0.7248, "step": 3905 }, { "epoch": 0.41, "learning_rate": 0.0001344131412834386, "loss": 0.7001, "step": 3906 }, { "epoch": 0.41, "learning_rate": 0.0001343814832982318, "loss": 0.7158, "step": 3907 }, { "epoch": 0.41, "learning_rate": 0.00013434982140480558, "loss": 0.6538, "step": 3908 }, { "epoch": 0.41, "learning_rate": 0.00013431815560675903, "loss": 0.6885, "step": 3909 }, { "epoch": 0.41, "learning_rate": 0.00013428648590769164, "loss": 0.698, "step": 3910 }, { "epoch": 0.41, "learning_rate": 0.0001342548123112034, "loss": 0.6774, "step": 3911 }, { "epoch": 0.41, "learning_rate": 0.00013422313482089476, "loss": 0.7143, "step": 3912 }, { "epoch": 0.41, "learning_rate": 0.00013419145344036645, "loss": 0.6716, "step": 3913 }, { "epoch": 0.41, "learning_rate": 0.0001341597681732199, "loss": 0.6781, "step": 3914 }, { "epoch": 0.41, "learning_rate": 0.00013412807902305675, "loss": 0.6391, "step": 3915 }, { "epoch": 0.41, "learning_rate": 0.00013409638599347918, "loss": 0.6678, "step": 3916 }, { "epoch": 0.41, "learning_rate": 0.00013406468908808988, "loss": 0.7132, "step": 3917 }, { "epoch": 0.41, "learning_rate": 0.00013403298831049184, "loss": 0.6218, "step": 3918 }, { "epoch": 0.41, "learning_rate": 0.0001340012836642886, "loss": 0.7089, "step": 3919 }, { "epoch": 0.41, "learning_rate": 0.00013396957515308407, "loss": 0.7051, "step": 3920 }, { "epoch": 0.41, "learning_rate": 0.00013393786278048263, "loss": 0.6579, "step": 3921 }, { "epoch": 0.41, "learning_rate": 0.00013390614655008908, "loss": 0.661, "step": 3922 }, { "epoch": 0.41, "learning_rate": 0.00013387442646550869, "loss": 0.7225, "step": 3923 }, { "epoch": 0.41, "learning_rate": 0.00013384270253034717, "loss": 0.6405, "step": 3924 }, { "epoch": 0.41, "learning_rate": 0.00013381097474821066, "loss": 0.6956, "step": 3925 }, { "epoch": 0.41, "learning_rate": 0.00013377924312270566, "loss": 0.7512, "step": 3926 }, { "epoch": 0.41, "learning_rate": 0.00013374750765743923, "loss": 0.642, "step": 3927 }, { "epoch": 0.41, "learning_rate": 0.00013371576835601883, "loss": 0.7337, "step": 3928 }, { "epoch": 0.41, "learning_rate": 0.00013368402522205227, "loss": 0.7669, "step": 3929 }, { "epoch": 0.41, "learning_rate": 0.00013365227825914787, "loss": 0.7201, "step": 3930 }, { "epoch": 0.41, "learning_rate": 0.00013362052747091448, "loss": 0.6215, "step": 3931 }, { "epoch": 0.41, "learning_rate": 0.00013358877286096115, "loss": 0.6999, "step": 3932 }, { "epoch": 0.41, "learning_rate": 0.00013355701443289755, "loss": 0.6731, "step": 3933 }, { "epoch": 0.41, "learning_rate": 0.00013352525219033375, "loss": 0.6751, "step": 3934 }, { "epoch": 0.41, "learning_rate": 0.00013349348613688025, "loss": 0.6431, "step": 3935 }, { "epoch": 0.41, "learning_rate": 0.0001334617162761479, "loss": 0.7185, "step": 3936 }, { "epoch": 0.41, "learning_rate": 0.00013342994261174808, "loss": 0.6755, "step": 3937 }, { "epoch": 0.41, "learning_rate": 0.00013339816514729264, "loss": 0.647, "step": 3938 }, { "epoch": 0.41, "learning_rate": 0.0001333663838863937, "loss": 0.7521, "step": 3939 }, { "epoch": 0.41, "learning_rate": 0.0001333345988326639, "loss": 0.6743, "step": 3940 }, { "epoch": 0.41, "learning_rate": 0.0001333028099897164, "loss": 0.6765, "step": 3941 }, { "epoch": 0.41, "learning_rate": 0.00013327101736116466, "loss": 0.6776, "step": 3942 }, { "epoch": 0.41, "learning_rate": 0.0001332392209506226, "loss": 0.6977, "step": 3943 }, { "epoch": 0.41, "learning_rate": 0.00013320742076170468, "loss": 0.6348, "step": 3944 }, { "epoch": 0.41, "learning_rate": 0.0001331756167980256, "loss": 0.6964, "step": 3945 }, { "epoch": 0.41, "learning_rate": 0.00013314380906320059, "loss": 0.7008, "step": 3946 }, { "epoch": 0.41, "learning_rate": 0.00013311199756084536, "loss": 0.6901, "step": 3947 }, { "epoch": 0.41, "learning_rate": 0.00013308018229457594, "loss": 0.7287, "step": 3948 }, { "epoch": 0.41, "learning_rate": 0.0001330483632680089, "loss": 0.6443, "step": 3949 }, { "epoch": 0.41, "learning_rate": 0.00013301654048476116, "loss": 0.646, "step": 3950 }, { "epoch": 0.41, "learning_rate": 0.00013298471394845006, "loss": 0.6252, "step": 3951 }, { "epoch": 0.41, "learning_rate": 0.00013295288366269343, "loss": 0.7535, "step": 3952 }, { "epoch": 0.41, "learning_rate": 0.00013292104963110943, "loss": 0.6709, "step": 3953 }, { "epoch": 0.41, "learning_rate": 0.00013288921185731676, "loss": 0.6711, "step": 3954 }, { "epoch": 0.41, "learning_rate": 0.0001328573703449345, "loss": 0.6199, "step": 3955 }, { "epoch": 0.41, "learning_rate": 0.00013282552509758208, "loss": 0.7184, "step": 3956 }, { "epoch": 0.41, "learning_rate": 0.0001327936761188795, "loss": 0.7204, "step": 3957 }, { "epoch": 0.41, "learning_rate": 0.00013276182341244702, "loss": 0.707, "step": 3958 }, { "epoch": 0.41, "learning_rate": 0.0001327299669819055, "loss": 0.6769, "step": 3959 }, { "epoch": 0.41, "learning_rate": 0.000132698106830876, "loss": 0.7155, "step": 3960 }, { "epoch": 0.41, "learning_rate": 0.00013266624296298028, "loss": 0.6624, "step": 3961 }, { "epoch": 0.41, "learning_rate": 0.0001326343753818403, "loss": 0.6661, "step": 3962 }, { "epoch": 0.41, "learning_rate": 0.00013260250409107853, "loss": 0.6544, "step": 3963 }, { "epoch": 0.41, "learning_rate": 0.00013257062909431786, "loss": 0.7191, "step": 3964 }, { "epoch": 0.41, "learning_rate": 0.00013253875039518156, "loss": 0.621, "step": 3965 }, { "epoch": 0.41, "learning_rate": 0.00013250686799729338, "loss": 0.6503, "step": 3966 }, { "epoch": 0.41, "learning_rate": 0.00013247498190427747, "loss": 0.6531, "step": 3967 }, { "epoch": 0.41, "learning_rate": 0.00013244309211975837, "loss": 0.6249, "step": 3968 }, { "epoch": 0.41, "learning_rate": 0.0001324111986473611, "loss": 0.7086, "step": 3969 }, { "epoch": 0.41, "learning_rate": 0.000132379301490711, "loss": 0.7415, "step": 3970 }, { "epoch": 0.41, "learning_rate": 0.00013234740065343393, "loss": 0.74, "step": 3971 }, { "epoch": 0.41, "learning_rate": 0.00013231549613915614, "loss": 0.7178, "step": 3972 }, { "epoch": 0.41, "learning_rate": 0.00013228358795150426, "loss": 0.6941, "step": 3973 }, { "epoch": 0.41, "learning_rate": 0.00013225167609410537, "loss": 0.6816, "step": 3974 }, { "epoch": 0.41, "learning_rate": 0.000132219760570587, "loss": 0.6653, "step": 3975 }, { "epoch": 0.41, "learning_rate": 0.000132187841384577, "loss": 0.6934, "step": 3976 }, { "epoch": 0.41, "learning_rate": 0.00013215591853970373, "loss": 0.7123, "step": 3977 }, { "epoch": 0.41, "learning_rate": 0.00013212399203959592, "loss": 0.7034, "step": 3978 }, { "epoch": 0.41, "learning_rate": 0.0001320920618878827, "loss": 0.6998, "step": 3979 }, { "epoch": 0.41, "learning_rate": 0.00013206012808819368, "loss": 0.6679, "step": 3980 }, { "epoch": 0.41, "learning_rate": 0.00013202819064415884, "loss": 0.7031, "step": 3981 }, { "epoch": 0.41, "learning_rate": 0.0001319962495594086, "loss": 0.704, "step": 3982 }, { "epoch": 0.41, "learning_rate": 0.0001319643048375737, "loss": 0.7209, "step": 3983 }, { "epoch": 0.41, "learning_rate": 0.00013193235648228545, "loss": 0.7602, "step": 3984 }, { "epoch": 0.41, "learning_rate": 0.00013190040449717545, "loss": 0.6529, "step": 3985 }, { "epoch": 0.41, "learning_rate": 0.00013186844888587573, "loss": 0.6668, "step": 3986 }, { "epoch": 0.42, "learning_rate": 0.0001318364896520188, "loss": 0.6856, "step": 3987 }, { "epoch": 0.42, "learning_rate": 0.00013180452679923755, "loss": 0.7425, "step": 3988 }, { "epoch": 0.42, "learning_rate": 0.0001317725603311652, "loss": 0.7424, "step": 3989 }, { "epoch": 0.42, "learning_rate": 0.0001317405902514355, "loss": 0.6931, "step": 3990 }, { "epoch": 0.42, "learning_rate": 0.00013170861656368254, "loss": 0.6487, "step": 3991 }, { "epoch": 0.42, "learning_rate": 0.00013167663927154085, "loss": 0.6739, "step": 3992 }, { "epoch": 0.42, "learning_rate": 0.00013164465837864537, "loss": 0.7425, "step": 3993 }, { "epoch": 0.42, "learning_rate": 0.00013161267388863142, "loss": 0.7132, "step": 3994 }, { "epoch": 0.42, "learning_rate": 0.00013158068580513475, "loss": 0.6614, "step": 3995 }, { "epoch": 0.42, "learning_rate": 0.00013154869413179154, "loss": 0.7247, "step": 3996 }, { "epoch": 0.42, "learning_rate": 0.00013151669887223833, "loss": 0.6582, "step": 3997 }, { "epoch": 0.42, "learning_rate": 0.00013148470003011207, "loss": 0.7455, "step": 3998 }, { "epoch": 0.42, "learning_rate": 0.0001314526976090502, "loss": 0.6658, "step": 3999 }, { "epoch": 0.42, "learning_rate": 0.00013142069161269044, "loss": 0.7282, "step": 4000 }, { "epoch": 0.42, "learning_rate": 0.00013138868204467104, "loss": 0.7055, "step": 4001 }, { "epoch": 0.42, "learning_rate": 0.00013135666890863056, "loss": 0.6847, "step": 4002 }, { "epoch": 0.42, "learning_rate": 0.00013132465220820803, "loss": 0.6731, "step": 4003 }, { "epoch": 0.42, "learning_rate": 0.00013129263194704285, "loss": 0.6707, "step": 4004 }, { "epoch": 0.42, "learning_rate": 0.0001312606081287748, "loss": 0.711, "step": 4005 }, { "epoch": 0.42, "learning_rate": 0.00013122858075704415, "loss": 0.6801, "step": 4006 }, { "epoch": 0.42, "learning_rate": 0.0001311965498354915, "loss": 0.7019, "step": 4007 }, { "epoch": 0.42, "learning_rate": 0.00013116451536775788, "loss": 0.6829, "step": 4008 }, { "epoch": 0.42, "learning_rate": 0.00013113247735748474, "loss": 0.684, "step": 4009 }, { "epoch": 0.42, "learning_rate": 0.00013110043580831385, "loss": 0.6718, "step": 4010 }, { "epoch": 0.42, "learning_rate": 0.0001310683907238875, "loss": 0.7065, "step": 4011 }, { "epoch": 0.42, "learning_rate": 0.0001310363421078483, "loss": 0.68, "step": 4012 }, { "epoch": 0.42, "learning_rate": 0.00013100428996383928, "loss": 0.6765, "step": 4013 }, { "epoch": 0.42, "learning_rate": 0.00013097223429550393, "loss": 0.7077, "step": 4014 }, { "epoch": 0.42, "learning_rate": 0.00013094017510648605, "loss": 0.6916, "step": 4015 }, { "epoch": 0.42, "learning_rate": 0.00013090811240042987, "loss": 0.7343, "step": 4016 }, { "epoch": 0.42, "learning_rate": 0.00013087604618098, "loss": 0.7011, "step": 4017 }, { "epoch": 0.42, "learning_rate": 0.00013084397645178158, "loss": 0.6704, "step": 4018 }, { "epoch": 0.42, "learning_rate": 0.00013081190321647998, "loss": 0.6479, "step": 4019 }, { "epoch": 0.42, "learning_rate": 0.000130779826478721, "loss": 0.681, "step": 4020 }, { "epoch": 0.42, "learning_rate": 0.00013074774624215096, "loss": 0.6781, "step": 4021 }, { "epoch": 0.42, "learning_rate": 0.00013071566251041645, "loss": 0.7167, "step": 4022 }, { "epoch": 0.42, "learning_rate": 0.00013068357528716443, "loss": 0.6556, "step": 4023 }, { "epoch": 0.42, "learning_rate": 0.00013065148457604245, "loss": 0.7239, "step": 4024 }, { "epoch": 0.42, "learning_rate": 0.00013061939038069826, "loss": 0.6854, "step": 4025 }, { "epoch": 0.42, "learning_rate": 0.00013058729270478008, "loss": 0.6799, "step": 4026 }, { "epoch": 0.42, "learning_rate": 0.00013055519155193656, "loss": 0.6998, "step": 4027 }, { "epoch": 0.42, "learning_rate": 0.0001305230869258167, "loss": 0.6812, "step": 4028 }, { "epoch": 0.42, "learning_rate": 0.00013049097883006987, "loss": 0.7124, "step": 4029 }, { "epoch": 0.42, "learning_rate": 0.00013045886726834586, "loss": 0.6727, "step": 4030 }, { "epoch": 0.42, "learning_rate": 0.0001304267522442949, "loss": 0.659, "step": 4031 }, { "epoch": 0.42, "learning_rate": 0.00013039463376156757, "loss": 0.6759, "step": 4032 }, { "epoch": 0.42, "learning_rate": 0.00013036251182381485, "loss": 0.6877, "step": 4033 }, { "epoch": 0.42, "learning_rate": 0.00013033038643468813, "loss": 0.6573, "step": 4034 }, { "epoch": 0.42, "learning_rate": 0.00013029825759783913, "loss": 0.6617, "step": 4035 }, { "epoch": 0.42, "learning_rate": 0.00013026612531692004, "loss": 0.6768, "step": 4036 }, { "epoch": 0.42, "learning_rate": 0.00013023398959558337, "loss": 0.7262, "step": 4037 }, { "epoch": 0.42, "learning_rate": 0.0001302018504374821, "loss": 0.6347, "step": 4038 }, { "epoch": 0.42, "learning_rate": 0.00013016970784626957, "loss": 0.615, "step": 4039 }, { "epoch": 0.42, "learning_rate": 0.00013013756182559942, "loss": 0.6073, "step": 4040 }, { "epoch": 0.42, "learning_rate": 0.00013010541237912584, "loss": 0.7275, "step": 4041 }, { "epoch": 0.42, "learning_rate": 0.0001300732595105033, "loss": 0.7282, "step": 4042 }, { "epoch": 0.42, "learning_rate": 0.00013004110322338666, "loss": 0.6801, "step": 4043 }, { "epoch": 0.42, "learning_rate": 0.0001300089435214313, "loss": 0.7388, "step": 4044 }, { "epoch": 0.42, "learning_rate": 0.00012997678040829275, "loss": 0.657, "step": 4045 }, { "epoch": 0.42, "learning_rate": 0.00012994461388762712, "loss": 0.727, "step": 4046 }, { "epoch": 0.42, "learning_rate": 0.0001299124439630909, "loss": 0.6708, "step": 4047 }, { "epoch": 0.42, "learning_rate": 0.00012988027063834084, "loss": 0.7348, "step": 4048 }, { "epoch": 0.42, "learning_rate": 0.00012984809391703415, "loss": 0.7194, "step": 4049 }, { "epoch": 0.42, "learning_rate": 0.0001298159138028285, "loss": 0.6106, "step": 4050 }, { "epoch": 0.42, "learning_rate": 0.00012978373029938183, "loss": 0.7109, "step": 4051 }, { "epoch": 0.42, "learning_rate": 0.0001297515434103525, "loss": 0.6893, "step": 4052 }, { "epoch": 0.42, "learning_rate": 0.0001297193531393993, "loss": 0.731, "step": 4053 }, { "epoch": 0.42, "learning_rate": 0.00012968715949018136, "loss": 0.6803, "step": 4054 }, { "epoch": 0.42, "learning_rate": 0.00012965496246635817, "loss": 0.6132, "step": 4055 }, { "epoch": 0.42, "learning_rate": 0.00012962276207158964, "loss": 0.6945, "step": 4056 }, { "epoch": 0.42, "learning_rate": 0.00012959055830953612, "loss": 0.6638, "step": 4057 }, { "epoch": 0.42, "learning_rate": 0.00012955835118385825, "loss": 0.6973, "step": 4058 }, { "epoch": 0.42, "learning_rate": 0.00012952614069821708, "loss": 0.661, "step": 4059 }, { "epoch": 0.42, "learning_rate": 0.00012949392685627402, "loss": 0.7457, "step": 4060 }, { "epoch": 0.42, "learning_rate": 0.00012946170966169094, "loss": 0.7083, "step": 4061 }, { "epoch": 0.42, "learning_rate": 0.00012942948911813, "loss": 0.6989, "step": 4062 }, { "epoch": 0.42, "learning_rate": 0.0001293972652292538, "loss": 0.6584, "step": 4063 }, { "epoch": 0.42, "learning_rate": 0.00012936503799872528, "loss": 0.7628, "step": 4064 }, { "epoch": 0.42, "learning_rate": 0.0001293328074302078, "loss": 0.69, "step": 4065 }, { "epoch": 0.42, "learning_rate": 0.00012930057352736514, "loss": 0.723, "step": 4066 }, { "epoch": 0.42, "learning_rate": 0.00012926833629386128, "loss": 0.719, "step": 4067 }, { "epoch": 0.42, "learning_rate": 0.00012923609573336077, "loss": 0.6826, "step": 4068 }, { "epoch": 0.42, "learning_rate": 0.00012920385184952843, "loss": 0.6882, "step": 4069 }, { "epoch": 0.42, "learning_rate": 0.00012917160464602953, "loss": 0.6406, "step": 4070 }, { "epoch": 0.42, "learning_rate": 0.00012913935412652968, "loss": 0.7088, "step": 4071 }, { "epoch": 0.42, "learning_rate": 0.00012910710029469483, "loss": 0.6689, "step": 4072 }, { "epoch": 0.42, "learning_rate": 0.0001290748431541914, "loss": 0.7345, "step": 4073 }, { "epoch": 0.42, "learning_rate": 0.00012904258270868607, "loss": 0.6657, "step": 4074 }, { "epoch": 0.42, "learning_rate": 0.00012901031896184602, "loss": 0.7246, "step": 4075 }, { "epoch": 0.42, "learning_rate": 0.00012897805191733864, "loss": 0.7251, "step": 4076 }, { "epoch": 0.42, "learning_rate": 0.00012894578157883192, "loss": 0.6622, "step": 4077 }, { "epoch": 0.42, "learning_rate": 0.00012891350794999403, "loss": 0.6469, "step": 4078 }, { "epoch": 0.42, "learning_rate": 0.00012888123103449363, "loss": 0.6797, "step": 4079 }, { "epoch": 0.42, "learning_rate": 0.00012884895083599965, "loss": 0.6676, "step": 4080 }, { "epoch": 0.42, "learning_rate": 0.0001288166673581815, "loss": 0.7049, "step": 4081 }, { "epoch": 0.42, "learning_rate": 0.0001287843806047089, "loss": 0.7068, "step": 4082 }, { "epoch": 0.43, "learning_rate": 0.00012875209057925185, "loss": 0.6989, "step": 4083 }, { "epoch": 0.43, "learning_rate": 0.00012871979728548106, "loss": 0.6567, "step": 4084 }, { "epoch": 0.43, "learning_rate": 0.00012868750072706717, "loss": 0.6645, "step": 4085 }, { "epoch": 0.43, "learning_rate": 0.00012865520090768153, "loss": 0.7017, "step": 4086 }, { "epoch": 0.43, "learning_rate": 0.00012862289783099567, "loss": 0.6963, "step": 4087 }, { "epoch": 0.43, "learning_rate": 0.00012859059150068154, "loss": 0.686, "step": 4088 }, { "epoch": 0.43, "learning_rate": 0.00012855828192041152, "loss": 0.6499, "step": 4089 }, { "epoch": 0.43, "learning_rate": 0.00012852596909385827, "loss": 0.6546, "step": 4090 }, { "epoch": 0.43, "learning_rate": 0.00012849365302469492, "loss": 0.7027, "step": 4091 }, { "epoch": 0.43, "learning_rate": 0.00012846133371659485, "loss": 0.6969, "step": 4092 }, { "epoch": 0.43, "learning_rate": 0.00012842901117323188, "loss": 0.678, "step": 4093 }, { "epoch": 0.43, "learning_rate": 0.00012839668539828017, "loss": 0.6942, "step": 4094 }, { "epoch": 0.43, "learning_rate": 0.00012836435639541433, "loss": 0.7575, "step": 4095 }, { "epoch": 0.43, "learning_rate": 0.00012833202416830922, "loss": 0.6988, "step": 4096 }, { "epoch": 0.43, "learning_rate": 0.00012829968872064007, "loss": 0.679, "step": 4097 }, { "epoch": 0.43, "learning_rate": 0.00012826735005608264, "loss": 0.6908, "step": 4098 }, { "epoch": 0.43, "learning_rate": 0.00012823500817831285, "loss": 0.7576, "step": 4099 }, { "epoch": 0.43, "learning_rate": 0.00012820266309100705, "loss": 0.7155, "step": 4100 }, { "epoch": 0.43, "learning_rate": 0.00012817031479784205, "loss": 0.6564, "step": 4101 }, { "epoch": 0.43, "learning_rate": 0.0001281379633024949, "loss": 0.7168, "step": 4102 }, { "epoch": 0.43, "learning_rate": 0.00012810560860864313, "loss": 0.6642, "step": 4103 }, { "epoch": 0.43, "learning_rate": 0.0001280732507199645, "loss": 0.7221, "step": 4104 }, { "epoch": 0.43, "learning_rate": 0.00012804088964013727, "loss": 0.6922, "step": 4105 }, { "epoch": 0.43, "learning_rate": 0.00012800852537283992, "loss": 0.6797, "step": 4106 }, { "epoch": 0.43, "learning_rate": 0.0001279761579217514, "loss": 0.681, "step": 4107 }, { "epoch": 0.43, "learning_rate": 0.00012794378729055102, "loss": 0.6381, "step": 4108 }, { "epoch": 0.43, "learning_rate": 0.0001279114134829184, "loss": 0.6999, "step": 4109 }, { "epoch": 0.43, "learning_rate": 0.0001278790365025335, "loss": 0.7012, "step": 4110 }, { "epoch": 0.43, "learning_rate": 0.00012784665635307677, "loss": 0.7397, "step": 4111 }, { "epoch": 0.43, "learning_rate": 0.00012781427303822887, "loss": 0.6772, "step": 4112 }, { "epoch": 0.43, "learning_rate": 0.0001277818865616709, "loss": 0.7, "step": 4113 }, { "epoch": 0.43, "learning_rate": 0.00012774949692708428, "loss": 0.6761, "step": 4114 }, { "epoch": 0.43, "learning_rate": 0.00012771710413815086, "loss": 0.715, "step": 4115 }, { "epoch": 0.43, "learning_rate": 0.00012768470819855273, "loss": 0.731, "step": 4116 }, { "epoch": 0.43, "learning_rate": 0.0001276523091119725, "loss": 0.7572, "step": 4117 }, { "epoch": 0.43, "learning_rate": 0.00012761990688209298, "loss": 0.7484, "step": 4118 }, { "epoch": 0.43, "learning_rate": 0.00012758750151259742, "loss": 0.6829, "step": 4119 }, { "epoch": 0.43, "learning_rate": 0.00012755509300716938, "loss": 0.6951, "step": 4120 }, { "epoch": 0.43, "learning_rate": 0.00012752268136949287, "loss": 0.6864, "step": 4121 }, { "epoch": 0.43, "learning_rate": 0.00012749026660325216, "loss": 0.7424, "step": 4122 }, { "epoch": 0.43, "learning_rate": 0.00012745784871213194, "loss": 0.7338, "step": 4123 }, { "epoch": 0.43, "learning_rate": 0.00012742542769981713, "loss": 0.688, "step": 4124 }, { "epoch": 0.43, "learning_rate": 0.0001273930035699932, "loss": 0.6567, "step": 4125 }, { "epoch": 0.43, "learning_rate": 0.0001273605763263458, "loss": 0.655, "step": 4126 }, { "epoch": 0.43, "learning_rate": 0.00012732814597256106, "loss": 0.722, "step": 4127 }, { "epoch": 0.43, "learning_rate": 0.0001272957125123254, "loss": 0.6976, "step": 4128 }, { "epoch": 0.43, "learning_rate": 0.00012726327594932558, "loss": 0.6585, "step": 4129 }, { "epoch": 0.43, "learning_rate": 0.00012723083628724877, "loss": 0.6138, "step": 4130 }, { "epoch": 0.43, "learning_rate": 0.00012719839352978243, "loss": 0.6335, "step": 4131 }, { "epoch": 0.43, "learning_rate": 0.0001271659476806144, "loss": 0.675, "step": 4132 }, { "epoch": 0.43, "learning_rate": 0.00012713349874343284, "loss": 0.7176, "step": 4133 }, { "epoch": 0.43, "learning_rate": 0.00012710104672192636, "loss": 0.6769, "step": 4134 }, { "epoch": 0.43, "learning_rate": 0.00012706859161978383, "loss": 0.6963, "step": 4135 }, { "epoch": 0.43, "learning_rate": 0.00012703613344069452, "loss": 0.6745, "step": 4136 }, { "epoch": 0.43, "learning_rate": 0.00012700367218834797, "loss": 0.6824, "step": 4137 }, { "epoch": 0.43, "learning_rate": 0.00012697120786643414, "loss": 0.7081, "step": 4138 }, { "epoch": 0.43, "learning_rate": 0.00012693874047864332, "loss": 0.6689, "step": 4139 }, { "epoch": 0.43, "learning_rate": 0.00012690627002866613, "loss": 0.6602, "step": 4140 }, { "epoch": 0.43, "learning_rate": 0.0001268737965201936, "loss": 0.7081, "step": 4141 }, { "epoch": 0.43, "learning_rate": 0.0001268413199569171, "loss": 0.6723, "step": 4142 }, { "epoch": 0.43, "learning_rate": 0.0001268088403425282, "loss": 0.6839, "step": 4143 }, { "epoch": 0.43, "learning_rate": 0.00012677635768071902, "loss": 0.6909, "step": 4144 }, { "epoch": 0.43, "learning_rate": 0.0001267438719751819, "loss": 0.707, "step": 4145 }, { "epoch": 0.43, "learning_rate": 0.00012671138322960959, "loss": 0.7188, "step": 4146 }, { "epoch": 0.43, "learning_rate": 0.00012667889144769512, "loss": 0.7106, "step": 4147 }, { "epoch": 0.43, "learning_rate": 0.00012664639663313192, "loss": 0.704, "step": 4148 }, { "epoch": 0.43, "learning_rate": 0.00012661389878961375, "loss": 0.7029, "step": 4149 }, { "epoch": 0.43, "learning_rate": 0.00012658139792083472, "loss": 0.6902, "step": 4150 }, { "epoch": 0.43, "learning_rate": 0.00012654889403048927, "loss": 0.6745, "step": 4151 }, { "epoch": 0.43, "learning_rate": 0.00012651638712227217, "loss": 0.6828, "step": 4152 }, { "epoch": 0.43, "learning_rate": 0.00012648387719987856, "loss": 0.664, "step": 4153 }, { "epoch": 0.43, "learning_rate": 0.00012645136426700393, "loss": 0.7095, "step": 4154 }, { "epoch": 0.43, "learning_rate": 0.00012641884832734408, "loss": 0.715, "step": 4155 }, { "epoch": 0.43, "learning_rate": 0.0001263863293845952, "loss": 0.6747, "step": 4156 }, { "epoch": 0.43, "learning_rate": 0.00012635380744245377, "loss": 0.6594, "step": 4157 }, { "epoch": 0.43, "learning_rate": 0.00012632128250461664, "loss": 0.6082, "step": 4158 }, { "epoch": 0.43, "learning_rate": 0.00012628875457478095, "loss": 0.6696, "step": 4159 }, { "epoch": 0.43, "learning_rate": 0.00012625622365664425, "loss": 0.689, "step": 4160 }, { "epoch": 0.43, "learning_rate": 0.00012622368975390442, "loss": 0.656, "step": 4161 }, { "epoch": 0.43, "learning_rate": 0.00012619115287025966, "loss": 0.71, "step": 4162 }, { "epoch": 0.43, "learning_rate": 0.00012615861300940847, "loss": 0.6151, "step": 4163 }, { "epoch": 0.43, "learning_rate": 0.00012612607017504978, "loss": 0.6842, "step": 4164 }, { "epoch": 0.43, "learning_rate": 0.0001260935243708828, "loss": 0.625, "step": 4165 }, { "epoch": 0.43, "learning_rate": 0.00012606097560060702, "loss": 0.6275, "step": 4166 }, { "epoch": 0.43, "learning_rate": 0.00012602842386792238, "loss": 0.705, "step": 4167 }, { "epoch": 0.43, "learning_rate": 0.0001259958691765291, "loss": 0.7498, "step": 4168 }, { "epoch": 0.43, "learning_rate": 0.0001259633115301278, "loss": 0.6522, "step": 4169 }, { "epoch": 0.43, "learning_rate": 0.00012593075093241926, "loss": 0.6864, "step": 4170 }, { "epoch": 0.43, "learning_rate": 0.00012589818738710482, "loss": 0.6755, "step": 4171 }, { "epoch": 0.43, "learning_rate": 0.00012586562089788602, "loss": 0.6785, "step": 4172 }, { "epoch": 0.43, "learning_rate": 0.0001258330514684647, "loss": 0.6763, "step": 4173 }, { "epoch": 0.43, "learning_rate": 0.0001258004791025432, "loss": 0.6905, "step": 4174 }, { "epoch": 0.43, "learning_rate": 0.00012576790380382404, "loss": 0.6944, "step": 4175 }, { "epoch": 0.43, "learning_rate": 0.00012573532557601014, "loss": 0.6212, "step": 4176 }, { "epoch": 0.43, "learning_rate": 0.00012570274442280473, "loss": 0.6186, "step": 4177 }, { "epoch": 0.43, "learning_rate": 0.0001256701603479114, "loss": 0.6713, "step": 4178 }, { "epoch": 0.43, "learning_rate": 0.00012563757335503403, "loss": 0.6215, "step": 4179 }, { "epoch": 0.44, "learning_rate": 0.00012560498344787684, "loss": 0.7676, "step": 4180 }, { "epoch": 0.44, "learning_rate": 0.00012557239063014445, "loss": 0.6966, "step": 4181 }, { "epoch": 0.44, "learning_rate": 0.00012553979490554179, "loss": 0.6735, "step": 4182 }, { "epoch": 0.44, "learning_rate": 0.00012550719627777394, "loss": 0.6296, "step": 4183 }, { "epoch": 0.44, "learning_rate": 0.00012547459475054657, "loss": 0.71, "step": 4184 }, { "epoch": 0.44, "learning_rate": 0.00012544199032756557, "loss": 0.6834, "step": 4185 }, { "epoch": 0.44, "learning_rate": 0.0001254093830125371, "loss": 0.7043, "step": 4186 }, { "epoch": 0.44, "learning_rate": 0.00012537677280916775, "loss": 0.711, "step": 4187 }, { "epoch": 0.44, "learning_rate": 0.00012534415972116443, "loss": 0.5861, "step": 4188 }, { "epoch": 0.44, "learning_rate": 0.00012531154375223426, "loss": 0.7064, "step": 4189 }, { "epoch": 0.44, "learning_rate": 0.00012527892490608476, "loss": 0.6259, "step": 4190 }, { "epoch": 0.44, "learning_rate": 0.00012524630318642388, "loss": 0.7519, "step": 4191 }, { "epoch": 0.44, "learning_rate": 0.00012521367859695976, "loss": 0.7067, "step": 4192 }, { "epoch": 0.44, "learning_rate": 0.00012518105114140085, "loss": 0.6876, "step": 4193 }, { "epoch": 0.44, "learning_rate": 0.00012514842082345613, "loss": 0.6927, "step": 4194 }, { "epoch": 0.44, "learning_rate": 0.0001251157876468346, "loss": 0.7247, "step": 4195 }, { "epoch": 0.44, "learning_rate": 0.0001250831516152458, "loss": 0.6793, "step": 4196 }, { "epoch": 0.44, "learning_rate": 0.0001250505127323996, "loss": 0.724, "step": 4197 }, { "epoch": 0.44, "learning_rate": 0.0001250178710020061, "loss": 0.7705, "step": 4198 }, { "epoch": 0.44, "learning_rate": 0.00012498522642777574, "loss": 0.616, "step": 4199 }, { "epoch": 0.44, "learning_rate": 0.00012495257901341925, "loss": 0.7069, "step": 4200 }, { "epoch": 0.44, "learning_rate": 0.00012491992876264787, "loss": 0.7069, "step": 4201 }, { "epoch": 0.44, "learning_rate": 0.0001248872756791729, "loss": 0.7637, "step": 4202 }, { "epoch": 0.44, "learning_rate": 0.00012485461976670612, "loss": 0.7235, "step": 4203 }, { "epoch": 0.44, "learning_rate": 0.00012482196102895965, "loss": 0.6827, "step": 4204 }, { "epoch": 0.44, "learning_rate": 0.00012478929946964585, "loss": 0.6718, "step": 4205 }, { "epoch": 0.44, "learning_rate": 0.0001247566350924774, "loss": 0.6985, "step": 4206 }, { "epoch": 0.44, "learning_rate": 0.0001247239679011674, "loss": 0.7175, "step": 4207 }, { "epoch": 0.44, "learning_rate": 0.00012469129789942915, "loss": 0.6924, "step": 4208 }, { "epoch": 0.44, "learning_rate": 0.00012465862509097633, "loss": 0.6295, "step": 4209 }, { "epoch": 0.44, "learning_rate": 0.00012462594947952293, "loss": 0.7015, "step": 4210 }, { "epoch": 0.44, "learning_rate": 0.0001245932710687833, "loss": 0.6544, "step": 4211 }, { "epoch": 0.44, "learning_rate": 0.00012456058986247198, "loss": 0.6473, "step": 4212 }, { "epoch": 0.44, "learning_rate": 0.00012452790586430401, "loss": 0.6761, "step": 4213 }, { "epoch": 0.44, "learning_rate": 0.0001244952190779946, "loss": 0.6383, "step": 4214 }, { "epoch": 0.44, "learning_rate": 0.00012446252950725932, "loss": 0.723, "step": 4215 }, { "epoch": 0.44, "learning_rate": 0.00012442983715581408, "loss": 0.6862, "step": 4216 }, { "epoch": 0.44, "learning_rate": 0.00012439714202737513, "loss": 0.7252, "step": 4217 }, { "epoch": 0.44, "learning_rate": 0.00012436444412565896, "loss": 0.6422, "step": 4218 }, { "epoch": 0.44, "learning_rate": 0.0001243317434543824, "loss": 0.7135, "step": 4219 }, { "epoch": 0.44, "learning_rate": 0.00012429904001726264, "loss": 0.6601, "step": 4220 }, { "epoch": 0.44, "learning_rate": 0.00012426633381801717, "loss": 0.6785, "step": 4221 }, { "epoch": 0.44, "learning_rate": 0.0001242336248603637, "loss": 0.6666, "step": 4222 }, { "epoch": 0.44, "learning_rate": 0.00012420091314802037, "loss": 0.7156, "step": 4223 }, { "epoch": 0.44, "learning_rate": 0.0001241681986847056, "loss": 0.6193, "step": 4224 }, { "epoch": 0.44, "learning_rate": 0.0001241354814741381, "loss": 0.7127, "step": 4225 }, { "epoch": 0.44, "learning_rate": 0.00012410276152003698, "loss": 0.598, "step": 4226 }, { "epoch": 0.44, "learning_rate": 0.00012407003882612149, "loss": 0.6619, "step": 4227 }, { "epoch": 0.44, "learning_rate": 0.00012403731339611133, "loss": 0.6826, "step": 4228 }, { "epoch": 0.44, "learning_rate": 0.00012400458523372648, "loss": 0.7093, "step": 4229 }, { "epoch": 0.44, "learning_rate": 0.0001239718543426872, "loss": 0.7428, "step": 4230 }, { "epoch": 0.44, "learning_rate": 0.00012393912072671413, "loss": 0.6664, "step": 4231 }, { "epoch": 0.44, "learning_rate": 0.00012390638438952812, "loss": 0.7636, "step": 4232 }, { "epoch": 0.44, "learning_rate": 0.00012387364533485043, "loss": 0.6586, "step": 4233 }, { "epoch": 0.44, "learning_rate": 0.00012384090356640253, "loss": 0.6452, "step": 4234 }, { "epoch": 0.44, "learning_rate": 0.00012380815908790628, "loss": 0.7383, "step": 4235 }, { "epoch": 0.44, "learning_rate": 0.00012377541190308378, "loss": 0.7025, "step": 4236 }, { "epoch": 0.44, "learning_rate": 0.00012374266201565755, "loss": 0.75, "step": 4237 }, { "epoch": 0.44, "learning_rate": 0.00012370990942935027, "loss": 0.6936, "step": 4238 }, { "epoch": 0.44, "learning_rate": 0.00012367715414788506, "loss": 0.7057, "step": 4239 }, { "epoch": 0.44, "learning_rate": 0.00012364439617498524, "loss": 0.7436, "step": 4240 }, { "epoch": 0.44, "learning_rate": 0.0001236116355143745, "loss": 0.6754, "step": 4241 }, { "epoch": 0.44, "learning_rate": 0.0001235788721697768, "loss": 0.6797, "step": 4242 }, { "epoch": 0.44, "learning_rate": 0.00012354610614491644, "loss": 0.7162, "step": 4243 }, { "epoch": 0.44, "learning_rate": 0.000123513337443518, "loss": 0.6568, "step": 4244 }, { "epoch": 0.44, "learning_rate": 0.00012348056606930637, "loss": 0.6802, "step": 4245 }, { "epoch": 0.44, "learning_rate": 0.00012344779202600674, "loss": 0.64, "step": 4246 }, { "epoch": 0.44, "learning_rate": 0.00012341501531734463, "loss": 0.6193, "step": 4247 }, { "epoch": 0.44, "learning_rate": 0.00012338223594704584, "loss": 0.6258, "step": 4248 }, { "epoch": 0.44, "learning_rate": 0.00012334945391883644, "loss": 0.7459, "step": 4249 }, { "epoch": 0.44, "learning_rate": 0.00012331666923644282, "loss": 0.6683, "step": 4250 }, { "epoch": 0.44, "learning_rate": 0.00012328388190359176, "loss": 0.731, "step": 4251 }, { "epoch": 0.44, "learning_rate": 0.00012325109192401024, "loss": 0.7351, "step": 4252 }, { "epoch": 0.44, "learning_rate": 0.00012321829930142552, "loss": 0.6315, "step": 4253 }, { "epoch": 0.44, "learning_rate": 0.00012318550403956531, "loss": 0.728, "step": 4254 }, { "epoch": 0.44, "learning_rate": 0.0001231527061421574, "loss": 0.6469, "step": 4255 }, { "epoch": 0.44, "learning_rate": 0.0001231199056129301, "loss": 0.6971, "step": 4256 }, { "epoch": 0.44, "learning_rate": 0.00012308710245561186, "loss": 0.6227, "step": 4257 }, { "epoch": 0.44, "learning_rate": 0.0001230542966739315, "loss": 0.6598, "step": 4258 }, { "epoch": 0.44, "learning_rate": 0.0001230214882716182, "loss": 0.73, "step": 4259 }, { "epoch": 0.44, "learning_rate": 0.00012298867725240122, "loss": 0.7014, "step": 4260 }, { "epoch": 0.44, "learning_rate": 0.00012295586362001036, "loss": 0.7011, "step": 4261 }, { "epoch": 0.44, "learning_rate": 0.00012292304737817562, "loss": 0.7246, "step": 4262 }, { "epoch": 0.44, "learning_rate": 0.00012289022853062724, "loss": 0.7206, "step": 4263 }, { "epoch": 0.44, "learning_rate": 0.00012285740708109586, "loss": 0.6702, "step": 4264 }, { "epoch": 0.44, "learning_rate": 0.00012282458303331236, "loss": 0.6786, "step": 4265 }, { "epoch": 0.44, "learning_rate": 0.00012279175639100788, "loss": 0.7125, "step": 4266 }, { "epoch": 0.44, "learning_rate": 0.00012275892715791397, "loss": 0.6651, "step": 4267 }, { "epoch": 0.44, "learning_rate": 0.00012272609533776235, "loss": 0.7162, "step": 4268 }, { "epoch": 0.44, "learning_rate": 0.00012269326093428508, "loss": 0.7244, "step": 4269 }, { "epoch": 0.44, "learning_rate": 0.00012266042395121454, "loss": 0.6103, "step": 4270 }, { "epoch": 0.44, "learning_rate": 0.0001226275843922834, "loss": 0.6489, "step": 4271 }, { "epoch": 0.44, "learning_rate": 0.00012259474226122456, "loss": 0.6012, "step": 4272 }, { "epoch": 0.44, "learning_rate": 0.00012256189756177125, "loss": 0.6747, "step": 4273 }, { "epoch": 0.44, "learning_rate": 0.0001225290502976571, "loss": 0.6677, "step": 4274 }, { "epoch": 0.44, "learning_rate": 0.00012249620047261582, "loss": 0.7306, "step": 4275 }, { "epoch": 0.45, "learning_rate": 0.00012246334809038156, "loss": 0.7655, "step": 4276 }, { "epoch": 0.45, "learning_rate": 0.00012243049315468875, "loss": 0.6666, "step": 4277 }, { "epoch": 0.45, "learning_rate": 0.0001223976356692721, "loss": 0.6984, "step": 4278 }, { "epoch": 0.45, "learning_rate": 0.0001223647756378665, "loss": 0.698, "step": 4279 }, { "epoch": 0.45, "learning_rate": 0.0001223319130642073, "loss": 0.6912, "step": 4280 }, { "epoch": 0.45, "learning_rate": 0.00012229904795203002, "loss": 0.7014, "step": 4281 }, { "epoch": 0.45, "learning_rate": 0.00012226618030507054, "loss": 0.6669, "step": 4282 }, { "epoch": 0.45, "learning_rate": 0.00012223331012706497, "loss": 0.6569, "step": 4283 }, { "epoch": 0.45, "learning_rate": 0.0001222004374217498, "loss": 0.6631, "step": 4284 }, { "epoch": 0.45, "learning_rate": 0.00012216756219286167, "loss": 0.7014, "step": 4285 }, { "epoch": 0.45, "learning_rate": 0.00012213468444413763, "loss": 0.6331, "step": 4286 }, { "epoch": 0.45, "learning_rate": 0.00012210180417931488, "loss": 0.6764, "step": 4287 }, { "epoch": 0.45, "learning_rate": 0.0001220689214021311, "loss": 0.6848, "step": 4288 }, { "epoch": 0.45, "learning_rate": 0.00012203603611632413, "loss": 0.6549, "step": 4289 }, { "epoch": 0.45, "learning_rate": 0.00012200314832563204, "loss": 0.6656, "step": 4290 }, { "epoch": 0.45, "learning_rate": 0.00012197025803379333, "loss": 0.7284, "step": 4291 }, { "epoch": 0.45, "learning_rate": 0.0001219373652445467, "loss": 0.753, "step": 4292 }, { "epoch": 0.45, "learning_rate": 0.00012190446996163112, "loss": 0.7122, "step": 4293 }, { "epoch": 0.45, "learning_rate": 0.0001218715721887859, "loss": 0.6163, "step": 4294 }, { "epoch": 0.45, "learning_rate": 0.00012183867192975056, "loss": 0.661, "step": 4295 }, { "epoch": 0.45, "learning_rate": 0.00012180576918826498, "loss": 0.6699, "step": 4296 }, { "epoch": 0.45, "learning_rate": 0.00012177286396806929, "loss": 0.7287, "step": 4297 }, { "epoch": 0.45, "learning_rate": 0.00012173995627290389, "loss": 0.59, "step": 4298 }, { "epoch": 0.45, "learning_rate": 0.00012170704610650947, "loss": 0.718, "step": 4299 }, { "epoch": 0.45, "learning_rate": 0.00012167413347262697, "loss": 0.6607, "step": 4300 }, { "epoch": 0.45, "learning_rate": 0.00012164121837499771, "loss": 0.6832, "step": 4301 }, { "epoch": 0.45, "learning_rate": 0.00012160830081736318, "loss": 0.752, "step": 4302 }, { "epoch": 0.45, "learning_rate": 0.0001215753808034652, "loss": 0.6661, "step": 4303 }, { "epoch": 0.45, "learning_rate": 0.00012154245833704584, "loss": 0.6943, "step": 4304 }, { "epoch": 0.45, "learning_rate": 0.00012150953342184752, "loss": 0.7214, "step": 4305 }, { "epoch": 0.45, "learning_rate": 0.00012147660606161284, "loss": 0.6623, "step": 4306 }, { "epoch": 0.45, "learning_rate": 0.00012144367626008472, "loss": 0.6797, "step": 4307 }, { "epoch": 0.45, "learning_rate": 0.00012141074402100643, "loss": 0.6148, "step": 4308 }, { "epoch": 0.45, "learning_rate": 0.00012137780934812137, "loss": 0.7092, "step": 4309 }, { "epoch": 0.45, "learning_rate": 0.00012134487224517334, "loss": 0.6801, "step": 4310 }, { "epoch": 0.45, "learning_rate": 0.0001213119327159064, "loss": 0.722, "step": 4311 }, { "epoch": 0.45, "learning_rate": 0.0001212789907640648, "loss": 0.7456, "step": 4312 }, { "epoch": 0.45, "learning_rate": 0.00012124604639339314, "loss": 0.697, "step": 4313 }, { "epoch": 0.45, "learning_rate": 0.00012121309960763629, "loss": 0.65, "step": 4314 }, { "epoch": 0.45, "learning_rate": 0.0001211801504105394, "loss": 0.6714, "step": 4315 }, { "epoch": 0.45, "learning_rate": 0.00012114719880584788, "loss": 0.6221, "step": 4316 }, { "epoch": 0.45, "learning_rate": 0.00012111424479730738, "loss": 0.7118, "step": 4317 }, { "epoch": 0.45, "learning_rate": 0.00012108128838866386, "loss": 0.6573, "step": 4318 }, { "epoch": 0.45, "learning_rate": 0.00012104832958366357, "loss": 0.6083, "step": 4319 }, { "epoch": 0.45, "learning_rate": 0.00012101536838605299, "loss": 0.7602, "step": 4320 }, { "epoch": 0.45, "learning_rate": 0.0001209824047995789, "loss": 0.6096, "step": 4321 }, { "epoch": 0.45, "learning_rate": 0.00012094943882798838, "loss": 0.7447, "step": 4322 }, { "epoch": 0.45, "learning_rate": 0.00012091647047502868, "loss": 0.705, "step": 4323 }, { "epoch": 0.45, "learning_rate": 0.00012088349974444742, "loss": 0.6729, "step": 4324 }, { "epoch": 0.45, "learning_rate": 0.00012085052663999246, "loss": 0.7034, "step": 4325 }, { "epoch": 0.45, "learning_rate": 0.00012081755116541189, "loss": 0.6973, "step": 4326 }, { "epoch": 0.45, "learning_rate": 0.00012078457332445414, "loss": 0.6117, "step": 4327 }, { "epoch": 0.45, "learning_rate": 0.0001207515931208679, "loss": 0.6526, "step": 4328 }, { "epoch": 0.45, "learning_rate": 0.00012071861055840203, "loss": 0.5986, "step": 4329 }, { "epoch": 0.45, "learning_rate": 0.0001206856256408058, "loss": 0.7226, "step": 4330 }, { "epoch": 0.45, "learning_rate": 0.00012065263837182865, "loss": 0.6714, "step": 4331 }, { "epoch": 0.45, "learning_rate": 0.00012061964875522031, "loss": 0.6796, "step": 4332 }, { "epoch": 0.45, "learning_rate": 0.00012058665679473079, "loss": 0.7304, "step": 4333 }, { "epoch": 0.45, "learning_rate": 0.00012055366249411035, "loss": 0.6622, "step": 4334 }, { "epoch": 0.45, "learning_rate": 0.00012052066585710955, "loss": 0.7258, "step": 4335 }, { "epoch": 0.45, "learning_rate": 0.00012048766688747919, "loss": 0.6919, "step": 4336 }, { "epoch": 0.45, "learning_rate": 0.00012045466558897027, "loss": 0.6903, "step": 4337 }, { "epoch": 0.45, "learning_rate": 0.0001204216619653342, "loss": 0.6961, "step": 4338 }, { "epoch": 0.45, "learning_rate": 0.00012038865602032254, "loss": 0.6693, "step": 4339 }, { "epoch": 0.45, "learning_rate": 0.00012035564775768715, "loss": 0.7304, "step": 4340 }, { "epoch": 0.45, "learning_rate": 0.00012032263718118018, "loss": 0.7155, "step": 4341 }, { "epoch": 0.45, "learning_rate": 0.000120289624294554, "loss": 0.6821, "step": 4342 }, { "epoch": 0.45, "learning_rate": 0.0001202566091015612, "loss": 0.6901, "step": 4343 }, { "epoch": 0.45, "learning_rate": 0.00012022359160595478, "loss": 0.6621, "step": 4344 }, { "epoch": 0.45, "learning_rate": 0.00012019057181148788, "loss": 0.6759, "step": 4345 }, { "epoch": 0.45, "learning_rate": 0.00012015754972191391, "loss": 0.7109, "step": 4346 }, { "epoch": 0.45, "learning_rate": 0.00012012452534098655, "loss": 0.6672, "step": 4347 }, { "epoch": 0.45, "learning_rate": 0.00012009149867245981, "loss": 0.684, "step": 4348 }, { "epoch": 0.45, "learning_rate": 0.00012005846972008792, "loss": 0.7025, "step": 4349 }, { "epoch": 0.45, "learning_rate": 0.00012002543848762527, "loss": 0.6753, "step": 4350 }, { "epoch": 0.45, "learning_rate": 0.00011999240497882665, "loss": 0.6998, "step": 4351 }, { "epoch": 0.45, "learning_rate": 0.00011995936919744704, "loss": 0.6814, "step": 4352 }, { "epoch": 0.45, "learning_rate": 0.00011992633114724166, "loss": 0.6776, "step": 4353 }, { "epoch": 0.45, "learning_rate": 0.00011989329083196608, "loss": 0.6246, "step": 4354 }, { "epoch": 0.45, "learning_rate": 0.00011986024825537608, "loss": 0.6524, "step": 4355 }, { "epoch": 0.45, "learning_rate": 0.00011982720342122758, "loss": 0.6138, "step": 4356 }, { "epoch": 0.45, "learning_rate": 0.0001197941563332769, "loss": 0.6513, "step": 4357 }, { "epoch": 0.45, "learning_rate": 0.00011976110699528063, "loss": 0.6958, "step": 4358 }, { "epoch": 0.45, "learning_rate": 0.0001197280554109955, "loss": 0.648, "step": 4359 }, { "epoch": 0.45, "learning_rate": 0.00011969500158417857, "loss": 0.7157, "step": 4360 }, { "epoch": 0.45, "learning_rate": 0.0001196619455185872, "loss": 0.6767, "step": 4361 }, { "epoch": 0.45, "learning_rate": 0.00011962888721797887, "loss": 0.671, "step": 4362 }, { "epoch": 0.45, "learning_rate": 0.00011959582668611142, "loss": 0.6491, "step": 4363 }, { "epoch": 0.45, "learning_rate": 0.0001195627639267429, "loss": 0.7189, "step": 4364 }, { "epoch": 0.45, "learning_rate": 0.00011952969894363166, "loss": 0.6945, "step": 4365 }, { "epoch": 0.45, "learning_rate": 0.00011949663174053625, "loss": 0.7345, "step": 4366 }, { "epoch": 0.45, "learning_rate": 0.00011946356232121549, "loss": 0.7275, "step": 4367 }, { "epoch": 0.45, "learning_rate": 0.00011943049068942846, "loss": 0.6635, "step": 4368 }, { "epoch": 0.45, "learning_rate": 0.00011939741684893449, "loss": 0.7044, "step": 4369 }, { "epoch": 0.45, "learning_rate": 0.00011936434080349312, "loss": 0.7059, "step": 4370 }, { "epoch": 0.45, "learning_rate": 0.00011933126255686422, "loss": 0.6404, "step": 4371 }, { "epoch": 0.46, "learning_rate": 0.00011929818211280786, "loss": 0.6579, "step": 4372 }, { "epoch": 0.46, "learning_rate": 0.00011926509947508436, "loss": 0.6869, "step": 4373 }, { "epoch": 0.46, "learning_rate": 0.00011923201464745431, "loss": 0.6626, "step": 4374 }, { "epoch": 0.46, "learning_rate": 0.00011919892763367851, "loss": 0.6724, "step": 4375 }, { "epoch": 0.46, "learning_rate": 0.00011916583843751805, "loss": 0.7086, "step": 4376 }, { "epoch": 0.46, "learning_rate": 0.00011913274706273424, "loss": 0.7315, "step": 4377 }, { "epoch": 0.46, "learning_rate": 0.00011909965351308868, "loss": 0.6241, "step": 4378 }, { "epoch": 0.46, "learning_rate": 0.00011906655779234315, "loss": 0.7312, "step": 4379 }, { "epoch": 0.46, "learning_rate": 0.00011903345990425973, "loss": 0.6586, "step": 4380 }, { "epoch": 0.46, "learning_rate": 0.00011900035985260077, "loss": 0.6727, "step": 4381 }, { "epoch": 0.46, "learning_rate": 0.00011896725764112874, "loss": 0.6855, "step": 4382 }, { "epoch": 0.46, "learning_rate": 0.00011893415327360649, "loss": 0.7376, "step": 4383 }, { "epoch": 0.46, "learning_rate": 0.0001189010467537971, "loss": 0.653, "step": 4384 }, { "epoch": 0.46, "learning_rate": 0.00011886793808546381, "loss": 0.6935, "step": 4385 }, { "epoch": 0.46, "learning_rate": 0.00011883482727237019, "loss": 0.6954, "step": 4386 }, { "epoch": 0.46, "learning_rate": 0.00011880171431827997, "loss": 0.7516, "step": 4387 }, { "epoch": 0.46, "learning_rate": 0.00011876859922695725, "loss": 0.6414, "step": 4388 }, { "epoch": 0.46, "learning_rate": 0.00011873548200216621, "loss": 0.6536, "step": 4389 }, { "epoch": 0.46, "learning_rate": 0.00011870236264767143, "loss": 0.6818, "step": 4390 }, { "epoch": 0.46, "learning_rate": 0.00011866924116723761, "loss": 0.6878, "step": 4391 }, { "epoch": 0.46, "learning_rate": 0.00011863611756462978, "loss": 0.7053, "step": 4392 }, { "epoch": 0.46, "learning_rate": 0.00011860299184361317, "loss": 0.6449, "step": 4393 }, { "epoch": 0.46, "learning_rate": 0.0001185698640079532, "loss": 0.6956, "step": 4394 }, { "epoch": 0.46, "learning_rate": 0.00011853673406141566, "loss": 0.7584, "step": 4395 }, { "epoch": 0.46, "learning_rate": 0.00011850360200776647, "loss": 0.6982, "step": 4396 }, { "epoch": 0.46, "learning_rate": 0.00011847046785077178, "loss": 0.6906, "step": 4397 }, { "epoch": 0.46, "learning_rate": 0.0001184373315941981, "loss": 0.6684, "step": 4398 }, { "epoch": 0.46, "learning_rate": 0.00011840419324181206, "loss": 0.6542, "step": 4399 }, { "epoch": 0.46, "learning_rate": 0.00011837105279738059, "loss": 0.7049, "step": 4400 }, { "epoch": 0.46, "learning_rate": 0.0001183379102646708, "loss": 0.6314, "step": 4401 }, { "epoch": 0.46, "learning_rate": 0.00011830476564745014, "loss": 0.6909, "step": 4402 }, { "epoch": 0.46, "learning_rate": 0.00011827161894948615, "loss": 0.6471, "step": 4403 }, { "epoch": 0.46, "learning_rate": 0.00011823847017454677, "loss": 0.7273, "step": 4404 }, { "epoch": 0.46, "learning_rate": 0.00011820531932640002, "loss": 0.6843, "step": 4405 }, { "epoch": 0.46, "learning_rate": 0.0001181721664088143, "loss": 0.7053, "step": 4406 }, { "epoch": 0.46, "learning_rate": 0.00011813901142555815, "loss": 0.6732, "step": 4407 }, { "epoch": 0.46, "learning_rate": 0.00011810585438040034, "loss": 0.6305, "step": 4408 }, { "epoch": 0.46, "learning_rate": 0.00011807269527710994, "loss": 0.6413, "step": 4409 }, { "epoch": 0.46, "learning_rate": 0.00011803953411945617, "loss": 0.6819, "step": 4410 }, { "epoch": 0.46, "learning_rate": 0.00011800637091120859, "loss": 0.7299, "step": 4411 }, { "epoch": 0.46, "learning_rate": 0.00011797320565613693, "loss": 0.7208, "step": 4412 }, { "epoch": 0.46, "learning_rate": 0.00011794003835801113, "loss": 0.7389, "step": 4413 }, { "epoch": 0.46, "learning_rate": 0.00011790686902060142, "loss": 0.6769, "step": 4414 }, { "epoch": 0.46, "learning_rate": 0.0001178736976476782, "loss": 0.7328, "step": 4415 }, { "epoch": 0.46, "learning_rate": 0.00011784052424301216, "loss": 0.6085, "step": 4416 }, { "epoch": 0.46, "learning_rate": 0.00011780734881037414, "loss": 0.6792, "step": 4417 }, { "epoch": 0.46, "learning_rate": 0.00011777417135353534, "loss": 0.7009, "step": 4418 }, { "epoch": 0.46, "learning_rate": 0.00011774099187626708, "loss": 0.7045, "step": 4419 }, { "epoch": 0.46, "learning_rate": 0.00011770781038234097, "loss": 0.6926, "step": 4420 }, { "epoch": 0.46, "learning_rate": 0.00011767462687552877, "loss": 0.6361, "step": 4421 }, { "epoch": 0.46, "learning_rate": 0.00011764144135960257, "loss": 0.7396, "step": 4422 }, { "epoch": 0.46, "learning_rate": 0.0001176082538383346, "loss": 0.7147, "step": 4423 }, { "epoch": 0.46, "learning_rate": 0.00011757506431549742, "loss": 0.6737, "step": 4424 }, { "epoch": 0.46, "learning_rate": 0.0001175418727948637, "loss": 0.688, "step": 4425 }, { "epoch": 0.46, "learning_rate": 0.00011750867928020645, "loss": 0.6776, "step": 4426 }, { "epoch": 0.46, "learning_rate": 0.00011747548377529877, "loss": 0.7121, "step": 4427 }, { "epoch": 0.46, "learning_rate": 0.00011744228628391414, "loss": 0.6648, "step": 4428 }, { "epoch": 0.46, "learning_rate": 0.00011740908680982616, "loss": 0.6683, "step": 4429 }, { "epoch": 0.46, "learning_rate": 0.00011737588535680865, "loss": 0.6923, "step": 4430 }, { "epoch": 0.46, "learning_rate": 0.00011734268192863578, "loss": 0.6762, "step": 4431 }, { "epoch": 0.46, "learning_rate": 0.00011730947652908184, "loss": 0.6258, "step": 4432 }, { "epoch": 0.46, "learning_rate": 0.00011727626916192127, "loss": 0.6786, "step": 4433 }, { "epoch": 0.46, "learning_rate": 0.00011724305983092891, "loss": 0.6859, "step": 4434 }, { "epoch": 0.46, "learning_rate": 0.00011720984853987973, "loss": 0.6725, "step": 4435 }, { "epoch": 0.46, "learning_rate": 0.00011717663529254892, "loss": 0.6643, "step": 4436 }, { "epoch": 0.46, "learning_rate": 0.00011714342009271186, "loss": 0.6651, "step": 4437 }, { "epoch": 0.46, "learning_rate": 0.0001171102029441443, "loss": 0.7024, "step": 4438 }, { "epoch": 0.46, "learning_rate": 0.00011707698385062203, "loss": 0.6685, "step": 4439 }, { "epoch": 0.46, "learning_rate": 0.0001170437628159211, "loss": 0.7328, "step": 4440 }, { "epoch": 0.46, "learning_rate": 0.00011701053984381792, "loss": 0.7132, "step": 4441 }, { "epoch": 0.46, "learning_rate": 0.00011697731493808894, "loss": 0.667, "step": 4442 }, { "epoch": 0.46, "learning_rate": 0.00011694408810251093, "loss": 0.6001, "step": 4443 }, { "epoch": 0.46, "learning_rate": 0.0001169108593408609, "loss": 0.6916, "step": 4444 }, { "epoch": 0.46, "learning_rate": 0.000116877628656916, "loss": 0.6444, "step": 4445 }, { "epoch": 0.46, "learning_rate": 0.00011684439605445363, "loss": 0.739, "step": 4446 }, { "epoch": 0.46, "learning_rate": 0.0001168111615372514, "loss": 0.6276, "step": 4447 }, { "epoch": 0.46, "learning_rate": 0.0001167779251090872, "loss": 0.636, "step": 4448 }, { "epoch": 0.46, "learning_rate": 0.00011674468677373907, "loss": 0.7082, "step": 4449 }, { "epoch": 0.46, "learning_rate": 0.00011671144653498524, "loss": 0.7503, "step": 4450 }, { "epoch": 0.46, "learning_rate": 0.00011667820439660428, "loss": 0.6187, "step": 4451 }, { "epoch": 0.46, "learning_rate": 0.00011664496036237485, "loss": 0.7214, "step": 4452 }, { "epoch": 0.46, "learning_rate": 0.00011661171443607584, "loss": 0.7456, "step": 4453 }, { "epoch": 0.46, "learning_rate": 0.00011657846662148645, "loss": 0.693, "step": 4454 }, { "epoch": 0.46, "learning_rate": 0.00011654521692238602, "loss": 0.6812, "step": 4455 }, { "epoch": 0.46, "learning_rate": 0.00011651196534255411, "loss": 0.6606, "step": 4456 }, { "epoch": 0.46, "learning_rate": 0.00011647871188577048, "loss": 0.662, "step": 4457 }, { "epoch": 0.46, "learning_rate": 0.00011644545655581515, "loss": 0.6736, "step": 4458 }, { "epoch": 0.46, "learning_rate": 0.00011641219935646834, "loss": 0.7019, "step": 4459 }, { "epoch": 0.46, "learning_rate": 0.00011637894029151041, "loss": 0.7648, "step": 4460 }, { "epoch": 0.46, "learning_rate": 0.00011634567936472206, "loss": 0.7048, "step": 4461 }, { "epoch": 0.46, "learning_rate": 0.0001163124165798841, "loss": 0.6412, "step": 4462 }, { "epoch": 0.46, "learning_rate": 0.00011627915194077759, "loss": 0.6702, "step": 4463 }, { "epoch": 0.46, "learning_rate": 0.00011624588545118378, "loss": 0.6853, "step": 4464 }, { "epoch": 0.46, "learning_rate": 0.00011621261711488416, "loss": 0.6564, "step": 4465 }, { "epoch": 0.46, "learning_rate": 0.00011617934693566042, "loss": 0.6611, "step": 4466 }, { "epoch": 0.46, "learning_rate": 0.00011614607491729444, "loss": 0.6673, "step": 4467 }, { "epoch": 0.47, "learning_rate": 0.00011611280106356832, "loss": 0.7602, "step": 4468 }, { "epoch": 0.47, "learning_rate": 0.00011607952537826444, "loss": 0.7052, "step": 4469 }, { "epoch": 0.47, "learning_rate": 0.00011604624786516522, "loss": 0.7204, "step": 4470 }, { "epoch": 0.47, "learning_rate": 0.00011601296852805345, "loss": 0.6873, "step": 4471 }, { "epoch": 0.47, "learning_rate": 0.00011597968737071205, "loss": 0.707, "step": 4472 }, { "epoch": 0.47, "learning_rate": 0.00011594640439692417, "loss": 0.6856, "step": 4473 }, { "epoch": 0.47, "learning_rate": 0.00011591311961047315, "loss": 0.6925, "step": 4474 }, { "epoch": 0.47, "learning_rate": 0.00011587983301514256, "loss": 0.6626, "step": 4475 }, { "epoch": 0.47, "learning_rate": 0.00011584654461471613, "loss": 0.6872, "step": 4476 }, { "epoch": 0.47, "learning_rate": 0.00011581325441297788, "loss": 0.693, "step": 4477 }, { "epoch": 0.47, "learning_rate": 0.00011577996241371192, "loss": 0.5917, "step": 4478 }, { "epoch": 0.47, "learning_rate": 0.00011574666862070267, "loss": 0.6486, "step": 4479 }, { "epoch": 0.47, "learning_rate": 0.00011571337303773466, "loss": 0.7156, "step": 4480 }, { "epoch": 0.47, "learning_rate": 0.00011568007566859273, "loss": 0.6877, "step": 4481 }, { "epoch": 0.47, "learning_rate": 0.00011564677651706186, "loss": 0.6095, "step": 4482 }, { "epoch": 0.47, "learning_rate": 0.00011561347558692719, "loss": 0.6753, "step": 4483 }, { "epoch": 0.47, "learning_rate": 0.00011558017288197416, "loss": 0.6838, "step": 4484 }, { "epoch": 0.47, "learning_rate": 0.00011554686840598834, "loss": 0.6908, "step": 4485 }, { "epoch": 0.47, "learning_rate": 0.0001155135621627555, "loss": 0.6556, "step": 4486 }, { "epoch": 0.47, "learning_rate": 0.00011548025415606167, "loss": 0.6545, "step": 4487 }, { "epoch": 0.47, "learning_rate": 0.00011544694438969305, "loss": 0.7332, "step": 4488 }, { "epoch": 0.47, "learning_rate": 0.00011541363286743603, "loss": 0.6617, "step": 4489 }, { "epoch": 0.47, "learning_rate": 0.00011538031959307718, "loss": 0.6782, "step": 4490 }, { "epoch": 0.47, "learning_rate": 0.0001153470045704033, "loss": 0.6423, "step": 4491 }, { "epoch": 0.47, "learning_rate": 0.00011531368780320142, "loss": 0.6963, "step": 4492 }, { "epoch": 0.47, "learning_rate": 0.00011528036929525865, "loss": 0.7254, "step": 4493 }, { "epoch": 0.47, "learning_rate": 0.00011524704905036248, "loss": 0.6847, "step": 4494 }, { "epoch": 0.47, "learning_rate": 0.00011521372707230042, "loss": 0.655, "step": 4495 }, { "epoch": 0.47, "learning_rate": 0.00011518040336486029, "loss": 0.6517, "step": 4496 }, { "epoch": 0.47, "learning_rate": 0.00011514707793183008, "loss": 0.6761, "step": 4497 }, { "epoch": 0.47, "learning_rate": 0.00011511375077699792, "loss": 0.7086, "step": 4498 }, { "epoch": 0.47, "learning_rate": 0.00011508042190415223, "loss": 0.7383, "step": 4499 }, { "epoch": 0.47, "learning_rate": 0.00011504709131708151, "loss": 0.6286, "step": 4500 }, { "epoch": 0.47, "learning_rate": 0.00011501375901957459, "loss": 0.7303, "step": 4501 }, { "epoch": 0.47, "learning_rate": 0.00011498042501542041, "loss": 0.7099, "step": 4502 }, { "epoch": 0.47, "learning_rate": 0.00011494708930840809, "loss": 0.6114, "step": 4503 }, { "epoch": 0.47, "learning_rate": 0.00011491375190232702, "loss": 0.7373, "step": 4504 }, { "epoch": 0.47, "learning_rate": 0.0001148804128009667, "loss": 0.6928, "step": 4505 }, { "epoch": 0.47, "learning_rate": 0.00011484707200811688, "loss": 0.6602, "step": 4506 }, { "epoch": 0.47, "learning_rate": 0.00011481372952756747, "loss": 0.6521, "step": 4507 }, { "epoch": 0.47, "learning_rate": 0.00011478038536310858, "loss": 0.6503, "step": 4508 }, { "epoch": 0.47, "learning_rate": 0.00011474703951853057, "loss": 0.6648, "step": 4509 }, { "epoch": 0.47, "learning_rate": 0.0001147136919976238, "loss": 0.6781, "step": 4510 }, { "epoch": 0.47, "learning_rate": 0.00011468034280417912, "loss": 0.6718, "step": 4511 }, { "epoch": 0.47, "learning_rate": 0.00011464699194198729, "loss": 0.7009, "step": 4512 }, { "epoch": 0.47, "learning_rate": 0.00011461363941483943, "loss": 0.6293, "step": 4513 }, { "epoch": 0.47, "learning_rate": 0.00011458028522652677, "loss": 0.6717, "step": 4514 }, { "epoch": 0.47, "learning_rate": 0.0001145469293808408, "loss": 0.6431, "step": 4515 }, { "epoch": 0.47, "learning_rate": 0.00011451357188157312, "loss": 0.7123, "step": 4516 }, { "epoch": 0.47, "learning_rate": 0.00011448021273251552, "loss": 0.6621, "step": 4517 }, { "epoch": 0.47, "learning_rate": 0.00011444685193746008, "loss": 0.7037, "step": 4518 }, { "epoch": 0.47, "learning_rate": 0.00011441348950019895, "loss": 0.7346, "step": 4519 }, { "epoch": 0.47, "learning_rate": 0.00011438012542452447, "loss": 0.6061, "step": 4520 }, { "epoch": 0.47, "learning_rate": 0.0001143467597142293, "loss": 0.7064, "step": 4521 }, { "epoch": 0.47, "learning_rate": 0.00011431339237310616, "loss": 0.6682, "step": 4522 }, { "epoch": 0.47, "learning_rate": 0.00011428002340494797, "loss": 0.7012, "step": 4523 }, { "epoch": 0.47, "learning_rate": 0.00011424665281354785, "loss": 0.7202, "step": 4524 }, { "epoch": 0.47, "learning_rate": 0.00011421328060269913, "loss": 0.6786, "step": 4525 }, { "epoch": 0.47, "learning_rate": 0.00011417990677619533, "loss": 0.6538, "step": 4526 }, { "epoch": 0.47, "learning_rate": 0.00011414653133783005, "loss": 0.6905, "step": 4527 }, { "epoch": 0.47, "learning_rate": 0.00011411315429139721, "loss": 0.6837, "step": 4528 }, { "epoch": 0.47, "learning_rate": 0.00011407977564069085, "loss": 0.649, "step": 4529 }, { "epoch": 0.47, "learning_rate": 0.00011404639538950517, "loss": 0.7526, "step": 4530 }, { "epoch": 0.47, "learning_rate": 0.00011401301354163458, "loss": 0.6714, "step": 4531 }, { "epoch": 0.47, "learning_rate": 0.00011397963010087369, "loss": 0.6733, "step": 4532 }, { "epoch": 0.47, "learning_rate": 0.00011394624507101725, "loss": 0.7185, "step": 4533 }, { "epoch": 0.47, "learning_rate": 0.00011391285845586023, "loss": 0.5995, "step": 4534 }, { "epoch": 0.47, "learning_rate": 0.00011387947025919776, "loss": 0.7202, "step": 4535 }, { "epoch": 0.47, "learning_rate": 0.00011384608048482515, "loss": 0.6901, "step": 4536 }, { "epoch": 0.47, "learning_rate": 0.00011381268913653782, "loss": 0.6497, "step": 4537 }, { "epoch": 0.47, "learning_rate": 0.00011377929621813155, "loss": 0.7713, "step": 4538 }, { "epoch": 0.47, "learning_rate": 0.00011374590173340212, "loss": 0.7186, "step": 4539 }, { "epoch": 0.47, "learning_rate": 0.00011371250568614553, "loss": 0.7446, "step": 4540 }, { "epoch": 0.47, "learning_rate": 0.0001136791080801581, "loss": 0.7253, "step": 4541 }, { "epoch": 0.47, "learning_rate": 0.0001136457089192361, "loss": 0.7049, "step": 4542 }, { "epoch": 0.47, "learning_rate": 0.00011361230820717607, "loss": 0.7681, "step": 4543 }, { "epoch": 0.47, "learning_rate": 0.00011357890594777485, "loss": 0.6534, "step": 4544 }, { "epoch": 0.47, "learning_rate": 0.00011354550214482928, "loss": 0.7112, "step": 4545 }, { "epoch": 0.47, "learning_rate": 0.00011351209680213646, "loss": 0.6875, "step": 4546 }, { "epoch": 0.47, "learning_rate": 0.00011347868992349365, "loss": 0.6797, "step": 4547 }, { "epoch": 0.47, "learning_rate": 0.00011344528151269824, "loss": 0.6565, "step": 4548 }, { "epoch": 0.47, "learning_rate": 0.00011341187157354791, "loss": 0.6889, "step": 4549 }, { "epoch": 0.47, "learning_rate": 0.00011337846010984039, "loss": 0.6377, "step": 4550 }, { "epoch": 0.47, "learning_rate": 0.00011334504712537366, "loss": 0.697, "step": 4551 }, { "epoch": 0.47, "learning_rate": 0.00011331163262394584, "loss": 0.6611, "step": 4552 }, { "epoch": 0.47, "learning_rate": 0.00011327821660935524, "loss": 0.7033, "step": 4553 }, { "epoch": 0.47, "learning_rate": 0.00011324479908540034, "loss": 0.6753, "step": 4554 }, { "epoch": 0.47, "learning_rate": 0.00011321138005587975, "loss": 0.6684, "step": 4555 }, { "epoch": 0.47, "learning_rate": 0.00011317795952459229, "loss": 0.696, "step": 4556 }, { "epoch": 0.47, "learning_rate": 0.00011314453749533696, "loss": 0.6778, "step": 4557 }, { "epoch": 0.47, "learning_rate": 0.00011311111397191294, "loss": 0.6881, "step": 4558 }, { "epoch": 0.47, "learning_rate": 0.00011307768895811952, "loss": 0.7124, "step": 4559 }, { "epoch": 0.47, "learning_rate": 0.00011304426245775621, "loss": 0.6766, "step": 4560 }, { "epoch": 0.47, "learning_rate": 0.00011301083447462267, "loss": 0.6942, "step": 4561 }, { "epoch": 0.47, "learning_rate": 0.00011297740501251875, "loss": 0.6691, "step": 4562 }, { "epoch": 0.47, "learning_rate": 0.0001129439740752444, "loss": 0.768, "step": 4563 }, { "epoch": 0.48, "learning_rate": 0.00011291054166659984, "loss": 0.6744, "step": 4564 }, { "epoch": 0.48, "learning_rate": 0.0001128771077903854, "loss": 0.6842, "step": 4565 }, { "epoch": 0.48, "learning_rate": 0.00011284367245040157, "loss": 0.7023, "step": 4566 }, { "epoch": 0.48, "learning_rate": 0.00011281023565044901, "loss": 0.735, "step": 4567 }, { "epoch": 0.48, "learning_rate": 0.00011277679739432858, "loss": 0.7019, "step": 4568 }, { "epoch": 0.48, "learning_rate": 0.00011274335768584127, "loss": 0.6118, "step": 4569 }, { "epoch": 0.48, "learning_rate": 0.00011270991652878824, "loss": 0.6845, "step": 4570 }, { "epoch": 0.48, "learning_rate": 0.00011267647392697083, "loss": 0.662, "step": 4571 }, { "epoch": 0.48, "learning_rate": 0.00011264302988419051, "loss": 0.6963, "step": 4572 }, { "epoch": 0.48, "learning_rate": 0.00011260958440424898, "loss": 0.6781, "step": 4573 }, { "epoch": 0.48, "learning_rate": 0.00011257613749094802, "loss": 0.6597, "step": 4574 }, { "epoch": 0.48, "learning_rate": 0.00011254268914808965, "loss": 0.6764, "step": 4575 }, { "epoch": 0.48, "learning_rate": 0.00011250923937947602, "loss": 0.6822, "step": 4576 }, { "epoch": 0.48, "learning_rate": 0.00011247578818890936, "loss": 0.6459, "step": 4577 }, { "epoch": 0.48, "learning_rate": 0.00011244233558019226, "loss": 0.6169, "step": 4578 }, { "epoch": 0.48, "learning_rate": 0.00011240888155712728, "loss": 0.6822, "step": 4579 }, { "epoch": 0.48, "learning_rate": 0.00011237542612351722, "loss": 0.6343, "step": 4580 }, { "epoch": 0.48, "learning_rate": 0.00011234196928316503, "loss": 0.6907, "step": 4581 }, { "epoch": 0.48, "learning_rate": 0.00011230851103987385, "loss": 0.6596, "step": 4582 }, { "epoch": 0.48, "learning_rate": 0.00011227505139744692, "loss": 0.7362, "step": 4583 }, { "epoch": 0.48, "learning_rate": 0.00011224159035968769, "loss": 0.671, "step": 4584 }, { "epoch": 0.48, "learning_rate": 0.00011220812793039976, "loss": 0.6992, "step": 4585 }, { "epoch": 0.48, "learning_rate": 0.00011217466411338686, "loss": 0.6907, "step": 4586 }, { "epoch": 0.48, "learning_rate": 0.00011214119891245291, "loss": 0.7083, "step": 4587 }, { "epoch": 0.48, "learning_rate": 0.00011210773233140197, "loss": 0.7049, "step": 4588 }, { "epoch": 0.48, "learning_rate": 0.00011207426437403826, "loss": 0.622, "step": 4589 }, { "epoch": 0.48, "learning_rate": 0.00011204079504416614, "loss": 0.6507, "step": 4590 }, { "epoch": 0.48, "learning_rate": 0.00011200732434559015, "loss": 0.6715, "step": 4591 }, { "epoch": 0.48, "learning_rate": 0.00011197385228211499, "loss": 0.6622, "step": 4592 }, { "epoch": 0.48, "learning_rate": 0.00011194037885754552, "loss": 0.698, "step": 4593 }, { "epoch": 0.48, "learning_rate": 0.00011190690407568672, "loss": 0.6899, "step": 4594 }, { "epoch": 0.48, "learning_rate": 0.0001118734279403437, "loss": 0.65, "step": 4595 }, { "epoch": 0.48, "learning_rate": 0.00011183995045532185, "loss": 0.6151, "step": 4596 }, { "epoch": 0.48, "learning_rate": 0.00011180647162442654, "loss": 0.6758, "step": 4597 }, { "epoch": 0.48, "learning_rate": 0.00011177299145146345, "loss": 0.6987, "step": 4598 }, { "epoch": 0.48, "learning_rate": 0.00011173950994023836, "loss": 0.6951, "step": 4599 }, { "epoch": 0.48, "learning_rate": 0.00011170602709455711, "loss": 0.6302, "step": 4600 }, { "epoch": 0.48, "learning_rate": 0.00011167254291822582, "loss": 0.6824, "step": 4601 }, { "epoch": 0.48, "learning_rate": 0.00011163905741505072, "loss": 0.6706, "step": 4602 }, { "epoch": 0.48, "learning_rate": 0.00011160557058883814, "loss": 0.7343, "step": 4603 }, { "epoch": 0.48, "learning_rate": 0.00011157208244339464, "loss": 0.7106, "step": 4604 }, { "epoch": 0.48, "learning_rate": 0.0001115385929825269, "loss": 0.6844, "step": 4605 }, { "epoch": 0.48, "learning_rate": 0.00011150510221004168, "loss": 0.736, "step": 4606 }, { "epoch": 0.48, "learning_rate": 0.00011147161012974598, "loss": 0.7103, "step": 4607 }, { "epoch": 0.48, "learning_rate": 0.00011143811674544695, "loss": 0.6723, "step": 4608 }, { "epoch": 0.48, "learning_rate": 0.00011140462206095184, "loss": 0.7161, "step": 4609 }, { "epoch": 0.48, "learning_rate": 0.00011137112608006803, "loss": 0.7303, "step": 4610 }, { "epoch": 0.48, "learning_rate": 0.00011133762880660315, "loss": 0.663, "step": 4611 }, { "epoch": 0.48, "learning_rate": 0.00011130413024436488, "loss": 0.6746, "step": 4612 }, { "epoch": 0.48, "learning_rate": 0.00011127063039716101, "loss": 0.7059, "step": 4613 }, { "epoch": 0.48, "learning_rate": 0.00011123712926879965, "loss": 0.6342, "step": 4614 }, { "epoch": 0.48, "learning_rate": 0.00011120362686308889, "loss": 0.6155, "step": 4615 }, { "epoch": 0.48, "learning_rate": 0.00011117012318383701, "loss": 0.7407, "step": 4616 }, { "epoch": 0.48, "learning_rate": 0.00011113661823485246, "loss": 0.6531, "step": 4617 }, { "epoch": 0.48, "learning_rate": 0.00011110311201994388, "loss": 0.7021, "step": 4618 }, { "epoch": 0.48, "learning_rate": 0.00011106960454291992, "loss": 0.6533, "step": 4619 }, { "epoch": 0.48, "learning_rate": 0.00011103609580758944, "loss": 0.6901, "step": 4620 }, { "epoch": 0.48, "learning_rate": 0.00011100258581776153, "loss": 0.7182, "step": 4621 }, { "epoch": 0.48, "learning_rate": 0.00011096907457724529, "loss": 0.6967, "step": 4622 }, { "epoch": 0.48, "learning_rate": 0.00011093556208984999, "loss": 0.6227, "step": 4623 }, { "epoch": 0.48, "learning_rate": 0.00011090204835938516, "loss": 0.6722, "step": 4624 }, { "epoch": 0.48, "learning_rate": 0.00011086853338966032, "loss": 0.6275, "step": 4625 }, { "epoch": 0.48, "learning_rate": 0.00011083501718448516, "loss": 0.6657, "step": 4626 }, { "epoch": 0.48, "learning_rate": 0.0001108014997476696, "loss": 0.6909, "step": 4627 }, { "epoch": 0.48, "learning_rate": 0.00011076798108302362, "loss": 0.6979, "step": 4628 }, { "epoch": 0.48, "learning_rate": 0.00011073446119435738, "loss": 0.6477, "step": 4629 }, { "epoch": 0.48, "learning_rate": 0.00011070094008548113, "loss": 0.67, "step": 4630 }, { "epoch": 0.48, "learning_rate": 0.00011066741776020528, "loss": 0.6223, "step": 4631 }, { "epoch": 0.48, "learning_rate": 0.00011063389422234043, "loss": 0.7241, "step": 4632 }, { "epoch": 0.48, "learning_rate": 0.00011060036947569723, "loss": 0.6887, "step": 4633 }, { "epoch": 0.48, "learning_rate": 0.00011056684352408656, "loss": 0.6891, "step": 4634 }, { "epoch": 0.48, "learning_rate": 0.00011053331637131934, "loss": 0.7348, "step": 4635 }, { "epoch": 0.48, "learning_rate": 0.0001104997880212067, "loss": 0.7178, "step": 4636 }, { "epoch": 0.48, "learning_rate": 0.00011046625847755991, "loss": 0.7014, "step": 4637 }, { "epoch": 0.48, "learning_rate": 0.00011043272774419031, "loss": 0.7339, "step": 4638 }, { "epoch": 0.48, "learning_rate": 0.00011039919582490941, "loss": 0.584, "step": 4639 }, { "epoch": 0.48, "learning_rate": 0.00011036566272352886, "loss": 0.761, "step": 4640 }, { "epoch": 0.48, "learning_rate": 0.00011033212844386045, "loss": 0.6638, "step": 4641 }, { "epoch": 0.48, "learning_rate": 0.00011029859298971612, "loss": 0.6673, "step": 4642 }, { "epoch": 0.48, "learning_rate": 0.00011026505636490789, "loss": 0.7065, "step": 4643 }, { "epoch": 0.48, "learning_rate": 0.00011023151857324794, "loss": 0.661, "step": 4644 }, { "epoch": 0.48, "learning_rate": 0.00011019797961854861, "loss": 0.6988, "step": 4645 }, { "epoch": 0.48, "learning_rate": 0.00011016443950462232, "loss": 0.7584, "step": 4646 }, { "epoch": 0.48, "learning_rate": 0.00011013089823528164, "loss": 0.6605, "step": 4647 }, { "epoch": 0.48, "learning_rate": 0.00011009735581433931, "loss": 0.737, "step": 4648 }, { "epoch": 0.48, "learning_rate": 0.00011006381224560818, "loss": 0.7298, "step": 4649 }, { "epoch": 0.48, "learning_rate": 0.0001100302675329012, "loss": 0.7038, "step": 4650 }, { "epoch": 0.48, "learning_rate": 0.00010999672168003147, "loss": 0.6768, "step": 4651 }, { "epoch": 0.48, "learning_rate": 0.00010996317469081223, "loss": 0.6469, "step": 4652 }, { "epoch": 0.48, "learning_rate": 0.00010992962656905684, "loss": 0.6271, "step": 4653 }, { "epoch": 0.48, "learning_rate": 0.00010989607731857878, "loss": 0.6622, "step": 4654 }, { "epoch": 0.48, "learning_rate": 0.00010986252694319168, "loss": 0.6816, "step": 4655 }, { "epoch": 0.48, "learning_rate": 0.00010982897544670927, "loss": 0.6677, "step": 4656 }, { "epoch": 0.48, "learning_rate": 0.00010979542283294546, "loss": 0.6805, "step": 4657 }, { "epoch": 0.48, "learning_rate": 0.0001097618691057142, "loss": 0.6068, "step": 4658 }, { "epoch": 0.48, "learning_rate": 0.00010972831426882966, "loss": 0.684, "step": 4659 }, { "epoch": 0.49, "learning_rate": 0.00010969475832610604, "loss": 0.6605, "step": 4660 }, { "epoch": 0.49, "learning_rate": 0.00010966120128135777, "loss": 0.6878, "step": 4661 }, { "epoch": 0.49, "learning_rate": 0.00010962764313839933, "loss": 0.6533, "step": 4662 }, { "epoch": 0.49, "learning_rate": 0.00010959408390104535, "loss": 0.6447, "step": 4663 }, { "epoch": 0.49, "learning_rate": 0.00010956052357311062, "loss": 0.6552, "step": 4664 }, { "epoch": 0.49, "learning_rate": 0.00010952696215840995, "loss": 0.7244, "step": 4665 }, { "epoch": 0.49, "learning_rate": 0.00010949339966075838, "loss": 0.6623, "step": 4666 }, { "epoch": 0.49, "learning_rate": 0.00010945983608397101, "loss": 0.6856, "step": 4667 }, { "epoch": 0.49, "learning_rate": 0.00010942627143186313, "loss": 0.6104, "step": 4668 }, { "epoch": 0.49, "learning_rate": 0.00010939270570825007, "loss": 0.6225, "step": 4669 }, { "epoch": 0.49, "learning_rate": 0.00010935913891694733, "loss": 0.646, "step": 4670 }, { "epoch": 0.49, "learning_rate": 0.00010932557106177053, "loss": 0.6603, "step": 4671 }, { "epoch": 0.49, "learning_rate": 0.00010929200214653539, "loss": 0.6613, "step": 4672 }, { "epoch": 0.49, "learning_rate": 0.00010925843217505776, "loss": 0.5581, "step": 4673 }, { "epoch": 0.49, "learning_rate": 0.00010922486115115362, "loss": 0.7455, "step": 4674 }, { "epoch": 0.49, "learning_rate": 0.0001091912890786391, "loss": 0.583, "step": 4675 }, { "epoch": 0.49, "learning_rate": 0.00010915771596133038, "loss": 0.6859, "step": 4676 }, { "epoch": 0.49, "learning_rate": 0.00010912414180304373, "loss": 0.6615, "step": 4677 }, { "epoch": 0.49, "learning_rate": 0.0001090905666075957, "loss": 0.7103, "step": 4678 }, { "epoch": 0.49, "learning_rate": 0.00010905699037880279, "loss": 0.7036, "step": 4679 }, { "epoch": 0.49, "learning_rate": 0.0001090234131204817, "loss": 0.6334, "step": 4680 }, { "epoch": 0.49, "learning_rate": 0.00010898983483644926, "loss": 0.7166, "step": 4681 }, { "epoch": 0.49, "learning_rate": 0.00010895625553052235, "loss": 0.6366, "step": 4682 }, { "epoch": 0.49, "learning_rate": 0.00010892267520651804, "loss": 0.687, "step": 4683 }, { "epoch": 0.49, "learning_rate": 0.00010888909386825346, "loss": 0.7074, "step": 4684 }, { "epoch": 0.49, "learning_rate": 0.00010885551151954588, "loss": 0.7044, "step": 4685 }, { "epoch": 0.49, "learning_rate": 0.00010882192816421266, "loss": 0.6252, "step": 4686 }, { "epoch": 0.49, "learning_rate": 0.0001087883438060713, "loss": 0.6687, "step": 4687 }, { "epoch": 0.49, "learning_rate": 0.00010875475844893943, "loss": 0.6909, "step": 4688 }, { "epoch": 0.49, "learning_rate": 0.0001087211720966348, "loss": 0.6852, "step": 4689 }, { "epoch": 0.49, "learning_rate": 0.00010868758475297514, "loss": 0.6536, "step": 4690 }, { "epoch": 0.49, "learning_rate": 0.0001086539964217785, "loss": 0.6632, "step": 4691 }, { "epoch": 0.49, "learning_rate": 0.0001086204071068629, "loss": 0.6935, "step": 4692 }, { "epoch": 0.49, "learning_rate": 0.0001085868168120465, "loss": 0.6684, "step": 4693 }, { "epoch": 0.49, "learning_rate": 0.00010855322554114762, "loss": 0.6583, "step": 4694 }, { "epoch": 0.49, "learning_rate": 0.00010851963329798465, "loss": 0.6688, "step": 4695 }, { "epoch": 0.49, "learning_rate": 0.00010848604008637604, "loss": 0.7125, "step": 4696 }, { "epoch": 0.49, "learning_rate": 0.00010845244591014046, "loss": 0.7214, "step": 4697 }, { "epoch": 0.49, "learning_rate": 0.00010841885077309659, "loss": 0.6284, "step": 4698 }, { "epoch": 0.49, "learning_rate": 0.00010838525467906333, "loss": 0.6152, "step": 4699 }, { "epoch": 0.49, "learning_rate": 0.00010835165763185955, "loss": 0.7135, "step": 4700 }, { "epoch": 0.49, "learning_rate": 0.00010831805963530437, "loss": 0.6714, "step": 4701 }, { "epoch": 0.49, "learning_rate": 0.00010828446069321689, "loss": 0.6579, "step": 4702 }, { "epoch": 0.49, "learning_rate": 0.0001082508608094164, "loss": 0.6904, "step": 4703 }, { "epoch": 0.49, "learning_rate": 0.00010821725998772228, "loss": 0.6985, "step": 4704 }, { "epoch": 0.49, "learning_rate": 0.000108183658231954, "loss": 0.6691, "step": 4705 }, { "epoch": 0.49, "learning_rate": 0.00010815005554593114, "loss": 0.6898, "step": 4706 }, { "epoch": 0.49, "learning_rate": 0.00010811645193347341, "loss": 0.7033, "step": 4707 }, { "epoch": 0.49, "learning_rate": 0.0001080828473984006, "loss": 0.6652, "step": 4708 }, { "epoch": 0.49, "learning_rate": 0.00010804924194453261, "loss": 0.6927, "step": 4709 }, { "epoch": 0.49, "learning_rate": 0.00010801563557568941, "loss": 0.7174, "step": 4710 }, { "epoch": 0.49, "learning_rate": 0.00010798202829569117, "loss": 0.7456, "step": 4711 }, { "epoch": 0.49, "learning_rate": 0.00010794842010835809, "loss": 0.7269, "step": 4712 }, { "epoch": 0.49, "learning_rate": 0.00010791481101751047, "loss": 0.6532, "step": 4713 }, { "epoch": 0.49, "learning_rate": 0.00010788120102696875, "loss": 0.6587, "step": 4714 }, { "epoch": 0.49, "learning_rate": 0.00010784759014055344, "loss": 0.6845, "step": 4715 }, { "epoch": 0.49, "learning_rate": 0.00010781397836208516, "loss": 0.7846, "step": 4716 }, { "epoch": 0.49, "learning_rate": 0.00010778036569538459, "loss": 0.6903, "step": 4717 }, { "epoch": 0.49, "learning_rate": 0.00010774675214427265, "loss": 0.6914, "step": 4718 }, { "epoch": 0.49, "learning_rate": 0.00010771313771257023, "loss": 0.734, "step": 4719 }, { "epoch": 0.49, "learning_rate": 0.00010767952240409833, "loss": 0.6923, "step": 4720 }, { "epoch": 0.49, "learning_rate": 0.00010764590622267809, "loss": 0.5511, "step": 4721 }, { "epoch": 0.49, "learning_rate": 0.00010761228917213078, "loss": 0.6571, "step": 4722 }, { "epoch": 0.49, "learning_rate": 0.00010757867125627763, "loss": 0.7097, "step": 4723 }, { "epoch": 0.49, "learning_rate": 0.00010754505247894015, "loss": 0.6844, "step": 4724 }, { "epoch": 0.49, "learning_rate": 0.00010751143284393983, "loss": 0.6769, "step": 4725 }, { "epoch": 0.49, "learning_rate": 0.00010747781235509828, "loss": 0.6485, "step": 4726 }, { "epoch": 0.49, "learning_rate": 0.00010744419101623723, "loss": 0.7384, "step": 4727 }, { "epoch": 0.49, "learning_rate": 0.0001074105688311785, "loss": 0.6567, "step": 4728 }, { "epoch": 0.49, "learning_rate": 0.00010737694580374395, "loss": 0.7011, "step": 4729 }, { "epoch": 0.49, "learning_rate": 0.00010734332193775562, "loss": 0.6559, "step": 4730 }, { "epoch": 0.49, "learning_rate": 0.00010730969723703563, "loss": 0.7007, "step": 4731 }, { "epoch": 0.49, "learning_rate": 0.00010727607170540616, "loss": 0.6335, "step": 4732 }, { "epoch": 0.49, "learning_rate": 0.00010724244534668949, "loss": 0.6642, "step": 4733 }, { "epoch": 0.49, "learning_rate": 0.00010720881816470797, "loss": 0.6826, "step": 4734 }, { "epoch": 0.49, "learning_rate": 0.00010717519016328414, "loss": 0.6358, "step": 4735 }, { "epoch": 0.49, "learning_rate": 0.00010714156134624054, "loss": 0.6564, "step": 4736 }, { "epoch": 0.49, "learning_rate": 0.0001071079317173998, "loss": 0.6429, "step": 4737 }, { "epoch": 0.49, "learning_rate": 0.00010707430128058473, "loss": 0.6615, "step": 4738 }, { "epoch": 0.49, "learning_rate": 0.00010704067003961815, "loss": 0.6595, "step": 4739 }, { "epoch": 0.49, "learning_rate": 0.00010700703799832301, "loss": 0.6339, "step": 4740 }, { "epoch": 0.49, "learning_rate": 0.00010697340516052233, "loss": 0.7289, "step": 4741 }, { "epoch": 0.49, "learning_rate": 0.0001069397715300392, "loss": 0.6431, "step": 4742 }, { "epoch": 0.49, "learning_rate": 0.00010690613711069686, "loss": 0.6706, "step": 4743 }, { "epoch": 0.49, "learning_rate": 0.0001068725019063186, "loss": 0.7019, "step": 4744 }, { "epoch": 0.49, "learning_rate": 0.00010683886592072784, "loss": 0.6729, "step": 4745 }, { "epoch": 0.49, "learning_rate": 0.00010680522915774803, "loss": 0.6989, "step": 4746 }, { "epoch": 0.49, "learning_rate": 0.00010677159162120274, "loss": 0.7233, "step": 4747 }, { "epoch": 0.49, "learning_rate": 0.0001067379533149156, "loss": 0.6772, "step": 4748 }, { "epoch": 0.49, "learning_rate": 0.00010670431424271039, "loss": 0.6633, "step": 4749 }, { "epoch": 0.49, "learning_rate": 0.00010667067440841089, "loss": 0.6703, "step": 4750 }, { "epoch": 0.49, "learning_rate": 0.00010663703381584107, "loss": 0.62, "step": 4751 }, { "epoch": 0.49, "learning_rate": 0.00010660339246882489, "loss": 0.694, "step": 4752 }, { "epoch": 0.49, "learning_rate": 0.00010656975037118647, "loss": 0.7187, "step": 4753 }, { "epoch": 0.49, "learning_rate": 0.00010653610752674994, "loss": 0.6539, "step": 4754 }, { "epoch": 0.49, "learning_rate": 0.0001065024639393396, "loss": 0.674, "step": 4755 }, { "epoch": 0.5, "learning_rate": 0.00010646881961277974, "loss": 0.7144, "step": 4756 }, { "epoch": 0.5, "learning_rate": 0.00010643517455089482, "loss": 0.7051, "step": 4757 }, { "epoch": 0.5, "learning_rate": 0.00010640152875750938, "loss": 0.6629, "step": 4758 }, { "epoch": 0.5, "learning_rate": 0.00010636788223644795, "loss": 0.6934, "step": 4759 }, { "epoch": 0.5, "learning_rate": 0.00010633423499153523, "loss": 0.643, "step": 4760 }, { "epoch": 0.5, "learning_rate": 0.000106300587026596, "loss": 0.6515, "step": 4761 }, { "epoch": 0.5, "learning_rate": 0.00010626693834545505, "loss": 0.6573, "step": 4762 }, { "epoch": 0.5, "learning_rate": 0.00010623328895193731, "loss": 0.6892, "step": 4763 }, { "epoch": 0.5, "learning_rate": 0.00010619963884986783, "loss": 0.6779, "step": 4764 }, { "epoch": 0.5, "learning_rate": 0.00010616598804307167, "loss": 0.6805, "step": 4765 }, { "epoch": 0.5, "learning_rate": 0.00010613233653537398, "loss": 0.6827, "step": 4766 }, { "epoch": 0.5, "learning_rate": 0.00010609868433059997, "loss": 0.6671, "step": 4767 }, { "epoch": 0.5, "learning_rate": 0.000106065031432575, "loss": 0.7087, "step": 4768 }, { "epoch": 0.5, "learning_rate": 0.0001060313778451245, "loss": 0.7101, "step": 4769 }, { "epoch": 0.5, "learning_rate": 0.00010599772357207385, "loss": 0.6461, "step": 4770 }, { "epoch": 0.5, "learning_rate": 0.0001059640686172487, "loss": 0.6707, "step": 4771 }, { "epoch": 0.5, "learning_rate": 0.00010593041298447469, "loss": 0.678, "step": 4772 }, { "epoch": 0.5, "learning_rate": 0.00010589675667757741, "loss": 0.6747, "step": 4773 }, { "epoch": 0.5, "learning_rate": 0.00010586309970038277, "loss": 0.6474, "step": 4774 }, { "epoch": 0.5, "learning_rate": 0.00010582944205671661, "loss": 0.6909, "step": 4775 }, { "epoch": 0.5, "learning_rate": 0.00010579578375040483, "loss": 0.7454, "step": 4776 }, { "epoch": 0.5, "learning_rate": 0.00010576212478527343, "loss": 0.6756, "step": 4777 }, { "epoch": 0.5, "learning_rate": 0.0001057284651651486, "loss": 0.6538, "step": 4778 }, { "epoch": 0.5, "learning_rate": 0.0001056948048938564, "loss": 0.648, "step": 4779 }, { "epoch": 0.5, "learning_rate": 0.00010566114397522309, "loss": 0.6786, "step": 4780 }, { "epoch": 0.5, "learning_rate": 0.000105627482413075, "loss": 0.7235, "step": 4781 }, { "epoch": 0.5, "learning_rate": 0.00010559382021123853, "loss": 0.6635, "step": 4782 }, { "epoch": 0.5, "learning_rate": 0.00010556015737354007, "loss": 0.6996, "step": 4783 }, { "epoch": 0.5, "learning_rate": 0.00010552649390380625, "loss": 0.685, "step": 4784 }, { "epoch": 0.5, "learning_rate": 0.00010549282980586363, "loss": 0.6795, "step": 4785 }, { "epoch": 0.5, "learning_rate": 0.00010545916508353883, "loss": 0.7173, "step": 4786 }, { "epoch": 0.5, "learning_rate": 0.00010542549974065865, "loss": 0.7255, "step": 4787 }, { "epoch": 0.5, "learning_rate": 0.0001053918337810499, "loss": 0.6328, "step": 4788 }, { "epoch": 0.5, "learning_rate": 0.00010535816720853942, "loss": 0.6984, "step": 4789 }, { "epoch": 0.5, "learning_rate": 0.00010532450002695419, "loss": 0.7353, "step": 4790 }, { "epoch": 0.5, "learning_rate": 0.00010529083224012129, "loss": 0.6537, "step": 4791 }, { "epoch": 0.5, "learning_rate": 0.00010525716385186773, "loss": 0.6371, "step": 4792 }, { "epoch": 0.5, "learning_rate": 0.00010522349486602067, "loss": 0.653, "step": 4793 }, { "epoch": 0.5, "learning_rate": 0.00010518982528640742, "loss": 0.6901, "step": 4794 }, { "epoch": 0.5, "learning_rate": 0.00010515615511685521, "loss": 0.5709, "step": 4795 }, { "epoch": 0.5, "learning_rate": 0.00010512248436119143, "loss": 0.5995, "step": 4796 }, { "epoch": 0.5, "learning_rate": 0.00010508881302324348, "loss": 0.6695, "step": 4797 }, { "epoch": 0.5, "learning_rate": 0.00010505514110683888, "loss": 0.6883, "step": 4798 }, { "epoch": 0.5, "learning_rate": 0.0001050214686158052, "loss": 0.6469, "step": 4799 }, { "epoch": 0.5, "learning_rate": 0.00010498779555397001, "loss": 0.7124, "step": 4800 }, { "epoch": 0.5, "learning_rate": 0.00010495412192516107, "loss": 0.6248, "step": 4801 }, { "epoch": 0.5, "learning_rate": 0.0001049204477332061, "loss": 0.7161, "step": 4802 }, { "epoch": 0.5, "learning_rate": 0.00010488677298193295, "loss": 0.6817, "step": 4803 }, { "epoch": 0.5, "learning_rate": 0.00010485309767516946, "loss": 0.6403, "step": 4804 }, { "epoch": 0.5, "learning_rate": 0.00010481942181674362, "loss": 0.6429, "step": 4805 }, { "epoch": 0.5, "learning_rate": 0.0001047857454104834, "loss": 0.7031, "step": 4806 }, { "epoch": 0.5, "learning_rate": 0.00010475206846021688, "loss": 0.6821, "step": 4807 }, { "epoch": 0.5, "learning_rate": 0.00010471839096977223, "loss": 0.7396, "step": 4808 }, { "epoch": 0.5, "learning_rate": 0.00010468471294297762, "loss": 0.6803, "step": 4809 }, { "epoch": 0.5, "learning_rate": 0.00010465103438366131, "loss": 0.7167, "step": 4810 }, { "epoch": 0.5, "learning_rate": 0.0001046173552956516, "loss": 0.7059, "step": 4811 }, { "epoch": 0.5, "learning_rate": 0.00010458367568277687, "loss": 0.6949, "step": 4812 }, { "epoch": 0.5, "learning_rate": 0.00010454999554886556, "loss": 0.7362, "step": 4813 }, { "epoch": 0.5, "learning_rate": 0.00010451631489774618, "loss": 0.694, "step": 4814 }, { "epoch": 0.5, "learning_rate": 0.00010448263373324727, "loss": 0.6523, "step": 4815 }, { "epoch": 0.5, "learning_rate": 0.00010444895205919747, "loss": 0.6697, "step": 4816 }, { "epoch": 0.5, "learning_rate": 0.0001044152698794254, "loss": 0.6988, "step": 4817 }, { "epoch": 0.5, "learning_rate": 0.00010438158719775983, "loss": 0.7113, "step": 4818 }, { "epoch": 0.5, "learning_rate": 0.00010434790401802954, "loss": 0.6519, "step": 4819 }, { "epoch": 0.5, "learning_rate": 0.00010431422034406333, "loss": 0.6451, "step": 4820 }, { "epoch": 0.5, "learning_rate": 0.00010428053617969016, "loss": 0.6923, "step": 4821 }, { "epoch": 0.5, "learning_rate": 0.00010424685152873894, "loss": 0.6403, "step": 4822 }, { "epoch": 0.5, "learning_rate": 0.00010421316639503871, "loss": 0.738, "step": 4823 }, { "epoch": 0.5, "learning_rate": 0.00010417948078241851, "loss": 0.7062, "step": 4824 }, { "epoch": 0.5, "learning_rate": 0.00010414579469470745, "loss": 0.658, "step": 4825 }, { "epoch": 0.5, "learning_rate": 0.00010411210813573474, "loss": 0.6939, "step": 4826 }, { "epoch": 0.5, "learning_rate": 0.00010407842110932955, "loss": 0.7024, "step": 4827 }, { "epoch": 0.5, "learning_rate": 0.00010404473361932121, "loss": 0.6415, "step": 4828 }, { "epoch": 0.5, "learning_rate": 0.00010401104566953904, "loss": 0.6087, "step": 4829 }, { "epoch": 0.5, "learning_rate": 0.00010397735726381242, "loss": 0.6729, "step": 4830 }, { "epoch": 0.5, "learning_rate": 0.00010394366840597077, "loss": 0.7215, "step": 4831 }, { "epoch": 0.5, "learning_rate": 0.0001039099790998436, "loss": 0.7523, "step": 4832 }, { "epoch": 0.5, "learning_rate": 0.00010387628934926042, "loss": 0.6538, "step": 4833 }, { "epoch": 0.5, "learning_rate": 0.00010384259915805084, "loss": 0.6994, "step": 4834 }, { "epoch": 0.5, "learning_rate": 0.00010380890853004452, "loss": 0.7147, "step": 4835 }, { "epoch": 0.5, "learning_rate": 0.0001037752174690711, "loss": 0.719, "step": 4836 }, { "epoch": 0.5, "learning_rate": 0.00010374152597896036, "loss": 0.6908, "step": 4837 }, { "epoch": 0.5, "learning_rate": 0.00010370783406354207, "loss": 0.7049, "step": 4838 }, { "epoch": 0.5, "learning_rate": 0.00010367414172664607, "loss": 0.6976, "step": 4839 }, { "epoch": 0.5, "learning_rate": 0.00010364044897210219, "loss": 0.6956, "step": 4840 }, { "epoch": 0.5, "learning_rate": 0.00010360675580374045, "loss": 0.7437, "step": 4841 }, { "epoch": 0.5, "learning_rate": 0.00010357306222539077, "loss": 0.6682, "step": 4842 }, { "epoch": 0.5, "learning_rate": 0.00010353936824088317, "loss": 0.6075, "step": 4843 }, { "epoch": 0.5, "learning_rate": 0.00010350567385404776, "loss": 0.7289, "step": 4844 }, { "epoch": 0.5, "learning_rate": 0.00010347197906871464, "loss": 0.7149, "step": 4845 }, { "epoch": 0.5, "learning_rate": 0.00010343828388871395, "loss": 0.715, "step": 4846 }, { "epoch": 0.5, "learning_rate": 0.00010340458831787589, "loss": 0.6887, "step": 4847 }, { "epoch": 0.5, "learning_rate": 0.00010337089236003075, "loss": 0.624, "step": 4848 }, { "epoch": 0.5, "learning_rate": 0.00010333719601900882, "loss": 0.6682, "step": 4849 }, { "epoch": 0.5, "learning_rate": 0.00010330349929864038, "loss": 0.6781, "step": 4850 }, { "epoch": 0.5, "learning_rate": 0.00010326980220275586, "loss": 0.6385, "step": 4851 }, { "epoch": 0.51, "learning_rate": 0.0001032361047351857, "loss": 0.5948, "step": 4852 }, { "epoch": 0.51, "learning_rate": 0.00010320240689976031, "loss": 0.673, "step": 4853 }, { "epoch": 0.51, "learning_rate": 0.00010316870870031025, "loss": 0.6504, "step": 4854 }, { "epoch": 0.51, "learning_rate": 0.00010313501014066604, "loss": 0.7098, "step": 4855 }, { "epoch": 0.51, "learning_rate": 0.00010310131122465831, "loss": 0.7166, "step": 4856 }, { "epoch": 0.51, "learning_rate": 0.00010306761195611762, "loss": 0.6422, "step": 4857 }, { "epoch": 0.51, "learning_rate": 0.0001030339123388747, "loss": 0.7209, "step": 4858 }, { "epoch": 0.51, "learning_rate": 0.00010300021237676023, "loss": 0.7282, "step": 4859 }, { "epoch": 0.51, "learning_rate": 0.00010296651207360494, "loss": 0.6841, "step": 4860 }, { "epoch": 0.51, "learning_rate": 0.0001029328114332397, "loss": 0.6151, "step": 4861 }, { "epoch": 0.51, "learning_rate": 0.00010289911045949527, "loss": 0.6688, "step": 4862 }, { "epoch": 0.51, "learning_rate": 0.0001028654091562025, "loss": 0.669, "step": 4863 }, { "epoch": 0.51, "learning_rate": 0.00010283170752719233, "loss": 0.6191, "step": 4864 }, { "epoch": 0.51, "learning_rate": 0.0001027980055762957, "loss": 0.6467, "step": 4865 }, { "epoch": 0.51, "learning_rate": 0.00010276430330734359, "loss": 0.6744, "step": 4866 }, { "epoch": 0.51, "learning_rate": 0.00010273060072416693, "loss": 0.6681, "step": 4867 }, { "epoch": 0.51, "learning_rate": 0.00010269689783059693, "loss": 0.6973, "step": 4868 }, { "epoch": 0.51, "learning_rate": 0.00010266319463046453, "loss": 0.6169, "step": 4869 }, { "epoch": 0.51, "learning_rate": 0.00010262949112760085, "loss": 0.6805, "step": 4870 }, { "epoch": 0.51, "learning_rate": 0.00010259578732583712, "loss": 0.6044, "step": 4871 }, { "epoch": 0.51, "learning_rate": 0.0001025620832290045, "loss": 0.6562, "step": 4872 }, { "epoch": 0.51, "learning_rate": 0.00010252837884093419, "loss": 0.618, "step": 4873 }, { "epoch": 0.51, "learning_rate": 0.00010249467416545747, "loss": 0.6581, "step": 4874 }, { "epoch": 0.51, "learning_rate": 0.00010246096920640558, "loss": 0.6876, "step": 4875 }, { "epoch": 0.51, "learning_rate": 0.00010242726396760988, "loss": 0.7042, "step": 4876 }, { "epoch": 0.51, "learning_rate": 0.00010239355845290169, "loss": 0.6419, "step": 4877 }, { "epoch": 0.51, "learning_rate": 0.00010235985266611241, "loss": 0.667, "step": 4878 }, { "epoch": 0.51, "learning_rate": 0.00010232614661107344, "loss": 0.5926, "step": 4879 }, { "epoch": 0.51, "learning_rate": 0.00010229244029161624, "loss": 0.6891, "step": 4880 }, { "epoch": 0.51, "learning_rate": 0.0001022587337115723, "loss": 0.7102, "step": 4881 }, { "epoch": 0.51, "learning_rate": 0.00010222502687477307, "loss": 0.7008, "step": 4882 }, { "epoch": 0.51, "learning_rate": 0.00010219131978505008, "loss": 0.6576, "step": 4883 }, { "epoch": 0.51, "learning_rate": 0.00010215761244623491, "loss": 0.6556, "step": 4884 }, { "epoch": 0.51, "learning_rate": 0.0001021239048621592, "loss": 0.6099, "step": 4885 }, { "epoch": 0.51, "learning_rate": 0.00010209019703665448, "loss": 0.6592, "step": 4886 }, { "epoch": 0.51, "learning_rate": 0.00010205648897355242, "loss": 0.5627, "step": 4887 }, { "epoch": 0.51, "learning_rate": 0.00010202278067668474, "loss": 0.6691, "step": 4888 }, { "epoch": 0.51, "learning_rate": 0.00010198907214988308, "loss": 0.6353, "step": 4889 }, { "epoch": 0.51, "learning_rate": 0.00010195536339697913, "loss": 0.6756, "step": 4890 }, { "epoch": 0.51, "learning_rate": 0.00010192165442180474, "loss": 0.68, "step": 4891 }, { "epoch": 0.51, "learning_rate": 0.00010188794522819163, "loss": 0.7287, "step": 4892 }, { "epoch": 0.51, "learning_rate": 0.0001018542358199716, "loss": 0.7165, "step": 4893 }, { "epoch": 0.51, "learning_rate": 0.00010182052620097647, "loss": 0.651, "step": 4894 }, { "epoch": 0.51, "learning_rate": 0.00010178681637503809, "loss": 0.659, "step": 4895 }, { "epoch": 0.51, "learning_rate": 0.00010175310634598833, "loss": 0.6187, "step": 4896 }, { "epoch": 0.51, "learning_rate": 0.00010171939611765907, "loss": 0.7047, "step": 4897 }, { "epoch": 0.51, "learning_rate": 0.00010168568569388226, "loss": 0.6483, "step": 4898 }, { "epoch": 0.51, "learning_rate": 0.00010165197507848983, "loss": 0.6626, "step": 4899 }, { "epoch": 0.51, "learning_rate": 0.00010161826427531371, "loss": 0.7257, "step": 4900 }, { "epoch": 0.51, "learning_rate": 0.0001015845532881859, "loss": 0.6411, "step": 4901 }, { "epoch": 0.51, "learning_rate": 0.00010155084212093844, "loss": 0.6941, "step": 4902 }, { "epoch": 0.51, "learning_rate": 0.00010151713077740328, "loss": 0.6734, "step": 4903 }, { "epoch": 0.51, "learning_rate": 0.00010148341926141251, "loss": 0.6806, "step": 4904 }, { "epoch": 0.51, "learning_rate": 0.00010144970757679819, "loss": 0.7126, "step": 4905 }, { "epoch": 0.51, "learning_rate": 0.0001014159957273924, "loss": 0.6973, "step": 4906 }, { "epoch": 0.51, "learning_rate": 0.00010138228371702725, "loss": 0.7063, "step": 4907 }, { "epoch": 0.51, "learning_rate": 0.00010134857154953484, "loss": 0.6698, "step": 4908 }, { "epoch": 0.51, "learning_rate": 0.00010131485922874729, "loss": 0.6928, "step": 4909 }, { "epoch": 0.51, "learning_rate": 0.00010128114675849678, "loss": 0.7053, "step": 4910 }, { "epoch": 0.51, "learning_rate": 0.00010124743414261548, "loss": 0.6419, "step": 4911 }, { "epoch": 0.51, "learning_rate": 0.00010121372138493559, "loss": 0.6869, "step": 4912 }, { "epoch": 0.51, "learning_rate": 0.0001011800084892893, "loss": 0.7043, "step": 4913 }, { "epoch": 0.51, "learning_rate": 0.00010114629545950883, "loss": 0.6356, "step": 4914 }, { "epoch": 0.51, "learning_rate": 0.0001011125822994264, "loss": 0.735, "step": 4915 }, { "epoch": 0.51, "learning_rate": 0.00010107886901287428, "loss": 0.6958, "step": 4916 }, { "epoch": 0.51, "learning_rate": 0.00010104515560368473, "loss": 0.6964, "step": 4917 }, { "epoch": 0.51, "learning_rate": 0.00010101144207569002, "loss": 0.6681, "step": 4918 }, { "epoch": 0.51, "learning_rate": 0.00010097772843272244, "loss": 0.6533, "step": 4919 }, { "epoch": 0.51, "learning_rate": 0.00010094401467861432, "loss": 0.7194, "step": 4920 }, { "epoch": 0.51, "learning_rate": 0.00010091030081719797, "loss": 0.6536, "step": 4921 }, { "epoch": 0.51, "learning_rate": 0.00010087658685230567, "loss": 0.6891, "step": 4922 }, { "epoch": 0.51, "learning_rate": 0.0001008428727877698, "loss": 0.6337, "step": 4923 }, { "epoch": 0.51, "learning_rate": 0.00010080915862742275, "loss": 0.6471, "step": 4924 }, { "epoch": 0.51, "learning_rate": 0.00010077544437509683, "loss": 0.7135, "step": 4925 }, { "epoch": 0.51, "learning_rate": 0.00010074173003462444, "loss": 0.6998, "step": 4926 }, { "epoch": 0.51, "learning_rate": 0.00010070801560983794, "loss": 0.6371, "step": 4927 }, { "epoch": 0.51, "learning_rate": 0.00010067430110456972, "loss": 0.6335, "step": 4928 }, { "epoch": 0.51, "learning_rate": 0.00010064058652265222, "loss": 0.675, "step": 4929 }, { "epoch": 0.51, "learning_rate": 0.00010060687186791782, "loss": 0.6507, "step": 4930 }, { "epoch": 0.51, "learning_rate": 0.00010057315714419895, "loss": 0.6926, "step": 4931 }, { "epoch": 0.51, "learning_rate": 0.00010053944235532803, "loss": 0.6784, "step": 4932 }, { "epoch": 0.51, "learning_rate": 0.00010050572750513751, "loss": 0.6566, "step": 4933 }, { "epoch": 0.51, "learning_rate": 0.00010047201259745984, "loss": 0.7164, "step": 4934 }, { "epoch": 0.51, "learning_rate": 0.00010043829763612744, "loss": 0.5821, "step": 4935 }, { "epoch": 0.51, "learning_rate": 0.00010040458262497279, "loss": 0.6302, "step": 4936 }, { "epoch": 0.51, "learning_rate": 0.0001003708675678283, "loss": 0.7155, "step": 4937 }, { "epoch": 0.51, "learning_rate": 0.00010033715246852649, "loss": 0.6752, "step": 4938 }, { "epoch": 0.51, "learning_rate": 0.00010030343733089984, "loss": 0.6654, "step": 4939 }, { "epoch": 0.51, "learning_rate": 0.00010026972215878074, "loss": 0.6487, "step": 4940 }, { "epoch": 0.51, "learning_rate": 0.00010023600695600175, "loss": 0.6712, "step": 4941 }, { "epoch": 0.51, "learning_rate": 0.00010020229172639535, "loss": 0.6606, "step": 4942 }, { "epoch": 0.51, "learning_rate": 0.00010016857647379395, "loss": 0.7029, "step": 4943 }, { "epoch": 0.51, "learning_rate": 0.00010013486120203013, "loss": 0.7017, "step": 4944 }, { "epoch": 0.51, "learning_rate": 0.00010010114591493634, "loss": 0.7003, "step": 4945 }, { "epoch": 0.51, "learning_rate": 0.00010006743061634507, "loss": 0.6877, "step": 4946 }, { "epoch": 0.51, "learning_rate": 0.00010003371531008879, "loss": 0.7305, "step": 4947 }, { "epoch": 0.52, "learning_rate": 0.0001, "loss": 0.6832, "step": 4948 }, { "epoch": 0.52, "learning_rate": 9.996628468991122e-05, "loss": 0.6393, "step": 4949 }, { "epoch": 0.52, "learning_rate": 9.993256938365499e-05, "loss": 0.6592, "step": 4950 }, { "epoch": 0.52, "learning_rate": 9.989885408506367e-05, "loss": 0.7151, "step": 4951 }, { "epoch": 0.52, "learning_rate": 9.986513879796988e-05, "loss": 0.6874, "step": 4952 }, { "epoch": 0.52, "learning_rate": 9.983142352620606e-05, "loss": 0.7057, "step": 4953 }, { "epoch": 0.52, "learning_rate": 9.979770827360469e-05, "loss": 0.6885, "step": 4954 }, { "epoch": 0.52, "learning_rate": 9.976399304399824e-05, "loss": 0.6817, "step": 4955 }, { "epoch": 0.52, "learning_rate": 9.973027784121928e-05, "loss": 0.7555, "step": 4956 }, { "epoch": 0.52, "learning_rate": 9.969656266910018e-05, "loss": 0.6972, "step": 4957 }, { "epoch": 0.52, "learning_rate": 9.966284753147353e-05, "loss": 0.6937, "step": 4958 }, { "epoch": 0.52, "learning_rate": 9.962913243217173e-05, "loss": 0.68, "step": 4959 }, { "epoch": 0.52, "learning_rate": 9.959541737502725e-05, "loss": 0.68, "step": 4960 }, { "epoch": 0.52, "learning_rate": 9.95617023638726e-05, "loss": 0.7378, "step": 4961 }, { "epoch": 0.52, "learning_rate": 9.952798740254018e-05, "loss": 0.6911, "step": 4962 }, { "epoch": 0.52, "learning_rate": 9.949427249486247e-05, "loss": 0.6831, "step": 4963 }, { "epoch": 0.52, "learning_rate": 9.946055764467198e-05, "loss": 0.7289, "step": 4964 }, { "epoch": 0.52, "learning_rate": 9.942684285580107e-05, "loss": 0.7139, "step": 4965 }, { "epoch": 0.52, "learning_rate": 9.939312813208219e-05, "loss": 0.6343, "step": 4966 }, { "epoch": 0.52, "learning_rate": 9.935941347734781e-05, "loss": 0.6509, "step": 4967 }, { "epoch": 0.52, "learning_rate": 9.93256988954303e-05, "loss": 0.6744, "step": 4968 }, { "epoch": 0.52, "learning_rate": 9.929198439016207e-05, "loss": 0.6474, "step": 4969 }, { "epoch": 0.52, "learning_rate": 9.925826996537559e-05, "loss": 0.6731, "step": 4970 }, { "epoch": 0.52, "learning_rate": 9.92245556249032e-05, "loss": 0.6556, "step": 4971 }, { "epoch": 0.52, "learning_rate": 9.919084137257724e-05, "loss": 0.6067, "step": 4972 }, { "epoch": 0.52, "learning_rate": 9.915712721223021e-05, "loss": 0.6491, "step": 4973 }, { "epoch": 0.52, "learning_rate": 9.912341314769434e-05, "loss": 0.644, "step": 4974 }, { "epoch": 0.52, "learning_rate": 9.908969918280204e-05, "loss": 0.6729, "step": 4975 }, { "epoch": 0.52, "learning_rate": 9.905598532138569e-05, "loss": 0.666, "step": 4976 }, { "epoch": 0.52, "learning_rate": 9.902227156727756e-05, "loss": 0.671, "step": 4977 }, { "epoch": 0.52, "learning_rate": 9.898855792431e-05, "loss": 0.6773, "step": 4978 }, { "epoch": 0.52, "learning_rate": 9.895484439631531e-05, "loss": 0.6159, "step": 4979 }, { "epoch": 0.52, "learning_rate": 9.892113098712574e-05, "loss": 0.6992, "step": 4980 }, { "epoch": 0.52, "learning_rate": 9.888741770057364e-05, "loss": 0.6515, "step": 4981 }, { "epoch": 0.52, "learning_rate": 9.88537045404912e-05, "loss": 0.6878, "step": 4982 }, { "epoch": 0.52, "learning_rate": 9.881999151071072e-05, "loss": 0.6213, "step": 4983 }, { "epoch": 0.52, "learning_rate": 9.878627861506444e-05, "loss": 0.635, "step": 4984 }, { "epoch": 0.52, "learning_rate": 9.875256585738454e-05, "loss": 0.7196, "step": 4985 }, { "epoch": 0.52, "learning_rate": 9.871885324150323e-05, "loss": 0.6654, "step": 4986 }, { "epoch": 0.52, "learning_rate": 9.868514077125275e-05, "loss": 0.7093, "step": 4987 }, { "epoch": 0.52, "learning_rate": 9.86514284504652e-05, "loss": 0.6897, "step": 4988 }, { "epoch": 0.52, "learning_rate": 9.861771628297279e-05, "loss": 0.649, "step": 4989 }, { "epoch": 0.52, "learning_rate": 9.858400427260762e-05, "loss": 0.6422, "step": 4990 }, { "epoch": 0.52, "learning_rate": 9.855029242320183e-05, "loss": 0.6696, "step": 4991 }, { "epoch": 0.52, "learning_rate": 9.85165807385875e-05, "loss": 0.6829, "step": 4992 }, { "epoch": 0.52, "learning_rate": 9.848286922259676e-05, "loss": 0.6658, "step": 4993 }, { "epoch": 0.52, "learning_rate": 9.84491578790616e-05, "loss": 0.6166, "step": 4994 }, { "epoch": 0.52, "learning_rate": 9.84154467118141e-05, "loss": 0.5699, "step": 4995 }, { "epoch": 0.52, "learning_rate": 9.838173572468633e-05, "loss": 0.6716, "step": 4996 }, { "epoch": 0.52, "learning_rate": 9.834802492151021e-05, "loss": 0.7068, "step": 4997 }, { "epoch": 0.52, "learning_rate": 9.831431430611779e-05, "loss": 0.7209, "step": 4998 }, { "epoch": 0.52, "learning_rate": 9.828060388234096e-05, "loss": 0.693, "step": 4999 }, { "epoch": 0.52, "learning_rate": 9.824689365401169e-05, "loss": 0.694, "step": 5000 }, { "epoch": 0.52, "learning_rate": 9.821318362496196e-05, "loss": 0.662, "step": 5001 }, { "epoch": 0.52, "learning_rate": 9.817947379902356e-05, "loss": 0.6947, "step": 5002 }, { "epoch": 0.52, "learning_rate": 9.814576418002844e-05, "loss": 0.6508, "step": 5003 }, { "epoch": 0.52, "learning_rate": 9.811205477180841e-05, "loss": 0.7096, "step": 5004 }, { "epoch": 0.52, "learning_rate": 9.807834557819528e-05, "loss": 0.6914, "step": 5005 }, { "epoch": 0.52, "learning_rate": 9.804463660302085e-05, "loss": 0.6471, "step": 5006 }, { "epoch": 0.52, "learning_rate": 9.801092785011697e-05, "loss": 0.6724, "step": 5007 }, { "epoch": 0.52, "learning_rate": 9.79772193233153e-05, "loss": 0.674, "step": 5008 }, { "epoch": 0.52, "learning_rate": 9.794351102644759e-05, "loss": 0.6839, "step": 5009 }, { "epoch": 0.52, "learning_rate": 9.790980296334557e-05, "loss": 0.7509, "step": 5010 }, { "epoch": 0.52, "learning_rate": 9.787609513784084e-05, "loss": 0.6591, "step": 5011 }, { "epoch": 0.52, "learning_rate": 9.784238755376508e-05, "loss": 0.6321, "step": 5012 }, { "epoch": 0.52, "learning_rate": 9.780868021494995e-05, "loss": 0.6695, "step": 5013 }, { "epoch": 0.52, "learning_rate": 9.777497312522695e-05, "loss": 0.7017, "step": 5014 }, { "epoch": 0.52, "learning_rate": 9.774126628842772e-05, "loss": 0.6696, "step": 5015 }, { "epoch": 0.52, "learning_rate": 9.770755970838377e-05, "loss": 0.7071, "step": 5016 }, { "epoch": 0.52, "learning_rate": 9.767385338892657e-05, "loss": 0.6614, "step": 5017 }, { "epoch": 0.52, "learning_rate": 9.764014733388764e-05, "loss": 0.5755, "step": 5018 }, { "epoch": 0.52, "learning_rate": 9.760644154709834e-05, "loss": 0.7012, "step": 5019 }, { "epoch": 0.52, "learning_rate": 9.757273603239014e-05, "loss": 0.7013, "step": 5020 }, { "epoch": 0.52, "learning_rate": 9.753903079359447e-05, "loss": 0.7002, "step": 5021 }, { "epoch": 0.52, "learning_rate": 9.750532583454256e-05, "loss": 0.6717, "step": 5022 }, { "epoch": 0.52, "learning_rate": 9.747162115906582e-05, "loss": 0.6921, "step": 5023 }, { "epoch": 0.52, "learning_rate": 9.743791677099554e-05, "loss": 0.6899, "step": 5024 }, { "epoch": 0.52, "learning_rate": 9.74042126741629e-05, "loss": 0.6536, "step": 5025 }, { "epoch": 0.52, "learning_rate": 9.737050887239915e-05, "loss": 0.616, "step": 5026 }, { "epoch": 0.52, "learning_rate": 9.733680536953554e-05, "loss": 0.7144, "step": 5027 }, { "epoch": 0.52, "learning_rate": 9.73031021694031e-05, "loss": 0.6625, "step": 5028 }, { "epoch": 0.52, "learning_rate": 9.726939927583305e-05, "loss": 0.6497, "step": 5029 }, { "epoch": 0.52, "learning_rate": 9.723569669265646e-05, "loss": 0.688, "step": 5030 }, { "epoch": 0.52, "learning_rate": 9.720199442370432e-05, "loss": 0.6978, "step": 5031 }, { "epoch": 0.52, "learning_rate": 9.716829247280765e-05, "loss": 0.71, "step": 5032 }, { "epoch": 0.52, "learning_rate": 9.713459084379752e-05, "loss": 0.7048, "step": 5033 }, { "epoch": 0.52, "learning_rate": 9.710088954050475e-05, "loss": 0.6401, "step": 5034 }, { "epoch": 0.52, "learning_rate": 9.706718856676031e-05, "loss": 0.6304, "step": 5035 }, { "epoch": 0.52, "learning_rate": 9.703348792639508e-05, "loss": 0.636, "step": 5036 }, { "epoch": 0.52, "learning_rate": 9.699978762323979e-05, "loss": 0.6205, "step": 5037 }, { "epoch": 0.52, "learning_rate": 9.696608766112535e-05, "loss": 0.6489, "step": 5038 }, { "epoch": 0.52, "learning_rate": 9.69323880438824e-05, "loss": 0.6663, "step": 5039 }, { "epoch": 0.52, "learning_rate": 9.68986887753417e-05, "loss": 0.7187, "step": 5040 }, { "epoch": 0.52, "learning_rate": 9.686498985933397e-05, "loss": 0.6841, "step": 5041 }, { "epoch": 0.52, "learning_rate": 9.683129129968977e-05, "loss": 0.6173, "step": 5042 }, { "epoch": 0.52, "learning_rate": 9.679759310023969e-05, "loss": 0.639, "step": 5043 }, { "epoch": 0.53, "learning_rate": 9.676389526481434e-05, "loss": 0.7106, "step": 5044 }, { "epoch": 0.53, "learning_rate": 9.673019779724415e-05, "loss": 0.7223, "step": 5045 }, { "epoch": 0.53, "learning_rate": 9.669650070135963e-05, "loss": 0.6829, "step": 5046 }, { "epoch": 0.53, "learning_rate": 9.666280398099123e-05, "loss": 0.6258, "step": 5047 }, { "epoch": 0.53, "learning_rate": 9.662910763996928e-05, "loss": 0.6943, "step": 5048 }, { "epoch": 0.53, "learning_rate": 9.659541168212412e-05, "loss": 0.7077, "step": 5049 }, { "epoch": 0.53, "learning_rate": 9.65617161112861e-05, "loss": 0.6813, "step": 5050 }, { "epoch": 0.53, "learning_rate": 9.652802093128539e-05, "loss": 0.7176, "step": 5051 }, { "epoch": 0.53, "learning_rate": 9.649432614595223e-05, "loss": 0.6822, "step": 5052 }, { "epoch": 0.53, "learning_rate": 9.646063175911684e-05, "loss": 0.626, "step": 5053 }, { "epoch": 0.53, "learning_rate": 9.642693777460926e-05, "loss": 0.6573, "step": 5054 }, { "epoch": 0.53, "learning_rate": 9.639324419625956e-05, "loss": 0.6846, "step": 5055 }, { "epoch": 0.53, "learning_rate": 9.635955102789783e-05, "loss": 0.625, "step": 5056 }, { "epoch": 0.53, "learning_rate": 9.632585827335397e-05, "loss": 0.6848, "step": 5057 }, { "epoch": 0.53, "learning_rate": 9.629216593645797e-05, "loss": 0.6403, "step": 5058 }, { "epoch": 0.53, "learning_rate": 9.625847402103966e-05, "loss": 0.724, "step": 5059 }, { "epoch": 0.53, "learning_rate": 9.622478253092891e-05, "loss": 0.6809, "step": 5060 }, { "epoch": 0.53, "learning_rate": 9.619109146995551e-05, "loss": 0.7326, "step": 5061 }, { "epoch": 0.53, "learning_rate": 9.615740084194917e-05, "loss": 0.6495, "step": 5062 }, { "epoch": 0.53, "learning_rate": 9.612371065073959e-05, "loss": 0.6491, "step": 5063 }, { "epoch": 0.53, "learning_rate": 9.609002090015645e-05, "loss": 0.682, "step": 5064 }, { "epoch": 0.53, "learning_rate": 9.605633159402926e-05, "loss": 0.6753, "step": 5065 }, { "epoch": 0.53, "learning_rate": 9.602264273618762e-05, "loss": 0.6991, "step": 5066 }, { "epoch": 0.53, "learning_rate": 9.598895433046099e-05, "loss": 0.6849, "step": 5067 }, { "epoch": 0.53, "learning_rate": 9.595526638067883e-05, "loss": 0.7359, "step": 5068 }, { "epoch": 0.53, "learning_rate": 9.592157889067046e-05, "loss": 0.6498, "step": 5069 }, { "epoch": 0.53, "learning_rate": 9.588789186426531e-05, "loss": 0.6628, "step": 5070 }, { "epoch": 0.53, "learning_rate": 9.585420530529256e-05, "loss": 0.6553, "step": 5071 }, { "epoch": 0.53, "learning_rate": 9.58205192175815e-05, "loss": 0.6907, "step": 5072 }, { "epoch": 0.53, "learning_rate": 9.578683360496133e-05, "loss": 0.7037, "step": 5073 }, { "epoch": 0.53, "learning_rate": 9.575314847126107e-05, "loss": 0.6556, "step": 5074 }, { "epoch": 0.53, "learning_rate": 9.571946382030985e-05, "loss": 0.6268, "step": 5075 }, { "epoch": 0.53, "learning_rate": 9.56857796559367e-05, "loss": 0.5711, "step": 5076 }, { "epoch": 0.53, "learning_rate": 9.565209598197048e-05, "loss": 0.7014, "step": 5077 }, { "epoch": 0.53, "learning_rate": 9.56184128022402e-05, "loss": 0.7013, "step": 5078 }, { "epoch": 0.53, "learning_rate": 9.558473012057462e-05, "loss": 0.7214, "step": 5079 }, { "epoch": 0.53, "learning_rate": 9.555104794080255e-05, "loss": 0.6812, "step": 5080 }, { "epoch": 0.53, "learning_rate": 9.551736626675277e-05, "loss": 0.6421, "step": 5081 }, { "epoch": 0.53, "learning_rate": 9.548368510225384e-05, "loss": 0.6689, "step": 5082 }, { "epoch": 0.53, "learning_rate": 9.545000445113445e-05, "loss": 0.691, "step": 5083 }, { "epoch": 0.53, "learning_rate": 9.541632431722317e-05, "loss": 0.7403, "step": 5084 }, { "epoch": 0.53, "learning_rate": 9.538264470434844e-05, "loss": 0.7146, "step": 5085 }, { "epoch": 0.53, "learning_rate": 9.534896561633873e-05, "loss": 0.7175, "step": 5086 }, { "epoch": 0.53, "learning_rate": 9.531528705702243e-05, "loss": 0.7009, "step": 5087 }, { "epoch": 0.53, "learning_rate": 9.528160903022779e-05, "loss": 0.6654, "step": 5088 }, { "epoch": 0.53, "learning_rate": 9.524793153978311e-05, "loss": 0.6683, "step": 5089 }, { "epoch": 0.53, "learning_rate": 9.521425458951664e-05, "loss": 0.6094, "step": 5090 }, { "epoch": 0.53, "learning_rate": 9.51805781832564e-05, "loss": 0.6552, "step": 5091 }, { "epoch": 0.53, "learning_rate": 9.514690232483055e-05, "loss": 0.6948, "step": 5092 }, { "epoch": 0.53, "learning_rate": 9.511322701806707e-05, "loss": 0.6557, "step": 5093 }, { "epoch": 0.53, "learning_rate": 9.507955226679392e-05, "loss": 0.6437, "step": 5094 }, { "epoch": 0.53, "learning_rate": 9.504587807483894e-05, "loss": 0.7374, "step": 5095 }, { "epoch": 0.53, "learning_rate": 9.501220444603002e-05, "loss": 0.6452, "step": 5096 }, { "epoch": 0.53, "learning_rate": 9.497853138419484e-05, "loss": 0.6765, "step": 5097 }, { "epoch": 0.53, "learning_rate": 9.494485889316116e-05, "loss": 0.6896, "step": 5098 }, { "epoch": 0.53, "learning_rate": 9.491118697675653e-05, "loss": 0.6785, "step": 5099 }, { "epoch": 0.53, "learning_rate": 9.48775156388086e-05, "loss": 0.6482, "step": 5100 }, { "epoch": 0.53, "learning_rate": 9.484384488314482e-05, "loss": 0.6691, "step": 5101 }, { "epoch": 0.53, "learning_rate": 9.48101747135926e-05, "loss": 0.7502, "step": 5102 }, { "epoch": 0.53, "learning_rate": 9.477650513397932e-05, "loss": 0.7282, "step": 5103 }, { "epoch": 0.53, "learning_rate": 9.474283614813232e-05, "loss": 0.5957, "step": 5104 }, { "epoch": 0.53, "learning_rate": 9.470916775987873e-05, "loss": 0.6875, "step": 5105 }, { "epoch": 0.53, "learning_rate": 9.467549997304582e-05, "loss": 0.6561, "step": 5106 }, { "epoch": 0.53, "learning_rate": 9.464183279146063e-05, "loss": 0.7035, "step": 5107 }, { "epoch": 0.53, "learning_rate": 9.460816621895014e-05, "loss": 0.6097, "step": 5108 }, { "epoch": 0.53, "learning_rate": 9.457450025934136e-05, "loss": 0.6613, "step": 5109 }, { "epoch": 0.53, "learning_rate": 9.454083491646119e-05, "loss": 0.612, "step": 5110 }, { "epoch": 0.53, "learning_rate": 9.450717019413638e-05, "loss": 0.6532, "step": 5111 }, { "epoch": 0.53, "learning_rate": 9.447350609619374e-05, "loss": 0.665, "step": 5112 }, { "epoch": 0.53, "learning_rate": 9.443984262645993e-05, "loss": 0.6504, "step": 5113 }, { "epoch": 0.53, "learning_rate": 9.440617978876149e-05, "loss": 0.624, "step": 5114 }, { "epoch": 0.53, "learning_rate": 9.437251758692499e-05, "loss": 0.64, "step": 5115 }, { "epoch": 0.53, "learning_rate": 9.433885602477693e-05, "loss": 0.6816, "step": 5116 }, { "epoch": 0.53, "learning_rate": 9.430519510614362e-05, "loss": 0.6675, "step": 5117 }, { "epoch": 0.53, "learning_rate": 9.427153483485145e-05, "loss": 0.6985, "step": 5118 }, { "epoch": 0.53, "learning_rate": 9.423787521472659e-05, "loss": 0.6928, "step": 5119 }, { "epoch": 0.53, "learning_rate": 9.42042162495952e-05, "loss": 0.6812, "step": 5120 }, { "epoch": 0.53, "learning_rate": 9.417055794328344e-05, "loss": 0.6237, "step": 5121 }, { "epoch": 0.53, "learning_rate": 9.413690029961724e-05, "loss": 0.7109, "step": 5122 }, { "epoch": 0.53, "learning_rate": 9.410324332242257e-05, "loss": 0.6891, "step": 5123 }, { "epoch": 0.53, "learning_rate": 9.406958701552536e-05, "loss": 0.6526, "step": 5124 }, { "epoch": 0.53, "learning_rate": 9.403593138275132e-05, "loss": 0.701, "step": 5125 }, { "epoch": 0.53, "learning_rate": 9.400227642792615e-05, "loss": 0.7188, "step": 5126 }, { "epoch": 0.53, "learning_rate": 9.396862215487556e-05, "loss": 0.7195, "step": 5127 }, { "epoch": 0.53, "learning_rate": 9.3934968567425e-05, "loss": 0.6582, "step": 5128 }, { "epoch": 0.53, "learning_rate": 9.390131566940002e-05, "loss": 0.7308, "step": 5129 }, { "epoch": 0.53, "learning_rate": 9.386766346462607e-05, "loss": 0.6649, "step": 5130 }, { "epoch": 0.53, "learning_rate": 9.383401195692836e-05, "loss": 0.6848, "step": 5131 }, { "epoch": 0.53, "learning_rate": 9.380036115013217e-05, "loss": 0.6827, "step": 5132 }, { "epoch": 0.53, "learning_rate": 9.37667110480627e-05, "loss": 0.6555, "step": 5133 }, { "epoch": 0.53, "learning_rate": 9.373306165454496e-05, "loss": 0.7299, "step": 5134 }, { "epoch": 0.53, "learning_rate": 9.369941297340401e-05, "loss": 0.6305, "step": 5135 }, { "epoch": 0.53, "learning_rate": 9.366576500846478e-05, "loss": 0.6546, "step": 5136 }, { "epoch": 0.53, "learning_rate": 9.363211776355207e-05, "loss": 0.6577, "step": 5137 }, { "epoch": 0.53, "learning_rate": 9.359847124249065e-05, "loss": 0.6863, "step": 5138 }, { "epoch": 0.53, "learning_rate": 9.356482544910519e-05, "loss": 0.6609, "step": 5139 }, { "epoch": 0.54, "learning_rate": 9.353118038722027e-05, "loss": 0.7164, "step": 5140 }, { "epoch": 0.54, "learning_rate": 9.349753606066045e-05, "loss": 0.7228, "step": 5141 }, { "epoch": 0.54, "learning_rate": 9.346389247325008e-05, "loss": 0.6644, "step": 5142 }, { "epoch": 0.54, "learning_rate": 9.343024962881354e-05, "loss": 0.6794, "step": 5143 }, { "epoch": 0.54, "learning_rate": 9.339660753117513e-05, "loss": 0.71, "step": 5144 }, { "epoch": 0.54, "learning_rate": 9.336296618415896e-05, "loss": 0.662, "step": 5145 }, { "epoch": 0.54, "learning_rate": 9.332932559158912e-05, "loss": 0.6454, "step": 5146 }, { "epoch": 0.54, "learning_rate": 9.329568575728965e-05, "loss": 0.6354, "step": 5147 }, { "epoch": 0.54, "learning_rate": 9.326204668508442e-05, "loss": 0.666, "step": 5148 }, { "epoch": 0.54, "learning_rate": 9.322840837879727e-05, "loss": 0.5847, "step": 5149 }, { "epoch": 0.54, "learning_rate": 9.319477084225198e-05, "loss": 0.6488, "step": 5150 }, { "epoch": 0.54, "learning_rate": 9.316113407927218e-05, "loss": 0.6952, "step": 5151 }, { "epoch": 0.54, "learning_rate": 9.312749809368139e-05, "loss": 0.6895, "step": 5152 }, { "epoch": 0.54, "learning_rate": 9.309386288930318e-05, "loss": 0.7329, "step": 5153 }, { "epoch": 0.54, "learning_rate": 9.306022846996083e-05, "loss": 0.6903, "step": 5154 }, { "epoch": 0.54, "learning_rate": 9.302659483947768e-05, "loss": 0.6897, "step": 5155 }, { "epoch": 0.54, "learning_rate": 9.299296200167702e-05, "loss": 0.683, "step": 5156 }, { "epoch": 0.54, "learning_rate": 9.295932996038187e-05, "loss": 0.6827, "step": 5157 }, { "epoch": 0.54, "learning_rate": 9.292569871941532e-05, "loss": 0.7114, "step": 5158 }, { "epoch": 0.54, "learning_rate": 9.289206828260021e-05, "loss": 0.6502, "step": 5159 }, { "epoch": 0.54, "learning_rate": 9.285843865375949e-05, "loss": 0.6576, "step": 5160 }, { "epoch": 0.54, "learning_rate": 9.28248098367159e-05, "loss": 0.6697, "step": 5161 }, { "epoch": 0.54, "learning_rate": 9.279118183529204e-05, "loss": 0.6513, "step": 5162 }, { "epoch": 0.54, "learning_rate": 9.275755465331054e-05, "loss": 0.6756, "step": 5163 }, { "epoch": 0.54, "learning_rate": 9.272392829459386e-05, "loss": 0.6935, "step": 5164 }, { "epoch": 0.54, "learning_rate": 9.269030276296438e-05, "loss": 0.7012, "step": 5165 }, { "epoch": 0.54, "learning_rate": 9.265667806224436e-05, "loss": 0.6927, "step": 5166 }, { "epoch": 0.54, "learning_rate": 9.262305419625608e-05, "loss": 0.6722, "step": 5167 }, { "epoch": 0.54, "learning_rate": 9.258943116882153e-05, "loss": 0.7308, "step": 5168 }, { "epoch": 0.54, "learning_rate": 9.255580898376278e-05, "loss": 0.663, "step": 5169 }, { "epoch": 0.54, "learning_rate": 9.252218764490174e-05, "loss": 0.6448, "step": 5170 }, { "epoch": 0.54, "learning_rate": 9.24885671560602e-05, "loss": 0.6758, "step": 5171 }, { "epoch": 0.54, "learning_rate": 9.245494752105986e-05, "loss": 0.6587, "step": 5172 }, { "epoch": 0.54, "learning_rate": 9.242132874372239e-05, "loss": 0.6453, "step": 5173 }, { "epoch": 0.54, "learning_rate": 9.238771082786926e-05, "loss": 0.6603, "step": 5174 }, { "epoch": 0.54, "learning_rate": 9.235409377732192e-05, "loss": 0.6945, "step": 5175 }, { "epoch": 0.54, "learning_rate": 9.23204775959017e-05, "loss": 0.6899, "step": 5176 }, { "epoch": 0.54, "learning_rate": 9.22868622874298e-05, "loss": 0.7026, "step": 5177 }, { "epoch": 0.54, "learning_rate": 9.225324785572738e-05, "loss": 0.7426, "step": 5178 }, { "epoch": 0.54, "learning_rate": 9.221963430461542e-05, "loss": 0.6639, "step": 5179 }, { "epoch": 0.54, "learning_rate": 9.218602163791488e-05, "loss": 0.6906, "step": 5180 }, { "epoch": 0.54, "learning_rate": 9.215240985944662e-05, "loss": 0.7799, "step": 5181 }, { "epoch": 0.54, "learning_rate": 9.211879897303128e-05, "loss": 0.6546, "step": 5182 }, { "epoch": 0.54, "learning_rate": 9.208518898248954e-05, "loss": 0.6664, "step": 5183 }, { "epoch": 0.54, "learning_rate": 9.205157989164195e-05, "loss": 0.6634, "step": 5184 }, { "epoch": 0.54, "learning_rate": 9.201797170430885e-05, "loss": 0.6868, "step": 5185 }, { "epoch": 0.54, "learning_rate": 9.198436442431059e-05, "loss": 0.6837, "step": 5186 }, { "epoch": 0.54, "learning_rate": 9.195075805546745e-05, "loss": 0.7481, "step": 5187 }, { "epoch": 0.54, "learning_rate": 9.191715260159943e-05, "loss": 0.6796, "step": 5188 }, { "epoch": 0.54, "learning_rate": 9.188354806652661e-05, "loss": 0.6796, "step": 5189 }, { "epoch": 0.54, "learning_rate": 9.18499444540689e-05, "loss": 0.7317, "step": 5190 }, { "epoch": 0.54, "learning_rate": 9.181634176804604e-05, "loss": 0.6737, "step": 5191 }, { "epoch": 0.54, "learning_rate": 9.178274001227773e-05, "loss": 0.5913, "step": 5192 }, { "epoch": 0.54, "learning_rate": 9.174913919058364e-05, "loss": 0.6685, "step": 5193 }, { "epoch": 0.54, "learning_rate": 9.171553930678312e-05, "loss": 0.646, "step": 5194 }, { "epoch": 0.54, "learning_rate": 9.168194036469565e-05, "loss": 0.635, "step": 5195 }, { "epoch": 0.54, "learning_rate": 9.164834236814048e-05, "loss": 0.6398, "step": 5196 }, { "epoch": 0.54, "learning_rate": 9.161474532093669e-05, "loss": 0.613, "step": 5197 }, { "epoch": 0.54, "learning_rate": 9.158114922690343e-05, "loss": 0.7029, "step": 5198 }, { "epoch": 0.54, "learning_rate": 9.154755408985958e-05, "loss": 0.6846, "step": 5199 }, { "epoch": 0.54, "learning_rate": 9.151395991362397e-05, "loss": 0.7379, "step": 5200 }, { "epoch": 0.54, "learning_rate": 9.14803667020154e-05, "loss": 0.6981, "step": 5201 }, { "epoch": 0.54, "learning_rate": 9.144677445885241e-05, "loss": 0.6781, "step": 5202 }, { "epoch": 0.54, "learning_rate": 9.14131831879535e-05, "loss": 0.6972, "step": 5203 }, { "epoch": 0.54, "learning_rate": 9.137959289313714e-05, "loss": 0.6607, "step": 5204 }, { "epoch": 0.54, "learning_rate": 9.134600357822152e-05, "loss": 0.6771, "step": 5205 }, { "epoch": 0.54, "learning_rate": 9.131241524702486e-05, "loss": 0.5998, "step": 5206 }, { "epoch": 0.54, "learning_rate": 9.127882790336525e-05, "loss": 0.6154, "step": 5207 }, { "epoch": 0.54, "learning_rate": 9.124524155106059e-05, "loss": 0.6848, "step": 5208 }, { "epoch": 0.54, "learning_rate": 9.121165619392871e-05, "loss": 0.7275, "step": 5209 }, { "epoch": 0.54, "learning_rate": 9.117807183578739e-05, "loss": 0.7264, "step": 5210 }, { "epoch": 0.54, "learning_rate": 9.114448848045415e-05, "loss": 0.7029, "step": 5211 }, { "epoch": 0.54, "learning_rate": 9.111090613174653e-05, "loss": 0.6819, "step": 5212 }, { "epoch": 0.54, "learning_rate": 9.107732479348198e-05, "loss": 0.6812, "step": 5213 }, { "epoch": 0.54, "learning_rate": 9.104374446947767e-05, "loss": 0.6713, "step": 5214 }, { "epoch": 0.54, "learning_rate": 9.101016516355075e-05, "loss": 0.7466, "step": 5215 }, { "epoch": 0.54, "learning_rate": 9.097658687951832e-05, "loss": 0.6656, "step": 5216 }, { "epoch": 0.54, "learning_rate": 9.094300962119723e-05, "loss": 0.695, "step": 5217 }, { "epoch": 0.54, "learning_rate": 9.090943339240435e-05, "loss": 0.6782, "step": 5218 }, { "epoch": 0.54, "learning_rate": 9.08758581969563e-05, "loss": 0.7453, "step": 5219 }, { "epoch": 0.54, "learning_rate": 9.084228403866965e-05, "loss": 0.7306, "step": 5220 }, { "epoch": 0.54, "learning_rate": 9.080871092136093e-05, "loss": 0.703, "step": 5221 }, { "epoch": 0.54, "learning_rate": 9.077513884884639e-05, "loss": 0.6549, "step": 5222 }, { "epoch": 0.54, "learning_rate": 9.074156782494225e-05, "loss": 0.6455, "step": 5223 }, { "epoch": 0.54, "learning_rate": 9.070799785346465e-05, "loss": 0.6314, "step": 5224 }, { "epoch": 0.54, "learning_rate": 9.067442893822949e-05, "loss": 0.6374, "step": 5225 }, { "epoch": 0.54, "learning_rate": 9.064086108305267e-05, "loss": 0.6757, "step": 5226 }, { "epoch": 0.54, "learning_rate": 9.060729429174995e-05, "loss": 0.6892, "step": 5227 }, { "epoch": 0.54, "learning_rate": 9.057372856813691e-05, "loss": 0.6239, "step": 5228 }, { "epoch": 0.54, "learning_rate": 9.054016391602898e-05, "loss": 0.6771, "step": 5229 }, { "epoch": 0.54, "learning_rate": 9.050660033924166e-05, "loss": 0.6828, "step": 5230 }, { "epoch": 0.54, "learning_rate": 9.047303784159006e-05, "loss": 0.6542, "step": 5231 }, { "epoch": 0.54, "learning_rate": 9.043947642688939e-05, "loss": 0.6566, "step": 5232 }, { "epoch": 0.54, "learning_rate": 9.040591609895466e-05, "loss": 0.6843, "step": 5233 }, { "epoch": 0.54, "learning_rate": 9.037235686160069e-05, "loss": 0.6587, "step": 5234 }, { "epoch": 0.54, "learning_rate": 9.033879871864224e-05, "loss": 0.6676, "step": 5235 }, { "epoch": 0.55, "learning_rate": 9.030524167389399e-05, "loss": 0.62, "step": 5236 }, { "epoch": 0.55, "learning_rate": 9.027168573117038e-05, "loss": 0.6746, "step": 5237 }, { "epoch": 0.55, "learning_rate": 9.023813089428585e-05, "loss": 0.6658, "step": 5238 }, { "epoch": 0.55, "learning_rate": 9.020457716705457e-05, "loss": 0.652, "step": 5239 }, { "epoch": 0.55, "learning_rate": 9.017102455329074e-05, "loss": 0.6732, "step": 5240 }, { "epoch": 0.55, "learning_rate": 9.013747305680835e-05, "loss": 0.6947, "step": 5241 }, { "epoch": 0.55, "learning_rate": 9.010392268142124e-05, "loss": 0.6695, "step": 5242 }, { "epoch": 0.55, "learning_rate": 9.007037343094317e-05, "loss": 0.6997, "step": 5243 }, { "epoch": 0.55, "learning_rate": 9.00368253091878e-05, "loss": 0.6968, "step": 5244 }, { "epoch": 0.55, "learning_rate": 9.000327831996854e-05, "loss": 0.6783, "step": 5245 }, { "epoch": 0.55, "learning_rate": 8.996973246709882e-05, "loss": 0.6979, "step": 5246 }, { "epoch": 0.55, "learning_rate": 8.993618775439183e-05, "loss": 0.684, "step": 5247 }, { "epoch": 0.55, "learning_rate": 8.99026441856607e-05, "loss": 0.6649, "step": 5248 }, { "epoch": 0.55, "learning_rate": 8.986910176471837e-05, "loss": 0.6272, "step": 5249 }, { "epoch": 0.55, "learning_rate": 8.983556049537773e-05, "loss": 0.707, "step": 5250 }, { "epoch": 0.55, "learning_rate": 8.980202038145141e-05, "loss": 0.6793, "step": 5251 }, { "epoch": 0.55, "learning_rate": 8.976848142675209e-05, "loss": 0.6727, "step": 5252 }, { "epoch": 0.55, "learning_rate": 8.973494363509214e-05, "loss": 0.6515, "step": 5253 }, { "epoch": 0.55, "learning_rate": 8.97014070102839e-05, "loss": 0.6717, "step": 5254 }, { "epoch": 0.55, "learning_rate": 8.966787155613954e-05, "loss": 0.701, "step": 5255 }, { "epoch": 0.55, "learning_rate": 8.963433727647117e-05, "loss": 0.6619, "step": 5256 }, { "epoch": 0.55, "learning_rate": 8.960080417509061e-05, "loss": 0.7005, "step": 5257 }, { "epoch": 0.55, "learning_rate": 8.956727225580974e-05, "loss": 0.6648, "step": 5258 }, { "epoch": 0.55, "learning_rate": 8.95337415224401e-05, "loss": 0.6735, "step": 5259 }, { "epoch": 0.55, "learning_rate": 8.95002119787933e-05, "loss": 0.66, "step": 5260 }, { "epoch": 0.55, "learning_rate": 8.94666836286807e-05, "loss": 0.7259, "step": 5261 }, { "epoch": 0.55, "learning_rate": 8.943315647591347e-05, "loss": 0.6193, "step": 5262 }, { "epoch": 0.55, "learning_rate": 8.939963052430278e-05, "loss": 0.6727, "step": 5263 }, { "epoch": 0.55, "learning_rate": 8.936610577765962e-05, "loss": 0.6168, "step": 5264 }, { "epoch": 0.55, "learning_rate": 8.933258223979474e-05, "loss": 0.6591, "step": 5265 }, { "epoch": 0.55, "learning_rate": 8.92990599145189e-05, "loss": 0.6093, "step": 5266 }, { "epoch": 0.55, "learning_rate": 8.926553880564267e-05, "loss": 0.7057, "step": 5267 }, { "epoch": 0.55, "learning_rate": 8.923201891697639e-05, "loss": 0.6687, "step": 5268 }, { "epoch": 0.55, "learning_rate": 8.91985002523304e-05, "loss": 0.6812, "step": 5269 }, { "epoch": 0.55, "learning_rate": 8.916498281551486e-05, "loss": 0.653, "step": 5270 }, { "epoch": 0.55, "learning_rate": 8.91314666103397e-05, "loss": 0.6125, "step": 5271 }, { "epoch": 0.55, "learning_rate": 8.909795164061487e-05, "loss": 0.6399, "step": 5272 }, { "epoch": 0.55, "learning_rate": 8.906443791015004e-05, "loss": 0.6935, "step": 5273 }, { "epoch": 0.55, "learning_rate": 8.903092542275474e-05, "loss": 0.6154, "step": 5274 }, { "epoch": 0.55, "learning_rate": 8.899741418223848e-05, "loss": 0.7094, "step": 5275 }, { "epoch": 0.55, "learning_rate": 8.896390419241057e-05, "loss": 0.6136, "step": 5276 }, { "epoch": 0.55, "learning_rate": 8.89303954570801e-05, "loss": 0.7297, "step": 5277 }, { "epoch": 0.55, "learning_rate": 8.889688798005617e-05, "loss": 0.6347, "step": 5278 }, { "epoch": 0.55, "learning_rate": 8.886338176514756e-05, "loss": 0.7267, "step": 5279 }, { "epoch": 0.55, "learning_rate": 8.882987681616301e-05, "loss": 0.691, "step": 5280 }, { "epoch": 0.55, "learning_rate": 8.879637313691116e-05, "loss": 0.6716, "step": 5281 }, { "epoch": 0.55, "learning_rate": 8.876287073120037e-05, "loss": 0.7128, "step": 5282 }, { "epoch": 0.55, "learning_rate": 8.872936960283897e-05, "loss": 0.7029, "step": 5283 }, { "epoch": 0.55, "learning_rate": 8.869586975563518e-05, "loss": 0.6688, "step": 5284 }, { "epoch": 0.55, "learning_rate": 8.866237119339687e-05, "loss": 0.7232, "step": 5285 }, { "epoch": 0.55, "learning_rate": 8.862887391993196e-05, "loss": 0.6185, "step": 5286 }, { "epoch": 0.55, "learning_rate": 8.859537793904821e-05, "loss": 0.6593, "step": 5287 }, { "epoch": 0.55, "learning_rate": 8.856188325455307e-05, "loss": 0.6771, "step": 5288 }, { "epoch": 0.55, "learning_rate": 8.852838987025403e-05, "loss": 0.6852, "step": 5289 }, { "epoch": 0.55, "learning_rate": 8.849489778995837e-05, "loss": 0.6639, "step": 5290 }, { "epoch": 0.55, "learning_rate": 8.846140701747314e-05, "loss": 0.681, "step": 5291 }, { "epoch": 0.55, "learning_rate": 8.842791755660537e-05, "loss": 0.6593, "step": 5292 }, { "epoch": 0.55, "learning_rate": 8.83944294111619e-05, "loss": 0.6785, "step": 5293 }, { "epoch": 0.55, "learning_rate": 8.83609425849493e-05, "loss": 0.6657, "step": 5294 }, { "epoch": 0.55, "learning_rate": 8.832745708177417e-05, "loss": 0.684, "step": 5295 }, { "epoch": 0.55, "learning_rate": 8.829397290544291e-05, "loss": 0.6738, "step": 5296 }, { "epoch": 0.55, "learning_rate": 8.826049005976166e-05, "loss": 0.6823, "step": 5297 }, { "epoch": 0.55, "learning_rate": 8.822700854853656e-05, "loss": 0.6529, "step": 5298 }, { "epoch": 0.55, "learning_rate": 8.819352837557349e-05, "loss": 0.6893, "step": 5299 }, { "epoch": 0.55, "learning_rate": 8.816004954467818e-05, "loss": 0.6847, "step": 5300 }, { "epoch": 0.55, "learning_rate": 8.812657205965633e-05, "loss": 0.6976, "step": 5301 }, { "epoch": 0.55, "learning_rate": 8.809309592431332e-05, "loss": 0.6076, "step": 5302 }, { "epoch": 0.55, "learning_rate": 8.805962114245448e-05, "loss": 0.658, "step": 5303 }, { "epoch": 0.55, "learning_rate": 8.802614771788502e-05, "loss": 0.7218, "step": 5304 }, { "epoch": 0.55, "learning_rate": 8.799267565440987e-05, "loss": 0.6552, "step": 5305 }, { "epoch": 0.55, "learning_rate": 8.795920495583387e-05, "loss": 0.6872, "step": 5306 }, { "epoch": 0.55, "learning_rate": 8.792573562596178e-05, "loss": 0.6919, "step": 5307 }, { "epoch": 0.55, "learning_rate": 8.789226766859805e-05, "loss": 0.6449, "step": 5308 }, { "epoch": 0.55, "learning_rate": 8.785880108754709e-05, "loss": 0.7113, "step": 5309 }, { "epoch": 0.55, "learning_rate": 8.782533588661315e-05, "loss": 0.6477, "step": 5310 }, { "epoch": 0.55, "learning_rate": 8.779187206960026e-05, "loss": 0.6888, "step": 5311 }, { "epoch": 0.55, "learning_rate": 8.77584096403123e-05, "loss": 0.6827, "step": 5312 }, { "epoch": 0.55, "learning_rate": 8.772494860255312e-05, "loss": 0.7056, "step": 5313 }, { "epoch": 0.55, "learning_rate": 8.769148896012617e-05, "loss": 0.7329, "step": 5314 }, { "epoch": 0.55, "learning_rate": 8.765803071683497e-05, "loss": 0.6305, "step": 5315 }, { "epoch": 0.55, "learning_rate": 8.76245738764828e-05, "loss": 0.707, "step": 5316 }, { "epoch": 0.55, "learning_rate": 8.759111844287276e-05, "loss": 0.6942, "step": 5317 }, { "epoch": 0.55, "learning_rate": 8.755766441980778e-05, "loss": 0.6884, "step": 5318 }, { "epoch": 0.55, "learning_rate": 8.752421181109065e-05, "loss": 0.6747, "step": 5319 }, { "epoch": 0.55, "learning_rate": 8.749076062052402e-05, "loss": 0.6031, "step": 5320 }, { "epoch": 0.55, "learning_rate": 8.745731085191037e-05, "loss": 0.7063, "step": 5321 }, { "epoch": 0.55, "learning_rate": 8.742386250905199e-05, "loss": 0.6274, "step": 5322 }, { "epoch": 0.55, "learning_rate": 8.739041559575104e-05, "loss": 0.7206, "step": 5323 }, { "epoch": 0.55, "learning_rate": 8.735697011580951e-05, "loss": 0.6923, "step": 5324 }, { "epoch": 0.55, "learning_rate": 8.73235260730292e-05, "loss": 0.5656, "step": 5325 }, { "epoch": 0.55, "learning_rate": 8.729008347121177e-05, "loss": 0.6964, "step": 5326 }, { "epoch": 0.55, "learning_rate": 8.725664231415876e-05, "loss": 0.7222, "step": 5327 }, { "epoch": 0.55, "learning_rate": 8.722320260567143e-05, "loss": 0.7078, "step": 5328 }, { "epoch": 0.55, "learning_rate": 8.7189764349551e-05, "loss": 0.6159, "step": 5329 }, { "epoch": 0.55, "learning_rate": 8.715632754959846e-05, "loss": 0.7024, "step": 5330 }, { "epoch": 0.55, "learning_rate": 8.712289220961463e-05, "loss": 0.6142, "step": 5331 }, { "epoch": 0.56, "learning_rate": 8.708945833340017e-05, "loss": 0.7009, "step": 5332 }, { "epoch": 0.56, "learning_rate": 8.705602592475563e-05, "loss": 0.623, "step": 5333 }, { "epoch": 0.56, "learning_rate": 8.702259498748129e-05, "loss": 0.625, "step": 5334 }, { "epoch": 0.56, "learning_rate": 8.698916552537734e-05, "loss": 0.6511, "step": 5335 }, { "epoch": 0.56, "learning_rate": 8.695573754224381e-05, "loss": 0.6526, "step": 5336 }, { "epoch": 0.56, "learning_rate": 8.692231104188052e-05, "loss": 0.736, "step": 5337 }, { "epoch": 0.56, "learning_rate": 8.688888602808711e-05, "loss": 0.701, "step": 5338 }, { "epoch": 0.56, "learning_rate": 8.685546250466305e-05, "loss": 0.6867, "step": 5339 }, { "epoch": 0.56, "learning_rate": 8.682204047540772e-05, "loss": 0.6826, "step": 5340 }, { "epoch": 0.56, "learning_rate": 8.678861994412031e-05, "loss": 0.6944, "step": 5341 }, { "epoch": 0.56, "learning_rate": 8.67552009145997e-05, "loss": 0.6721, "step": 5342 }, { "epoch": 0.56, "learning_rate": 8.672178339064478e-05, "loss": 0.6415, "step": 5343 }, { "epoch": 0.56, "learning_rate": 8.66883673760542e-05, "loss": 0.6533, "step": 5344 }, { "epoch": 0.56, "learning_rate": 8.665495287462636e-05, "loss": 0.6952, "step": 5345 }, { "epoch": 0.56, "learning_rate": 8.662153989015962e-05, "loss": 0.6762, "step": 5346 }, { "epoch": 0.56, "learning_rate": 8.658812842645214e-05, "loss": 0.6338, "step": 5347 }, { "epoch": 0.56, "learning_rate": 8.655471848730177e-05, "loss": 0.6914, "step": 5348 }, { "epoch": 0.56, "learning_rate": 8.652131007650639e-05, "loss": 0.7174, "step": 5349 }, { "epoch": 0.56, "learning_rate": 8.64879031978636e-05, "loss": 0.6832, "step": 5350 }, { "epoch": 0.56, "learning_rate": 8.645449785517074e-05, "loss": 0.6806, "step": 5351 }, { "epoch": 0.56, "learning_rate": 8.642109405222515e-05, "loss": 0.7035, "step": 5352 }, { "epoch": 0.56, "learning_rate": 8.638769179282394e-05, "loss": 0.6517, "step": 5353 }, { "epoch": 0.56, "learning_rate": 8.635429108076392e-05, "loss": 0.7014, "step": 5354 }, { "epoch": 0.56, "learning_rate": 8.632089191984191e-05, "loss": 0.617, "step": 5355 }, { "epoch": 0.56, "learning_rate": 8.628749431385448e-05, "loss": 0.6535, "step": 5356 }, { "epoch": 0.56, "learning_rate": 8.625409826659791e-05, "loss": 0.6633, "step": 5357 }, { "epoch": 0.56, "learning_rate": 8.62207037818685e-05, "loss": 0.6308, "step": 5358 }, { "epoch": 0.56, "learning_rate": 8.618731086346219e-05, "loss": 0.6433, "step": 5359 }, { "epoch": 0.56, "learning_rate": 8.615391951517489e-05, "loss": 0.6859, "step": 5360 }, { "epoch": 0.56, "learning_rate": 8.612052974080227e-05, "loss": 0.6826, "step": 5361 }, { "epoch": 0.56, "learning_rate": 8.608714154413978e-05, "loss": 0.7146, "step": 5362 }, { "epoch": 0.56, "learning_rate": 8.605375492898275e-05, "loss": 0.6597, "step": 5363 }, { "epoch": 0.56, "learning_rate": 8.602036989912634e-05, "loss": 0.7146, "step": 5364 }, { "epoch": 0.56, "learning_rate": 8.598698645836543e-05, "loss": 0.7326, "step": 5365 }, { "epoch": 0.56, "learning_rate": 8.595360461049484e-05, "loss": 0.718, "step": 5366 }, { "epoch": 0.56, "learning_rate": 8.592022435930918e-05, "loss": 0.6969, "step": 5367 }, { "epoch": 0.56, "learning_rate": 8.588684570860281e-05, "loss": 0.618, "step": 5368 }, { "epoch": 0.56, "learning_rate": 8.585346866216996e-05, "loss": 0.6663, "step": 5369 }, { "epoch": 0.56, "learning_rate": 8.582009322380474e-05, "loss": 0.5742, "step": 5370 }, { "epoch": 0.56, "learning_rate": 8.578671939730088e-05, "loss": 0.6858, "step": 5371 }, { "epoch": 0.56, "learning_rate": 8.575334718645214e-05, "loss": 0.6996, "step": 5372 }, { "epoch": 0.56, "learning_rate": 8.571997659505207e-05, "loss": 0.7017, "step": 5373 }, { "epoch": 0.56, "learning_rate": 8.568660762689385e-05, "loss": 0.7869, "step": 5374 }, { "epoch": 0.56, "learning_rate": 8.565324028577069e-05, "loss": 0.6432, "step": 5375 }, { "epoch": 0.56, "learning_rate": 8.561987457547554e-05, "loss": 0.6628, "step": 5376 }, { "epoch": 0.56, "learning_rate": 8.558651049980109e-05, "loss": 0.6773, "step": 5377 }, { "epoch": 0.56, "learning_rate": 8.555314806253997e-05, "loss": 0.6845, "step": 5378 }, { "epoch": 0.56, "learning_rate": 8.551978726748449e-05, "loss": 0.6643, "step": 5379 }, { "epoch": 0.56, "learning_rate": 8.548642811842689e-05, "loss": 0.6576, "step": 5380 }, { "epoch": 0.56, "learning_rate": 8.545307061915921e-05, "loss": 0.6971, "step": 5381 }, { "epoch": 0.56, "learning_rate": 8.541971477347324e-05, "loss": 0.6479, "step": 5382 }, { "epoch": 0.56, "learning_rate": 8.538636058516058e-05, "loss": 0.7094, "step": 5383 }, { "epoch": 0.56, "learning_rate": 8.535300805801273e-05, "loss": 0.658, "step": 5384 }, { "epoch": 0.56, "learning_rate": 8.531965719582092e-05, "loss": 0.6485, "step": 5385 }, { "epoch": 0.56, "learning_rate": 8.528630800237618e-05, "loss": 0.6812, "step": 5386 }, { "epoch": 0.56, "learning_rate": 8.52529604814695e-05, "loss": 0.6766, "step": 5387 }, { "epoch": 0.56, "learning_rate": 8.521961463689144e-05, "loss": 0.5918, "step": 5388 }, { "epoch": 0.56, "learning_rate": 8.518627047243254e-05, "loss": 0.6859, "step": 5389 }, { "epoch": 0.56, "learning_rate": 8.515292799188315e-05, "loss": 0.7042, "step": 5390 }, { "epoch": 0.56, "learning_rate": 8.511958719903332e-05, "loss": 0.6476, "step": 5391 }, { "epoch": 0.56, "learning_rate": 8.508624809767297e-05, "loss": 0.6271, "step": 5392 }, { "epoch": 0.56, "learning_rate": 8.505291069159192e-05, "loss": 0.7048, "step": 5393 }, { "epoch": 0.56, "learning_rate": 8.501957498457962e-05, "loss": 0.6701, "step": 5394 }, { "epoch": 0.56, "learning_rate": 8.498624098042541e-05, "loss": 0.6675, "step": 5395 }, { "epoch": 0.56, "learning_rate": 8.495290868291852e-05, "loss": 0.695, "step": 5396 }, { "epoch": 0.56, "learning_rate": 8.491957809584781e-05, "loss": 0.6736, "step": 5397 }, { "epoch": 0.56, "learning_rate": 8.488624922300213e-05, "loss": 0.6667, "step": 5398 }, { "epoch": 0.56, "learning_rate": 8.485292206816995e-05, "loss": 0.7376, "step": 5399 }, { "epoch": 0.56, "learning_rate": 8.481959663513972e-05, "loss": 0.7108, "step": 5400 }, { "epoch": 0.56, "learning_rate": 8.478627292769959e-05, "loss": 0.6896, "step": 5401 }, { "epoch": 0.56, "learning_rate": 8.475295094963756e-05, "loss": 0.6258, "step": 5402 }, { "epoch": 0.56, "learning_rate": 8.471963070474134e-05, "loss": 0.6877, "step": 5403 }, { "epoch": 0.56, "learning_rate": 8.468631219679863e-05, "loss": 0.6998, "step": 5404 }, { "epoch": 0.56, "learning_rate": 8.465299542959672e-05, "loss": 0.7097, "step": 5405 }, { "epoch": 0.56, "learning_rate": 8.461968040692286e-05, "loss": 0.6931, "step": 5406 }, { "epoch": 0.56, "learning_rate": 8.458636713256401e-05, "loss": 0.6807, "step": 5407 }, { "epoch": 0.56, "learning_rate": 8.455305561030697e-05, "loss": 0.6332, "step": 5408 }, { "epoch": 0.56, "learning_rate": 8.451974584393832e-05, "loss": 0.7256, "step": 5409 }, { "epoch": 0.56, "learning_rate": 8.448643783724452e-05, "loss": 0.6231, "step": 5410 }, { "epoch": 0.56, "learning_rate": 8.445313159401169e-05, "loss": 0.6595, "step": 5411 }, { "epoch": 0.56, "learning_rate": 8.441982711802584e-05, "loss": 0.6743, "step": 5412 }, { "epoch": 0.56, "learning_rate": 8.438652441307284e-05, "loss": 0.6765, "step": 5413 }, { "epoch": 0.56, "learning_rate": 8.435322348293817e-05, "loss": 0.6575, "step": 5414 }, { "epoch": 0.56, "learning_rate": 8.431992433140726e-05, "loss": 0.6801, "step": 5415 }, { "epoch": 0.56, "learning_rate": 8.428662696226536e-05, "loss": 0.6245, "step": 5416 }, { "epoch": 0.56, "learning_rate": 8.425333137929736e-05, "loss": 0.6665, "step": 5417 }, { "epoch": 0.56, "learning_rate": 8.422003758628813e-05, "loss": 0.6693, "step": 5418 }, { "epoch": 0.56, "learning_rate": 8.418674558702216e-05, "loss": 0.643, "step": 5419 }, { "epoch": 0.56, "learning_rate": 8.415345538528389e-05, "loss": 0.669, "step": 5420 }, { "epoch": 0.56, "learning_rate": 8.41201669848575e-05, "loss": 0.6431, "step": 5421 }, { "epoch": 0.56, "learning_rate": 8.408688038952687e-05, "loss": 0.6962, "step": 5422 }, { "epoch": 0.56, "learning_rate": 8.405359560307584e-05, "loss": 0.6493, "step": 5423 }, { "epoch": 0.56, "learning_rate": 8.402031262928798e-05, "loss": 0.7135, "step": 5424 }, { "epoch": 0.56, "learning_rate": 8.398703147194657e-05, "loss": 0.701, "step": 5425 }, { "epoch": 0.56, "learning_rate": 8.39537521348348e-05, "loss": 0.6393, "step": 5426 }, { "epoch": 0.56, "learning_rate": 8.392047462173563e-05, "loss": 0.6989, "step": 5427 }, { "epoch": 0.57, "learning_rate": 8.388719893643169e-05, "loss": 0.6441, "step": 5428 }, { "epoch": 0.57, "learning_rate": 8.385392508270557e-05, "loss": 0.7128, "step": 5429 }, { "epoch": 0.57, "learning_rate": 8.382065306433963e-05, "loss": 0.67, "step": 5430 }, { "epoch": 0.57, "learning_rate": 8.378738288511587e-05, "loss": 0.7299, "step": 5431 }, { "epoch": 0.57, "learning_rate": 8.375411454881626e-05, "loss": 0.6731, "step": 5432 }, { "epoch": 0.57, "learning_rate": 8.372084805922245e-05, "loss": 0.6611, "step": 5433 }, { "epoch": 0.57, "learning_rate": 8.368758342011593e-05, "loss": 0.6795, "step": 5434 }, { "epoch": 0.57, "learning_rate": 8.365432063527795e-05, "loss": 0.687, "step": 5435 }, { "epoch": 0.57, "learning_rate": 8.362105970848961e-05, "loss": 0.6243, "step": 5436 }, { "epoch": 0.57, "learning_rate": 8.358780064353168e-05, "loss": 0.6864, "step": 5437 }, { "epoch": 0.57, "learning_rate": 8.355454344418487e-05, "loss": 0.6965, "step": 5438 }, { "epoch": 0.57, "learning_rate": 8.352128811422952e-05, "loss": 0.6622, "step": 5439 }, { "epoch": 0.57, "learning_rate": 8.348803465744591e-05, "loss": 0.6923, "step": 5440 }, { "epoch": 0.57, "learning_rate": 8.345478307761401e-05, "loss": 0.7019, "step": 5441 }, { "epoch": 0.57, "learning_rate": 8.342153337851356e-05, "loss": 0.6928, "step": 5442 }, { "epoch": 0.57, "learning_rate": 8.338828556392415e-05, "loss": 0.6441, "step": 5443 }, { "epoch": 0.57, "learning_rate": 8.33550396376252e-05, "loss": 0.5597, "step": 5444 }, { "epoch": 0.57, "learning_rate": 8.332179560339573e-05, "loss": 0.7165, "step": 5445 }, { "epoch": 0.57, "learning_rate": 8.328855346501476e-05, "loss": 0.6765, "step": 5446 }, { "epoch": 0.57, "learning_rate": 8.325531322626098e-05, "loss": 0.679, "step": 5447 }, { "epoch": 0.57, "learning_rate": 8.322207489091282e-05, "loss": 0.6884, "step": 5448 }, { "epoch": 0.57, "learning_rate": 8.318883846274859e-05, "loss": 0.672, "step": 5449 }, { "epoch": 0.57, "learning_rate": 8.31556039455464e-05, "loss": 0.7532, "step": 5450 }, { "epoch": 0.57, "learning_rate": 8.312237134308402e-05, "loss": 0.6395, "step": 5451 }, { "epoch": 0.57, "learning_rate": 8.308914065913911e-05, "loss": 0.7509, "step": 5452 }, { "epoch": 0.57, "learning_rate": 8.305591189748909e-05, "loss": 0.779, "step": 5453 }, { "epoch": 0.57, "learning_rate": 8.302268506191108e-05, "loss": 0.6435, "step": 5454 }, { "epoch": 0.57, "learning_rate": 8.29894601561821e-05, "loss": 0.7065, "step": 5455 }, { "epoch": 0.57, "learning_rate": 8.295623718407892e-05, "loss": 0.7111, "step": 5456 }, { "epoch": 0.57, "learning_rate": 8.292301614937801e-05, "loss": 0.6693, "step": 5457 }, { "epoch": 0.57, "learning_rate": 8.288979705585575e-05, "loss": 0.7385, "step": 5458 }, { "epoch": 0.57, "learning_rate": 8.285657990728816e-05, "loss": 0.6408, "step": 5459 }, { "epoch": 0.57, "learning_rate": 8.282336470745112e-05, "loss": 0.6305, "step": 5460 }, { "epoch": 0.57, "learning_rate": 8.279015146012031e-05, "loss": 0.7227, "step": 5461 }, { "epoch": 0.57, "learning_rate": 8.27569401690711e-05, "loss": 0.5966, "step": 5462 }, { "epoch": 0.57, "learning_rate": 8.272373083807872e-05, "loss": 0.6741, "step": 5463 }, { "epoch": 0.57, "learning_rate": 8.269052347091822e-05, "loss": 0.745, "step": 5464 }, { "epoch": 0.57, "learning_rate": 8.265731807136423e-05, "loss": 0.7217, "step": 5465 }, { "epoch": 0.57, "learning_rate": 8.262411464319134e-05, "loss": 0.6995, "step": 5466 }, { "epoch": 0.57, "learning_rate": 8.259091319017389e-05, "loss": 0.6738, "step": 5467 }, { "epoch": 0.57, "learning_rate": 8.255771371608588e-05, "loss": 0.5852, "step": 5468 }, { "epoch": 0.57, "learning_rate": 8.252451622470122e-05, "loss": 0.7145, "step": 5469 }, { "epoch": 0.57, "learning_rate": 8.249132071979358e-05, "loss": 0.7276, "step": 5470 }, { "epoch": 0.57, "learning_rate": 8.24581272051363e-05, "loss": 0.6636, "step": 5471 }, { "epoch": 0.57, "learning_rate": 8.242493568450258e-05, "loss": 0.726, "step": 5472 }, { "epoch": 0.57, "learning_rate": 8.23917461616654e-05, "loss": 0.6739, "step": 5473 }, { "epoch": 0.57, "learning_rate": 8.235855864039744e-05, "loss": 0.675, "step": 5474 }, { "epoch": 0.57, "learning_rate": 8.232537312447122e-05, "loss": 0.646, "step": 5475 }, { "epoch": 0.57, "learning_rate": 8.229218961765905e-05, "loss": 0.6703, "step": 5476 }, { "epoch": 0.57, "learning_rate": 8.225900812373293e-05, "loss": 0.6897, "step": 5477 }, { "epoch": 0.57, "learning_rate": 8.222582864646467e-05, "loss": 0.7341, "step": 5478 }, { "epoch": 0.57, "learning_rate": 8.219265118962588e-05, "loss": 0.6403, "step": 5479 }, { "epoch": 0.57, "learning_rate": 8.215947575698787e-05, "loss": 0.6333, "step": 5480 }, { "epoch": 0.57, "learning_rate": 8.212630235232184e-05, "loss": 0.6849, "step": 5481 }, { "epoch": 0.57, "learning_rate": 8.209313097939861e-05, "loss": 0.6885, "step": 5482 }, { "epoch": 0.57, "learning_rate": 8.205996164198887e-05, "loss": 0.6403, "step": 5483 }, { "epoch": 0.57, "learning_rate": 8.202679434386308e-05, "loss": 0.7095, "step": 5484 }, { "epoch": 0.57, "learning_rate": 8.199362908879142e-05, "loss": 0.6642, "step": 5485 }, { "epoch": 0.57, "learning_rate": 8.196046588054384e-05, "loss": 0.6937, "step": 5486 }, { "epoch": 0.57, "learning_rate": 8.192730472289011e-05, "loss": 0.708, "step": 5487 }, { "epoch": 0.57, "learning_rate": 8.18941456195997e-05, "loss": 0.6941, "step": 5488 }, { "epoch": 0.57, "learning_rate": 8.186098857444186e-05, "loss": 0.6792, "step": 5489 }, { "epoch": 0.57, "learning_rate": 8.182783359118572e-05, "loss": 0.6362, "step": 5490 }, { "epoch": 0.57, "learning_rate": 8.179468067359999e-05, "loss": 0.7191, "step": 5491 }, { "epoch": 0.57, "learning_rate": 8.176152982545324e-05, "loss": 0.656, "step": 5492 }, { "epoch": 0.57, "learning_rate": 8.172838105051387e-05, "loss": 0.6677, "step": 5493 }, { "epoch": 0.57, "learning_rate": 8.169523435254988e-05, "loss": 0.6654, "step": 5494 }, { "epoch": 0.57, "learning_rate": 8.166208973532919e-05, "loss": 0.7078, "step": 5495 }, { "epoch": 0.57, "learning_rate": 8.162894720261944e-05, "loss": 0.6585, "step": 5496 }, { "epoch": 0.57, "learning_rate": 8.159580675818796e-05, "loss": 0.705, "step": 5497 }, { "epoch": 0.57, "learning_rate": 8.156266840580194e-05, "loss": 0.6451, "step": 5498 }, { "epoch": 0.57, "learning_rate": 8.152953214922825e-05, "loss": 0.6972, "step": 5499 }, { "epoch": 0.57, "learning_rate": 8.149639799223356e-05, "loss": 0.7185, "step": 5500 }, { "epoch": 0.57, "learning_rate": 8.146326593858439e-05, "loss": 0.6536, "step": 5501 }, { "epoch": 0.57, "learning_rate": 8.14301359920468e-05, "loss": 0.6612, "step": 5502 }, { "epoch": 0.57, "learning_rate": 8.139700815638687e-05, "loss": 0.6574, "step": 5503 }, { "epoch": 0.57, "learning_rate": 8.136388243537025e-05, "loss": 0.639, "step": 5504 }, { "epoch": 0.57, "learning_rate": 8.13307588327624e-05, "loss": 0.7251, "step": 5505 }, { "epoch": 0.57, "learning_rate": 8.129763735232858e-05, "loss": 0.716, "step": 5506 }, { "epoch": 0.57, "learning_rate": 8.126451799783381e-05, "loss": 0.7004, "step": 5507 }, { "epoch": 0.57, "learning_rate": 8.123140077304277e-05, "loss": 0.7119, "step": 5508 }, { "epoch": 0.57, "learning_rate": 8.119828568172004e-05, "loss": 0.7469, "step": 5509 }, { "epoch": 0.57, "learning_rate": 8.116517272762983e-05, "loss": 0.6994, "step": 5510 }, { "epoch": 0.57, "learning_rate": 8.113206191453621e-05, "loss": 0.6783, "step": 5511 }, { "epoch": 0.57, "learning_rate": 8.109895324620291e-05, "loss": 0.779, "step": 5512 }, { "epoch": 0.57, "learning_rate": 8.106584672639352e-05, "loss": 0.6735, "step": 5513 }, { "epoch": 0.57, "learning_rate": 8.103274235887127e-05, "loss": 0.6789, "step": 5514 }, { "epoch": 0.57, "learning_rate": 8.099964014739927e-05, "loss": 0.6599, "step": 5515 }, { "epoch": 0.57, "learning_rate": 8.096654009574029e-05, "loss": 0.676, "step": 5516 }, { "epoch": 0.57, "learning_rate": 8.093344220765688e-05, "loss": 0.616, "step": 5517 }, { "epoch": 0.57, "learning_rate": 8.090034648691139e-05, "loss": 0.7085, "step": 5518 }, { "epoch": 0.57, "learning_rate": 8.086725293726579e-05, "loss": 0.6664, "step": 5519 }, { "epoch": 0.57, "learning_rate": 8.083416156248197e-05, "loss": 0.6514, "step": 5520 }, { "epoch": 0.57, "learning_rate": 8.080107236632153e-05, "loss": 0.6867, "step": 5521 }, { "epoch": 0.57, "learning_rate": 8.076798535254571e-05, "loss": 0.6399, "step": 5522 }, { "epoch": 0.57, "learning_rate": 8.073490052491565e-05, "loss": 0.7065, "step": 5523 }, { "epoch": 0.57, "learning_rate": 8.070181788719218e-05, "loss": 0.736, "step": 5524 }, { "epoch": 0.58, "learning_rate": 8.06687374431358e-05, "loss": 0.6745, "step": 5525 }, { "epoch": 0.58, "learning_rate": 8.063565919650689e-05, "loss": 0.6574, "step": 5526 }, { "epoch": 0.58, "learning_rate": 8.060258315106556e-05, "loss": 0.6049, "step": 5527 }, { "epoch": 0.58, "learning_rate": 8.056950931057156e-05, "loss": 0.648, "step": 5528 }, { "epoch": 0.58, "learning_rate": 8.053643767878452e-05, "loss": 0.6801, "step": 5529 }, { "epoch": 0.58, "learning_rate": 8.050336825946379e-05, "loss": 0.6228, "step": 5530 }, { "epoch": 0.58, "learning_rate": 8.047030105636835e-05, "loss": 0.6474, "step": 5531 }, { "epoch": 0.58, "learning_rate": 8.043723607325708e-05, "loss": 0.7144, "step": 5532 }, { "epoch": 0.58, "learning_rate": 8.040417331388862e-05, "loss": 0.6823, "step": 5533 }, { "epoch": 0.58, "learning_rate": 8.037111278202114e-05, "loss": 0.6205, "step": 5534 }, { "epoch": 0.58, "learning_rate": 8.033805448141282e-05, "loss": 0.7125, "step": 5535 }, { "epoch": 0.58, "learning_rate": 8.030499841582144e-05, "loss": 0.6726, "step": 5536 }, { "epoch": 0.58, "learning_rate": 8.027194458900453e-05, "loss": 0.6984, "step": 5537 }, { "epoch": 0.58, "learning_rate": 8.023889300471943e-05, "loss": 0.6734, "step": 5538 }, { "epoch": 0.58, "learning_rate": 8.020584366672312e-05, "loss": 0.6891, "step": 5539 }, { "epoch": 0.58, "learning_rate": 8.017279657877244e-05, "loss": 0.6912, "step": 5540 }, { "epoch": 0.58, "learning_rate": 8.013975174462397e-05, "loss": 0.6903, "step": 5541 }, { "epoch": 0.58, "learning_rate": 8.010670916803393e-05, "loss": 0.6954, "step": 5542 }, { "epoch": 0.58, "learning_rate": 8.007366885275834e-05, "loss": 0.6728, "step": 5543 }, { "epoch": 0.58, "learning_rate": 8.004063080255301e-05, "loss": 0.6659, "step": 5544 }, { "epoch": 0.58, "learning_rate": 8.000759502117337e-05, "loss": 0.7003, "step": 5545 }, { "epoch": 0.58, "learning_rate": 7.997456151237474e-05, "loss": 0.5938, "step": 5546 }, { "epoch": 0.58, "learning_rate": 7.994153027991212e-05, "loss": 0.7102, "step": 5547 }, { "epoch": 0.58, "learning_rate": 7.99085013275402e-05, "loss": 0.7254, "step": 5548 }, { "epoch": 0.58, "learning_rate": 7.987547465901345e-05, "loss": 0.6607, "step": 5549 }, { "epoch": 0.58, "learning_rate": 7.984245027808615e-05, "loss": 0.6682, "step": 5550 }, { "epoch": 0.58, "learning_rate": 7.980942818851216e-05, "loss": 0.6327, "step": 5551 }, { "epoch": 0.58, "learning_rate": 7.977640839404522e-05, "loss": 0.6149, "step": 5552 }, { "epoch": 0.58, "learning_rate": 7.974339089843882e-05, "loss": 0.6969, "step": 5553 }, { "epoch": 0.58, "learning_rate": 7.971037570544602e-05, "loss": 0.6801, "step": 5554 }, { "epoch": 0.58, "learning_rate": 7.967736281881983e-05, "loss": 0.6672, "step": 5555 }, { "epoch": 0.58, "learning_rate": 7.964435224231288e-05, "loss": 0.7222, "step": 5556 }, { "epoch": 0.58, "learning_rate": 7.961134397967747e-05, "loss": 0.6278, "step": 5557 }, { "epoch": 0.58, "learning_rate": 7.957833803466584e-05, "loss": 0.6365, "step": 5558 }, { "epoch": 0.58, "learning_rate": 7.954533441102975e-05, "loss": 0.6544, "step": 5559 }, { "epoch": 0.58, "learning_rate": 7.951233311252084e-05, "loss": 0.6878, "step": 5560 }, { "epoch": 0.58, "learning_rate": 7.947933414289048e-05, "loss": 0.6876, "step": 5561 }, { "epoch": 0.58, "learning_rate": 7.944633750588966e-05, "loss": 0.6408, "step": 5562 }, { "epoch": 0.58, "learning_rate": 7.941334320526922e-05, "loss": 0.7127, "step": 5563 }, { "epoch": 0.58, "learning_rate": 7.938035124477972e-05, "loss": 0.6478, "step": 5564 }, { "epoch": 0.58, "learning_rate": 7.934736162817136e-05, "loss": 0.6843, "step": 5565 }, { "epoch": 0.58, "learning_rate": 7.931437435919419e-05, "loss": 0.713, "step": 5566 }, { "epoch": 0.58, "learning_rate": 7.928138944159798e-05, "loss": 0.6763, "step": 5567 }, { "epoch": 0.58, "learning_rate": 7.924840687913214e-05, "loss": 0.7047, "step": 5568 }, { "epoch": 0.58, "learning_rate": 7.921542667554585e-05, "loss": 0.6309, "step": 5569 }, { "epoch": 0.58, "learning_rate": 7.918244883458814e-05, "loss": 0.7415, "step": 5570 }, { "epoch": 0.58, "learning_rate": 7.914947336000757e-05, "loss": 0.7342, "step": 5571 }, { "epoch": 0.58, "learning_rate": 7.911650025555259e-05, "loss": 0.6348, "step": 5572 }, { "epoch": 0.58, "learning_rate": 7.908352952497136e-05, "loss": 0.6676, "step": 5573 }, { "epoch": 0.58, "learning_rate": 7.905056117201166e-05, "loss": 0.6629, "step": 5574 }, { "epoch": 0.58, "learning_rate": 7.901759520042109e-05, "loss": 0.7027, "step": 5575 }, { "epoch": 0.58, "learning_rate": 7.898463161394703e-05, "loss": 0.6452, "step": 5576 }, { "epoch": 0.58, "learning_rate": 7.895167041633644e-05, "loss": 0.6566, "step": 5577 }, { "epoch": 0.58, "learning_rate": 7.891871161133617e-05, "loss": 0.7664, "step": 5578 }, { "epoch": 0.58, "learning_rate": 7.888575520269265e-05, "loss": 0.6684, "step": 5579 }, { "epoch": 0.58, "learning_rate": 7.885280119415214e-05, "loss": 0.7055, "step": 5580 }, { "epoch": 0.58, "learning_rate": 7.881984958946061e-05, "loss": 0.7258, "step": 5581 }, { "epoch": 0.58, "learning_rate": 7.878690039236372e-05, "loss": 0.7097, "step": 5582 }, { "epoch": 0.58, "learning_rate": 7.875395360660687e-05, "loss": 0.6893, "step": 5583 }, { "epoch": 0.58, "learning_rate": 7.872100923593524e-05, "loss": 0.6948, "step": 5584 }, { "epoch": 0.58, "learning_rate": 7.868806728409362e-05, "loss": 0.6942, "step": 5585 }, { "epoch": 0.58, "learning_rate": 7.865512775482667e-05, "loss": 0.6539, "step": 5586 }, { "epoch": 0.58, "learning_rate": 7.862219065187865e-05, "loss": 0.7085, "step": 5587 }, { "epoch": 0.58, "learning_rate": 7.85892559789936e-05, "loss": 0.6995, "step": 5588 }, { "epoch": 0.58, "learning_rate": 7.855632373991527e-05, "loss": 0.677, "step": 5589 }, { "epoch": 0.58, "learning_rate": 7.85233939383872e-05, "loss": 0.699, "step": 5590 }, { "epoch": 0.58, "learning_rate": 7.84904665781525e-05, "loss": 0.6929, "step": 5591 }, { "epoch": 0.58, "learning_rate": 7.845754166295417e-05, "loss": 0.6853, "step": 5592 }, { "epoch": 0.58, "learning_rate": 7.842461919653482e-05, "loss": 0.6246, "step": 5593 }, { "epoch": 0.58, "learning_rate": 7.839169918263684e-05, "loss": 0.6811, "step": 5594 }, { "epoch": 0.58, "learning_rate": 7.835878162500228e-05, "loss": 0.6753, "step": 5595 }, { "epoch": 0.58, "learning_rate": 7.832586652737304e-05, "loss": 0.6818, "step": 5596 }, { "epoch": 0.58, "learning_rate": 7.829295389349055e-05, "loss": 0.6935, "step": 5597 }, { "epoch": 0.58, "learning_rate": 7.826004372709615e-05, "loss": 0.7102, "step": 5598 }, { "epoch": 0.58, "learning_rate": 7.822713603193072e-05, "loss": 0.6721, "step": 5599 }, { "epoch": 0.58, "learning_rate": 7.819423081173503e-05, "loss": 0.6503, "step": 5600 }, { "epoch": 0.58, "learning_rate": 7.816132807024949e-05, "loss": 0.639, "step": 5601 }, { "epoch": 0.58, "learning_rate": 7.812842781121414e-05, "loss": 0.6616, "step": 5602 }, { "epoch": 0.58, "learning_rate": 7.809553003836888e-05, "loss": 0.6605, "step": 5603 }, { "epoch": 0.58, "learning_rate": 7.806263475545333e-05, "loss": 0.6479, "step": 5604 }, { "epoch": 0.58, "learning_rate": 7.802974196620668e-05, "loss": 0.6328, "step": 5605 }, { "epoch": 0.58, "learning_rate": 7.799685167436797e-05, "loss": 0.6692, "step": 5606 }, { "epoch": 0.58, "learning_rate": 7.796396388367593e-05, "loss": 0.6945, "step": 5607 }, { "epoch": 0.58, "learning_rate": 7.79310785978689e-05, "loss": 0.7076, "step": 5608 }, { "epoch": 0.58, "learning_rate": 7.78981958206851e-05, "loss": 0.6945, "step": 5609 }, { "epoch": 0.58, "learning_rate": 7.786531555586243e-05, "loss": 0.6918, "step": 5610 }, { "epoch": 0.58, "learning_rate": 7.783243780713834e-05, "loss": 0.638, "step": 5611 }, { "epoch": 0.58, "learning_rate": 7.779956257825021e-05, "loss": 0.7092, "step": 5612 }, { "epoch": 0.58, "learning_rate": 7.776668987293505e-05, "loss": 0.724, "step": 5613 }, { "epoch": 0.58, "learning_rate": 7.773381969492948e-05, "loss": 0.6336, "step": 5614 }, { "epoch": 0.58, "learning_rate": 7.770095204797003e-05, "loss": 0.7026, "step": 5615 }, { "epoch": 0.58, "learning_rate": 7.766808693579274e-05, "loss": 0.6861, "step": 5616 }, { "epoch": 0.58, "learning_rate": 7.763522436213352e-05, "loss": 0.688, "step": 5617 }, { "epoch": 0.58, "learning_rate": 7.760236433072796e-05, "loss": 0.6932, "step": 5618 }, { "epoch": 0.58, "learning_rate": 7.756950684531127e-05, "loss": 0.6239, "step": 5619 }, { "epoch": 0.58, "learning_rate": 7.753665190961843e-05, "loss": 0.5836, "step": 5620 }, { "epoch": 0.59, "learning_rate": 7.750379952738422e-05, "loss": 0.6909, "step": 5621 }, { "epoch": 0.59, "learning_rate": 7.747094970234293e-05, "loss": 0.6763, "step": 5622 }, { "epoch": 0.59, "learning_rate": 7.743810243822873e-05, "loss": 0.6801, "step": 5623 }, { "epoch": 0.59, "learning_rate": 7.74052577387755e-05, "loss": 0.7114, "step": 5624 }, { "epoch": 0.59, "learning_rate": 7.737241560771665e-05, "loss": 0.7365, "step": 5625 }, { "epoch": 0.59, "learning_rate": 7.733957604878548e-05, "loss": 0.7291, "step": 5626 }, { "epoch": 0.59, "learning_rate": 7.730673906571497e-05, "loss": 0.7174, "step": 5627 }, { "epoch": 0.59, "learning_rate": 7.727390466223769e-05, "loss": 0.6459, "step": 5628 }, { "epoch": 0.59, "learning_rate": 7.724107284208604e-05, "loss": 0.6795, "step": 5629 }, { "epoch": 0.59, "learning_rate": 7.720824360899212e-05, "loss": 0.6614, "step": 5630 }, { "epoch": 0.59, "learning_rate": 7.717541696668765e-05, "loss": 0.6545, "step": 5631 }, { "epoch": 0.59, "learning_rate": 7.714259291890415e-05, "loss": 0.6669, "step": 5632 }, { "epoch": 0.59, "learning_rate": 7.710977146937278e-05, "loss": 0.7114, "step": 5633 }, { "epoch": 0.59, "learning_rate": 7.707695262182439e-05, "loss": 0.6772, "step": 5634 }, { "epoch": 0.59, "learning_rate": 7.704413637998966e-05, "loss": 0.6653, "step": 5635 }, { "epoch": 0.59, "learning_rate": 7.701132274759879e-05, "loss": 0.7161, "step": 5636 }, { "epoch": 0.59, "learning_rate": 7.697851172838182e-05, "loss": 0.6421, "step": 5637 }, { "epoch": 0.59, "learning_rate": 7.69457033260685e-05, "loss": 0.7217, "step": 5638 }, { "epoch": 0.59, "learning_rate": 7.691289754438816e-05, "loss": 0.6848, "step": 5639 }, { "epoch": 0.59, "learning_rate": 7.68800943870699e-05, "loss": 0.6985, "step": 5640 }, { "epoch": 0.59, "learning_rate": 7.684729385784263e-05, "loss": 0.6548, "step": 5641 }, { "epoch": 0.59, "learning_rate": 7.681449596043474e-05, "loss": 0.6673, "step": 5642 }, { "epoch": 0.59, "learning_rate": 7.678170069857446e-05, "loss": 0.6417, "step": 5643 }, { "epoch": 0.59, "learning_rate": 7.67489080759898e-05, "loss": 0.6921, "step": 5644 }, { "epoch": 0.59, "learning_rate": 7.671611809640826e-05, "loss": 0.6825, "step": 5645 }, { "epoch": 0.59, "learning_rate": 7.668333076355718e-05, "loss": 0.6593, "step": 5646 }, { "epoch": 0.59, "learning_rate": 7.665054608116363e-05, "loss": 0.7403, "step": 5647 }, { "epoch": 0.59, "learning_rate": 7.66177640529542e-05, "loss": 0.7112, "step": 5648 }, { "epoch": 0.59, "learning_rate": 7.658498468265537e-05, "loss": 0.7051, "step": 5649 }, { "epoch": 0.59, "learning_rate": 7.655220797399327e-05, "loss": 0.6456, "step": 5650 }, { "epoch": 0.59, "learning_rate": 7.651943393069365e-05, "loss": 0.7206, "step": 5651 }, { "epoch": 0.59, "learning_rate": 7.648666255648201e-05, "loss": 0.6268, "step": 5652 }, { "epoch": 0.59, "learning_rate": 7.645389385508359e-05, "loss": 0.647, "step": 5653 }, { "epoch": 0.59, "learning_rate": 7.642112783022322e-05, "loss": 0.6962, "step": 5654 }, { "epoch": 0.59, "learning_rate": 7.638836448562555e-05, "loss": 0.6915, "step": 5655 }, { "epoch": 0.59, "learning_rate": 7.635560382501478e-05, "loss": 0.64, "step": 5656 }, { "epoch": 0.59, "learning_rate": 7.632284585211496e-05, "loss": 0.6377, "step": 5657 }, { "epoch": 0.59, "learning_rate": 7.629009057064972e-05, "loss": 0.6449, "step": 5658 }, { "epoch": 0.59, "learning_rate": 7.625733798434247e-05, "loss": 0.6238, "step": 5659 }, { "epoch": 0.59, "learning_rate": 7.622458809691621e-05, "loss": 0.6432, "step": 5660 }, { "epoch": 0.59, "learning_rate": 7.619184091209377e-05, "loss": 0.6571, "step": 5661 }, { "epoch": 0.59, "learning_rate": 7.61590964335975e-05, "loss": 0.6611, "step": 5662 }, { "epoch": 0.59, "learning_rate": 7.612635466514961e-05, "loss": 0.6245, "step": 5663 }, { "epoch": 0.59, "learning_rate": 7.60936156104719e-05, "loss": 0.617, "step": 5664 }, { "epoch": 0.59, "learning_rate": 7.60608792732859e-05, "loss": 0.682, "step": 5665 }, { "epoch": 0.59, "learning_rate": 7.60281456573128e-05, "loss": 0.7178, "step": 5666 }, { "epoch": 0.59, "learning_rate": 7.599541476627355e-05, "loss": 0.6416, "step": 5667 }, { "epoch": 0.59, "learning_rate": 7.596268660388868e-05, "loss": 0.6406, "step": 5668 }, { "epoch": 0.59, "learning_rate": 7.592996117387854e-05, "loss": 0.6844, "step": 5669 }, { "epoch": 0.59, "learning_rate": 7.589723847996305e-05, "loss": 0.6949, "step": 5670 }, { "epoch": 0.59, "learning_rate": 7.58645185258619e-05, "loss": 0.6667, "step": 5671 }, { "epoch": 0.59, "learning_rate": 7.58318013152944e-05, "loss": 0.7278, "step": 5672 }, { "epoch": 0.59, "learning_rate": 7.579908685197967e-05, "loss": 0.7071, "step": 5673 }, { "epoch": 0.59, "learning_rate": 7.576637513963633e-05, "loss": 0.6599, "step": 5674 }, { "epoch": 0.59, "learning_rate": 7.57336661819829e-05, "loss": 0.6793, "step": 5675 }, { "epoch": 0.59, "learning_rate": 7.570095998273737e-05, "loss": 0.7142, "step": 5676 }, { "epoch": 0.59, "learning_rate": 7.566825654561762e-05, "loss": 0.6862, "step": 5677 }, { "epoch": 0.59, "learning_rate": 7.56355558743411e-05, "loss": 0.6688, "step": 5678 }, { "epoch": 0.59, "learning_rate": 7.56028579726249e-05, "loss": 0.7143, "step": 5679 }, { "epoch": 0.59, "learning_rate": 7.557016284418591e-05, "loss": 0.6916, "step": 5680 }, { "epoch": 0.59, "learning_rate": 7.553747049274072e-05, "loss": 0.6915, "step": 5681 }, { "epoch": 0.59, "learning_rate": 7.550478092200542e-05, "loss": 0.6528, "step": 5682 }, { "epoch": 0.59, "learning_rate": 7.547209413569601e-05, "loss": 0.7132, "step": 5683 }, { "epoch": 0.59, "learning_rate": 7.543941013752806e-05, "loss": 0.7094, "step": 5684 }, { "epoch": 0.59, "learning_rate": 7.540672893121674e-05, "loss": 0.6973, "step": 5685 }, { "epoch": 0.59, "learning_rate": 7.537405052047707e-05, "loss": 0.6952, "step": 5686 }, { "epoch": 0.59, "learning_rate": 7.53413749090237e-05, "loss": 0.6723, "step": 5687 }, { "epoch": 0.59, "learning_rate": 7.530870210057086e-05, "loss": 0.6465, "step": 5688 }, { "epoch": 0.59, "learning_rate": 7.527603209883261e-05, "loss": 0.7054, "step": 5689 }, { "epoch": 0.59, "learning_rate": 7.524336490752261e-05, "loss": 0.6847, "step": 5690 }, { "epoch": 0.59, "learning_rate": 7.521070053035418e-05, "loss": 0.7197, "step": 5691 }, { "epoch": 0.59, "learning_rate": 7.517803897104035e-05, "loss": 0.6897, "step": 5692 }, { "epoch": 0.59, "learning_rate": 7.514538023329389e-05, "loss": 0.6829, "step": 5693 }, { "epoch": 0.59, "learning_rate": 7.511272432082712e-05, "loss": 0.6334, "step": 5694 }, { "epoch": 0.59, "learning_rate": 7.508007123735219e-05, "loss": 0.66, "step": 5695 }, { "epoch": 0.59, "learning_rate": 7.504742098658075e-05, "loss": 0.6351, "step": 5696 }, { "epoch": 0.59, "learning_rate": 7.50147735722243e-05, "loss": 0.6583, "step": 5697 }, { "epoch": 0.59, "learning_rate": 7.498212899799395e-05, "loss": 0.6679, "step": 5698 }, { "epoch": 0.59, "learning_rate": 7.49494872676004e-05, "loss": 0.7034, "step": 5699 }, { "epoch": 0.59, "learning_rate": 7.491684838475418e-05, "loss": 0.7181, "step": 5700 }, { "epoch": 0.59, "learning_rate": 7.488421235316543e-05, "loss": 0.6443, "step": 5701 }, { "epoch": 0.59, "learning_rate": 7.48515791765439e-05, "loss": 0.6206, "step": 5702 }, { "epoch": 0.59, "learning_rate": 7.481894885859914e-05, "loss": 0.7226, "step": 5703 }, { "epoch": 0.59, "learning_rate": 7.478632140304029e-05, "loss": 0.6633, "step": 5704 }, { "epoch": 0.59, "learning_rate": 7.475369681357614e-05, "loss": 0.7079, "step": 5705 }, { "epoch": 0.59, "learning_rate": 7.472107509391522e-05, "loss": 0.6474, "step": 5706 }, { "epoch": 0.59, "learning_rate": 7.468845624776579e-05, "loss": 0.6055, "step": 5707 }, { "epoch": 0.59, "learning_rate": 7.46558402788356e-05, "loss": 0.7277, "step": 5708 }, { "epoch": 0.59, "learning_rate": 7.462322719083225e-05, "loss": 0.6606, "step": 5709 }, { "epoch": 0.59, "learning_rate": 7.459061698746293e-05, "loss": 0.6727, "step": 5710 }, { "epoch": 0.59, "learning_rate": 7.455800967243446e-05, "loss": 0.6944, "step": 5711 }, { "epoch": 0.59, "learning_rate": 7.452540524945343e-05, "loss": 0.719, "step": 5712 }, { "epoch": 0.59, "learning_rate": 7.449280372222609e-05, "loss": 0.6629, "step": 5713 }, { "epoch": 0.59, "learning_rate": 7.446020509445825e-05, "loss": 0.7261, "step": 5714 }, { "epoch": 0.59, "learning_rate": 7.442760936985556e-05, "loss": 0.6389, "step": 5715 }, { "epoch": 0.59, "learning_rate": 7.439501655212318e-05, "loss": 0.6131, "step": 5716 }, { "epoch": 0.6, "learning_rate": 7.4362426644966e-05, "loss": 0.6057, "step": 5717 }, { "epoch": 0.6, "learning_rate": 7.432983965208865e-05, "loss": 0.677, "step": 5718 }, { "epoch": 0.6, "learning_rate": 7.42972555771953e-05, "loss": 0.6663, "step": 5719 }, { "epoch": 0.6, "learning_rate": 7.426467442398986e-05, "loss": 0.7429, "step": 5720 }, { "epoch": 0.6, "learning_rate": 7.423209619617599e-05, "loss": 0.6773, "step": 5721 }, { "epoch": 0.6, "learning_rate": 7.419952089745683e-05, "loss": 0.6923, "step": 5722 }, { "epoch": 0.6, "learning_rate": 7.41669485315353e-05, "loss": 0.7424, "step": 5723 }, { "epoch": 0.6, "learning_rate": 7.413437910211405e-05, "loss": 0.6638, "step": 5724 }, { "epoch": 0.6, "learning_rate": 7.41018126128952e-05, "loss": 0.6533, "step": 5725 }, { "epoch": 0.6, "learning_rate": 7.406924906758074e-05, "loss": 0.6475, "step": 5726 }, { "epoch": 0.6, "learning_rate": 7.403668846987224e-05, "loss": 0.6218, "step": 5727 }, { "epoch": 0.6, "learning_rate": 7.40041308234709e-05, "loss": 0.685, "step": 5728 }, { "epoch": 0.6, "learning_rate": 7.397157613207762e-05, "loss": 0.6771, "step": 5729 }, { "epoch": 0.6, "learning_rate": 7.393902439939303e-05, "loss": 0.6309, "step": 5730 }, { "epoch": 0.6, "learning_rate": 7.390647562911723e-05, "loss": 0.6981, "step": 5731 }, { "epoch": 0.6, "learning_rate": 7.38739298249502e-05, "loss": 0.6301, "step": 5732 }, { "epoch": 0.6, "learning_rate": 7.384138699059154e-05, "loss": 0.6907, "step": 5733 }, { "epoch": 0.6, "learning_rate": 7.380884712974036e-05, "loss": 0.7284, "step": 5734 }, { "epoch": 0.6, "learning_rate": 7.37763102460956e-05, "loss": 0.6072, "step": 5735 }, { "epoch": 0.6, "learning_rate": 7.374377634335576e-05, "loss": 0.675, "step": 5736 }, { "epoch": 0.6, "learning_rate": 7.371124542521907e-05, "loss": 0.6922, "step": 5737 }, { "epoch": 0.6, "learning_rate": 7.367871749538341e-05, "loss": 0.6783, "step": 5738 }, { "epoch": 0.6, "learning_rate": 7.364619255754626e-05, "loss": 0.6784, "step": 5739 }, { "epoch": 0.6, "learning_rate": 7.361367061540482e-05, "loss": 0.6919, "step": 5740 }, { "epoch": 0.6, "learning_rate": 7.358115167265593e-05, "loss": 0.6599, "step": 5741 }, { "epoch": 0.6, "learning_rate": 7.354863573299611e-05, "loss": 0.6844, "step": 5742 }, { "epoch": 0.6, "learning_rate": 7.351612280012145e-05, "loss": 0.6463, "step": 5743 }, { "epoch": 0.6, "learning_rate": 7.348361287772788e-05, "loss": 0.6817, "step": 5744 }, { "epoch": 0.6, "learning_rate": 7.345110596951077e-05, "loss": 0.6917, "step": 5745 }, { "epoch": 0.6, "learning_rate": 7.341860207916531e-05, "loss": 0.6816, "step": 5746 }, { "epoch": 0.6, "learning_rate": 7.338610121038627e-05, "loss": 0.6816, "step": 5747 }, { "epoch": 0.6, "learning_rate": 7.33536033668681e-05, "loss": 0.6968, "step": 5748 }, { "epoch": 0.6, "learning_rate": 7.332110855230489e-05, "loss": 0.6836, "step": 5749 }, { "epoch": 0.6, "learning_rate": 7.328861677039045e-05, "loss": 0.7021, "step": 5750 }, { "epoch": 0.6, "learning_rate": 7.32561280248181e-05, "loss": 0.7044, "step": 5751 }, { "epoch": 0.6, "learning_rate": 7.322364231928096e-05, "loss": 0.6279, "step": 5752 }, { "epoch": 0.6, "learning_rate": 7.319115965747181e-05, "loss": 0.6628, "step": 5753 }, { "epoch": 0.6, "learning_rate": 7.315868004308293e-05, "loss": 0.7137, "step": 5754 }, { "epoch": 0.6, "learning_rate": 7.312620347980643e-05, "loss": 0.6397, "step": 5755 }, { "epoch": 0.6, "learning_rate": 7.309372997133388e-05, "loss": 0.6903, "step": 5756 }, { "epoch": 0.6, "learning_rate": 7.30612595213567e-05, "loss": 0.6879, "step": 5757 }, { "epoch": 0.6, "learning_rate": 7.302879213356591e-05, "loss": 0.6503, "step": 5758 }, { "epoch": 0.6, "learning_rate": 7.299632781165207e-05, "loss": 0.6302, "step": 5759 }, { "epoch": 0.6, "learning_rate": 7.296386655930551e-05, "loss": 0.6602, "step": 5760 }, { "epoch": 0.6, "learning_rate": 7.29314083802162e-05, "loss": 0.6638, "step": 5761 }, { "epoch": 0.6, "learning_rate": 7.289895327807366e-05, "loss": 0.6491, "step": 5762 }, { "epoch": 0.6, "learning_rate": 7.286650125656715e-05, "loss": 0.6754, "step": 5763 }, { "epoch": 0.6, "learning_rate": 7.283405231938565e-05, "loss": 0.6647, "step": 5764 }, { "epoch": 0.6, "learning_rate": 7.280160647021762e-05, "loss": 0.6601, "step": 5765 }, { "epoch": 0.6, "learning_rate": 7.276916371275126e-05, "loss": 0.6638, "step": 5766 }, { "epoch": 0.6, "learning_rate": 7.273672405067444e-05, "loss": 0.649, "step": 5767 }, { "epoch": 0.6, "learning_rate": 7.270428748767462e-05, "loss": 0.6678, "step": 5768 }, { "epoch": 0.6, "learning_rate": 7.267185402743893e-05, "loss": 0.6513, "step": 5769 }, { "epoch": 0.6, "learning_rate": 7.263942367365422e-05, "loss": 0.749, "step": 5770 }, { "epoch": 0.6, "learning_rate": 7.260699643000681e-05, "loss": 0.71, "step": 5771 }, { "epoch": 0.6, "learning_rate": 7.257457230018287e-05, "loss": 0.6875, "step": 5772 }, { "epoch": 0.6, "learning_rate": 7.25421512878681e-05, "loss": 0.7024, "step": 5773 }, { "epoch": 0.6, "learning_rate": 7.250973339674785e-05, "loss": 0.6284, "step": 5774 }, { "epoch": 0.6, "learning_rate": 7.247731863050716e-05, "loss": 0.625, "step": 5775 }, { "epoch": 0.6, "learning_rate": 7.244490699283063e-05, "loss": 0.648, "step": 5776 }, { "epoch": 0.6, "learning_rate": 7.241249848740258e-05, "loss": 0.7027, "step": 5777 }, { "epoch": 0.6, "learning_rate": 7.238009311790706e-05, "loss": 0.7357, "step": 5778 }, { "epoch": 0.6, "learning_rate": 7.234769088802752e-05, "loss": 0.6554, "step": 5779 }, { "epoch": 0.6, "learning_rate": 7.231529180144728e-05, "loss": 0.7024, "step": 5780 }, { "epoch": 0.6, "learning_rate": 7.228289586184919e-05, "loss": 0.7109, "step": 5781 }, { "epoch": 0.6, "learning_rate": 7.225050307291574e-05, "loss": 0.6171, "step": 5782 }, { "epoch": 0.6, "learning_rate": 7.221811343832912e-05, "loss": 0.6705, "step": 5783 }, { "epoch": 0.6, "learning_rate": 7.218572696177118e-05, "loss": 0.618, "step": 5784 }, { "epoch": 0.6, "learning_rate": 7.215334364692323e-05, "loss": 0.6694, "step": 5785 }, { "epoch": 0.6, "learning_rate": 7.212096349746648e-05, "loss": 0.7265, "step": 5786 }, { "epoch": 0.6, "learning_rate": 7.208858651708164e-05, "loss": 0.6932, "step": 5787 }, { "epoch": 0.6, "learning_rate": 7.205621270944899e-05, "loss": 0.6139, "step": 5788 }, { "epoch": 0.6, "learning_rate": 7.202384207824859e-05, "loss": 0.7275, "step": 5789 }, { "epoch": 0.6, "learning_rate": 7.199147462716009e-05, "loss": 0.6837, "step": 5790 }, { "epoch": 0.6, "learning_rate": 7.195911035986273e-05, "loss": 0.6732, "step": 5791 }, { "epoch": 0.6, "learning_rate": 7.19267492800355e-05, "loss": 0.6983, "step": 5792 }, { "epoch": 0.6, "learning_rate": 7.189439139135689e-05, "loss": 0.6821, "step": 5793 }, { "epoch": 0.6, "learning_rate": 7.186203669750509e-05, "loss": 0.7267, "step": 5794 }, { "epoch": 0.6, "learning_rate": 7.182968520215799e-05, "loss": 0.6413, "step": 5795 }, { "epoch": 0.6, "learning_rate": 7.179733690899298e-05, "loss": 0.6828, "step": 5796 }, { "epoch": 0.6, "learning_rate": 7.176499182168718e-05, "loss": 0.7061, "step": 5797 }, { "epoch": 0.6, "learning_rate": 7.17326499439174e-05, "loss": 0.6875, "step": 5798 }, { "epoch": 0.6, "learning_rate": 7.170031127935995e-05, "loss": 0.6827, "step": 5799 }, { "epoch": 0.6, "learning_rate": 7.16679758316908e-05, "loss": 0.6983, "step": 5800 }, { "epoch": 0.6, "learning_rate": 7.16356436045857e-05, "loss": 0.6543, "step": 5801 }, { "epoch": 0.6, "learning_rate": 7.160331460171982e-05, "loss": 0.755, "step": 5802 }, { "epoch": 0.6, "learning_rate": 7.157098882676813e-05, "loss": 0.6654, "step": 5803 }, { "epoch": 0.6, "learning_rate": 7.153866628340519e-05, "loss": 0.6272, "step": 5804 }, { "epoch": 0.6, "learning_rate": 7.150634697530511e-05, "loss": 0.6844, "step": 5805 }, { "epoch": 0.6, "learning_rate": 7.147403090614173e-05, "loss": 0.6145, "step": 5806 }, { "epoch": 0.6, "learning_rate": 7.144171807958853e-05, "loss": 0.6871, "step": 5807 }, { "epoch": 0.6, "learning_rate": 7.140940849931847e-05, "loss": 0.6988, "step": 5808 }, { "epoch": 0.6, "learning_rate": 7.137710216900435e-05, "loss": 0.6283, "step": 5809 }, { "epoch": 0.6, "learning_rate": 7.13447990923185e-05, "loss": 0.6677, "step": 5810 }, { "epoch": 0.6, "learning_rate": 7.131249927293284e-05, "loss": 0.71, "step": 5811 }, { "epoch": 0.6, "learning_rate": 7.128020271451897e-05, "loss": 0.7217, "step": 5812 }, { "epoch": 0.61, "learning_rate": 7.124790942074814e-05, "loss": 0.6474, "step": 5813 }, { "epoch": 0.61, "learning_rate": 7.121561939529115e-05, "loss": 0.6832, "step": 5814 }, { "epoch": 0.61, "learning_rate": 7.118333264181856e-05, "loss": 0.7025, "step": 5815 }, { "epoch": 0.61, "learning_rate": 7.115104916400037e-05, "loss": 0.645, "step": 5816 }, { "epoch": 0.61, "learning_rate": 7.11187689655064e-05, "loss": 0.6465, "step": 5817 }, { "epoch": 0.61, "learning_rate": 7.108649205000597e-05, "loss": 0.7, "step": 5818 }, { "epoch": 0.61, "learning_rate": 7.105421842116809e-05, "loss": 0.6319, "step": 5819 }, { "epoch": 0.61, "learning_rate": 7.102194808266134e-05, "loss": 0.7358, "step": 5820 }, { "epoch": 0.61, "learning_rate": 7.098968103815402e-05, "loss": 0.6611, "step": 5821 }, { "epoch": 0.61, "learning_rate": 7.095741729131394e-05, "loss": 0.6724, "step": 5822 }, { "epoch": 0.61, "learning_rate": 7.09251568458086e-05, "loss": 0.6147, "step": 5823 }, { "epoch": 0.61, "learning_rate": 7.089289970530517e-05, "loss": 0.6391, "step": 5824 }, { "epoch": 0.61, "learning_rate": 7.086064587347034e-05, "loss": 0.6337, "step": 5825 }, { "epoch": 0.61, "learning_rate": 7.082839535397046e-05, "loss": 0.6763, "step": 5826 }, { "epoch": 0.61, "learning_rate": 7.079614815047159e-05, "loss": 0.7118, "step": 5827 }, { "epoch": 0.61, "learning_rate": 7.076390426663926e-05, "loss": 0.6762, "step": 5828 }, { "epoch": 0.61, "learning_rate": 7.073166370613872e-05, "loss": 0.7057, "step": 5829 }, { "epoch": 0.61, "learning_rate": 7.06994264726349e-05, "loss": 0.6794, "step": 5830 }, { "epoch": 0.61, "learning_rate": 7.066719256979219e-05, "loss": 0.6895, "step": 5831 }, { "epoch": 0.61, "learning_rate": 7.063496200127472e-05, "loss": 0.5683, "step": 5832 }, { "epoch": 0.61, "learning_rate": 7.060273477074624e-05, "loss": 0.6946, "step": 5833 }, { "epoch": 0.61, "learning_rate": 7.057051088187002e-05, "loss": 0.7584, "step": 5834 }, { "epoch": 0.61, "learning_rate": 7.053829033830911e-05, "loss": 0.714, "step": 5835 }, { "epoch": 0.61, "learning_rate": 7.0506073143726e-05, "loss": 0.6332, "step": 5836 }, { "epoch": 0.61, "learning_rate": 7.047385930178297e-05, "loss": 0.6889, "step": 5837 }, { "epoch": 0.61, "learning_rate": 7.044164881614179e-05, "loss": 0.6301, "step": 5838 }, { "epoch": 0.61, "learning_rate": 7.040944169046389e-05, "loss": 0.6616, "step": 5839 }, { "epoch": 0.61, "learning_rate": 7.037723792841034e-05, "loss": 0.637, "step": 5840 }, { "epoch": 0.61, "learning_rate": 7.034503753364188e-05, "loss": 0.7582, "step": 5841 }, { "epoch": 0.61, "learning_rate": 7.031284050981867e-05, "loss": 0.6737, "step": 5842 }, { "epoch": 0.61, "learning_rate": 7.028064686060071e-05, "loss": 0.6841, "step": 5843 }, { "epoch": 0.61, "learning_rate": 7.024845658964752e-05, "loss": 0.6837, "step": 5844 }, { "epoch": 0.61, "learning_rate": 7.02162697006182e-05, "loss": 0.7164, "step": 5845 }, { "epoch": 0.61, "learning_rate": 7.01840861971715e-05, "loss": 0.6958, "step": 5846 }, { "epoch": 0.61, "learning_rate": 7.015190608296587e-05, "loss": 0.6455, "step": 5847 }, { "epoch": 0.61, "learning_rate": 7.011972936165919e-05, "loss": 0.6832, "step": 5848 }, { "epoch": 0.61, "learning_rate": 7.008755603690912e-05, "loss": 0.6648, "step": 5849 }, { "epoch": 0.61, "learning_rate": 7.005538611237287e-05, "loss": 0.7152, "step": 5850 }, { "epoch": 0.61, "learning_rate": 7.002321959170728e-05, "loss": 0.7124, "step": 5851 }, { "epoch": 0.61, "learning_rate": 6.999105647856872e-05, "loss": 0.6977, "step": 5852 }, { "epoch": 0.61, "learning_rate": 6.995889677661333e-05, "loss": 0.704, "step": 5853 }, { "epoch": 0.61, "learning_rate": 6.99267404894967e-05, "loss": 0.6385, "step": 5854 }, { "epoch": 0.61, "learning_rate": 6.989458762087419e-05, "loss": 0.6936, "step": 5855 }, { "epoch": 0.61, "learning_rate": 6.986243817440059e-05, "loss": 0.6717, "step": 5856 }, { "epoch": 0.61, "learning_rate": 6.983029215373048e-05, "loss": 0.6836, "step": 5857 }, { "epoch": 0.61, "learning_rate": 6.979814956251794e-05, "loss": 0.6715, "step": 5858 }, { "epoch": 0.61, "learning_rate": 6.976601040441665e-05, "loss": 0.6474, "step": 5859 }, { "epoch": 0.61, "learning_rate": 6.973387468307997e-05, "loss": 0.675, "step": 5860 }, { "epoch": 0.61, "learning_rate": 6.97017424021609e-05, "loss": 0.7088, "step": 5861 }, { "epoch": 0.61, "learning_rate": 6.966961356531188e-05, "loss": 0.6769, "step": 5862 }, { "epoch": 0.61, "learning_rate": 6.963748817618514e-05, "loss": 0.6233, "step": 5863 }, { "epoch": 0.61, "learning_rate": 6.960536623843245e-05, "loss": 0.6905, "step": 5864 }, { "epoch": 0.61, "learning_rate": 6.957324775570512e-05, "loss": 0.6707, "step": 5865 }, { "epoch": 0.61, "learning_rate": 6.954113273165415e-05, "loss": 0.6615, "step": 5866 }, { "epoch": 0.61, "learning_rate": 6.950902116993019e-05, "loss": 0.7107, "step": 5867 }, { "epoch": 0.61, "learning_rate": 6.947691307418333e-05, "loss": 0.623, "step": 5868 }, { "epoch": 0.61, "learning_rate": 6.944480844806345e-05, "loss": 0.6482, "step": 5869 }, { "epoch": 0.61, "learning_rate": 6.941270729521993e-05, "loss": 0.7064, "step": 5870 }, { "epoch": 0.61, "learning_rate": 6.938060961930175e-05, "loss": 0.6975, "step": 5871 }, { "epoch": 0.61, "learning_rate": 6.934851542395754e-05, "loss": 0.6694, "step": 5872 }, { "epoch": 0.61, "learning_rate": 6.931642471283556e-05, "loss": 0.6753, "step": 5873 }, { "epoch": 0.61, "learning_rate": 6.928433748958358e-05, "loss": 0.7437, "step": 5874 }, { "epoch": 0.61, "learning_rate": 6.925225375784908e-05, "loss": 0.6704, "step": 5875 }, { "epoch": 0.61, "learning_rate": 6.9220173521279e-05, "loss": 0.652, "step": 5876 }, { "epoch": 0.61, "learning_rate": 6.918809678352006e-05, "loss": 0.6651, "step": 5877 }, { "epoch": 0.61, "learning_rate": 6.915602354821846e-05, "loss": 0.689, "step": 5878 }, { "epoch": 0.61, "learning_rate": 6.912395381901999e-05, "loss": 0.717, "step": 5879 }, { "epoch": 0.61, "learning_rate": 6.909188759957014e-05, "loss": 0.6836, "step": 5880 }, { "epoch": 0.61, "learning_rate": 6.905982489351399e-05, "loss": 0.6539, "step": 5881 }, { "epoch": 0.61, "learning_rate": 6.90277657044961e-05, "loss": 0.6759, "step": 5882 }, { "epoch": 0.61, "learning_rate": 6.899571003616071e-05, "loss": 0.6892, "step": 5883 }, { "epoch": 0.61, "learning_rate": 6.896365789215174e-05, "loss": 0.7454, "step": 5884 }, { "epoch": 0.61, "learning_rate": 6.893160927611253e-05, "loss": 0.7102, "step": 5885 }, { "epoch": 0.61, "learning_rate": 6.889956419168615e-05, "loss": 0.7509, "step": 5886 }, { "epoch": 0.61, "learning_rate": 6.88675226425153e-05, "loss": 0.703, "step": 5887 }, { "epoch": 0.61, "learning_rate": 6.883548463224215e-05, "loss": 0.7002, "step": 5888 }, { "epoch": 0.61, "learning_rate": 6.88034501645085e-05, "loss": 0.6987, "step": 5889 }, { "epoch": 0.61, "learning_rate": 6.877141924295589e-05, "loss": 0.7213, "step": 5890 }, { "epoch": 0.61, "learning_rate": 6.873939187122523e-05, "loss": 0.6688, "step": 5891 }, { "epoch": 0.61, "learning_rate": 6.870736805295716e-05, "loss": 0.7679, "step": 5892 }, { "epoch": 0.61, "learning_rate": 6.8675347791792e-05, "loss": 0.6715, "step": 5893 }, { "epoch": 0.61, "learning_rate": 6.864333109136945e-05, "loss": 0.6589, "step": 5894 }, { "epoch": 0.61, "learning_rate": 6.8611317955329e-05, "loss": 0.6829, "step": 5895 }, { "epoch": 0.61, "learning_rate": 6.85793083873096e-05, "loss": 0.6898, "step": 5896 }, { "epoch": 0.61, "learning_rate": 6.854730239094982e-05, "loss": 0.6515, "step": 5897 }, { "epoch": 0.61, "learning_rate": 6.851529996988796e-05, "loss": 0.7244, "step": 5898 }, { "epoch": 0.61, "learning_rate": 6.848330112776171e-05, "loss": 0.655, "step": 5899 }, { "epoch": 0.61, "learning_rate": 6.845130586820847e-05, "loss": 0.6486, "step": 5900 }, { "epoch": 0.61, "learning_rate": 6.841931419486527e-05, "loss": 0.6805, "step": 5901 }, { "epoch": 0.61, "learning_rate": 6.83873261113686e-05, "loss": 0.6803, "step": 5902 }, { "epoch": 0.61, "learning_rate": 6.835534162135464e-05, "loss": 0.65, "step": 5903 }, { "epoch": 0.61, "learning_rate": 6.832336072845918e-05, "loss": 0.724, "step": 5904 }, { "epoch": 0.61, "learning_rate": 6.829138343631747e-05, "loss": 0.6758, "step": 5905 }, { "epoch": 0.61, "learning_rate": 6.82594097485645e-05, "loss": 0.6746, "step": 5906 }, { "epoch": 0.61, "learning_rate": 6.822743966883482e-05, "loss": 0.6879, "step": 5907 }, { "epoch": 0.61, "learning_rate": 6.819547320076249e-05, "loss": 0.6045, "step": 5908 }, { "epoch": 0.62, "learning_rate": 6.816351034798119e-05, "loss": 0.7033, "step": 5909 }, { "epoch": 0.62, "learning_rate": 6.81315511141243e-05, "loss": 0.6929, "step": 5910 }, { "epoch": 0.62, "learning_rate": 6.809959550282458e-05, "loss": 0.6306, "step": 5911 }, { "epoch": 0.62, "learning_rate": 6.806764351771455e-05, "loss": 0.7031, "step": 5912 }, { "epoch": 0.62, "learning_rate": 6.803569516242632e-05, "loss": 0.7031, "step": 5913 }, { "epoch": 0.62, "learning_rate": 6.800375044059144e-05, "loss": 0.6527, "step": 5914 }, { "epoch": 0.62, "learning_rate": 6.797180935584118e-05, "loss": 0.649, "step": 5915 }, { "epoch": 0.62, "learning_rate": 6.793987191180635e-05, "loss": 0.6647, "step": 5916 }, { "epoch": 0.62, "learning_rate": 6.790793811211731e-05, "loss": 0.6905, "step": 5917 }, { "epoch": 0.62, "learning_rate": 6.787600796040413e-05, "loss": 0.6798, "step": 5918 }, { "epoch": 0.62, "learning_rate": 6.784408146029631e-05, "loss": 0.7247, "step": 5919 }, { "epoch": 0.62, "learning_rate": 6.781215861542302e-05, "loss": 0.7047, "step": 5920 }, { "epoch": 0.62, "learning_rate": 6.778023942941303e-05, "loss": 0.6986, "step": 5921 }, { "epoch": 0.62, "learning_rate": 6.774832390589463e-05, "loss": 0.6995, "step": 5922 }, { "epoch": 0.62, "learning_rate": 6.771641204849575e-05, "loss": 0.6623, "step": 5923 }, { "epoch": 0.62, "learning_rate": 6.768450386084389e-05, "loss": 0.6356, "step": 5924 }, { "epoch": 0.62, "learning_rate": 6.765259934656607e-05, "loss": 0.7217, "step": 5925 }, { "epoch": 0.62, "learning_rate": 6.762069850928903e-05, "loss": 0.6934, "step": 5926 }, { "epoch": 0.62, "learning_rate": 6.758880135263894e-05, "loss": 0.6753, "step": 5927 }, { "epoch": 0.62, "learning_rate": 6.755690788024165e-05, "loss": 0.7009, "step": 5928 }, { "epoch": 0.62, "learning_rate": 6.752501809572254e-05, "loss": 0.6347, "step": 5929 }, { "epoch": 0.62, "learning_rate": 6.749313200270664e-05, "loss": 0.712, "step": 5930 }, { "epoch": 0.62, "learning_rate": 6.746124960481846e-05, "loss": 0.6673, "step": 5931 }, { "epoch": 0.62, "learning_rate": 6.742937090568218e-05, "loss": 0.713, "step": 5932 }, { "epoch": 0.62, "learning_rate": 6.739749590892149e-05, "loss": 0.66, "step": 5933 }, { "epoch": 0.62, "learning_rate": 6.736562461815972e-05, "loss": 0.6403, "step": 5934 }, { "epoch": 0.62, "learning_rate": 6.733375703701976e-05, "loss": 0.666, "step": 5935 }, { "epoch": 0.62, "learning_rate": 6.730189316912401e-05, "loss": 0.6772, "step": 5936 }, { "epoch": 0.62, "learning_rate": 6.727003301809455e-05, "loss": 0.6618, "step": 5937 }, { "epoch": 0.62, "learning_rate": 6.723817658755302e-05, "loss": 0.7011, "step": 5938 }, { "epoch": 0.62, "learning_rate": 6.720632388112054e-05, "loss": 0.7371, "step": 5939 }, { "epoch": 0.62, "learning_rate": 6.717447490241793e-05, "loss": 0.7108, "step": 5940 }, { "epoch": 0.62, "learning_rate": 6.714262965506556e-05, "loss": 0.6514, "step": 5941 }, { "epoch": 0.62, "learning_rate": 6.711078814268325e-05, "loss": 0.7029, "step": 5942 }, { "epoch": 0.62, "learning_rate": 6.707895036889057e-05, "loss": 0.6774, "step": 5943 }, { "epoch": 0.62, "learning_rate": 6.704711633730662e-05, "loss": 0.7108, "step": 5944 }, { "epoch": 0.62, "learning_rate": 6.701528605154994e-05, "loss": 0.6831, "step": 5945 }, { "epoch": 0.62, "learning_rate": 6.698345951523885e-05, "loss": 0.6624, "step": 5946 }, { "epoch": 0.62, "learning_rate": 6.695163673199112e-05, "loss": 0.6713, "step": 5947 }, { "epoch": 0.62, "learning_rate": 6.691981770542406e-05, "loss": 0.6583, "step": 5948 }, { "epoch": 0.62, "learning_rate": 6.688800243915465e-05, "loss": 0.729, "step": 5949 }, { "epoch": 0.62, "learning_rate": 6.685619093679945e-05, "loss": 0.6749, "step": 5950 }, { "epoch": 0.62, "learning_rate": 6.682438320197443e-05, "loss": 0.6749, "step": 5951 }, { "epoch": 0.62, "learning_rate": 6.679257923829536e-05, "loss": 0.6913, "step": 5952 }, { "epoch": 0.62, "learning_rate": 6.676077904937741e-05, "loss": 0.6969, "step": 5953 }, { "epoch": 0.62, "learning_rate": 6.672898263883536e-05, "loss": 0.6064, "step": 5954 }, { "epoch": 0.62, "learning_rate": 6.669719001028365e-05, "loss": 0.6979, "step": 5955 }, { "epoch": 0.62, "learning_rate": 6.666540116733611e-05, "loss": 0.6858, "step": 5956 }, { "epoch": 0.62, "learning_rate": 6.663361611360634e-05, "loss": 0.7559, "step": 5957 }, { "epoch": 0.62, "learning_rate": 6.660183485270741e-05, "loss": 0.6796, "step": 5958 }, { "epoch": 0.62, "learning_rate": 6.657005738825193e-05, "loss": 0.6618, "step": 5959 }, { "epoch": 0.62, "learning_rate": 6.653828372385212e-05, "loss": 0.6462, "step": 5960 }, { "epoch": 0.62, "learning_rate": 6.65065138631198e-05, "loss": 0.6391, "step": 5961 }, { "epoch": 0.62, "learning_rate": 6.647474780966626e-05, "loss": 0.6345, "step": 5962 }, { "epoch": 0.62, "learning_rate": 6.644298556710243e-05, "loss": 0.6208, "step": 5963 }, { "epoch": 0.62, "learning_rate": 6.641122713903887e-05, "loss": 0.6353, "step": 5964 }, { "epoch": 0.62, "learning_rate": 6.637947252908554e-05, "loss": 0.6892, "step": 5965 }, { "epoch": 0.62, "learning_rate": 6.634772174085211e-05, "loss": 0.6804, "step": 5966 }, { "epoch": 0.62, "learning_rate": 6.631597477794778e-05, "loss": 0.711, "step": 5967 }, { "epoch": 0.62, "learning_rate": 6.628423164398121e-05, "loss": 0.7391, "step": 5968 }, { "epoch": 0.62, "learning_rate": 6.625249234256077e-05, "loss": 0.7376, "step": 5969 }, { "epoch": 0.62, "learning_rate": 6.622075687729436e-05, "loss": 0.6638, "step": 5970 }, { "epoch": 0.62, "learning_rate": 6.618902525178936e-05, "loss": 0.7082, "step": 5971 }, { "epoch": 0.62, "learning_rate": 6.615729746965283e-05, "loss": 0.6673, "step": 5972 }, { "epoch": 0.62, "learning_rate": 6.612557353449134e-05, "loss": 0.6785, "step": 5973 }, { "epoch": 0.62, "learning_rate": 6.609385344991094e-05, "loss": 0.6859, "step": 5974 }, { "epoch": 0.62, "learning_rate": 6.606213721951742e-05, "loss": 0.6448, "step": 5975 }, { "epoch": 0.62, "learning_rate": 6.603042484691598e-05, "loss": 0.6933, "step": 5976 }, { "epoch": 0.62, "learning_rate": 6.599871633571141e-05, "loss": 0.6958, "step": 5977 }, { "epoch": 0.62, "learning_rate": 6.596701168950818e-05, "loss": 0.605, "step": 5978 }, { "epoch": 0.62, "learning_rate": 6.593531091191015e-05, "loss": 0.6667, "step": 5979 }, { "epoch": 0.62, "learning_rate": 6.590361400652081e-05, "loss": 0.7271, "step": 5980 }, { "epoch": 0.62, "learning_rate": 6.58719209769433e-05, "loss": 0.6531, "step": 5981 }, { "epoch": 0.62, "learning_rate": 6.584023182678012e-05, "loss": 0.6746, "step": 5982 }, { "epoch": 0.62, "learning_rate": 6.580854655963353e-05, "loss": 0.6731, "step": 5983 }, { "epoch": 0.62, "learning_rate": 6.577686517910528e-05, "loss": 0.6434, "step": 5984 }, { "epoch": 0.62, "learning_rate": 6.574518768879662e-05, "loss": 0.6991, "step": 5985 }, { "epoch": 0.62, "learning_rate": 6.571351409230837e-05, "loss": 0.7731, "step": 5986 }, { "epoch": 0.62, "learning_rate": 6.568184439324101e-05, "loss": 0.6888, "step": 5987 }, { "epoch": 0.62, "learning_rate": 6.565017859519444e-05, "loss": 0.5749, "step": 5988 }, { "epoch": 0.62, "learning_rate": 6.561851670176821e-05, "loss": 0.6355, "step": 5989 }, { "epoch": 0.62, "learning_rate": 6.558685871656143e-05, "loss": 0.708, "step": 5990 }, { "epoch": 0.62, "learning_rate": 6.555520464317269e-05, "loss": 0.6357, "step": 5991 }, { "epoch": 0.62, "learning_rate": 6.552355448520018e-05, "loss": 0.6863, "step": 5992 }, { "epoch": 0.62, "learning_rate": 6.549190824624168e-05, "loss": 0.6696, "step": 5993 }, { "epoch": 0.62, "learning_rate": 6.546026592989442e-05, "loss": 0.718, "step": 5994 }, { "epoch": 0.62, "learning_rate": 6.542862753975536e-05, "loss": 0.6614, "step": 5995 }, { "epoch": 0.62, "learning_rate": 6.539699307942078e-05, "loss": 0.7115, "step": 5996 }, { "epoch": 0.62, "learning_rate": 6.536536255248673e-05, "loss": 0.6732, "step": 5997 }, { "epoch": 0.62, "learning_rate": 6.533373596254868e-05, "loss": 0.6651, "step": 5998 }, { "epoch": 0.62, "learning_rate": 6.530211331320171e-05, "loss": 0.6726, "step": 5999 }, { "epoch": 0.62, "learning_rate": 6.527049460804043e-05, "loss": 0.612, "step": 6000 }, { "epoch": 0.62, "learning_rate": 6.523887985065903e-05, "loss": 0.6644, "step": 6001 }, { "epoch": 0.62, "learning_rate": 6.520726904465117e-05, "loss": 0.6955, "step": 6002 }, { "epoch": 0.62, "learning_rate": 6.517566219361019e-05, "loss": 0.6919, "step": 6003 }, { "epoch": 0.62, "learning_rate": 6.514405930112889e-05, "loss": 0.6657, "step": 6004 }, { "epoch": 0.63, "learning_rate": 6.511246037079964e-05, "loss": 0.7234, "step": 6005 }, { "epoch": 0.63, "learning_rate": 6.50808654062143e-05, "loss": 0.6429, "step": 6006 }, { "epoch": 0.63, "learning_rate": 6.504927441096447e-05, "loss": 0.6834, "step": 6007 }, { "epoch": 0.63, "learning_rate": 6.501768738864102e-05, "loss": 0.7081, "step": 6008 }, { "epoch": 0.63, "learning_rate": 6.498610434283463e-05, "loss": 0.6671, "step": 6009 }, { "epoch": 0.63, "learning_rate": 6.495452527713538e-05, "loss": 0.6801, "step": 6010 }, { "epoch": 0.63, "learning_rate": 6.49229501951329e-05, "loss": 0.639, "step": 6011 }, { "epoch": 0.63, "learning_rate": 6.489137910041642e-05, "loss": 0.7204, "step": 6012 }, { "epoch": 0.63, "learning_rate": 6.485981199657474e-05, "loss": 0.5915, "step": 6013 }, { "epoch": 0.63, "learning_rate": 6.482824888719609e-05, "loss": 0.7287, "step": 6014 }, { "epoch": 0.63, "learning_rate": 6.479668977586839e-05, "loss": 0.6487, "step": 6015 }, { "epoch": 0.63, "learning_rate": 6.476513466617895e-05, "loss": 0.6353, "step": 6016 }, { "epoch": 0.63, "learning_rate": 6.473358356171478e-05, "loss": 0.6493, "step": 6017 }, { "epoch": 0.63, "learning_rate": 6.470203646606237e-05, "loss": 0.6628, "step": 6018 }, { "epoch": 0.63, "learning_rate": 6.467049338280766e-05, "loss": 0.6736, "step": 6019 }, { "epoch": 0.63, "learning_rate": 6.46389543155363e-05, "loss": 0.6769, "step": 6020 }, { "epoch": 0.63, "learning_rate": 6.460741926783342e-05, "loss": 0.6682, "step": 6021 }, { "epoch": 0.63, "learning_rate": 6.45758882432836e-05, "loss": 0.6954, "step": 6022 }, { "epoch": 0.63, "learning_rate": 6.454436124547112e-05, "loss": 0.6095, "step": 6023 }, { "epoch": 0.63, "learning_rate": 6.45128382779797e-05, "loss": 0.6641, "step": 6024 }, { "epoch": 0.63, "learning_rate": 6.448131934439257e-05, "loss": 0.6735, "step": 6025 }, { "epoch": 0.63, "learning_rate": 6.444980444829263e-05, "loss": 0.6409, "step": 6026 }, { "epoch": 0.63, "learning_rate": 6.441829359326223e-05, "loss": 0.6884, "step": 6027 }, { "epoch": 0.63, "learning_rate": 6.438678678288325e-05, "loss": 0.6915, "step": 6028 }, { "epoch": 0.63, "learning_rate": 6.435528402073718e-05, "loss": 0.693, "step": 6029 }, { "epoch": 0.63, "learning_rate": 6.432378531040499e-05, "loss": 0.653, "step": 6030 }, { "epoch": 0.63, "learning_rate": 6.429229065546718e-05, "loss": 0.7317, "step": 6031 }, { "epoch": 0.63, "learning_rate": 6.426080005950383e-05, "loss": 0.6515, "step": 6032 }, { "epoch": 0.63, "learning_rate": 6.422931352609461e-05, "loss": 0.6764, "step": 6033 }, { "epoch": 0.63, "learning_rate": 6.419783105881859e-05, "loss": 0.6128, "step": 6034 }, { "epoch": 0.63, "learning_rate": 6.416635266125448e-05, "loss": 0.7201, "step": 6035 }, { "epoch": 0.63, "learning_rate": 6.413487833698048e-05, "loss": 0.6741, "step": 6036 }, { "epoch": 0.63, "learning_rate": 6.410340808957437e-05, "loss": 0.6557, "step": 6037 }, { "epoch": 0.63, "learning_rate": 6.407194192261345e-05, "loss": 0.699, "step": 6038 }, { "epoch": 0.63, "learning_rate": 6.40404798396745e-05, "loss": 0.7398, "step": 6039 }, { "epoch": 0.63, "learning_rate": 6.400902184433392e-05, "loss": 0.6588, "step": 6040 }, { "epoch": 0.63, "learning_rate": 6.397756794016763e-05, "loss": 0.624, "step": 6041 }, { "epoch": 0.63, "learning_rate": 6.394611813075102e-05, "loss": 0.607, "step": 6042 }, { "epoch": 0.63, "learning_rate": 6.39146724196591e-05, "loss": 0.7052, "step": 6043 }, { "epoch": 0.63, "learning_rate": 6.388323081046636e-05, "loss": 0.6623, "step": 6044 }, { "epoch": 0.63, "learning_rate": 6.385179330674681e-05, "loss": 0.6947, "step": 6045 }, { "epoch": 0.63, "learning_rate": 6.382035991207403e-05, "loss": 0.6623, "step": 6046 }, { "epoch": 0.63, "learning_rate": 6.37889306300212e-05, "loss": 0.6954, "step": 6047 }, { "epoch": 0.63, "learning_rate": 6.375750546416082e-05, "loss": 0.642, "step": 6048 }, { "epoch": 0.63, "learning_rate": 6.372608441806518e-05, "loss": 0.6608, "step": 6049 }, { "epoch": 0.63, "learning_rate": 6.369466749530594e-05, "loss": 0.7, "step": 6050 }, { "epoch": 0.63, "learning_rate": 6.366325469945428e-05, "loss": 0.6605, "step": 6051 }, { "epoch": 0.63, "learning_rate": 6.363184603408101e-05, "loss": 0.7313, "step": 6052 }, { "epoch": 0.63, "learning_rate": 6.360044150275646e-05, "loss": 0.624, "step": 6053 }, { "epoch": 0.63, "learning_rate": 6.356904110905036e-05, "loss": 0.6656, "step": 6054 }, { "epoch": 0.63, "learning_rate": 6.353764485653216e-05, "loss": 0.7128, "step": 6055 }, { "epoch": 0.63, "learning_rate": 6.350625274877067e-05, "loss": 0.6796, "step": 6056 }, { "epoch": 0.63, "learning_rate": 6.34748647893343e-05, "loss": 0.6725, "step": 6057 }, { "epoch": 0.63, "learning_rate": 6.344348098179105e-05, "loss": 0.6877, "step": 6058 }, { "epoch": 0.63, "learning_rate": 6.341210132970833e-05, "loss": 0.627, "step": 6059 }, { "epoch": 0.63, "learning_rate": 6.338072583665314e-05, "loss": 0.7243, "step": 6060 }, { "epoch": 0.63, "learning_rate": 6.334935450619207e-05, "loss": 0.6942, "step": 6061 }, { "epoch": 0.63, "learning_rate": 6.33179873418911e-05, "loss": 0.6625, "step": 6062 }, { "epoch": 0.63, "learning_rate": 6.328662434731578e-05, "loss": 0.6902, "step": 6063 }, { "epoch": 0.63, "learning_rate": 6.325526552603129e-05, "loss": 0.6821, "step": 6064 }, { "epoch": 0.63, "learning_rate": 6.32239108816022e-05, "loss": 0.6267, "step": 6065 }, { "epoch": 0.63, "learning_rate": 6.319256041759266e-05, "loss": 0.7847, "step": 6066 }, { "epoch": 0.63, "learning_rate": 6.316121413756642e-05, "loss": 0.6617, "step": 6067 }, { "epoch": 0.63, "learning_rate": 6.31298720450866e-05, "loss": 0.6329, "step": 6068 }, { "epoch": 0.63, "learning_rate": 6.309853414371594e-05, "loss": 0.6657, "step": 6069 }, { "epoch": 0.63, "learning_rate": 6.306720043701675e-05, "loss": 0.6926, "step": 6070 }, { "epoch": 0.63, "learning_rate": 6.30358709285507e-05, "loss": 0.6529, "step": 6071 }, { "epoch": 0.63, "learning_rate": 6.300454562187913e-05, "loss": 0.6894, "step": 6072 }, { "epoch": 0.63, "learning_rate": 6.297322452056293e-05, "loss": 0.6761, "step": 6073 }, { "epoch": 0.63, "learning_rate": 6.294190762816234e-05, "loss": 0.6764, "step": 6074 }, { "epoch": 0.63, "learning_rate": 6.291059494823726e-05, "loss": 0.7029, "step": 6075 }, { "epoch": 0.63, "learning_rate": 6.287928648434706e-05, "loss": 0.6936, "step": 6076 }, { "epoch": 0.63, "learning_rate": 6.284798224005064e-05, "loss": 0.6538, "step": 6077 }, { "epoch": 0.63, "learning_rate": 6.281668221890648e-05, "loss": 0.6703, "step": 6078 }, { "epoch": 0.63, "learning_rate": 6.278538642447242e-05, "loss": 0.6309, "step": 6079 }, { "epoch": 0.63, "learning_rate": 6.2754094860306e-05, "loss": 0.6921, "step": 6080 }, { "epoch": 0.63, "learning_rate": 6.272280752996418e-05, "loss": 0.6693, "step": 6081 }, { "epoch": 0.63, "learning_rate": 6.269152443700345e-05, "loss": 0.6608, "step": 6082 }, { "epoch": 0.63, "learning_rate": 6.266024558497984e-05, "loss": 0.7815, "step": 6083 }, { "epoch": 0.63, "learning_rate": 6.262897097744891e-05, "loss": 0.6445, "step": 6084 }, { "epoch": 0.63, "learning_rate": 6.259770061796566e-05, "loss": 0.6631, "step": 6085 }, { "epoch": 0.63, "learning_rate": 6.256643451008467e-05, "loss": 0.6376, "step": 6086 }, { "epoch": 0.63, "learning_rate": 6.25351726573601e-05, "loss": 0.6914, "step": 6087 }, { "epoch": 0.63, "learning_rate": 6.250391506334547e-05, "loss": 0.5884, "step": 6088 }, { "epoch": 0.63, "learning_rate": 6.247266173159391e-05, "loss": 0.6493, "step": 6089 }, { "epoch": 0.63, "learning_rate": 6.244141266565814e-05, "loss": 0.7461, "step": 6090 }, { "epoch": 0.63, "learning_rate": 6.241016786909019e-05, "loss": 0.6968, "step": 6091 }, { "epoch": 0.63, "learning_rate": 6.23789273454418e-05, "loss": 0.5547, "step": 6092 }, { "epoch": 0.63, "learning_rate": 6.234769109826415e-05, "loss": 0.6351, "step": 6093 }, { "epoch": 0.63, "learning_rate": 6.231645913110789e-05, "loss": 0.6506, "step": 6094 }, { "epoch": 0.63, "learning_rate": 6.22852314475233e-05, "loss": 0.727, "step": 6095 }, { "epoch": 0.63, "learning_rate": 6.225400805105999e-05, "loss": 0.7435, "step": 6096 }, { "epoch": 0.63, "learning_rate": 6.222278894526726e-05, "loss": 0.67, "step": 6097 }, { "epoch": 0.63, "learning_rate": 6.21915741336939e-05, "loss": 0.6146, "step": 6098 }, { "epoch": 0.63, "learning_rate": 6.216036361988807e-05, "loss": 0.6891, "step": 6099 }, { "epoch": 0.63, "learning_rate": 6.21291574073976e-05, "loss": 0.629, "step": 6100 }, { "epoch": 0.64, "learning_rate": 6.209795549976977e-05, "loss": 0.6992, "step": 6101 }, { "epoch": 0.64, "learning_rate": 6.206675790055134e-05, "loss": 0.6597, "step": 6102 }, { "epoch": 0.64, "learning_rate": 6.203556461328862e-05, "loss": 0.7292, "step": 6103 }, { "epoch": 0.64, "learning_rate": 6.200437564152743e-05, "loss": 0.7174, "step": 6104 }, { "epoch": 0.64, "learning_rate": 6.197319098881307e-05, "loss": 0.6587, "step": 6105 }, { "epoch": 0.64, "learning_rate": 6.194201065869041e-05, "loss": 0.668, "step": 6106 }, { "epoch": 0.64, "learning_rate": 6.191083465470376e-05, "loss": 0.6057, "step": 6107 }, { "epoch": 0.64, "learning_rate": 6.187966298039696e-05, "loss": 0.6508, "step": 6108 }, { "epoch": 0.64, "learning_rate": 6.184849563931335e-05, "loss": 0.6411, "step": 6109 }, { "epoch": 0.64, "learning_rate": 6.181733263499584e-05, "loss": 0.6397, "step": 6110 }, { "epoch": 0.64, "learning_rate": 6.178617397098674e-05, "loss": 0.6811, "step": 6111 }, { "epoch": 0.64, "learning_rate": 6.175501965082796e-05, "loss": 0.6784, "step": 6112 }, { "epoch": 0.64, "learning_rate": 6.172386967806088e-05, "loss": 0.6464, "step": 6113 }, { "epoch": 0.64, "learning_rate": 6.169272405622638e-05, "loss": 0.7063, "step": 6114 }, { "epoch": 0.64, "learning_rate": 6.166158278886487e-05, "loss": 0.6417, "step": 6115 }, { "epoch": 0.64, "learning_rate": 6.163044587951619e-05, "loss": 0.7253, "step": 6116 }, { "epoch": 0.64, "learning_rate": 6.159931333171977e-05, "loss": 0.6715, "step": 6117 }, { "epoch": 0.64, "learning_rate": 6.156818514901457e-05, "loss": 0.6408, "step": 6118 }, { "epoch": 0.64, "learning_rate": 6.153706133493892e-05, "loss": 0.6327, "step": 6119 }, { "epoch": 0.64, "learning_rate": 6.150594189303079e-05, "loss": 0.6086, "step": 6120 }, { "epoch": 0.64, "learning_rate": 6.147482682682759e-05, "loss": 0.639, "step": 6121 }, { "epoch": 0.64, "learning_rate": 6.144371613986619e-05, "loss": 0.7053, "step": 6122 }, { "epoch": 0.64, "learning_rate": 6.141260983568302e-05, "loss": 0.6827, "step": 6123 }, { "epoch": 0.64, "learning_rate": 6.138150791781408e-05, "loss": 0.6519, "step": 6124 }, { "epoch": 0.64, "learning_rate": 6.13504103897947e-05, "loss": 0.6284, "step": 6125 }, { "epoch": 0.64, "learning_rate": 6.131931725515987e-05, "loss": 0.6293, "step": 6126 }, { "epoch": 0.64, "learning_rate": 6.128822851744401e-05, "loss": 0.6188, "step": 6127 }, { "epoch": 0.64, "learning_rate": 6.125714418018096e-05, "loss": 0.6562, "step": 6128 }, { "epoch": 0.64, "learning_rate": 6.122606424690422e-05, "loss": 0.6792, "step": 6129 }, { "epoch": 0.64, "learning_rate": 6.119498872114677e-05, "loss": 0.7001, "step": 6130 }, { "epoch": 0.64, "learning_rate": 6.116391760644091e-05, "loss": 0.6768, "step": 6131 }, { "epoch": 0.64, "learning_rate": 6.113285090631866e-05, "loss": 0.6184, "step": 6132 }, { "epoch": 0.64, "learning_rate": 6.11017886243114e-05, "loss": 0.6372, "step": 6133 }, { "epoch": 0.64, "learning_rate": 6.107073076395003e-05, "loss": 0.6229, "step": 6134 }, { "epoch": 0.64, "learning_rate": 6.103967732876501e-05, "loss": 0.6493, "step": 6135 }, { "epoch": 0.64, "learning_rate": 6.10086283222862e-05, "loss": 0.7282, "step": 6136 }, { "epoch": 0.64, "learning_rate": 6.097758374804304e-05, "loss": 0.6844, "step": 6137 }, { "epoch": 0.64, "learning_rate": 6.0946543609564476e-05, "loss": 0.7157, "step": 6138 }, { "epoch": 0.64, "learning_rate": 6.091550791037886e-05, "loss": 0.6402, "step": 6139 }, { "epoch": 0.64, "learning_rate": 6.0884476654014044e-05, "loss": 0.6709, "step": 6140 }, { "epoch": 0.64, "learning_rate": 6.0853449843997544e-05, "loss": 0.6594, "step": 6141 }, { "epoch": 0.64, "learning_rate": 6.0822427483856115e-05, "loss": 0.6438, "step": 6142 }, { "epoch": 0.64, "learning_rate": 6.079140957711622e-05, "loss": 0.7329, "step": 6143 }, { "epoch": 0.64, "learning_rate": 6.076039612730373e-05, "loss": 0.6814, "step": 6144 }, { "epoch": 0.64, "learning_rate": 6.0729387137943984e-05, "loss": 0.665, "step": 6145 }, { "epoch": 0.64, "learning_rate": 6.069838261256182e-05, "loss": 0.6807, "step": 6146 }, { "epoch": 0.64, "learning_rate": 6.066738255468167e-05, "loss": 0.5714, "step": 6147 }, { "epoch": 0.64, "learning_rate": 6.0636386967827295e-05, "loss": 0.6636, "step": 6148 }, { "epoch": 0.64, "learning_rate": 6.0605395855522075e-05, "loss": 0.7254, "step": 6149 }, { "epoch": 0.64, "learning_rate": 6.0574409221288874e-05, "loss": 0.6507, "step": 6150 }, { "epoch": 0.64, "learning_rate": 6.054342706864994e-05, "loss": 0.5872, "step": 6151 }, { "epoch": 0.64, "learning_rate": 6.051244940112709e-05, "loss": 0.6033, "step": 6152 }, { "epoch": 0.64, "learning_rate": 6.0481476222241694e-05, "loss": 0.6659, "step": 6153 }, { "epoch": 0.64, "learning_rate": 6.0450507535514456e-05, "loss": 0.6402, "step": 6154 }, { "epoch": 0.64, "learning_rate": 6.041954334446573e-05, "loss": 0.6561, "step": 6155 }, { "epoch": 0.64, "learning_rate": 6.0388583652615216e-05, "loss": 0.701, "step": 6156 }, { "epoch": 0.64, "learning_rate": 6.035762846348221e-05, "loss": 0.6901, "step": 6157 }, { "epoch": 0.64, "learning_rate": 6.032667778058547e-05, "loss": 0.7145, "step": 6158 }, { "epoch": 0.64, "learning_rate": 6.02957316074432e-05, "loss": 0.68, "step": 6159 }, { "epoch": 0.64, "learning_rate": 6.026478994757311e-05, "loss": 0.6627, "step": 6160 }, { "epoch": 0.64, "learning_rate": 6.0233852804492474e-05, "loss": 0.6843, "step": 6161 }, { "epoch": 0.64, "learning_rate": 6.020292018171788e-05, "loss": 0.7106, "step": 6162 }, { "epoch": 0.64, "learning_rate": 6.0171992082765586e-05, "loss": 0.6324, "step": 6163 }, { "epoch": 0.64, "learning_rate": 6.0141068511151266e-05, "loss": 0.5935, "step": 6164 }, { "epoch": 0.64, "learning_rate": 6.011014947039002e-05, "loss": 0.6965, "step": 6165 }, { "epoch": 0.64, "learning_rate": 6.007923496399648e-05, "loss": 0.6368, "step": 6166 }, { "epoch": 0.64, "learning_rate": 6.004832499548485e-05, "loss": 0.6972, "step": 6167 }, { "epoch": 0.64, "learning_rate": 6.0017419568368626e-05, "loss": 0.7113, "step": 6168 }, { "epoch": 0.64, "learning_rate": 5.9986518686160955e-05, "loss": 0.631, "step": 6169 }, { "epoch": 0.64, "learning_rate": 5.995562235237444e-05, "loss": 0.6863, "step": 6170 }, { "epoch": 0.64, "learning_rate": 5.992473057052107e-05, "loss": 0.6802, "step": 6171 }, { "epoch": 0.64, "learning_rate": 5.989384334411239e-05, "loss": 0.6764, "step": 6172 }, { "epoch": 0.64, "learning_rate": 5.986296067665948e-05, "loss": 0.5872, "step": 6173 }, { "epoch": 0.64, "learning_rate": 5.983208257167278e-05, "loss": 0.6635, "step": 6174 }, { "epoch": 0.64, "learning_rate": 5.9801209032662306e-05, "loss": 0.7144, "step": 6175 }, { "epoch": 0.64, "learning_rate": 5.9770340063137486e-05, "loss": 0.636, "step": 6176 }, { "epoch": 0.64, "learning_rate": 5.9739475666607304e-05, "loss": 0.6877, "step": 6177 }, { "epoch": 0.64, "learning_rate": 5.9708615846580165e-05, "loss": 0.6212, "step": 6178 }, { "epoch": 0.64, "learning_rate": 5.967776060656397e-05, "loss": 0.7044, "step": 6179 }, { "epoch": 0.64, "learning_rate": 5.96469099500661e-05, "loss": 0.6604, "step": 6180 }, { "epoch": 0.64, "learning_rate": 5.9616063880593455e-05, "loss": 0.6146, "step": 6181 }, { "epoch": 0.64, "learning_rate": 5.958522240165231e-05, "loss": 0.7057, "step": 6182 }, { "epoch": 0.64, "learning_rate": 5.9554385516748536e-05, "loss": 0.7036, "step": 6183 }, { "epoch": 0.64, "learning_rate": 5.952355322938742e-05, "loss": 0.6626, "step": 6184 }, { "epoch": 0.64, "learning_rate": 5.9492725543073726e-05, "loss": 0.6398, "step": 6185 }, { "epoch": 0.64, "learning_rate": 5.946190246131169e-05, "loss": 0.6734, "step": 6186 }, { "epoch": 0.64, "learning_rate": 5.9431083987605106e-05, "loss": 0.6618, "step": 6187 }, { "epoch": 0.64, "learning_rate": 5.9400270125457105e-05, "loss": 0.7086, "step": 6188 }, { "epoch": 0.64, "learning_rate": 5.93694608783704e-05, "loss": 0.6534, "step": 6189 }, { "epoch": 0.64, "learning_rate": 5.9338656249847135e-05, "loss": 0.6912, "step": 6190 }, { "epoch": 0.64, "learning_rate": 5.930785624338897e-05, "loss": 0.6682, "step": 6191 }, { "epoch": 0.64, "learning_rate": 5.927706086249695e-05, "loss": 0.5949, "step": 6192 }, { "epoch": 0.64, "learning_rate": 5.924627011067173e-05, "loss": 0.7146, "step": 6193 }, { "epoch": 0.64, "learning_rate": 5.921548399141329e-05, "loss": 0.6571, "step": 6194 }, { "epoch": 0.64, "learning_rate": 5.918470250822123e-05, "loss": 0.7143, "step": 6195 }, { "epoch": 0.64, "learning_rate": 5.9153925664594456e-05, "loss": 0.6676, "step": 6196 }, { "epoch": 0.65, "learning_rate": 5.912315346403153e-05, "loss": 0.624, "step": 6197 }, { "epoch": 0.65, "learning_rate": 5.909238591003038e-05, "loss": 0.6932, "step": 6198 }, { "epoch": 0.65, "learning_rate": 5.906162300608835e-05, "loss": 0.7088, "step": 6199 }, { "epoch": 0.65, "learning_rate": 5.90308647557024e-05, "loss": 0.5762, "step": 6200 }, { "epoch": 0.65, "learning_rate": 5.90001111623689e-05, "loss": 0.619, "step": 6201 }, { "epoch": 0.65, "learning_rate": 5.8969362229583606e-05, "loss": 0.6297, "step": 6202 }, { "epoch": 0.65, "learning_rate": 5.893861796084187e-05, "loss": 0.6816, "step": 6203 }, { "epoch": 0.65, "learning_rate": 5.890787835963847e-05, "loss": 0.7028, "step": 6204 }, { "epoch": 0.65, "learning_rate": 5.8877143429467595e-05, "loss": 0.6233, "step": 6205 }, { "epoch": 0.65, "learning_rate": 5.884641317382298e-05, "loss": 0.7204, "step": 6206 }, { "epoch": 0.65, "learning_rate": 5.8815687596197846e-05, "loss": 0.6826, "step": 6207 }, { "epoch": 0.65, "learning_rate": 5.878496670008474e-05, "loss": 0.695, "step": 6208 }, { "epoch": 0.65, "learning_rate": 5.875425048897586e-05, "loss": 0.6706, "step": 6209 }, { "epoch": 0.65, "learning_rate": 5.872353896636278e-05, "loss": 0.6489, "step": 6210 }, { "epoch": 0.65, "learning_rate": 5.869283213573646e-05, "loss": 0.6729, "step": 6211 }, { "epoch": 0.65, "learning_rate": 5.86621300005875e-05, "loss": 0.6606, "step": 6212 }, { "epoch": 0.65, "learning_rate": 5.8631432564405886e-05, "loss": 0.6492, "step": 6213 }, { "epoch": 0.65, "learning_rate": 5.860073983068099e-05, "loss": 0.6742, "step": 6214 }, { "epoch": 0.65, "learning_rate": 5.8570051802901815e-05, "loss": 0.699, "step": 6215 }, { "epoch": 0.65, "learning_rate": 5.8539368484556666e-05, "loss": 0.603, "step": 6216 }, { "epoch": 0.65, "learning_rate": 5.850868987913338e-05, "loss": 0.6414, "step": 6217 }, { "epoch": 0.65, "learning_rate": 5.847801599011933e-05, "loss": 0.7003, "step": 6218 }, { "epoch": 0.65, "learning_rate": 5.8447346821001203e-05, "loss": 0.6262, "step": 6219 }, { "epoch": 0.65, "learning_rate": 5.841668237526527e-05, "loss": 0.6546, "step": 6220 }, { "epoch": 0.65, "learning_rate": 5.838602265639728e-05, "loss": 0.6986, "step": 6221 }, { "epoch": 0.65, "learning_rate": 5.835536766788228e-05, "loss": 0.6687, "step": 6222 }, { "epoch": 0.65, "learning_rate": 5.832471741320495e-05, "loss": 0.6351, "step": 6223 }, { "epoch": 0.65, "learning_rate": 5.829407189584944e-05, "loss": 0.6886, "step": 6224 }, { "epoch": 0.65, "learning_rate": 5.82634311192992e-05, "loss": 0.6687, "step": 6225 }, { "epoch": 0.65, "learning_rate": 5.823279508703723e-05, "loss": 0.7293, "step": 6226 }, { "epoch": 0.65, "learning_rate": 5.820216380254606e-05, "loss": 0.6265, "step": 6227 }, { "epoch": 0.65, "learning_rate": 5.8171537269307544e-05, "loss": 0.6592, "step": 6228 }, { "epoch": 0.65, "learning_rate": 5.81409154908031e-05, "loss": 0.6586, "step": 6229 }, { "epoch": 0.65, "learning_rate": 5.8110298470513635e-05, "loss": 0.6952, "step": 6230 }, { "epoch": 0.65, "learning_rate": 5.807968621191935e-05, "loss": 0.6792, "step": 6231 }, { "epoch": 0.65, "learning_rate": 5.804907871850005e-05, "loss": 0.6744, "step": 6232 }, { "epoch": 0.65, "learning_rate": 5.801847599373502e-05, "loss": 0.614, "step": 6233 }, { "epoch": 0.65, "learning_rate": 5.798787804110284e-05, "loss": 0.65, "step": 6234 }, { "epoch": 0.65, "learning_rate": 5.795728486408172e-05, "loss": 0.707, "step": 6235 }, { "epoch": 0.65, "learning_rate": 5.792669646614919e-05, "loss": 0.6099, "step": 6236 }, { "epoch": 0.65, "learning_rate": 5.789611285078234e-05, "loss": 0.6576, "step": 6237 }, { "epoch": 0.65, "learning_rate": 5.786553402145769e-05, "loss": 0.6292, "step": 6238 }, { "epoch": 0.65, "learning_rate": 5.78349599816512e-05, "loss": 0.6897, "step": 6239 }, { "epoch": 0.65, "learning_rate": 5.780439073483824e-05, "loss": 0.6521, "step": 6240 }, { "epoch": 0.65, "learning_rate": 5.777382628449376e-05, "loss": 0.6649, "step": 6241 }, { "epoch": 0.65, "learning_rate": 5.7743266634091995e-05, "loss": 0.691, "step": 6242 }, { "epoch": 0.65, "learning_rate": 5.77127117871068e-05, "loss": 0.7037, "step": 6243 }, { "epoch": 0.65, "learning_rate": 5.768216174701142e-05, "loss": 0.6648, "step": 6244 }, { "epoch": 0.65, "learning_rate": 5.765161651727849e-05, "loss": 0.7004, "step": 6245 }, { "epoch": 0.65, "learning_rate": 5.7621076101380165e-05, "loss": 0.6181, "step": 6246 }, { "epoch": 0.65, "learning_rate": 5.759054050278812e-05, "loss": 0.6878, "step": 6247 }, { "epoch": 0.65, "learning_rate": 5.7560009724973286e-05, "loss": 0.6652, "step": 6248 }, { "epoch": 0.65, "learning_rate": 5.752948377140623e-05, "loss": 0.6323, "step": 6249 }, { "epoch": 0.65, "learning_rate": 5.7498962645556934e-05, "loss": 0.6733, "step": 6250 }, { "epoch": 0.65, "learning_rate": 5.746844635089477e-05, "loss": 0.7154, "step": 6251 }, { "epoch": 0.65, "learning_rate": 5.743793489088853e-05, "loss": 0.7114, "step": 6252 }, { "epoch": 0.65, "learning_rate": 5.740742826900664e-05, "loss": 0.6382, "step": 6253 }, { "epoch": 0.65, "learning_rate": 5.737692648871674e-05, "loss": 0.6955, "step": 6254 }, { "epoch": 0.65, "learning_rate": 5.734642955348613e-05, "loss": 0.6582, "step": 6255 }, { "epoch": 0.65, "learning_rate": 5.731593746678139e-05, "loss": 0.6871, "step": 6256 }, { "epoch": 0.65, "learning_rate": 5.728545023206864e-05, "loss": 0.6759, "step": 6257 }, { "epoch": 0.65, "learning_rate": 5.725496785281349e-05, "loss": 0.6955, "step": 6258 }, { "epoch": 0.65, "learning_rate": 5.722449033248086e-05, "loss": 0.6884, "step": 6259 }, { "epoch": 0.65, "learning_rate": 5.7194017674535224e-05, "loss": 0.7057, "step": 6260 }, { "epoch": 0.65, "learning_rate": 5.716354988244055e-05, "loss": 0.6386, "step": 6261 }, { "epoch": 0.65, "learning_rate": 5.7133086959660044e-05, "loss": 0.6355, "step": 6262 }, { "epoch": 0.65, "learning_rate": 5.710262890965663e-05, "loss": 0.612, "step": 6263 }, { "epoch": 0.65, "learning_rate": 5.7072175735892416e-05, "loss": 0.6561, "step": 6264 }, { "epoch": 0.65, "learning_rate": 5.70417274418292e-05, "loss": 0.6336, "step": 6265 }, { "epoch": 0.65, "learning_rate": 5.701128403092799e-05, "loss": 0.6033, "step": 6266 }, { "epoch": 0.65, "learning_rate": 5.698084550664948e-05, "loss": 0.6092, "step": 6267 }, { "epoch": 0.65, "learning_rate": 5.695041187245357e-05, "loss": 0.689, "step": 6268 }, { "epoch": 0.65, "learning_rate": 5.691998313179976e-05, "loss": 0.626, "step": 6269 }, { "epoch": 0.65, "learning_rate": 5.688955928814701e-05, "loss": 0.679, "step": 6270 }, { "epoch": 0.65, "learning_rate": 5.685914034495359e-05, "loss": 0.66, "step": 6271 }, { "epoch": 0.65, "learning_rate": 5.6828726305677295e-05, "loss": 0.6752, "step": 6272 }, { "epoch": 0.65, "learning_rate": 5.679831717377542e-05, "loss": 0.6938, "step": 6273 }, { "epoch": 0.65, "learning_rate": 5.676791295270456e-05, "loss": 0.6868, "step": 6274 }, { "epoch": 0.65, "learning_rate": 5.673751364592092e-05, "loss": 0.6909, "step": 6275 }, { "epoch": 0.65, "learning_rate": 5.670711925687995e-05, "loss": 0.7334, "step": 6276 }, { "epoch": 0.65, "learning_rate": 5.667672978903673e-05, "loss": 0.69, "step": 6277 }, { "epoch": 0.65, "learning_rate": 5.664634524584568e-05, "loss": 0.6311, "step": 6278 }, { "epoch": 0.65, "learning_rate": 5.661596563076063e-05, "loss": 0.7472, "step": 6279 }, { "epoch": 0.65, "learning_rate": 5.658559094723492e-05, "loss": 0.6878, "step": 6280 }, { "epoch": 0.65, "learning_rate": 5.655522119872138e-05, "loss": 0.566, "step": 6281 }, { "epoch": 0.65, "learning_rate": 5.6524856388672084e-05, "loss": 0.6052, "step": 6282 }, { "epoch": 0.65, "learning_rate": 5.649449652053875e-05, "loss": 0.6065, "step": 6283 }, { "epoch": 0.65, "learning_rate": 5.646414159777248e-05, "loss": 0.6909, "step": 6284 }, { "epoch": 0.65, "learning_rate": 5.6433791623823696e-05, "loss": 0.6149, "step": 6285 }, { "epoch": 0.65, "learning_rate": 5.640344660214238e-05, "loss": 0.799, "step": 6286 }, { "epoch": 0.65, "learning_rate": 5.6373106536177975e-05, "loss": 0.7502, "step": 6287 }, { "epoch": 0.65, "learning_rate": 5.6342771429379215e-05, "loss": 0.692, "step": 6288 }, { "epoch": 0.65, "learning_rate": 5.631244128519444e-05, "loss": 0.685, "step": 6289 }, { "epoch": 0.65, "learning_rate": 5.6282116107071305e-05, "loss": 0.7348, "step": 6290 }, { "epoch": 0.65, "learning_rate": 5.62517958984569e-05, "loss": 0.7018, "step": 6291 }, { "epoch": 0.65, "learning_rate": 5.622148066279786e-05, "loss": 0.686, "step": 6292 }, { "epoch": 0.66, "learning_rate": 5.619117040354014e-05, "loss": 0.5811, "step": 6293 }, { "epoch": 0.66, "learning_rate": 5.616086512412917e-05, "loss": 0.6907, "step": 6294 }, { "epoch": 0.66, "learning_rate": 5.613056482800989e-05, "loss": 0.6722, "step": 6295 }, { "epoch": 0.66, "learning_rate": 5.61002695186265e-05, "loss": 0.6578, "step": 6296 }, { "epoch": 0.66, "learning_rate": 5.606997919942279e-05, "loss": 0.6549, "step": 6297 }, { "epoch": 0.66, "learning_rate": 5.603969387384196e-05, "loss": 0.6319, "step": 6298 }, { "epoch": 0.66, "learning_rate": 5.600941354532654e-05, "loss": 0.7112, "step": 6299 }, { "epoch": 0.66, "learning_rate": 5.5979138217318586e-05, "loss": 0.6549, "step": 6300 }, { "epoch": 0.66, "learning_rate": 5.594886789325961e-05, "loss": 0.661, "step": 6301 }, { "epoch": 0.66, "learning_rate": 5.591860257659043e-05, "loss": 0.6454, "step": 6302 }, { "epoch": 0.66, "learning_rate": 5.588834227075146e-05, "loss": 0.7076, "step": 6303 }, { "epoch": 0.66, "learning_rate": 5.585808697918239e-05, "loss": 0.6659, "step": 6304 }, { "epoch": 0.66, "learning_rate": 5.582783670532239e-05, "loss": 0.7075, "step": 6305 }, { "epoch": 0.66, "learning_rate": 5.57975914526101e-05, "loss": 0.6293, "step": 6306 }, { "epoch": 0.66, "learning_rate": 5.576735122448362e-05, "loss": 0.6863, "step": 6307 }, { "epoch": 0.66, "learning_rate": 5.573711602438032e-05, "loss": 0.6886, "step": 6308 }, { "epoch": 0.66, "learning_rate": 5.570688585573718e-05, "loss": 0.7242, "step": 6309 }, { "epoch": 0.66, "learning_rate": 5.567666072199053e-05, "loss": 0.6661, "step": 6310 }, { "epoch": 0.66, "learning_rate": 5.564644062657607e-05, "loss": 0.7366, "step": 6311 }, { "epoch": 0.66, "learning_rate": 5.561622557292906e-05, "loss": 0.6537, "step": 6312 }, { "epoch": 0.66, "learning_rate": 5.558601556448404e-05, "loss": 0.6279, "step": 6313 }, { "epoch": 0.66, "learning_rate": 5.555581060467507e-05, "loss": 0.6683, "step": 6314 }, { "epoch": 0.66, "learning_rate": 5.552561069693568e-05, "loss": 0.6797, "step": 6315 }, { "epoch": 0.66, "learning_rate": 5.5495415844698706e-05, "loss": 0.6974, "step": 6316 }, { "epoch": 0.66, "learning_rate": 5.546522605139641e-05, "loss": 0.6318, "step": 6317 }, { "epoch": 0.66, "learning_rate": 5.5435041320460644e-05, "loss": 0.6961, "step": 6318 }, { "epoch": 0.66, "learning_rate": 5.540486165532247e-05, "loss": 0.6962, "step": 6319 }, { "epoch": 0.66, "learning_rate": 5.537468705941253e-05, "loss": 0.707, "step": 6320 }, { "epoch": 0.66, "learning_rate": 5.5344517536160856e-05, "loss": 0.6443, "step": 6321 }, { "epoch": 0.66, "learning_rate": 5.531435308899684e-05, "loss": 0.7269, "step": 6322 }, { "epoch": 0.66, "learning_rate": 5.528419372134934e-05, "loss": 0.7091, "step": 6323 }, { "epoch": 0.66, "learning_rate": 5.525403943664672e-05, "loss": 0.6672, "step": 6324 }, { "epoch": 0.66, "learning_rate": 5.522389023831658e-05, "loss": 0.6533, "step": 6325 }, { "epoch": 0.66, "learning_rate": 5.519374612978609e-05, "loss": 0.6714, "step": 6326 }, { "epoch": 0.66, "learning_rate": 5.516360711448183e-05, "loss": 0.6812, "step": 6327 }, { "epoch": 0.66, "learning_rate": 5.513347319582973e-05, "loss": 0.5781, "step": 6328 }, { "epoch": 0.66, "learning_rate": 5.510334437725517e-05, "loss": 0.6187, "step": 6329 }, { "epoch": 0.66, "learning_rate": 5.5073220662183004e-05, "loss": 0.7227, "step": 6330 }, { "epoch": 0.66, "learning_rate": 5.504310205403739e-05, "loss": 0.702, "step": 6331 }, { "epoch": 0.66, "learning_rate": 5.501298855624206e-05, "loss": 0.7234, "step": 6332 }, { "epoch": 0.66, "learning_rate": 5.4982880172219996e-05, "loss": 0.6953, "step": 6333 }, { "epoch": 0.66, "learning_rate": 5.4952776905393756e-05, "loss": 0.6067, "step": 6334 }, { "epoch": 0.66, "learning_rate": 5.4922678759185244e-05, "loss": 0.6669, "step": 6335 }, { "epoch": 0.66, "learning_rate": 5.48925857370157e-05, "loss": 0.6659, "step": 6336 }, { "epoch": 0.66, "learning_rate": 5.486249784230595e-05, "loss": 0.6523, "step": 6337 }, { "epoch": 0.66, "learning_rate": 5.483241507847616e-05, "loss": 0.6601, "step": 6338 }, { "epoch": 0.66, "learning_rate": 5.480233744894583e-05, "loss": 0.6263, "step": 6339 }, { "epoch": 0.66, "learning_rate": 5.477226495713401e-05, "loss": 0.6626, "step": 6340 }, { "epoch": 0.66, "learning_rate": 5.474219760645907e-05, "loss": 0.753, "step": 6341 }, { "epoch": 0.66, "learning_rate": 5.4712135400338884e-05, "loss": 0.7527, "step": 6342 }, { "epoch": 0.66, "learning_rate": 5.4682078342190614e-05, "loss": 0.6823, "step": 6343 }, { "epoch": 0.66, "learning_rate": 5.465202643543099e-05, "loss": 0.6785, "step": 6344 }, { "epoch": 0.66, "learning_rate": 5.4621979683476024e-05, "loss": 0.7077, "step": 6345 }, { "epoch": 0.66, "learning_rate": 5.459193808974119e-05, "loss": 0.6855, "step": 6346 }, { "epoch": 0.66, "learning_rate": 5.4561901657641455e-05, "loss": 0.6956, "step": 6347 }, { "epoch": 0.66, "learning_rate": 5.4531870390591046e-05, "loss": 0.6566, "step": 6348 }, { "epoch": 0.66, "learning_rate": 5.450184429200371e-05, "loss": 0.6942, "step": 6349 }, { "epoch": 0.66, "learning_rate": 5.447182336529263e-05, "loss": 0.6686, "step": 6350 }, { "epoch": 0.66, "learning_rate": 5.4441807613870266e-05, "loss": 0.6876, "step": 6351 }, { "epoch": 0.66, "learning_rate": 5.441179704114866e-05, "loss": 0.628, "step": 6352 }, { "epoch": 0.66, "learning_rate": 5.4381791650539095e-05, "loss": 0.6828, "step": 6353 }, { "epoch": 0.66, "learning_rate": 5.435179144545244e-05, "loss": 0.6741, "step": 6354 }, { "epoch": 0.66, "learning_rate": 5.4321796429298844e-05, "loss": 0.6379, "step": 6355 }, { "epoch": 0.66, "learning_rate": 5.429180660548785e-05, "loss": 0.7147, "step": 6356 }, { "epoch": 0.66, "learning_rate": 5.4261821977428527e-05, "loss": 0.6297, "step": 6357 }, { "epoch": 0.66, "learning_rate": 5.423184254852931e-05, "loss": 0.6739, "step": 6358 }, { "epoch": 0.66, "learning_rate": 5.4201868322197976e-05, "loss": 0.6139, "step": 6359 }, { "epoch": 0.66, "learning_rate": 5.417189930184179e-05, "loss": 0.6445, "step": 6360 }, { "epoch": 0.66, "learning_rate": 5.414193549086744e-05, "loss": 0.6926, "step": 6361 }, { "epoch": 0.66, "learning_rate": 5.411197689268088e-05, "loss": 0.6496, "step": 6362 }, { "epoch": 0.66, "learning_rate": 5.408202351068764e-05, "loss": 0.6896, "step": 6363 }, { "epoch": 0.66, "learning_rate": 5.405207534829261e-05, "loss": 0.6072, "step": 6364 }, { "epoch": 0.66, "learning_rate": 5.4022132408899985e-05, "loss": 0.6861, "step": 6365 }, { "epoch": 0.66, "learning_rate": 5.399219469591352e-05, "loss": 0.5981, "step": 6366 }, { "epoch": 0.66, "learning_rate": 5.396226221273628e-05, "loss": 0.6764, "step": 6367 }, { "epoch": 0.66, "learning_rate": 5.3932334962770694e-05, "loss": 0.6633, "step": 6368 }, { "epoch": 0.66, "learning_rate": 5.390241294941871e-05, "loss": 0.7261, "step": 6369 }, { "epoch": 0.66, "learning_rate": 5.3872496176081675e-05, "loss": 0.6637, "step": 6370 }, { "epoch": 0.66, "learning_rate": 5.384258464616021e-05, "loss": 0.7181, "step": 6371 }, { "epoch": 0.66, "learning_rate": 5.38126783630545e-05, "loss": 0.656, "step": 6372 }, { "epoch": 0.66, "learning_rate": 5.378277733016398e-05, "loss": 0.7243, "step": 6373 }, { "epoch": 0.66, "learning_rate": 5.37528815508876e-05, "loss": 0.6504, "step": 6374 }, { "epoch": 0.66, "learning_rate": 5.3722991028623746e-05, "loss": 0.7315, "step": 6375 }, { "epoch": 0.66, "learning_rate": 5.3693105766770046e-05, "loss": 0.6785, "step": 6376 }, { "epoch": 0.66, "learning_rate": 5.3663225768723647e-05, "loss": 0.6683, "step": 6377 }, { "epoch": 0.66, "learning_rate": 5.363335103788113e-05, "loss": 0.6605, "step": 6378 }, { "epoch": 0.66, "learning_rate": 5.360348157763835e-05, "loss": 0.7272, "step": 6379 }, { "epoch": 0.66, "learning_rate": 5.357361739139069e-05, "loss": 0.6324, "step": 6380 }, { "epoch": 0.66, "learning_rate": 5.3543758482532856e-05, "loss": 0.7608, "step": 6381 }, { "epoch": 0.66, "learning_rate": 5.351390485445895e-05, "loss": 0.7293, "step": 6382 }, { "epoch": 0.66, "learning_rate": 5.348405651056251e-05, "loss": 0.6654, "step": 6383 }, { "epoch": 0.66, "learning_rate": 5.345421345423651e-05, "loss": 0.7125, "step": 6384 }, { "epoch": 0.66, "learning_rate": 5.3424375688873215e-05, "loss": 0.7012, "step": 6385 }, { "epoch": 0.66, "learning_rate": 5.339454321786438e-05, "loss": 0.6341, "step": 6386 }, { "epoch": 0.66, "learning_rate": 5.336471604460116e-05, "loss": 0.7296, "step": 6387 }, { "epoch": 0.66, "learning_rate": 5.3334894172473994e-05, "loss": 0.6368, "step": 6388 }, { "epoch": 0.67, "learning_rate": 5.3305077604872864e-05, "loss": 0.6574, "step": 6389 }, { "epoch": 0.67, "learning_rate": 5.3275266345187104e-05, "loss": 0.6492, "step": 6390 }, { "epoch": 0.67, "learning_rate": 5.324546039680536e-05, "loss": 0.6416, "step": 6391 }, { "epoch": 0.67, "learning_rate": 5.32156597631158e-05, "loss": 0.6998, "step": 6392 }, { "epoch": 0.67, "learning_rate": 5.3185864447505893e-05, "loss": 0.6388, "step": 6393 }, { "epoch": 0.67, "learning_rate": 5.3156074453362526e-05, "loss": 0.6742, "step": 6394 }, { "epoch": 0.67, "learning_rate": 5.3126289784072036e-05, "loss": 0.6679, "step": 6395 }, { "epoch": 0.67, "learning_rate": 5.309651044302007e-05, "loss": 0.6656, "step": 6396 }, { "epoch": 0.67, "learning_rate": 5.30667364335917e-05, "loss": 0.7242, "step": 6397 }, { "epoch": 0.67, "learning_rate": 5.303696775917151e-05, "loss": 0.6096, "step": 6398 }, { "epoch": 0.67, "learning_rate": 5.300720442314323e-05, "loss": 0.6812, "step": 6399 }, { "epoch": 0.67, "learning_rate": 5.29774464288902e-05, "loss": 0.7061, "step": 6400 }, { "epoch": 0.67, "learning_rate": 5.2947693779795115e-05, "loss": 0.6491, "step": 6401 }, { "epoch": 0.67, "learning_rate": 5.2917946479239935e-05, "loss": 0.6477, "step": 6402 }, { "epoch": 0.67, "learning_rate": 5.288820453060612e-05, "loss": 0.7409, "step": 6403 }, { "epoch": 0.67, "learning_rate": 5.28584679372746e-05, "loss": 0.6796, "step": 6404 }, { "epoch": 0.67, "learning_rate": 5.2828736702625515e-05, "loss": 0.691, "step": 6405 }, { "epoch": 0.67, "learning_rate": 5.2799010830038445e-05, "loss": 0.6425, "step": 6406 }, { "epoch": 0.67, "learning_rate": 5.2769290322892486e-05, "loss": 0.6943, "step": 6407 }, { "epoch": 0.67, "learning_rate": 5.273957518456596e-05, "loss": 0.6652, "step": 6408 }, { "epoch": 0.67, "learning_rate": 5.2709865418436674e-05, "loss": 0.6189, "step": 6409 }, { "epoch": 0.67, "learning_rate": 5.268016102788185e-05, "loss": 0.6932, "step": 6410 }, { "epoch": 0.67, "learning_rate": 5.265046201627799e-05, "loss": 0.6323, "step": 6411 }, { "epoch": 0.67, "learning_rate": 5.2620768387001095e-05, "loss": 0.6095, "step": 6412 }, { "epoch": 0.67, "learning_rate": 5.259108014342644e-05, "loss": 0.6939, "step": 6413 }, { "epoch": 0.67, "learning_rate": 5.256139728892881e-05, "loss": 0.6936, "step": 6414 }, { "epoch": 0.67, "learning_rate": 5.253171982688234e-05, "loss": 0.667, "step": 6415 }, { "epoch": 0.67, "learning_rate": 5.250204776066046e-05, "loss": 0.6675, "step": 6416 }, { "epoch": 0.67, "learning_rate": 5.247238109363612e-05, "loss": 0.6726, "step": 6417 }, { "epoch": 0.67, "learning_rate": 5.244271982918156e-05, "loss": 0.6686, "step": 6418 }, { "epoch": 0.67, "learning_rate": 5.241306397066847e-05, "loss": 0.6094, "step": 6419 }, { "epoch": 0.67, "learning_rate": 5.238341352146787e-05, "loss": 0.6842, "step": 6420 }, { "epoch": 0.67, "learning_rate": 5.235376848495024e-05, "loss": 0.6796, "step": 6421 }, { "epoch": 0.67, "learning_rate": 5.23241288644853e-05, "loss": 0.6901, "step": 6422 }, { "epoch": 0.67, "learning_rate": 5.229449466344234e-05, "loss": 0.6809, "step": 6423 }, { "epoch": 0.67, "learning_rate": 5.226486588518995e-05, "loss": 0.6327, "step": 6424 }, { "epoch": 0.67, "learning_rate": 5.223524253309602e-05, "loss": 0.6325, "step": 6425 }, { "epoch": 0.67, "learning_rate": 5.220562461052796e-05, "loss": 0.6548, "step": 6426 }, { "epoch": 0.67, "learning_rate": 5.217601212085252e-05, "loss": 0.7193, "step": 6427 }, { "epoch": 0.67, "learning_rate": 5.214640506743577e-05, "loss": 0.6947, "step": 6428 }, { "epoch": 0.67, "learning_rate": 5.2116803453643223e-05, "loss": 0.571, "step": 6429 }, { "epoch": 0.67, "learning_rate": 5.20872072828398e-05, "loss": 0.6447, "step": 6430 }, { "epoch": 0.67, "learning_rate": 5.2057616558389745e-05, "loss": 0.7131, "step": 6431 }, { "epoch": 0.67, "learning_rate": 5.2028031283656686e-05, "loss": 0.6725, "step": 6432 }, { "epoch": 0.67, "learning_rate": 5.1998451462003604e-05, "loss": 0.6385, "step": 6433 }, { "epoch": 0.67, "learning_rate": 5.1968877096792956e-05, "loss": 0.6718, "step": 6434 }, { "epoch": 0.67, "learning_rate": 5.193930819138655e-05, "loss": 0.7144, "step": 6435 }, { "epoch": 0.67, "learning_rate": 5.1909744749145486e-05, "loss": 0.6533, "step": 6436 }, { "epoch": 0.67, "learning_rate": 5.188018677343033e-05, "loss": 0.6153, "step": 6437 }, { "epoch": 0.67, "learning_rate": 5.185063426760104e-05, "loss": 0.6801, "step": 6438 }, { "epoch": 0.67, "learning_rate": 5.182108723501686e-05, "loss": 0.7471, "step": 6439 }, { "epoch": 0.67, "learning_rate": 5.179154567903648e-05, "loss": 0.7155, "step": 6440 }, { "epoch": 0.67, "learning_rate": 5.1762009603018e-05, "loss": 0.7051, "step": 6441 }, { "epoch": 0.67, "learning_rate": 5.173247901031879e-05, "loss": 0.6375, "step": 6442 }, { "epoch": 0.67, "learning_rate": 5.1702953904295716e-05, "loss": 0.6436, "step": 6443 }, { "epoch": 0.67, "learning_rate": 5.16734342883049e-05, "loss": 0.6795, "step": 6444 }, { "epoch": 0.67, "learning_rate": 5.164392016570196e-05, "loss": 0.7509, "step": 6445 }, { "epoch": 0.67, "learning_rate": 5.1614411539841767e-05, "loss": 0.6727, "step": 6446 }, { "epoch": 0.67, "learning_rate": 5.1584908414078714e-05, "loss": 0.691, "step": 6447 }, { "epoch": 0.67, "learning_rate": 5.1555410791766404e-05, "loss": 0.701, "step": 6448 }, { "epoch": 0.67, "learning_rate": 5.1525918676257935e-05, "loss": 0.6901, "step": 6449 }, { "epoch": 0.67, "learning_rate": 5.1496432070905777e-05, "loss": 0.6884, "step": 6450 }, { "epoch": 0.67, "learning_rate": 5.146695097906164e-05, "loss": 0.6688, "step": 6451 }, { "epoch": 0.67, "learning_rate": 5.143747540407684e-05, "loss": 0.6625, "step": 6452 }, { "epoch": 0.67, "learning_rate": 5.140800534930181e-05, "loss": 0.6557, "step": 6453 }, { "epoch": 0.67, "learning_rate": 5.137854081808652e-05, "loss": 0.6444, "step": 6454 }, { "epoch": 0.67, "learning_rate": 5.134908181378031e-05, "loss": 0.7118, "step": 6455 }, { "epoch": 0.67, "learning_rate": 5.1319628339731775e-05, "loss": 0.6906, "step": 6456 }, { "epoch": 0.67, "learning_rate": 5.129018039928903e-05, "loss": 0.6266, "step": 6457 }, { "epoch": 0.67, "learning_rate": 5.126073799579947e-05, "loss": 0.6964, "step": 6458 }, { "epoch": 0.67, "learning_rate": 5.12313011326098e-05, "loss": 0.7001, "step": 6459 }, { "epoch": 0.67, "learning_rate": 5.120186981306625e-05, "loss": 0.7, "step": 6460 }, { "epoch": 0.67, "learning_rate": 5.117244404051436e-05, "loss": 0.6201, "step": 6461 }, { "epoch": 0.67, "learning_rate": 5.114302381829894e-05, "loss": 0.7172, "step": 6462 }, { "epoch": 0.67, "learning_rate": 5.111360914976433e-05, "loss": 0.6946, "step": 6463 }, { "epoch": 0.67, "learning_rate": 5.108420003825415e-05, "loss": 0.6652, "step": 6464 }, { "epoch": 0.67, "learning_rate": 5.105479648711134e-05, "loss": 0.6914, "step": 6465 }, { "epoch": 0.67, "learning_rate": 5.1025398499678324e-05, "loss": 0.7117, "step": 6466 }, { "epoch": 0.67, "learning_rate": 5.0996006079296854e-05, "loss": 0.6859, "step": 6467 }, { "epoch": 0.67, "learning_rate": 5.0966619229307966e-05, "loss": 0.6349, "step": 6468 }, { "epoch": 0.67, "learning_rate": 5.0937237953052184e-05, "loss": 0.6414, "step": 6469 }, { "epoch": 0.67, "learning_rate": 5.090786225386933e-05, "loss": 0.7082, "step": 6470 }, { "epoch": 0.67, "learning_rate": 5.087849213509855e-05, "loss": 0.6547, "step": 6471 }, { "epoch": 0.67, "learning_rate": 5.0849127600078494e-05, "loss": 0.6515, "step": 6472 }, { "epoch": 0.67, "learning_rate": 5.081976865214703e-05, "loss": 0.6633, "step": 6473 }, { "epoch": 0.67, "learning_rate": 5.079041529464147e-05, "loss": 0.6685, "step": 6474 }, { "epoch": 0.67, "learning_rate": 5.076106753089852e-05, "loss": 0.6648, "step": 6475 }, { "epoch": 0.67, "learning_rate": 5.0731725364254135e-05, "loss": 0.6901, "step": 6476 }, { "epoch": 0.67, "learning_rate": 5.0702388798043745e-05, "loss": 0.6618, "step": 6477 }, { "epoch": 0.67, "learning_rate": 5.067305783560212e-05, "loss": 0.6337, "step": 6478 }, { "epoch": 0.67, "learning_rate": 5.064373248026333e-05, "loss": 0.6598, "step": 6479 }, { "epoch": 0.67, "learning_rate": 5.061441273536087e-05, "loss": 0.6747, "step": 6480 }, { "epoch": 0.67, "learning_rate": 5.058509860422762e-05, "loss": 0.6142, "step": 6481 }, { "epoch": 0.67, "learning_rate": 5.0555790090195755e-05, "loss": 0.702, "step": 6482 }, { "epoch": 0.67, "learning_rate": 5.052648719659678e-05, "loss": 0.7158, "step": 6483 }, { "epoch": 0.67, "learning_rate": 5.049718992676174e-05, "loss": 0.6391, "step": 6484 }, { "epoch": 0.68, "learning_rate": 5.0467898284020786e-05, "loss": 0.5821, "step": 6485 }, { "epoch": 0.68, "learning_rate": 5.0438612271703634e-05, "loss": 0.6974, "step": 6486 }, { "epoch": 0.68, "learning_rate": 5.040933189313932e-05, "loss": 0.6916, "step": 6487 }, { "epoch": 0.68, "learning_rate": 5.0380057151656145e-05, "loss": 0.6423, "step": 6488 }, { "epoch": 0.68, "learning_rate": 5.035078805058187e-05, "loss": 0.6919, "step": 6489 }, { "epoch": 0.68, "learning_rate": 5.0321524593243616e-05, "loss": 0.6138, "step": 6490 }, { "epoch": 0.68, "learning_rate": 5.0292266782967725e-05, "loss": 0.6433, "step": 6491 }, { "epoch": 0.68, "learning_rate": 5.026301462308011e-05, "loss": 0.6547, "step": 6492 }, { "epoch": 0.68, "learning_rate": 5.023376811690583e-05, "loss": 0.6531, "step": 6493 }, { "epoch": 0.68, "learning_rate": 5.0204527267769474e-05, "loss": 0.6521, "step": 6494 }, { "epoch": 0.68, "learning_rate": 5.0175292078994854e-05, "loss": 0.7003, "step": 6495 }, { "epoch": 0.68, "learning_rate": 5.014606255390526e-05, "loss": 0.6639, "step": 6496 }, { "epoch": 0.68, "learning_rate": 5.011683869582321e-05, "loss": 0.6818, "step": 6497 }, { "epoch": 0.68, "learning_rate": 5.0087620508070724e-05, "loss": 0.6837, "step": 6498 }, { "epoch": 0.68, "learning_rate": 5.0058407993969e-05, "loss": 0.6242, "step": 6499 }, { "epoch": 0.68, "learning_rate": 5.0029201156838756e-05, "loss": 0.7044, "step": 6500 }, { "epoch": 0.68, "learning_rate": 5.000000000000002e-05, "loss": 0.6138, "step": 6501 }, { "epoch": 0.68, "learning_rate": 4.9970804526772084e-05, "loss": 0.6632, "step": 6502 }, { "epoch": 0.68, "learning_rate": 4.994161474047368e-05, "loss": 0.6923, "step": 6503 }, { "epoch": 0.68, "learning_rate": 4.9912430644422946e-05, "loss": 0.6679, "step": 6504 }, { "epoch": 0.68, "learning_rate": 4.988325224193721e-05, "loss": 0.6542, "step": 6505 }, { "epoch": 0.68, "learning_rate": 4.9854079536333277e-05, "loss": 0.6726, "step": 6506 }, { "epoch": 0.68, "learning_rate": 4.982491253092732e-05, "loss": 0.703, "step": 6507 }, { "epoch": 0.68, "learning_rate": 4.979575122903478e-05, "loss": 0.7087, "step": 6508 }, { "epoch": 0.68, "learning_rate": 4.9766595633970434e-05, "loss": 0.6592, "step": 6509 }, { "epoch": 0.68, "learning_rate": 4.973744574904856e-05, "loss": 0.6878, "step": 6510 }, { "epoch": 0.68, "learning_rate": 4.9708301577582615e-05, "loss": 0.7057, "step": 6511 }, { "epoch": 0.68, "learning_rate": 4.967916312288553e-05, "loss": 0.6766, "step": 6512 }, { "epoch": 0.68, "learning_rate": 4.9650030388269484e-05, "loss": 0.5982, "step": 6513 }, { "epoch": 0.68, "learning_rate": 4.9620903377046104e-05, "loss": 0.6677, "step": 6514 }, { "epoch": 0.68, "learning_rate": 4.959178209252634e-05, "loss": 0.668, "step": 6515 }, { "epoch": 0.68, "learning_rate": 4.9562666538020406e-05, "loss": 0.6764, "step": 6516 }, { "epoch": 0.68, "learning_rate": 4.953355671683797e-05, "loss": 0.6508, "step": 6517 }, { "epoch": 0.68, "learning_rate": 4.950445263228805e-05, "loss": 0.6019, "step": 6518 }, { "epoch": 0.68, "learning_rate": 4.947535428767889e-05, "loss": 0.6616, "step": 6519 }, { "epoch": 0.68, "learning_rate": 4.944626168631824e-05, "loss": 0.6723, "step": 6520 }, { "epoch": 0.68, "learning_rate": 4.9417174831513055e-05, "loss": 0.6187, "step": 6521 }, { "epoch": 0.68, "learning_rate": 4.938809372656976e-05, "loss": 0.6456, "step": 6522 }, { "epoch": 0.68, "learning_rate": 4.935901837479402e-05, "loss": 0.6562, "step": 6523 }, { "epoch": 0.68, "learning_rate": 4.932994877949093e-05, "loss": 0.7714, "step": 6524 }, { "epoch": 0.68, "learning_rate": 4.930088494396487e-05, "loss": 0.721, "step": 6525 }, { "epoch": 0.68, "learning_rate": 4.9271826871519575e-05, "loss": 0.631, "step": 6526 }, { "epoch": 0.68, "learning_rate": 4.9242774565458214e-05, "loss": 0.6795, "step": 6527 }, { "epoch": 0.68, "learning_rate": 4.921372802908315e-05, "loss": 0.6749, "step": 6528 }, { "epoch": 0.68, "learning_rate": 4.918468726569619e-05, "loss": 0.6933, "step": 6529 }, { "epoch": 0.68, "learning_rate": 4.9155652278598504e-05, "loss": 0.7182, "step": 6530 }, { "epoch": 0.68, "learning_rate": 4.912662307109051e-05, "loss": 0.6762, "step": 6531 }, { "epoch": 0.68, "learning_rate": 4.909759964647206e-05, "loss": 0.6849, "step": 6532 }, { "epoch": 0.68, "learning_rate": 4.906858200804226e-05, "loss": 0.6496, "step": 6533 }, { "epoch": 0.68, "learning_rate": 4.903957015909968e-05, "loss": 0.689, "step": 6534 }, { "epoch": 0.68, "learning_rate": 4.901056410294211e-05, "loss": 0.6898, "step": 6535 }, { "epoch": 0.68, "learning_rate": 4.898156384286673e-05, "loss": 0.675, "step": 6536 }, { "epoch": 0.68, "learning_rate": 4.8952569382170056e-05, "loss": 0.7127, "step": 6537 }, { "epoch": 0.68, "learning_rate": 4.8923580724148035e-05, "loss": 0.6834, "step": 6538 }, { "epoch": 0.68, "learning_rate": 4.889459787209576e-05, "loss": 0.6586, "step": 6539 }, { "epoch": 0.68, "learning_rate": 4.886562082930784e-05, "loss": 0.5988, "step": 6540 }, { "epoch": 0.68, "learning_rate": 4.883664959907817e-05, "loss": 0.6759, "step": 6541 }, { "epoch": 0.68, "learning_rate": 4.880768418469992e-05, "loss": 0.6711, "step": 6542 }, { "epoch": 0.68, "learning_rate": 4.8778724589465685e-05, "loss": 0.7307, "step": 6543 }, { "epoch": 0.68, "learning_rate": 4.874977081666741e-05, "loss": 0.6509, "step": 6544 }, { "epoch": 0.68, "learning_rate": 4.872082286959625e-05, "loss": 0.6594, "step": 6545 }, { "epoch": 0.68, "learning_rate": 4.869188075154286e-05, "loss": 0.6963, "step": 6546 }, { "epoch": 0.68, "learning_rate": 4.8662944465797124e-05, "loss": 0.6635, "step": 6547 }, { "epoch": 0.68, "learning_rate": 4.863401401564824e-05, "loss": 0.6716, "step": 6548 }, { "epoch": 0.68, "learning_rate": 4.860508940438485e-05, "loss": 0.6556, "step": 6549 }, { "epoch": 0.68, "learning_rate": 4.857617063529491e-05, "loss": 0.71, "step": 6550 }, { "epoch": 0.68, "learning_rate": 4.854725771166561e-05, "loss": 0.6658, "step": 6551 }, { "epoch": 0.68, "learning_rate": 4.851835063678362e-05, "loss": 0.7109, "step": 6552 }, { "epoch": 0.68, "learning_rate": 4.848944941393479e-05, "loss": 0.7618, "step": 6553 }, { "epoch": 0.68, "learning_rate": 4.846055404640442e-05, "loss": 0.6352, "step": 6554 }, { "epoch": 0.68, "learning_rate": 4.843166453747715e-05, "loss": 0.6369, "step": 6555 }, { "epoch": 0.68, "learning_rate": 4.840278089043686e-05, "loss": 0.6396, "step": 6556 }, { "epoch": 0.68, "learning_rate": 4.837390310856683e-05, "loss": 0.6911, "step": 6557 }, { "epoch": 0.68, "learning_rate": 4.834503119514971e-05, "loss": 0.6663, "step": 6558 }, { "epoch": 0.68, "learning_rate": 4.8316165153467395e-05, "loss": 0.6224, "step": 6559 }, { "epoch": 0.68, "learning_rate": 4.828730498680113e-05, "loss": 0.6431, "step": 6560 }, { "epoch": 0.68, "learning_rate": 4.8258450698431556e-05, "loss": 0.6704, "step": 6561 }, { "epoch": 0.68, "learning_rate": 4.8229602291638555e-05, "loss": 0.6755, "step": 6562 }, { "epoch": 0.68, "learning_rate": 4.820075976970142e-05, "loss": 0.6157, "step": 6563 }, { "epoch": 0.68, "learning_rate": 4.817192313589878e-05, "loss": 0.655, "step": 6564 }, { "epoch": 0.68, "learning_rate": 4.814309239350848e-05, "loss": 0.6234, "step": 6565 }, { "epoch": 0.68, "learning_rate": 4.8114267545807835e-05, "loss": 0.6711, "step": 6566 }, { "epoch": 0.68, "learning_rate": 4.808544859607343e-05, "loss": 0.6781, "step": 6567 }, { "epoch": 0.68, "learning_rate": 4.805663554758113e-05, "loss": 0.685, "step": 6568 }, { "epoch": 0.68, "learning_rate": 4.802782840360621e-05, "loss": 0.62, "step": 6569 }, { "epoch": 0.68, "learning_rate": 4.799902716742327e-05, "loss": 0.6927, "step": 6570 }, { "epoch": 0.68, "learning_rate": 4.797023184230616e-05, "loss": 0.7335, "step": 6571 }, { "epoch": 0.68, "learning_rate": 4.794144243152815e-05, "loss": 0.6817, "step": 6572 }, { "epoch": 0.68, "learning_rate": 4.7912658938361786e-05, "loss": 0.7159, "step": 6573 }, { "epoch": 0.68, "learning_rate": 4.78838813660789e-05, "loss": 0.73, "step": 6574 }, { "epoch": 0.68, "learning_rate": 4.785510971795078e-05, "loss": 0.6708, "step": 6575 }, { "epoch": 0.68, "learning_rate": 4.782634399724788e-05, "loss": 0.6802, "step": 6576 }, { "epoch": 0.68, "learning_rate": 4.779758420724012e-05, "loss": 0.6805, "step": 6577 }, { "epoch": 0.68, "learning_rate": 4.776883035119672e-05, "loss": 0.6959, "step": 6578 }, { "epoch": 0.68, "learning_rate": 4.77400824323861e-05, "loss": 0.5889, "step": 6579 }, { "epoch": 0.68, "learning_rate": 4.771134045407617e-05, "loss": 0.6585, "step": 6580 }, { "epoch": 0.69, "learning_rate": 4.7682604419534105e-05, "loss": 0.6706, "step": 6581 }, { "epoch": 0.69, "learning_rate": 4.765387433202633e-05, "loss": 0.6459, "step": 6582 }, { "epoch": 0.69, "learning_rate": 4.76251501948187e-05, "loss": 0.7156, "step": 6583 }, { "epoch": 0.69, "learning_rate": 4.7596432011176374e-05, "loss": 0.6659, "step": 6584 }, { "epoch": 0.69, "learning_rate": 4.7567719784363785e-05, "loss": 0.6628, "step": 6585 }, { "epoch": 0.69, "learning_rate": 4.753901351764468e-05, "loss": 0.6728, "step": 6586 }, { "epoch": 0.69, "learning_rate": 4.751031321428223e-05, "loss": 0.7039, "step": 6587 }, { "epoch": 0.69, "learning_rate": 4.748161887753879e-05, "loss": 0.7374, "step": 6588 }, { "epoch": 0.69, "learning_rate": 4.7452930510676153e-05, "loss": 0.5747, "step": 6589 }, { "epoch": 0.69, "learning_rate": 4.742424811695542e-05, "loss": 0.6715, "step": 6590 }, { "epoch": 0.69, "learning_rate": 4.739557169963691e-05, "loss": 0.6577, "step": 6591 }, { "epoch": 0.69, "learning_rate": 4.7366901261980404e-05, "loss": 0.6824, "step": 6592 }, { "epoch": 0.69, "learning_rate": 4.733823680724486e-05, "loss": 0.7018, "step": 6593 }, { "epoch": 0.69, "learning_rate": 4.7309578338688684e-05, "loss": 0.7111, "step": 6594 }, { "epoch": 0.69, "learning_rate": 4.728092585956957e-05, "loss": 0.634, "step": 6595 }, { "epoch": 0.69, "learning_rate": 4.725227937314444e-05, "loss": 0.6253, "step": 6596 }, { "epoch": 0.69, "learning_rate": 4.722363888266966e-05, "loss": 0.7313, "step": 6597 }, { "epoch": 0.69, "learning_rate": 4.719500439140081e-05, "loss": 0.6888, "step": 6598 }, { "epoch": 0.69, "learning_rate": 4.716637590259291e-05, "loss": 0.6178, "step": 6599 }, { "epoch": 0.69, "learning_rate": 4.713775341950012e-05, "loss": 0.7254, "step": 6600 }, { "epoch": 0.69, "learning_rate": 4.710913694537612e-05, "loss": 0.6732, "step": 6601 }, { "epoch": 0.69, "learning_rate": 4.708052648347373e-05, "loss": 0.6733, "step": 6602 }, { "epoch": 0.69, "learning_rate": 4.705192203704519e-05, "loss": 0.6886, "step": 6603 }, { "epoch": 0.69, "learning_rate": 4.7023323609342096e-05, "loss": 0.6388, "step": 6604 }, { "epoch": 0.69, "learning_rate": 4.699473120361519e-05, "loss": 0.6427, "step": 6605 }, { "epoch": 0.69, "learning_rate": 4.6966144823114686e-05, "loss": 0.7142, "step": 6606 }, { "epoch": 0.69, "learning_rate": 4.693756447109009e-05, "loss": 0.716, "step": 6607 }, { "epoch": 0.69, "learning_rate": 4.6908990150790134e-05, "loss": 0.6822, "step": 6608 }, { "epoch": 0.69, "learning_rate": 4.6880421865462985e-05, "loss": 0.7199, "step": 6609 }, { "epoch": 0.69, "learning_rate": 4.6851859618356e-05, "loss": 0.5512, "step": 6610 }, { "epoch": 0.69, "learning_rate": 4.682330341271597e-05, "loss": 0.6141, "step": 6611 }, { "epoch": 0.69, "learning_rate": 4.6794753251788925e-05, "loss": 0.6984, "step": 6612 }, { "epoch": 0.69, "learning_rate": 4.676620913882017e-05, "loss": 0.671, "step": 6613 }, { "epoch": 0.69, "learning_rate": 4.673767107705444e-05, "loss": 0.6907, "step": 6614 }, { "epoch": 0.69, "learning_rate": 4.670913906973572e-05, "loss": 0.6841, "step": 6615 }, { "epoch": 0.69, "learning_rate": 4.668061312010726e-05, "loss": 0.7208, "step": 6616 }, { "epoch": 0.69, "learning_rate": 4.6652093231411706e-05, "loss": 0.7215, "step": 6617 }, { "epoch": 0.69, "learning_rate": 4.662357940689101e-05, "loss": 0.6324, "step": 6618 }, { "epoch": 0.69, "learning_rate": 4.659507164978631e-05, "loss": 0.6862, "step": 6619 }, { "epoch": 0.69, "learning_rate": 4.6566569963338205e-05, "loss": 0.7147, "step": 6620 }, { "epoch": 0.69, "learning_rate": 4.653807435078656e-05, "loss": 0.7134, "step": 6621 }, { "epoch": 0.69, "learning_rate": 4.6509584815370485e-05, "loss": 0.692, "step": 6622 }, { "epoch": 0.69, "learning_rate": 4.6481101360328514e-05, "loss": 0.6885, "step": 6623 }, { "epoch": 0.69, "learning_rate": 4.645262398889838e-05, "loss": 0.6654, "step": 6624 }, { "epoch": 0.69, "learning_rate": 4.6424152704317136e-05, "loss": 0.6933, "step": 6625 }, { "epoch": 0.69, "learning_rate": 4.6395687509821214e-05, "loss": 0.6178, "step": 6626 }, { "epoch": 0.69, "learning_rate": 4.636722840864636e-05, "loss": 0.7093, "step": 6627 }, { "epoch": 0.69, "learning_rate": 4.63387754040275e-05, "loss": 0.6217, "step": 6628 }, { "epoch": 0.69, "learning_rate": 4.631032849919898e-05, "loss": 0.6473, "step": 6629 }, { "epoch": 0.69, "learning_rate": 4.628188769739448e-05, "loss": 0.6576, "step": 6630 }, { "epoch": 0.69, "learning_rate": 4.6253453001846835e-05, "loss": 0.6672, "step": 6631 }, { "epoch": 0.69, "learning_rate": 4.622502441578837e-05, "loss": 0.6478, "step": 6632 }, { "epoch": 0.69, "learning_rate": 4.6196601942450545e-05, "loss": 0.6581, "step": 6633 }, { "epoch": 0.69, "learning_rate": 4.6168185585064226e-05, "loss": 0.6778, "step": 6634 }, { "epoch": 0.69, "learning_rate": 4.613977534685964e-05, "loss": 0.6476, "step": 6635 }, { "epoch": 0.69, "learning_rate": 4.611137123106616e-05, "loss": 0.6532, "step": 6636 }, { "epoch": 0.69, "learning_rate": 4.6082973240912533e-05, "loss": 0.6901, "step": 6637 }, { "epoch": 0.69, "learning_rate": 4.605458137962689e-05, "loss": 0.6052, "step": 6638 }, { "epoch": 0.69, "learning_rate": 4.6026195650436535e-05, "loss": 0.658, "step": 6639 }, { "epoch": 0.69, "learning_rate": 4.599781605656815e-05, "loss": 0.6115, "step": 6640 }, { "epoch": 0.69, "learning_rate": 4.596944260124776e-05, "loss": 0.6534, "step": 6641 }, { "epoch": 0.69, "learning_rate": 4.5941075287700566e-05, "loss": 0.7127, "step": 6642 }, { "epoch": 0.69, "learning_rate": 4.5912714119151166e-05, "loss": 0.669, "step": 6643 }, { "epoch": 0.69, "learning_rate": 4.588435909882348e-05, "loss": 0.6613, "step": 6644 }, { "epoch": 0.69, "learning_rate": 4.585601022994063e-05, "loss": 0.6838, "step": 6645 }, { "epoch": 0.69, "learning_rate": 4.58276675157251e-05, "loss": 0.6919, "step": 6646 }, { "epoch": 0.69, "learning_rate": 4.5799330959398735e-05, "loss": 0.7144, "step": 6647 }, { "epoch": 0.69, "learning_rate": 4.577100056418252e-05, "loss": 0.6519, "step": 6648 }, { "epoch": 0.69, "learning_rate": 4.574267633329692e-05, "loss": 0.6925, "step": 6649 }, { "epoch": 0.69, "learning_rate": 4.5714358269961566e-05, "loss": 0.6579, "step": 6650 }, { "epoch": 0.69, "learning_rate": 4.568604637739541e-05, "loss": 0.7117, "step": 6651 }, { "epoch": 0.69, "learning_rate": 4.5657740658816796e-05, "loss": 0.6887, "step": 6652 }, { "epoch": 0.69, "learning_rate": 4.562944111744322e-05, "loss": 0.6259, "step": 6653 }, { "epoch": 0.69, "learning_rate": 4.560114775649159e-05, "loss": 0.6253, "step": 6654 }, { "epoch": 0.69, "learning_rate": 4.557286057917812e-05, "loss": 0.6917, "step": 6655 }, { "epoch": 0.69, "learning_rate": 4.5544579588718195e-05, "loss": 0.7032, "step": 6656 }, { "epoch": 0.69, "learning_rate": 4.5516304788326626e-05, "loss": 0.6205, "step": 6657 }, { "epoch": 0.69, "learning_rate": 4.5488036181217496e-05, "loss": 0.7873, "step": 6658 }, { "epoch": 0.69, "learning_rate": 4.545977377060409e-05, "loss": 0.6425, "step": 6659 }, { "epoch": 0.69, "learning_rate": 4.54315175596991e-05, "loss": 0.6688, "step": 6660 }, { "epoch": 0.69, "learning_rate": 4.54032675517145e-05, "loss": 0.7298, "step": 6661 }, { "epoch": 0.69, "learning_rate": 4.53750237498615e-05, "loss": 0.6781, "step": 6662 }, { "epoch": 0.69, "learning_rate": 4.5346786157350606e-05, "loss": 0.7003, "step": 6663 }, { "epoch": 0.69, "learning_rate": 4.5318554777391705e-05, "loss": 0.6732, "step": 6664 }, { "epoch": 0.69, "learning_rate": 4.529032961319387e-05, "loss": 0.6188, "step": 6665 }, { "epoch": 0.69, "learning_rate": 4.526211066796553e-05, "loss": 0.6904, "step": 6666 }, { "epoch": 0.69, "learning_rate": 4.523389794491445e-05, "loss": 0.6554, "step": 6667 }, { "epoch": 0.69, "learning_rate": 4.520569144724755e-05, "loss": 0.761, "step": 6668 }, { "epoch": 0.69, "learning_rate": 4.517749117817116e-05, "loss": 0.6333, "step": 6669 }, { "epoch": 0.69, "learning_rate": 4.514929714089091e-05, "loss": 0.7128, "step": 6670 }, { "epoch": 0.69, "learning_rate": 4.51211093386116e-05, "loss": 0.7035, "step": 6671 }, { "epoch": 0.69, "learning_rate": 4.509292777453749e-05, "loss": 0.7592, "step": 6672 }, { "epoch": 0.69, "learning_rate": 4.5064752451871936e-05, "loss": 0.7254, "step": 6673 }, { "epoch": 0.69, "learning_rate": 4.5036583373817786e-05, "loss": 0.679, "step": 6674 }, { "epoch": 0.69, "learning_rate": 4.500842054357701e-05, "loss": 0.5985, "step": 6675 }, { "epoch": 0.69, "learning_rate": 4.4980263964351e-05, "loss": 0.6656, "step": 6676 }, { "epoch": 0.7, "learning_rate": 4.495211363934031e-05, "loss": 0.6865, "step": 6677 }, { "epoch": 0.7, "learning_rate": 4.4923969571744916e-05, "loss": 0.72, "step": 6678 }, { "epoch": 0.7, "learning_rate": 4.489583176476396e-05, "loss": 0.6802, "step": 6679 }, { "epoch": 0.7, "learning_rate": 4.486770022159595e-05, "loss": 0.6973, "step": 6680 }, { "epoch": 0.7, "learning_rate": 4.48395749454387e-05, "loss": 0.6532, "step": 6681 }, { "epoch": 0.7, "learning_rate": 4.481145593948921e-05, "loss": 0.675, "step": 6682 }, { "epoch": 0.7, "learning_rate": 4.478334320694385e-05, "loss": 0.6455, "step": 6683 }, { "epoch": 0.7, "learning_rate": 4.475523675099831e-05, "loss": 0.6064, "step": 6684 }, { "epoch": 0.7, "learning_rate": 4.472713657484742e-05, "loss": 0.7083, "step": 6685 }, { "epoch": 0.7, "learning_rate": 4.469904268168548e-05, "loss": 0.6388, "step": 6686 }, { "epoch": 0.7, "learning_rate": 4.46709550747059e-05, "loss": 0.6793, "step": 6687 }, { "epoch": 0.7, "learning_rate": 4.4642873757101554e-05, "loss": 0.6908, "step": 6688 }, { "epoch": 0.7, "learning_rate": 4.461479873206441e-05, "loss": 0.6589, "step": 6689 }, { "epoch": 0.7, "learning_rate": 4.458673000278589e-05, "loss": 0.7441, "step": 6690 }, { "epoch": 0.7, "learning_rate": 4.455866757245658e-05, "loss": 0.6478, "step": 6691 }, { "epoch": 0.7, "learning_rate": 4.453061144426647e-05, "loss": 0.6652, "step": 6692 }, { "epoch": 0.7, "learning_rate": 4.450256162140466e-05, "loss": 0.6987, "step": 6693 }, { "epoch": 0.7, "learning_rate": 4.447451810705969e-05, "loss": 0.6301, "step": 6694 }, { "epoch": 0.7, "learning_rate": 4.4446480904419376e-05, "loss": 0.7174, "step": 6695 }, { "epoch": 0.7, "learning_rate": 4.441845001667068e-05, "loss": 0.6666, "step": 6696 }, { "epoch": 0.7, "learning_rate": 4.439042544699997e-05, "loss": 0.6856, "step": 6697 }, { "epoch": 0.7, "learning_rate": 4.4362407198592905e-05, "loss": 0.6683, "step": 6698 }, { "epoch": 0.7, "learning_rate": 4.433439527463431e-05, "loss": 0.7258, "step": 6699 }, { "epoch": 0.7, "learning_rate": 4.430638967830843e-05, "loss": 0.7374, "step": 6700 }, { "epoch": 0.7, "learning_rate": 4.42783904127987e-05, "loss": 0.7094, "step": 6701 }, { "epoch": 0.7, "learning_rate": 4.425039748128781e-05, "loss": 0.6975, "step": 6702 }, { "epoch": 0.7, "learning_rate": 4.422241088695781e-05, "loss": 0.6375, "step": 6703 }, { "epoch": 0.7, "learning_rate": 4.4194430632990046e-05, "loss": 0.6875, "step": 6704 }, { "epoch": 0.7, "learning_rate": 4.416645672256501e-05, "loss": 0.6161, "step": 6705 }, { "epoch": 0.7, "learning_rate": 4.413848915886261e-05, "loss": 0.691, "step": 6706 }, { "epoch": 0.7, "learning_rate": 4.4110527945062006e-05, "loss": 0.7079, "step": 6707 }, { "epoch": 0.7, "learning_rate": 4.408257308434155e-05, "loss": 0.6756, "step": 6708 }, { "epoch": 0.7, "learning_rate": 4.4054624579878955e-05, "loss": 0.6222, "step": 6709 }, { "epoch": 0.7, "learning_rate": 4.402668243485123e-05, "loss": 0.6391, "step": 6710 }, { "epoch": 0.7, "learning_rate": 4.399874665243455e-05, "loss": 0.6751, "step": 6711 }, { "epoch": 0.7, "learning_rate": 4.3970817235804515e-05, "loss": 0.6508, "step": 6712 }, { "epoch": 0.7, "learning_rate": 4.394289418813585e-05, "loss": 0.6776, "step": 6713 }, { "epoch": 0.7, "learning_rate": 4.391497751260271e-05, "loss": 0.6634, "step": 6714 }, { "epoch": 0.7, "learning_rate": 4.388706721237837e-05, "loss": 0.7173, "step": 6715 }, { "epoch": 0.7, "learning_rate": 4.385916329063546e-05, "loss": 0.6575, "step": 6716 }, { "epoch": 0.7, "learning_rate": 4.383126575054591e-05, "loss": 0.6857, "step": 6717 }, { "epoch": 0.7, "learning_rate": 4.380337459528092e-05, "loss": 0.6547, "step": 6718 }, { "epoch": 0.7, "learning_rate": 4.3775489828010875e-05, "loss": 0.6166, "step": 6719 }, { "epoch": 0.7, "learning_rate": 4.374761145190553e-05, "loss": 0.6973, "step": 6720 }, { "epoch": 0.7, "learning_rate": 4.371973947013392e-05, "loss": 0.6825, "step": 6721 }, { "epoch": 0.7, "learning_rate": 4.369187388586425e-05, "loss": 0.6948, "step": 6722 }, { "epoch": 0.7, "learning_rate": 4.366401470226409e-05, "loss": 0.6666, "step": 6723 }, { "epoch": 0.7, "learning_rate": 4.3636161922500284e-05, "loss": 0.67, "step": 6724 }, { "epoch": 0.7, "learning_rate": 4.3608315549738865e-05, "loss": 0.661, "step": 6725 }, { "epoch": 0.7, "learning_rate": 4.3580475587145254e-05, "loss": 0.6127, "step": 6726 }, { "epoch": 0.7, "learning_rate": 4.355264203788405e-05, "loss": 0.6687, "step": 6727 }, { "epoch": 0.7, "learning_rate": 4.3524814905119104e-05, "loss": 0.7185, "step": 6728 }, { "epoch": 0.7, "learning_rate": 4.349699419201364e-05, "loss": 0.6805, "step": 6729 }, { "epoch": 0.7, "learning_rate": 4.346917990173013e-05, "loss": 0.6824, "step": 6730 }, { "epoch": 0.7, "learning_rate": 4.3441372037430214e-05, "loss": 0.6888, "step": 6731 }, { "epoch": 0.7, "learning_rate": 4.3413570602274956e-05, "loss": 0.6544, "step": 6732 }, { "epoch": 0.7, "learning_rate": 4.3385775599424514e-05, "loss": 0.732, "step": 6733 }, { "epoch": 0.7, "learning_rate": 4.3357987032038464e-05, "loss": 0.6829, "step": 6734 }, { "epoch": 0.7, "learning_rate": 4.333020490327561e-05, "loss": 0.6691, "step": 6735 }, { "epoch": 0.7, "learning_rate": 4.330242921629395e-05, "loss": 0.5803, "step": 6736 }, { "epoch": 0.7, "learning_rate": 4.327465997425084e-05, "loss": 0.6934, "step": 6737 }, { "epoch": 0.7, "learning_rate": 4.32468971803029e-05, "loss": 0.6558, "step": 6738 }, { "epoch": 0.7, "learning_rate": 4.3219140837605976e-05, "loss": 0.6644, "step": 6739 }, { "epoch": 0.7, "learning_rate": 4.319139094931514e-05, "loss": 0.6762, "step": 6740 }, { "epoch": 0.7, "learning_rate": 4.3163647518584846e-05, "loss": 0.6441, "step": 6741 }, { "epoch": 0.7, "learning_rate": 4.313591054856869e-05, "loss": 0.6451, "step": 6742 }, { "epoch": 0.7, "learning_rate": 4.310818004241964e-05, "loss": 0.643, "step": 6743 }, { "epoch": 0.7, "learning_rate": 4.3080456003289905e-05, "loss": 0.7426, "step": 6744 }, { "epoch": 0.7, "learning_rate": 4.3052738434330875e-05, "loss": 0.6218, "step": 6745 }, { "epoch": 0.7, "learning_rate": 4.30250273386933e-05, "loss": 0.6218, "step": 6746 }, { "epoch": 0.7, "learning_rate": 4.2997322719527197e-05, "loss": 0.6819, "step": 6747 }, { "epoch": 0.7, "learning_rate": 4.296962457998175e-05, "loss": 0.7167, "step": 6748 }, { "epoch": 0.7, "learning_rate": 4.294193292320547e-05, "loss": 0.6621, "step": 6749 }, { "epoch": 0.7, "learning_rate": 4.2914247752346216e-05, "loss": 0.7153, "step": 6750 }, { "epoch": 0.7, "learning_rate": 4.288656907055094e-05, "loss": 0.7227, "step": 6751 }, { "epoch": 0.7, "learning_rate": 4.285889688096594e-05, "loss": 0.7196, "step": 6752 }, { "epoch": 0.7, "learning_rate": 4.283123118673682e-05, "loss": 0.662, "step": 6753 }, { "epoch": 0.7, "learning_rate": 4.280357199100834e-05, "loss": 0.6692, "step": 6754 }, { "epoch": 0.7, "learning_rate": 4.277591929692466e-05, "loss": 0.6138, "step": 6755 }, { "epoch": 0.7, "learning_rate": 4.274827310762903e-05, "loss": 0.6746, "step": 6756 }, { "epoch": 0.7, "learning_rate": 4.272063342626412e-05, "loss": 0.5892, "step": 6757 }, { "epoch": 0.7, "learning_rate": 4.2693000255971804e-05, "loss": 0.6367, "step": 6758 }, { "epoch": 0.7, "learning_rate": 4.2665373599893154e-05, "loss": 0.6708, "step": 6759 }, { "epoch": 0.7, "learning_rate": 4.263775346116857e-05, "loss": 0.6152, "step": 6760 }, { "epoch": 0.7, "learning_rate": 4.261013984293773e-05, "loss": 0.6701, "step": 6761 }, { "epoch": 0.7, "learning_rate": 4.258253274833949e-05, "loss": 0.693, "step": 6762 }, { "epoch": 0.7, "learning_rate": 4.255493218051202e-05, "loss": 0.6431, "step": 6763 }, { "epoch": 0.7, "learning_rate": 4.2527338142592785e-05, "loss": 0.6761, "step": 6764 }, { "epoch": 0.7, "learning_rate": 4.249975063771841e-05, "loss": 0.6755, "step": 6765 }, { "epoch": 0.7, "learning_rate": 4.247216966902482e-05, "loss": 0.6651, "step": 6766 }, { "epoch": 0.7, "learning_rate": 4.2444595239647254e-05, "loss": 0.6677, "step": 6767 }, { "epoch": 0.7, "learning_rate": 4.2417027352720096e-05, "loss": 0.6759, "step": 6768 }, { "epoch": 0.7, "learning_rate": 4.238946601137707e-05, "loss": 0.6052, "step": 6769 }, { "epoch": 0.7, "learning_rate": 4.236191121875118e-05, "loss": 0.6119, "step": 6770 }, { "epoch": 0.7, "learning_rate": 4.2334362977974587e-05, "loss": 0.7349, "step": 6771 }, { "epoch": 0.7, "learning_rate": 4.23068212921788e-05, "loss": 0.6932, "step": 6772 }, { "epoch": 0.71, "learning_rate": 4.2279286164494505e-05, "loss": 0.6185, "step": 6773 }, { "epoch": 0.71, "learning_rate": 4.2251757598051675e-05, "loss": 0.7302, "step": 6774 }, { "epoch": 0.71, "learning_rate": 4.222423559597962e-05, "loss": 0.7141, "step": 6775 }, { "epoch": 0.71, "learning_rate": 4.219672016140673e-05, "loss": 0.6865, "step": 6776 }, { "epoch": 0.71, "learning_rate": 4.216921129746084e-05, "loss": 0.6709, "step": 6777 }, { "epoch": 0.71, "learning_rate": 4.214170900726888e-05, "loss": 0.6772, "step": 6778 }, { "epoch": 0.71, "learning_rate": 4.2114213293957085e-05, "loss": 0.7045, "step": 6779 }, { "epoch": 0.71, "learning_rate": 4.208672416065097e-05, "loss": 0.713, "step": 6780 }, { "epoch": 0.71, "learning_rate": 4.205924161047533e-05, "loss": 0.7234, "step": 6781 }, { "epoch": 0.71, "learning_rate": 4.2031765646554097e-05, "loss": 0.707, "step": 6782 }, { "epoch": 0.71, "learning_rate": 4.2004296272010566e-05, "loss": 0.6488, "step": 6783 }, { "epoch": 0.71, "learning_rate": 4.197683348996726e-05, "loss": 0.7096, "step": 6784 }, { "epoch": 0.71, "learning_rate": 4.194937730354588e-05, "loss": 0.7588, "step": 6785 }, { "epoch": 0.71, "learning_rate": 4.192192771586746e-05, "loss": 0.6066, "step": 6786 }, { "epoch": 0.71, "learning_rate": 4.1894484730052296e-05, "loss": 0.5879, "step": 6787 }, { "epoch": 0.71, "learning_rate": 4.186704834921981e-05, "loss": 0.6119, "step": 6788 }, { "epoch": 0.71, "learning_rate": 4.1839618576488836e-05, "loss": 0.66, "step": 6789 }, { "epoch": 0.71, "learning_rate": 4.181219541497731e-05, "loss": 0.7252, "step": 6790 }, { "epoch": 0.71, "learning_rate": 4.178477886780254e-05, "loss": 0.6808, "step": 6791 }, { "epoch": 0.71, "learning_rate": 4.175736893808101e-05, "loss": 0.7248, "step": 6792 }, { "epoch": 0.71, "learning_rate": 4.172996562892843e-05, "loss": 0.6907, "step": 6793 }, { "epoch": 0.71, "learning_rate": 4.170256894345981e-05, "loss": 0.6748, "step": 6794 }, { "epoch": 0.71, "learning_rate": 4.167517888478943e-05, "loss": 0.65, "step": 6795 }, { "epoch": 0.71, "learning_rate": 4.164779545603074e-05, "loss": 0.6891, "step": 6796 }, { "epoch": 0.71, "learning_rate": 4.1620418660296465e-05, "loss": 0.6148, "step": 6797 }, { "epoch": 0.71, "learning_rate": 4.159304850069866e-05, "loss": 0.6939, "step": 6798 }, { "epoch": 0.71, "learning_rate": 4.156568498034846e-05, "loss": 0.6711, "step": 6799 }, { "epoch": 0.71, "learning_rate": 4.153832810235638e-05, "loss": 0.651, "step": 6800 }, { "epoch": 0.71, "learning_rate": 4.151097786983218e-05, "loss": 0.6963, "step": 6801 }, { "epoch": 0.71, "learning_rate": 4.148363428588472e-05, "loss": 0.6644, "step": 6802 }, { "epoch": 0.71, "learning_rate": 4.1456297353622306e-05, "loss": 0.7203, "step": 6803 }, { "epoch": 0.71, "learning_rate": 4.142896707615235e-05, "loss": 0.7039, "step": 6804 }, { "epoch": 0.71, "learning_rate": 4.140164345658151e-05, "loss": 0.6516, "step": 6805 }, { "epoch": 0.71, "learning_rate": 4.137432649801574e-05, "loss": 0.6237, "step": 6806 }, { "epoch": 0.71, "learning_rate": 4.1347016203560265e-05, "loss": 0.6708, "step": 6807 }, { "epoch": 0.71, "learning_rate": 4.131971257631944e-05, "loss": 0.6982, "step": 6808 }, { "epoch": 0.71, "learning_rate": 4.129241561939695e-05, "loss": 0.7017, "step": 6809 }, { "epoch": 0.71, "learning_rate": 4.126512533589576e-05, "loss": 0.6143, "step": 6810 }, { "epoch": 0.71, "learning_rate": 4.1237841728917935e-05, "loss": 0.6671, "step": 6811 }, { "epoch": 0.71, "learning_rate": 4.121056480156492e-05, "loss": 0.6869, "step": 6812 }, { "epoch": 0.71, "learning_rate": 4.11832945569373e-05, "loss": 0.6767, "step": 6813 }, { "epoch": 0.71, "learning_rate": 4.115603099813495e-05, "loss": 0.7229, "step": 6814 }, { "epoch": 0.71, "learning_rate": 4.112877412825704e-05, "loss": 0.6561, "step": 6815 }, { "epoch": 0.71, "learning_rate": 4.1101523950401876e-05, "loss": 0.6681, "step": 6816 }, { "epoch": 0.71, "learning_rate": 4.1074280467667e-05, "loss": 0.6279, "step": 6817 }, { "epoch": 0.71, "learning_rate": 4.1047043683149324e-05, "loss": 0.7187, "step": 6818 }, { "epoch": 0.71, "learning_rate": 4.101981359994482e-05, "loss": 0.6707, "step": 6819 }, { "epoch": 0.71, "learning_rate": 4.099259022114886e-05, "loss": 0.7369, "step": 6820 }, { "epoch": 0.71, "learning_rate": 4.0965373549856004e-05, "loss": 0.7053, "step": 6821 }, { "epoch": 0.71, "learning_rate": 4.093816358915996e-05, "loss": 0.6832, "step": 6822 }, { "epoch": 0.71, "learning_rate": 4.091096034215377e-05, "loss": 0.7024, "step": 6823 }, { "epoch": 0.71, "learning_rate": 4.088376381192974e-05, "loss": 0.6607, "step": 6824 }, { "epoch": 0.71, "learning_rate": 4.0856574001579296e-05, "loss": 0.6837, "step": 6825 }, { "epoch": 0.71, "learning_rate": 4.082939091419318e-05, "loss": 0.6902, "step": 6826 }, { "epoch": 0.71, "learning_rate": 4.0802214552861385e-05, "loss": 0.6016, "step": 6827 }, { "epoch": 0.71, "learning_rate": 4.0775044920673086e-05, "loss": 0.5871, "step": 6828 }, { "epoch": 0.71, "learning_rate": 4.0747882020716685e-05, "loss": 0.6646, "step": 6829 }, { "epoch": 0.71, "learning_rate": 4.072072585607991e-05, "loss": 0.6657, "step": 6830 }, { "epoch": 0.71, "learning_rate": 4.06935764298496e-05, "loss": 0.6619, "step": 6831 }, { "epoch": 0.71, "learning_rate": 4.066643374511195e-05, "loss": 0.6664, "step": 6832 }, { "epoch": 0.71, "learning_rate": 4.0639297804952256e-05, "loss": 0.6531, "step": 6833 }, { "epoch": 0.71, "learning_rate": 4.061216861245518e-05, "loss": 0.7479, "step": 6834 }, { "epoch": 0.71, "learning_rate": 4.058504617070457e-05, "loss": 0.739, "step": 6835 }, { "epoch": 0.71, "learning_rate": 4.0557930482783425e-05, "loss": 0.6168, "step": 6836 }, { "epoch": 0.71, "learning_rate": 4.053082155177408e-05, "loss": 0.6421, "step": 6837 }, { "epoch": 0.71, "learning_rate": 4.0503719380758124e-05, "loss": 0.6738, "step": 6838 }, { "epoch": 0.71, "learning_rate": 4.0476623972816216e-05, "loss": 0.6067, "step": 6839 }, { "epoch": 0.71, "learning_rate": 4.044953533102842e-05, "loss": 0.6758, "step": 6840 }, { "epoch": 0.71, "learning_rate": 4.042245345847398e-05, "loss": 0.6746, "step": 6841 }, { "epoch": 0.71, "learning_rate": 4.0395378358231304e-05, "loss": 0.6795, "step": 6842 }, { "epoch": 0.71, "learning_rate": 4.036831003337808e-05, "loss": 0.6795, "step": 6843 }, { "epoch": 0.71, "learning_rate": 4.0341248486991256e-05, "loss": 0.6432, "step": 6844 }, { "epoch": 0.71, "learning_rate": 4.031419372214693e-05, "loss": 0.717, "step": 6845 }, { "epoch": 0.71, "learning_rate": 4.028714574192051e-05, "loss": 0.656, "step": 6846 }, { "epoch": 0.71, "learning_rate": 4.0260104549386635e-05, "loss": 0.6164, "step": 6847 }, { "epoch": 0.71, "learning_rate": 4.0233070147619056e-05, "loss": 0.6676, "step": 6848 }, { "epoch": 0.71, "learning_rate": 4.020604253969088e-05, "loss": 0.6293, "step": 6849 }, { "epoch": 0.71, "learning_rate": 4.0179021728674425e-05, "loss": 0.6442, "step": 6850 }, { "epoch": 0.71, "learning_rate": 4.0152007717641147e-05, "loss": 0.6578, "step": 6851 }, { "epoch": 0.71, "learning_rate": 4.0125000509661845e-05, "loss": 0.6858, "step": 6852 }, { "epoch": 0.71, "learning_rate": 4.0098000107806425e-05, "loss": 0.6493, "step": 6853 }, { "epoch": 0.71, "learning_rate": 4.007100651514415e-05, "loss": 0.6691, "step": 6854 }, { "epoch": 0.71, "learning_rate": 4.0044019734743365e-05, "loss": 0.6762, "step": 6855 }, { "epoch": 0.71, "learning_rate": 4.00170397696718e-05, "loss": 0.6495, "step": 6856 }, { "epoch": 0.71, "learning_rate": 3.9990066622996245e-05, "loss": 0.6965, "step": 6857 }, { "epoch": 0.71, "learning_rate": 3.9963100297782886e-05, "loss": 0.6794, "step": 6858 }, { "epoch": 0.71, "learning_rate": 3.9936140797096955e-05, "loss": 0.7049, "step": 6859 }, { "epoch": 0.71, "learning_rate": 3.990918812400305e-05, "loss": 0.6763, "step": 6860 }, { "epoch": 0.71, "learning_rate": 3.9882242281564964e-05, "loss": 0.6589, "step": 6861 }, { "epoch": 0.71, "learning_rate": 3.9855303272845615e-05, "loss": 0.6775, "step": 6862 }, { "epoch": 0.71, "learning_rate": 3.9828371100907266e-05, "loss": 0.6884, "step": 6863 }, { "epoch": 0.71, "learning_rate": 3.98014457688114e-05, "loss": 0.6523, "step": 6864 }, { "epoch": 0.71, "learning_rate": 3.977452727961859e-05, "loss": 0.7106, "step": 6865 }, { "epoch": 0.71, "learning_rate": 3.97476156363888e-05, "loss": 0.6157, "step": 6866 }, { "epoch": 0.71, "learning_rate": 3.972071084218106e-05, "loss": 0.6842, "step": 6867 }, { "epoch": 0.71, "learning_rate": 3.969381290005378e-05, "loss": 0.6479, "step": 6868 }, { "epoch": 0.71, "learning_rate": 3.966692181306444e-05, "loss": 0.6181, "step": 6869 }, { "epoch": 0.72, "learning_rate": 3.9640037584269864e-05, "loss": 0.7398, "step": 6870 }, { "epoch": 0.72, "learning_rate": 3.9613160216725976e-05, "loss": 0.703, "step": 6871 }, { "epoch": 0.72, "learning_rate": 3.958628971348805e-05, "loss": 0.638, "step": 6872 }, { "epoch": 0.72, "learning_rate": 3.955942607761046e-05, "loss": 0.6952, "step": 6873 }, { "epoch": 0.72, "learning_rate": 3.953256931214689e-05, "loss": 0.6481, "step": 6874 }, { "epoch": 0.72, "learning_rate": 3.9505719420150245e-05, "loss": 0.6322, "step": 6875 }, { "epoch": 0.72, "learning_rate": 3.947887640467252e-05, "loss": 0.6871, "step": 6876 }, { "epoch": 0.72, "learning_rate": 3.9452040268765076e-05, "loss": 0.644, "step": 6877 }, { "epoch": 0.72, "learning_rate": 3.9425211015478456e-05, "loss": 0.6396, "step": 6878 }, { "epoch": 0.72, "learning_rate": 3.939838864786235e-05, "loss": 0.7178, "step": 6879 }, { "epoch": 0.72, "learning_rate": 3.937157316896577e-05, "loss": 0.6211, "step": 6880 }, { "epoch": 0.72, "learning_rate": 3.934476458183687e-05, "loss": 0.6919, "step": 6881 }, { "epoch": 0.72, "learning_rate": 3.931796288952299e-05, "loss": 0.7177, "step": 6882 }, { "epoch": 0.72, "learning_rate": 3.9291168095070775e-05, "loss": 0.6917, "step": 6883 }, { "epoch": 0.72, "learning_rate": 3.926438020152609e-05, "loss": 0.6668, "step": 6884 }, { "epoch": 0.72, "learning_rate": 3.923759921193391e-05, "loss": 0.6276, "step": 6885 }, { "epoch": 0.72, "learning_rate": 3.921082512933851e-05, "loss": 0.6627, "step": 6886 }, { "epoch": 0.72, "learning_rate": 3.9184057956783405e-05, "loss": 0.6206, "step": 6887 }, { "epoch": 0.72, "learning_rate": 3.915729769731121e-05, "loss": 0.6705, "step": 6888 }, { "epoch": 0.72, "learning_rate": 3.913054435396385e-05, "loss": 0.7056, "step": 6889 }, { "epoch": 0.72, "learning_rate": 3.9103797929782484e-05, "loss": 0.6954, "step": 6890 }, { "epoch": 0.72, "learning_rate": 3.9077058427807343e-05, "loss": 0.6487, "step": 6891 }, { "epoch": 0.72, "learning_rate": 3.905032585107806e-05, "loss": 0.6511, "step": 6892 }, { "epoch": 0.72, "learning_rate": 3.902360020263335e-05, "loss": 0.6947, "step": 6893 }, { "epoch": 0.72, "learning_rate": 3.899688148551113e-05, "loss": 0.6234, "step": 6894 }, { "epoch": 0.72, "learning_rate": 3.897016970274864e-05, "loss": 0.6504, "step": 6895 }, { "epoch": 0.72, "learning_rate": 3.894346485738222e-05, "loss": 0.6409, "step": 6896 }, { "epoch": 0.72, "learning_rate": 3.891676695244748e-05, "loss": 0.663, "step": 6897 }, { "epoch": 0.72, "learning_rate": 3.889007599097929e-05, "loss": 0.6765, "step": 6898 }, { "epoch": 0.72, "learning_rate": 3.8863391976011576e-05, "loss": 0.6843, "step": 6899 }, { "epoch": 0.72, "learning_rate": 3.883671491057762e-05, "loss": 0.6513, "step": 6900 }, { "epoch": 0.72, "learning_rate": 3.88100447977099e-05, "loss": 0.6312, "step": 6901 }, { "epoch": 0.72, "learning_rate": 3.8783381640439985e-05, "loss": 0.7405, "step": 6902 }, { "epoch": 0.72, "learning_rate": 3.875672544179878e-05, "loss": 0.6863, "step": 6903 }, { "epoch": 0.72, "learning_rate": 3.873007620481638e-05, "loss": 0.6639, "step": 6904 }, { "epoch": 0.72, "learning_rate": 3.870343393252201e-05, "loss": 0.6251, "step": 6905 }, { "epoch": 0.72, "learning_rate": 3.86767986279442e-05, "loss": 0.6459, "step": 6906 }, { "epoch": 0.72, "learning_rate": 3.8650170294110625e-05, "loss": 0.7338, "step": 6907 }, { "epoch": 0.72, "learning_rate": 3.8623548934048146e-05, "loss": 0.7148, "step": 6908 }, { "epoch": 0.72, "learning_rate": 3.859693455078291e-05, "loss": 0.6322, "step": 6909 }, { "epoch": 0.72, "learning_rate": 3.8570327147340276e-05, "loss": 0.6881, "step": 6910 }, { "epoch": 0.72, "learning_rate": 3.85437267267447e-05, "loss": 0.6508, "step": 6911 }, { "epoch": 0.72, "learning_rate": 3.8517133292019956e-05, "loss": 0.6655, "step": 6912 }, { "epoch": 0.72, "learning_rate": 3.849054684618892e-05, "loss": 0.6557, "step": 6913 }, { "epoch": 0.72, "learning_rate": 3.846396739227378e-05, "loss": 0.6758, "step": 6914 }, { "epoch": 0.72, "learning_rate": 3.84373949332959e-05, "loss": 0.6715, "step": 6915 }, { "epoch": 0.72, "learning_rate": 3.841082947227578e-05, "loss": 0.6467, "step": 6916 }, { "epoch": 0.72, "learning_rate": 3.8384271012233173e-05, "loss": 0.7268, "step": 6917 }, { "epoch": 0.72, "learning_rate": 3.835771955618712e-05, "loss": 0.605, "step": 6918 }, { "epoch": 0.72, "learning_rate": 3.8331175107155714e-05, "loss": 0.6672, "step": 6919 }, { "epoch": 0.72, "learning_rate": 3.830463766815629e-05, "loss": 0.6682, "step": 6920 }, { "epoch": 0.72, "learning_rate": 3.827810724220551e-05, "loss": 0.6542, "step": 6921 }, { "epoch": 0.72, "learning_rate": 3.825158383231906e-05, "loss": 0.6794, "step": 6922 }, { "epoch": 0.72, "learning_rate": 3.8225067441511943e-05, "loss": 0.7067, "step": 6923 }, { "epoch": 0.72, "learning_rate": 3.8198558072798384e-05, "loss": 0.6769, "step": 6924 }, { "epoch": 0.72, "learning_rate": 3.8172055729191694e-05, "loss": 0.6707, "step": 6925 }, { "epoch": 0.72, "learning_rate": 3.814556041370447e-05, "loss": 0.7258, "step": 6926 }, { "epoch": 0.72, "learning_rate": 3.811907212934854e-05, "loss": 0.647, "step": 6927 }, { "epoch": 0.72, "learning_rate": 3.8092590879134826e-05, "loss": 0.6617, "step": 6928 }, { "epoch": 0.72, "learning_rate": 3.806611666607353e-05, "loss": 0.6781, "step": 6929 }, { "epoch": 0.72, "learning_rate": 3.8039649493174066e-05, "loss": 0.6518, "step": 6930 }, { "epoch": 0.72, "learning_rate": 3.8013189363445e-05, "loss": 0.6476, "step": 6931 }, { "epoch": 0.72, "learning_rate": 3.798673627989407e-05, "loss": 0.6827, "step": 6932 }, { "epoch": 0.72, "learning_rate": 3.796029024552832e-05, "loss": 0.6725, "step": 6933 }, { "epoch": 0.72, "learning_rate": 3.793385126335386e-05, "loss": 0.6886, "step": 6934 }, { "epoch": 0.72, "learning_rate": 3.790741933637615e-05, "loss": 0.6232, "step": 6935 }, { "epoch": 0.72, "learning_rate": 3.788099446759968e-05, "loss": 0.6335, "step": 6936 }, { "epoch": 0.72, "learning_rate": 3.7854576660028275e-05, "loss": 0.6804, "step": 6937 }, { "epoch": 0.72, "learning_rate": 3.7828165916664926e-05, "loss": 0.6475, "step": 6938 }, { "epoch": 0.72, "learning_rate": 3.780176224051174e-05, "loss": 0.6724, "step": 6939 }, { "epoch": 0.72, "learning_rate": 3.7775365634570116e-05, "loss": 0.6264, "step": 6940 }, { "epoch": 0.72, "learning_rate": 3.7748976101840636e-05, "loss": 0.6795, "step": 6941 }, { "epoch": 0.72, "learning_rate": 3.7722593645323e-05, "loss": 0.6677, "step": 6942 }, { "epoch": 0.72, "learning_rate": 3.7696218268016237e-05, "loss": 0.6609, "step": 6943 }, { "epoch": 0.72, "learning_rate": 3.7669849972918405e-05, "loss": 0.6624, "step": 6944 }, { "epoch": 0.72, "learning_rate": 3.764348876302694e-05, "loss": 0.7103, "step": 6945 }, { "epoch": 0.72, "learning_rate": 3.761713464133828e-05, "loss": 0.7283, "step": 6946 }, { "epoch": 0.72, "learning_rate": 3.759078761084824e-05, "loss": 0.7343, "step": 6947 }, { "epoch": 0.72, "learning_rate": 3.7564447674551694e-05, "loss": 0.6952, "step": 6948 }, { "epoch": 0.72, "learning_rate": 3.75381148354428e-05, "loss": 0.6832, "step": 6949 }, { "epoch": 0.72, "learning_rate": 3.751178909651483e-05, "loss": 0.6572, "step": 6950 }, { "epoch": 0.72, "learning_rate": 3.74854704607603e-05, "loss": 0.7035, "step": 6951 }, { "epoch": 0.72, "learning_rate": 3.745915893117096e-05, "loss": 0.7284, "step": 6952 }, { "epoch": 0.72, "learning_rate": 3.743285451073761e-05, "loss": 0.6928, "step": 6953 }, { "epoch": 0.72, "learning_rate": 3.7406557202450386e-05, "loss": 0.7187, "step": 6954 }, { "epoch": 0.72, "learning_rate": 3.738026700929859e-05, "loss": 0.6823, "step": 6955 }, { "epoch": 0.72, "learning_rate": 3.735398393427061e-05, "loss": 0.663, "step": 6956 }, { "epoch": 0.72, "learning_rate": 3.7327707980354176e-05, "loss": 0.67, "step": 6957 }, { "epoch": 0.72, "learning_rate": 3.73014391505361e-05, "loss": 0.6666, "step": 6958 }, { "epoch": 0.72, "learning_rate": 3.727517744780238e-05, "loss": 0.687, "step": 6959 }, { "epoch": 0.72, "learning_rate": 3.7248922875138295e-05, "loss": 0.6707, "step": 6960 }, { "epoch": 0.72, "learning_rate": 3.7222675435528265e-05, "loss": 0.6107, "step": 6961 }, { "epoch": 0.72, "learning_rate": 3.7196435131955845e-05, "loss": 0.6467, "step": 6962 }, { "epoch": 0.72, "learning_rate": 3.717020196740385e-05, "loss": 0.6755, "step": 6963 }, { "epoch": 0.72, "learning_rate": 3.7143975944854316e-05, "loss": 0.7052, "step": 6964 }, { "epoch": 0.72, "learning_rate": 3.7117757067288326e-05, "loss": 0.6499, "step": 6965 }, { "epoch": 0.73, "learning_rate": 3.7091545337686285e-05, "loss": 0.6679, "step": 6966 }, { "epoch": 0.73, "learning_rate": 3.7065340759027764e-05, "loss": 0.6723, "step": 6967 }, { "epoch": 0.73, "learning_rate": 3.7039143334291426e-05, "loss": 0.6148, "step": 6968 }, { "epoch": 0.73, "learning_rate": 3.701295306645527e-05, "loss": 0.6501, "step": 6969 }, { "epoch": 0.73, "learning_rate": 3.698676995849636e-05, "loss": 0.6884, "step": 6970 }, { "epoch": 0.73, "learning_rate": 3.696059401339095e-05, "loss": 0.6719, "step": 6971 }, { "epoch": 0.73, "learning_rate": 3.693442523411459e-05, "loss": 0.6756, "step": 6972 }, { "epoch": 0.73, "learning_rate": 3.6908263623641884e-05, "loss": 0.6388, "step": 6973 }, { "epoch": 0.73, "learning_rate": 3.688210918494669e-05, "loss": 0.709, "step": 6974 }, { "epoch": 0.73, "learning_rate": 3.68559619210021e-05, "loss": 0.6766, "step": 6975 }, { "epoch": 0.73, "learning_rate": 3.682982183478025e-05, "loss": 0.6736, "step": 6976 }, { "epoch": 0.73, "learning_rate": 3.680368892925258e-05, "loss": 0.6396, "step": 6977 }, { "epoch": 0.73, "learning_rate": 3.677756320738971e-05, "loss": 0.6537, "step": 6978 }, { "epoch": 0.73, "learning_rate": 3.675144467216134e-05, "loss": 0.6889, "step": 6979 }, { "epoch": 0.73, "learning_rate": 3.672533332653646e-05, "loss": 0.6165, "step": 6980 }, { "epoch": 0.73, "learning_rate": 3.669922917348322e-05, "loss": 0.6438, "step": 6981 }, { "epoch": 0.73, "learning_rate": 3.66731322159689e-05, "loss": 0.6738, "step": 6982 }, { "epoch": 0.73, "learning_rate": 3.6647042456960036e-05, "loss": 0.6836, "step": 6983 }, { "epoch": 0.73, "learning_rate": 3.662095989942229e-05, "loss": 0.6982, "step": 6984 }, { "epoch": 0.73, "learning_rate": 3.65948845463205e-05, "loss": 0.6367, "step": 6985 }, { "epoch": 0.73, "learning_rate": 3.656881640061872e-05, "loss": 0.6875, "step": 6986 }, { "epoch": 0.73, "learning_rate": 3.654275546528022e-05, "loss": 0.7123, "step": 6987 }, { "epoch": 0.73, "learning_rate": 3.651670174326734e-05, "loss": 0.7016, "step": 6988 }, { "epoch": 0.73, "learning_rate": 3.6490655237541726e-05, "loss": 0.6441, "step": 6989 }, { "epoch": 0.73, "learning_rate": 3.6464615951064074e-05, "loss": 0.673, "step": 6990 }, { "epoch": 0.73, "learning_rate": 3.6438583886794375e-05, "loss": 0.6212, "step": 6991 }, { "epoch": 0.73, "learning_rate": 3.641255904769176e-05, "loss": 0.7152, "step": 6992 }, { "epoch": 0.73, "learning_rate": 3.638654143671448e-05, "loss": 0.6485, "step": 6993 }, { "epoch": 0.73, "learning_rate": 3.636053105682006e-05, "loss": 0.6768, "step": 6994 }, { "epoch": 0.73, "learning_rate": 3.6334527910965154e-05, "loss": 0.6684, "step": 6995 }, { "epoch": 0.73, "learning_rate": 3.63085320021056e-05, "loss": 0.6491, "step": 6996 }, { "epoch": 0.73, "learning_rate": 3.628254333319636e-05, "loss": 0.6772, "step": 6997 }, { "epoch": 0.73, "learning_rate": 3.625656190719169e-05, "loss": 0.7113, "step": 6998 }, { "epoch": 0.73, "learning_rate": 3.62305877270449e-05, "loss": 0.679, "step": 6999 }, { "epoch": 0.73, "learning_rate": 3.620462079570854e-05, "loss": 0.7021, "step": 7000 }, { "epoch": 0.73, "learning_rate": 3.61786611161344e-05, "loss": 0.6796, "step": 7001 }, { "epoch": 0.73, "learning_rate": 3.6152708691273284e-05, "loss": 0.6309, "step": 7002 }, { "epoch": 0.73, "learning_rate": 3.612676352407529e-05, "loss": 0.6477, "step": 7003 }, { "epoch": 0.73, "learning_rate": 3.610082561748972e-05, "loss": 0.6531, "step": 7004 }, { "epoch": 0.73, "learning_rate": 3.60748949744649e-05, "loss": 0.7575, "step": 7005 }, { "epoch": 0.73, "learning_rate": 3.6048971597948476e-05, "loss": 0.6697, "step": 7006 }, { "epoch": 0.73, "learning_rate": 3.602305549088724e-05, "loss": 0.6841, "step": 7007 }, { "epoch": 0.73, "learning_rate": 3.59971466562271e-05, "loss": 0.6439, "step": 7008 }, { "epoch": 0.73, "learning_rate": 3.597124509691314e-05, "loss": 0.6867, "step": 7009 }, { "epoch": 0.73, "learning_rate": 3.5945350815889714e-05, "loss": 0.6286, "step": 7010 }, { "epoch": 0.73, "learning_rate": 3.591946381610022e-05, "loss": 0.6254, "step": 7011 }, { "epoch": 0.73, "learning_rate": 3.589358410048734e-05, "loss": 0.628, "step": 7012 }, { "epoch": 0.73, "learning_rate": 3.586771167199283e-05, "loss": 0.709, "step": 7013 }, { "epoch": 0.73, "learning_rate": 3.58418465335577e-05, "loss": 0.6984, "step": 7014 }, { "epoch": 0.73, "learning_rate": 3.5815988688122124e-05, "loss": 0.6035, "step": 7015 }, { "epoch": 0.73, "learning_rate": 3.5790138138625363e-05, "loss": 0.7002, "step": 7016 }, { "epoch": 0.73, "learning_rate": 3.576429488800591e-05, "loss": 0.6332, "step": 7017 }, { "epoch": 0.73, "learning_rate": 3.5738458939201504e-05, "loss": 0.6065, "step": 7018 }, { "epoch": 0.73, "learning_rate": 3.5712630295148864e-05, "loss": 0.6817, "step": 7019 }, { "epoch": 0.73, "learning_rate": 3.568680895878409e-05, "loss": 0.652, "step": 7020 }, { "epoch": 0.73, "learning_rate": 3.566099493304226e-05, "loss": 0.6945, "step": 7021 }, { "epoch": 0.73, "learning_rate": 3.5635188220857784e-05, "loss": 0.612, "step": 7022 }, { "epoch": 0.73, "learning_rate": 3.5609388825164114e-05, "loss": 0.6813, "step": 7023 }, { "epoch": 0.73, "learning_rate": 3.558359674889398e-05, "loss": 0.7204, "step": 7024 }, { "epoch": 0.73, "learning_rate": 3.555781199497916e-05, "loss": 0.6707, "step": 7025 }, { "epoch": 0.73, "learning_rate": 3.55320345663507e-05, "loss": 0.6774, "step": 7026 }, { "epoch": 0.73, "learning_rate": 3.55062644659388e-05, "loss": 0.6868, "step": 7027 }, { "epoch": 0.73, "learning_rate": 3.548050169667275e-05, "loss": 0.6831, "step": 7028 }, { "epoch": 0.73, "learning_rate": 3.545474626148113e-05, "loss": 0.6526, "step": 7029 }, { "epoch": 0.73, "learning_rate": 3.542899816329154e-05, "loss": 0.7181, "step": 7030 }, { "epoch": 0.73, "learning_rate": 3.540325740503086e-05, "loss": 0.7258, "step": 7031 }, { "epoch": 0.73, "learning_rate": 3.537752398962514e-05, "loss": 0.6326, "step": 7032 }, { "epoch": 0.73, "learning_rate": 3.535179791999948e-05, "loss": 0.656, "step": 7033 }, { "epoch": 0.73, "learning_rate": 3.532607919907828e-05, "loss": 0.6633, "step": 7034 }, { "epoch": 0.73, "learning_rate": 3.530036782978502e-05, "loss": 0.6819, "step": 7035 }, { "epoch": 0.73, "learning_rate": 3.527466381504233e-05, "loss": 0.6125, "step": 7036 }, { "epoch": 0.73, "learning_rate": 3.524896715777208e-05, "loss": 0.6841, "step": 7037 }, { "epoch": 0.73, "learning_rate": 3.522327786089531e-05, "loss": 0.6534, "step": 7038 }, { "epoch": 0.73, "learning_rate": 3.5197595927332094e-05, "loss": 0.728, "step": 7039 }, { "epoch": 0.73, "learning_rate": 3.5171921360001795e-05, "loss": 0.7033, "step": 7040 }, { "epoch": 0.73, "learning_rate": 3.514625416182292e-05, "loss": 0.7242, "step": 7041 }, { "epoch": 0.73, "learning_rate": 3.512059433571307e-05, "loss": 0.673, "step": 7042 }, { "epoch": 0.73, "learning_rate": 3.5094941884589074e-05, "loss": 0.6877, "step": 7043 }, { "epoch": 0.73, "learning_rate": 3.506929681136695e-05, "loss": 0.5882, "step": 7044 }, { "epoch": 0.73, "learning_rate": 3.5043659118961745e-05, "loss": 0.6334, "step": 7045 }, { "epoch": 0.73, "learning_rate": 3.501802881028783e-05, "loss": 0.6165, "step": 7046 }, { "epoch": 0.73, "learning_rate": 3.4992405888258584e-05, "loss": 0.6747, "step": 7047 }, { "epoch": 0.73, "learning_rate": 3.496679035578671e-05, "loss": 0.7197, "step": 7048 }, { "epoch": 0.73, "learning_rate": 3.494118221578392e-05, "loss": 0.6907, "step": 7049 }, { "epoch": 0.73, "learning_rate": 3.491558147116113e-05, "loss": 0.66, "step": 7050 }, { "epoch": 0.73, "learning_rate": 3.4889988124828465e-05, "loss": 0.6929, "step": 7051 }, { "epoch": 0.73, "learning_rate": 3.486440217969521e-05, "loss": 0.7047, "step": 7052 }, { "epoch": 0.73, "learning_rate": 3.483882363866971e-05, "loss": 0.6609, "step": 7053 }, { "epoch": 0.73, "learning_rate": 3.481325250465958e-05, "loss": 0.6901, "step": 7054 }, { "epoch": 0.73, "learning_rate": 3.478768878057156e-05, "loss": 0.5982, "step": 7055 }, { "epoch": 0.73, "learning_rate": 3.476213246931147e-05, "loss": 0.7457, "step": 7056 }, { "epoch": 0.73, "learning_rate": 3.4736583573784397e-05, "loss": 0.6829, "step": 7057 }, { "epoch": 0.73, "learning_rate": 3.4711042096894574e-05, "loss": 0.6682, "step": 7058 }, { "epoch": 0.73, "learning_rate": 3.468550804154528e-05, "loss": 0.6308, "step": 7059 }, { "epoch": 0.73, "learning_rate": 3.465998141063911e-05, "loss": 0.6498, "step": 7060 }, { "epoch": 0.73, "learning_rate": 3.463446220707768e-05, "loss": 0.6853, "step": 7061 }, { "epoch": 0.74, "learning_rate": 3.46089504337618e-05, "loss": 0.6787, "step": 7062 }, { "epoch": 0.74, "learning_rate": 3.4583446093591466e-05, "loss": 0.6446, "step": 7063 }, { "epoch": 0.74, "learning_rate": 3.455794918946585e-05, "loss": 0.6463, "step": 7064 }, { "epoch": 0.74, "learning_rate": 3.453245972428319e-05, "loss": 0.6409, "step": 7065 }, { "epoch": 0.74, "learning_rate": 3.450697770094096e-05, "loss": 0.6848, "step": 7066 }, { "epoch": 0.74, "learning_rate": 3.4481503122335776e-05, "loss": 0.6077, "step": 7067 }, { "epoch": 0.74, "learning_rate": 3.4456035991363336e-05, "loss": 0.7345, "step": 7068 }, { "epoch": 0.74, "learning_rate": 3.443057631091859e-05, "loss": 0.5802, "step": 7069 }, { "epoch": 0.74, "learning_rate": 3.440512408389557e-05, "loss": 0.662, "step": 7070 }, { "epoch": 0.74, "learning_rate": 3.4379679313187486e-05, "loss": 0.6093, "step": 7071 }, { "epoch": 0.74, "learning_rate": 3.435424200168675e-05, "loss": 0.6898, "step": 7072 }, { "epoch": 0.74, "learning_rate": 3.432881215228484e-05, "loss": 0.6945, "step": 7073 }, { "epoch": 0.74, "learning_rate": 3.430338976787238e-05, "loss": 0.7108, "step": 7074 }, { "epoch": 0.74, "learning_rate": 3.427797485133928e-05, "loss": 0.6436, "step": 7075 }, { "epoch": 0.74, "learning_rate": 3.425256740557443e-05, "loss": 0.5998, "step": 7076 }, { "epoch": 0.74, "learning_rate": 3.422716743346598e-05, "loss": 0.624, "step": 7077 }, { "epoch": 0.74, "learning_rate": 3.420177493790123e-05, "loss": 0.6947, "step": 7078 }, { "epoch": 0.74, "learning_rate": 3.417638992176655e-05, "loss": 0.6366, "step": 7079 }, { "epoch": 0.74, "learning_rate": 3.415101238794753e-05, "loss": 0.6939, "step": 7080 }, { "epoch": 0.74, "learning_rate": 3.412564233932893e-05, "loss": 0.689, "step": 7081 }, { "epoch": 0.74, "learning_rate": 3.410027977879456e-05, "loss": 0.6461, "step": 7082 }, { "epoch": 0.74, "learning_rate": 3.407492470922748e-05, "loss": 0.6745, "step": 7083 }, { "epoch": 0.74, "learning_rate": 3.4049577133509845e-05, "loss": 0.7204, "step": 7084 }, { "epoch": 0.74, "learning_rate": 3.402423705452299e-05, "loss": 0.6289, "step": 7085 }, { "epoch": 0.74, "learning_rate": 3.399890447514731e-05, "loss": 0.6714, "step": 7086 }, { "epoch": 0.74, "learning_rate": 3.3973579398262503e-05, "loss": 0.7057, "step": 7087 }, { "epoch": 0.74, "learning_rate": 3.394826182674724e-05, "loss": 0.733, "step": 7088 }, { "epoch": 0.74, "learning_rate": 3.3922951763479516e-05, "loss": 0.6774, "step": 7089 }, { "epoch": 0.74, "learning_rate": 3.389764921133629e-05, "loss": 0.6686, "step": 7090 }, { "epoch": 0.74, "learning_rate": 3.387235417319381e-05, "loss": 0.7456, "step": 7091 }, { "epoch": 0.74, "learning_rate": 3.384706665192745e-05, "loss": 0.6978, "step": 7092 }, { "epoch": 0.74, "learning_rate": 3.3821786650411633e-05, "loss": 0.715, "step": 7093 }, { "epoch": 0.74, "learning_rate": 3.3796514171520024e-05, "loss": 0.6492, "step": 7094 }, { "epoch": 0.74, "learning_rate": 3.3771249218125424e-05, "loss": 0.7289, "step": 7095 }, { "epoch": 0.74, "learning_rate": 3.37459917930997e-05, "loss": 0.6416, "step": 7096 }, { "epoch": 0.74, "learning_rate": 3.372074189931399e-05, "loss": 0.6746, "step": 7097 }, { "epoch": 0.74, "learning_rate": 3.369549953963843e-05, "loss": 0.6939, "step": 7098 }, { "epoch": 0.74, "learning_rate": 3.3670264716942446e-05, "loss": 0.6335, "step": 7099 }, { "epoch": 0.74, "learning_rate": 3.3645037434094474e-05, "loss": 0.5831, "step": 7100 }, { "epoch": 0.74, "learning_rate": 3.361981769396222e-05, "loss": 0.6404, "step": 7101 }, { "epoch": 0.74, "learning_rate": 3.359460549941239e-05, "loss": 0.6652, "step": 7102 }, { "epoch": 0.74, "learning_rate": 3.356940085331095e-05, "loss": 0.6645, "step": 7103 }, { "epoch": 0.74, "learning_rate": 3.354420375852301e-05, "loss": 0.6587, "step": 7104 }, { "epoch": 0.74, "learning_rate": 3.3519014217912704e-05, "loss": 0.6884, "step": 7105 }, { "epoch": 0.74, "learning_rate": 3.349383223434342e-05, "loss": 0.68, "step": 7106 }, { "epoch": 0.74, "learning_rate": 3.346865781067767e-05, "loss": 0.6305, "step": 7107 }, { "epoch": 0.74, "learning_rate": 3.3443490949777046e-05, "loss": 0.6644, "step": 7108 }, { "epoch": 0.74, "learning_rate": 3.341833165450237e-05, "loss": 0.6382, "step": 7109 }, { "epoch": 0.74, "learning_rate": 3.339317992771349e-05, "loss": 0.7174, "step": 7110 }, { "epoch": 0.74, "learning_rate": 3.336803577226952e-05, "loss": 0.6451, "step": 7111 }, { "epoch": 0.74, "learning_rate": 3.334289919102863e-05, "loss": 0.7164, "step": 7112 }, { "epoch": 0.74, "learning_rate": 3.331777018684811e-05, "loss": 0.6709, "step": 7113 }, { "epoch": 0.74, "learning_rate": 3.3292648762584465e-05, "loss": 0.701, "step": 7114 }, { "epoch": 0.74, "learning_rate": 3.326753492109335e-05, "loss": 0.6881, "step": 7115 }, { "epoch": 0.74, "learning_rate": 3.324242866522941e-05, "loss": 0.6106, "step": 7116 }, { "epoch": 0.74, "learning_rate": 3.321732999784659e-05, "loss": 0.6691, "step": 7117 }, { "epoch": 0.74, "learning_rate": 3.3192238921797945e-05, "loss": 0.6601, "step": 7118 }, { "epoch": 0.74, "learning_rate": 3.316715543993555e-05, "loss": 0.6678, "step": 7119 }, { "epoch": 0.74, "learning_rate": 3.314207955511075e-05, "loss": 0.7116, "step": 7120 }, { "epoch": 0.74, "learning_rate": 3.311701127017399e-05, "loss": 0.7035, "step": 7121 }, { "epoch": 0.74, "learning_rate": 3.3091950587974796e-05, "loss": 0.5937, "step": 7122 }, { "epoch": 0.74, "learning_rate": 3.3066897511361914e-05, "loss": 0.6727, "step": 7123 }, { "epoch": 0.74, "learning_rate": 3.3041852043183144e-05, "loss": 0.651, "step": 7124 }, { "epoch": 0.74, "learning_rate": 3.301681418628549e-05, "loss": 0.6306, "step": 7125 }, { "epoch": 0.74, "learning_rate": 3.299178394351503e-05, "loss": 0.6956, "step": 7126 }, { "epoch": 0.74, "learning_rate": 3.296676131771704e-05, "loss": 0.7083, "step": 7127 }, { "epoch": 0.74, "learning_rate": 3.294174631173587e-05, "loss": 0.7086, "step": 7128 }, { "epoch": 0.74, "learning_rate": 3.291673892841506e-05, "loss": 0.6983, "step": 7129 }, { "epoch": 0.74, "learning_rate": 3.2891739170597215e-05, "loss": 0.6743, "step": 7130 }, { "epoch": 0.74, "learning_rate": 3.2866747041124124e-05, "loss": 0.7104, "step": 7131 }, { "epoch": 0.74, "learning_rate": 3.284176254283674e-05, "loss": 0.6687, "step": 7132 }, { "epoch": 0.74, "learning_rate": 3.2816785678575055e-05, "loss": 0.7123, "step": 7133 }, { "epoch": 0.74, "learning_rate": 3.2791816451178256e-05, "loss": 0.6976, "step": 7134 }, { "epoch": 0.74, "learning_rate": 3.27668548634847e-05, "loss": 0.6918, "step": 7135 }, { "epoch": 0.74, "learning_rate": 3.274190091833175e-05, "loss": 0.6896, "step": 7136 }, { "epoch": 0.74, "learning_rate": 3.271695461855604e-05, "loss": 0.6288, "step": 7137 }, { "epoch": 0.74, "learning_rate": 3.269201596699324e-05, "loss": 0.708, "step": 7138 }, { "epoch": 0.74, "learning_rate": 3.266708496647816e-05, "loss": 0.6005, "step": 7139 }, { "epoch": 0.74, "learning_rate": 3.264216161984478e-05, "loss": 0.6595, "step": 7140 }, { "epoch": 0.74, "learning_rate": 3.2617245929926234e-05, "loss": 0.6633, "step": 7141 }, { "epoch": 0.74, "learning_rate": 3.259233789955467e-05, "loss": 0.6666, "step": 7142 }, { "epoch": 0.74, "learning_rate": 3.2567437531561486e-05, "loss": 0.6595, "step": 7143 }, { "epoch": 0.74, "learning_rate": 3.254254482877719e-05, "loss": 0.7317, "step": 7144 }, { "epoch": 0.74, "learning_rate": 3.251765979403131e-05, "loss": 0.734, "step": 7145 }, { "epoch": 0.74, "learning_rate": 3.249278243015264e-05, "loss": 0.6314, "step": 7146 }, { "epoch": 0.74, "learning_rate": 3.2467912739969054e-05, "loss": 0.7407, "step": 7147 }, { "epoch": 0.74, "learning_rate": 3.244305072630749e-05, "loss": 0.6519, "step": 7148 }, { "epoch": 0.74, "learning_rate": 3.241819639199414e-05, "loss": 0.693, "step": 7149 }, { "epoch": 0.74, "learning_rate": 3.2393349739854204e-05, "loss": 0.6933, "step": 7150 }, { "epoch": 0.74, "learning_rate": 3.2368510772712034e-05, "loss": 0.7154, "step": 7151 }, { "epoch": 0.74, "learning_rate": 3.23436794933912e-05, "loss": 0.6676, "step": 7152 }, { "epoch": 0.74, "learning_rate": 3.231885590471426e-05, "loss": 0.7172, "step": 7153 }, { "epoch": 0.74, "learning_rate": 3.2294040009502994e-05, "loss": 0.6592, "step": 7154 }, { "epoch": 0.74, "learning_rate": 3.226923181057831e-05, "loss": 0.6744, "step": 7155 }, { "epoch": 0.74, "learning_rate": 3.224443131076015e-05, "loss": 0.6734, "step": 7156 }, { "epoch": 0.74, "learning_rate": 3.221963851286768e-05, "loss": 0.6388, "step": 7157 }, { "epoch": 0.75, "learning_rate": 3.2194853419719175e-05, "loss": 0.6493, "step": 7158 }, { "epoch": 0.75, "learning_rate": 3.2170076034131945e-05, "loss": 0.6251, "step": 7159 }, { "epoch": 0.75, "learning_rate": 3.2145306358922536e-05, "loss": 0.6432, "step": 7160 }, { "epoch": 0.75, "learning_rate": 3.2120544396906594e-05, "loss": 0.6542, "step": 7161 }, { "epoch": 0.75, "learning_rate": 3.209579015089884e-05, "loss": 0.6519, "step": 7162 }, { "epoch": 0.75, "learning_rate": 3.2071043623713106e-05, "loss": 0.6777, "step": 7163 }, { "epoch": 0.75, "learning_rate": 3.2046304818162455e-05, "loss": 0.6645, "step": 7164 }, { "epoch": 0.75, "learning_rate": 3.202157373705893e-05, "loss": 0.7822, "step": 7165 }, { "epoch": 0.75, "learning_rate": 3.1996850383213794e-05, "loss": 0.7043, "step": 7166 }, { "epoch": 0.75, "learning_rate": 3.197213475943747e-05, "loss": 0.6556, "step": 7167 }, { "epoch": 0.75, "learning_rate": 3.1947426868539334e-05, "loss": 0.7529, "step": 7168 }, { "epoch": 0.75, "learning_rate": 3.1922726713328074e-05, "loss": 0.6565, "step": 7169 }, { "epoch": 0.75, "learning_rate": 3.189803429661133e-05, "loss": 0.7095, "step": 7170 }, { "epoch": 0.75, "learning_rate": 3.1873349621196006e-05, "loss": 0.7113, "step": 7171 }, { "epoch": 0.75, "learning_rate": 3.184867268988807e-05, "loss": 0.7161, "step": 7172 }, { "epoch": 0.75, "learning_rate": 3.182400350549254e-05, "loss": 0.6772, "step": 7173 }, { "epoch": 0.75, "learning_rate": 3.179934207081366e-05, "loss": 0.6347, "step": 7174 }, { "epoch": 0.75, "learning_rate": 3.1774688388654786e-05, "loss": 0.6509, "step": 7175 }, { "epoch": 0.75, "learning_rate": 3.1750042461818295e-05, "loss": 0.6975, "step": 7176 }, { "epoch": 0.75, "learning_rate": 3.1725404293105753e-05, "loss": 0.7028, "step": 7177 }, { "epoch": 0.75, "learning_rate": 3.170077388531787e-05, "loss": 0.6947, "step": 7178 }, { "epoch": 0.75, "learning_rate": 3.167615124125438e-05, "loss": 0.6981, "step": 7179 }, { "epoch": 0.75, "learning_rate": 3.165153636371424e-05, "loss": 0.6773, "step": 7180 }, { "epoch": 0.75, "learning_rate": 3.162692925549549e-05, "loss": 0.7035, "step": 7181 }, { "epoch": 0.75, "learning_rate": 3.160232991939522e-05, "loss": 0.6973, "step": 7182 }, { "epoch": 0.75, "learning_rate": 3.157773835820973e-05, "loss": 0.6964, "step": 7183 }, { "epoch": 0.75, "learning_rate": 3.155315457473442e-05, "loss": 0.7451, "step": 7184 }, { "epoch": 0.75, "learning_rate": 3.152857857176372e-05, "loss": 0.6823, "step": 7185 }, { "epoch": 0.75, "learning_rate": 3.150401035209127e-05, "loss": 0.6644, "step": 7186 }, { "epoch": 0.75, "learning_rate": 3.147944991850983e-05, "loss": 0.6498, "step": 7187 }, { "epoch": 0.75, "learning_rate": 3.1454897273811214e-05, "loss": 0.7202, "step": 7188 }, { "epoch": 0.75, "learning_rate": 3.1430352420786356e-05, "loss": 0.6466, "step": 7189 }, { "epoch": 0.75, "learning_rate": 3.1405815362225296e-05, "loss": 0.6523, "step": 7190 }, { "epoch": 0.75, "learning_rate": 3.138128610091727e-05, "loss": 0.7286, "step": 7191 }, { "epoch": 0.75, "learning_rate": 3.1356764639650584e-05, "loss": 0.6635, "step": 7192 }, { "epoch": 0.75, "learning_rate": 3.133225098121258e-05, "loss": 0.6711, "step": 7193 }, { "epoch": 0.75, "learning_rate": 3.130774512838984e-05, "loss": 0.6777, "step": 7194 }, { "epoch": 0.75, "learning_rate": 3.128324708396799e-05, "loss": 0.6885, "step": 7195 }, { "epoch": 0.75, "learning_rate": 3.125875685073175e-05, "loss": 0.64, "step": 7196 }, { "epoch": 0.75, "learning_rate": 3.123427443146499e-05, "loss": 0.7319, "step": 7197 }, { "epoch": 0.75, "learning_rate": 3.1209799828950716e-05, "loss": 0.6629, "step": 7198 }, { "epoch": 0.75, "learning_rate": 3.1185333045970956e-05, "loss": 0.7309, "step": 7199 }, { "epoch": 0.75, "learning_rate": 3.116087408530695e-05, "loss": 0.6931, "step": 7200 }, { "epoch": 0.75, "learning_rate": 3.1136422949738954e-05, "loss": 0.7196, "step": 7201 }, { "epoch": 0.75, "learning_rate": 3.111197964204644e-05, "loss": 0.6427, "step": 7202 }, { "epoch": 0.75, "learning_rate": 3.108754416500786e-05, "loss": 0.6861, "step": 7203 }, { "epoch": 0.75, "learning_rate": 3.106311652140094e-05, "loss": 0.6863, "step": 7204 }, { "epoch": 0.75, "learning_rate": 3.103869671400234e-05, "loss": 0.715, "step": 7205 }, { "epoch": 0.75, "learning_rate": 3.101428474558794e-05, "loss": 0.6916, "step": 7206 }, { "epoch": 0.75, "learning_rate": 3.0989880618932746e-05, "loss": 0.6695, "step": 7207 }, { "epoch": 0.75, "learning_rate": 3.096548433681077e-05, "loss": 0.6554, "step": 7208 }, { "epoch": 0.75, "learning_rate": 3.094109590199524e-05, "loss": 0.6652, "step": 7209 }, { "epoch": 0.75, "learning_rate": 3.0916715317258395e-05, "loss": 0.6689, "step": 7210 }, { "epoch": 0.75, "learning_rate": 3.0892342585371646e-05, "loss": 0.635, "step": 7211 }, { "epoch": 0.75, "learning_rate": 3.086797770910553e-05, "loss": 0.6666, "step": 7212 }, { "epoch": 0.75, "learning_rate": 3.084362069122961e-05, "loss": 0.693, "step": 7213 }, { "epoch": 0.75, "learning_rate": 3.081927153451266e-05, "loss": 0.6254, "step": 7214 }, { "epoch": 0.75, "learning_rate": 3.0794930241722455e-05, "loss": 0.6091, "step": 7215 }, { "epoch": 0.75, "learning_rate": 3.077059681562591e-05, "loss": 0.6517, "step": 7216 }, { "epoch": 0.75, "learning_rate": 3.074627125898908e-05, "loss": 0.6954, "step": 7217 }, { "epoch": 0.75, "learning_rate": 3.0721953574577136e-05, "loss": 0.6552, "step": 7218 }, { "epoch": 0.75, "learning_rate": 3.069764376515427e-05, "loss": 0.6957, "step": 7219 }, { "epoch": 0.75, "learning_rate": 3.067334183348385e-05, "loss": 0.6877, "step": 7220 }, { "epoch": 0.75, "learning_rate": 3.064904778232838e-05, "loss": 0.6518, "step": 7221 }, { "epoch": 0.75, "learning_rate": 3.062476161444934e-05, "loss": 0.7261, "step": 7222 }, { "epoch": 0.75, "learning_rate": 3.060048333260742e-05, "loss": 0.6932, "step": 7223 }, { "epoch": 0.75, "learning_rate": 3.057621293956244e-05, "loss": 0.66, "step": 7224 }, { "epoch": 0.75, "learning_rate": 3.0551950438073194e-05, "loss": 0.6616, "step": 7225 }, { "epoch": 0.75, "learning_rate": 3.0527695830897704e-05, "loss": 0.738, "step": 7226 }, { "epoch": 0.75, "learning_rate": 3.050344912079304e-05, "loss": 0.7426, "step": 7227 }, { "epoch": 0.75, "learning_rate": 3.0479210310515328e-05, "loss": 0.6612, "step": 7228 }, { "epoch": 0.75, "learning_rate": 3.0454979402819916e-05, "loss": 0.6303, "step": 7229 }, { "epoch": 0.75, "learning_rate": 3.0430756400461114e-05, "loss": 0.6765, "step": 7230 }, { "epoch": 0.75, "learning_rate": 3.040654130619246e-05, "loss": 0.6635, "step": 7231 }, { "epoch": 0.75, "learning_rate": 3.038233412276654e-05, "loss": 0.6792, "step": 7232 }, { "epoch": 0.75, "learning_rate": 3.0358134852934994e-05, "loss": 0.7154, "step": 7233 }, { "epoch": 0.75, "learning_rate": 3.0333943499448626e-05, "loss": 0.7211, "step": 7234 }, { "epoch": 0.75, "learning_rate": 3.0309760065057368e-05, "loss": 0.6765, "step": 7235 }, { "epoch": 0.75, "learning_rate": 3.0285584552510128e-05, "loss": 0.6061, "step": 7236 }, { "epoch": 0.75, "learning_rate": 3.0261416964555023e-05, "loss": 0.6979, "step": 7237 }, { "epoch": 0.75, "learning_rate": 3.023725730393927e-05, "loss": 0.6752, "step": 7238 }, { "epoch": 0.75, "learning_rate": 3.021310557340912e-05, "loss": 0.731, "step": 7239 }, { "epoch": 0.75, "learning_rate": 3.0188961775709922e-05, "loss": 0.6895, "step": 7240 }, { "epoch": 0.75, "learning_rate": 3.0164825913586225e-05, "loss": 0.6575, "step": 7241 }, { "epoch": 0.75, "learning_rate": 3.014069798978153e-05, "loss": 0.6285, "step": 7242 }, { "epoch": 0.75, "learning_rate": 3.0116578007038555e-05, "loss": 0.6973, "step": 7243 }, { "epoch": 0.75, "learning_rate": 3.0092465968099093e-05, "loss": 0.671, "step": 7244 }, { "epoch": 0.75, "learning_rate": 3.0068361875703954e-05, "loss": 0.7158, "step": 7245 }, { "epoch": 0.75, "learning_rate": 3.0044265732593135e-05, "loss": 0.6437, "step": 7246 }, { "epoch": 0.75, "learning_rate": 3.0020177541505735e-05, "loss": 0.7314, "step": 7247 }, { "epoch": 0.75, "learning_rate": 2.999609730517985e-05, "loss": 0.6616, "step": 7248 }, { "epoch": 0.75, "learning_rate": 2.997202502635278e-05, "loss": 0.5977, "step": 7249 }, { "epoch": 0.75, "learning_rate": 2.9947960707760825e-05, "loss": 0.6708, "step": 7250 }, { "epoch": 0.75, "learning_rate": 2.9923904352139464e-05, "loss": 0.6438, "step": 7251 }, { "epoch": 0.75, "learning_rate": 2.9899855962223257e-05, "loss": 0.6185, "step": 7252 }, { "epoch": 0.75, "learning_rate": 2.987581554074581e-05, "loss": 0.6667, "step": 7253 }, { "epoch": 0.76, "learning_rate": 2.9851783090439823e-05, "loss": 0.7003, "step": 7254 }, { "epoch": 0.76, "learning_rate": 2.9827758614037183e-05, "loss": 0.6299, "step": 7255 }, { "epoch": 0.76, "learning_rate": 2.980374211426874e-05, "loss": 0.6633, "step": 7256 }, { "epoch": 0.76, "learning_rate": 2.9779733593864522e-05, "loss": 0.618, "step": 7257 }, { "epoch": 0.76, "learning_rate": 2.975573305555368e-05, "loss": 0.6823, "step": 7258 }, { "epoch": 0.76, "learning_rate": 2.9731740502064344e-05, "loss": 0.6103, "step": 7259 }, { "epoch": 0.76, "learning_rate": 2.9707755936123816e-05, "loss": 0.7192, "step": 7260 }, { "epoch": 0.76, "learning_rate": 2.9683779360458518e-05, "loss": 0.6063, "step": 7261 }, { "epoch": 0.76, "learning_rate": 2.9659810777793863e-05, "loss": 0.6255, "step": 7262 }, { "epoch": 0.76, "learning_rate": 2.963585019085443e-05, "loss": 0.7125, "step": 7263 }, { "epoch": 0.76, "learning_rate": 2.9611897602363915e-05, "loss": 0.641, "step": 7264 }, { "epoch": 0.76, "learning_rate": 2.9587953015045033e-05, "loss": 0.67, "step": 7265 }, { "epoch": 0.76, "learning_rate": 2.9564016431619568e-05, "loss": 0.6769, "step": 7266 }, { "epoch": 0.76, "learning_rate": 2.954008785480853e-05, "loss": 0.6772, "step": 7267 }, { "epoch": 0.76, "learning_rate": 2.951616728733185e-05, "loss": 0.7214, "step": 7268 }, { "epoch": 0.76, "learning_rate": 2.9492254731908718e-05, "loss": 0.6579, "step": 7269 }, { "epoch": 0.76, "learning_rate": 2.9468350191257245e-05, "loss": 0.6788, "step": 7270 }, { "epoch": 0.76, "learning_rate": 2.944445366809475e-05, "loss": 0.6704, "step": 7271 }, { "epoch": 0.76, "learning_rate": 2.9420565165137637e-05, "loss": 0.6499, "step": 7272 }, { "epoch": 0.76, "learning_rate": 2.9396684685101307e-05, "loss": 0.6775, "step": 7273 }, { "epoch": 0.76, "learning_rate": 2.937281223070032e-05, "loss": 0.6714, "step": 7274 }, { "epoch": 0.76, "learning_rate": 2.9348947804648362e-05, "loss": 0.6583, "step": 7275 }, { "epoch": 0.76, "learning_rate": 2.932509140965809e-05, "loss": 0.6818, "step": 7276 }, { "epoch": 0.76, "learning_rate": 2.9301243048441375e-05, "loss": 0.6934, "step": 7277 }, { "epoch": 0.76, "learning_rate": 2.9277402723709037e-05, "loss": 0.7083, "step": 7278 }, { "epoch": 0.76, "learning_rate": 2.9253570438171128e-05, "loss": 0.585, "step": 7279 }, { "epoch": 0.76, "learning_rate": 2.9229746194536666e-05, "loss": 0.6996, "step": 7280 }, { "epoch": 0.76, "learning_rate": 2.920592999551386e-05, "loss": 0.6626, "step": 7281 }, { "epoch": 0.76, "learning_rate": 2.9182121843809886e-05, "loss": 0.71, "step": 7282 }, { "epoch": 0.76, "learning_rate": 2.91583217421311e-05, "loss": 0.7129, "step": 7283 }, { "epoch": 0.76, "learning_rate": 2.9134529693182944e-05, "loss": 0.616, "step": 7284 }, { "epoch": 0.76, "learning_rate": 2.911074569966986e-05, "loss": 0.6853, "step": 7285 }, { "epoch": 0.76, "learning_rate": 2.9086969764295436e-05, "loss": 0.6459, "step": 7286 }, { "epoch": 0.76, "learning_rate": 2.906320188976239e-05, "loss": 0.6429, "step": 7287 }, { "epoch": 0.76, "learning_rate": 2.9039442078772404e-05, "loss": 0.6826, "step": 7288 }, { "epoch": 0.76, "learning_rate": 2.901569033402636e-05, "loss": 0.6545, "step": 7289 }, { "epoch": 0.76, "learning_rate": 2.89919466582241e-05, "loss": 0.6458, "step": 7290 }, { "epoch": 0.76, "learning_rate": 2.896821105406471e-05, "loss": 0.6767, "step": 7291 }, { "epoch": 0.76, "learning_rate": 2.8944483524246212e-05, "loss": 0.6041, "step": 7292 }, { "epoch": 0.76, "learning_rate": 2.8920764071465756e-05, "loss": 0.7025, "step": 7293 }, { "epoch": 0.76, "learning_rate": 2.88970526984196e-05, "loss": 0.6686, "step": 7294 }, { "epoch": 0.76, "learning_rate": 2.887334940780312e-05, "loss": 0.7474, "step": 7295 }, { "epoch": 0.76, "learning_rate": 2.8849654202310638e-05, "loss": 0.6799, "step": 7296 }, { "epoch": 0.76, "learning_rate": 2.8825967084635676e-05, "loss": 0.7129, "step": 7297 }, { "epoch": 0.76, "learning_rate": 2.8802288057470837e-05, "loss": 0.7061, "step": 7298 }, { "epoch": 0.76, "learning_rate": 2.8778617123507713e-05, "loss": 0.6859, "step": 7299 }, { "epoch": 0.76, "learning_rate": 2.875495428543704e-05, "loss": 0.6262, "step": 7300 }, { "epoch": 0.76, "learning_rate": 2.8731299545948687e-05, "loss": 0.6442, "step": 7301 }, { "epoch": 0.76, "learning_rate": 2.8707652907731452e-05, "loss": 0.6299, "step": 7302 }, { "epoch": 0.76, "learning_rate": 2.8684014373473378e-05, "loss": 0.6191, "step": 7303 }, { "epoch": 0.76, "learning_rate": 2.866038394586148e-05, "loss": 0.691, "step": 7304 }, { "epoch": 0.76, "learning_rate": 2.8636761627581832e-05, "loss": 0.6717, "step": 7305 }, { "epoch": 0.76, "learning_rate": 2.8613147421319684e-05, "loss": 0.7092, "step": 7306 }, { "epoch": 0.76, "learning_rate": 2.858954132975934e-05, "loss": 0.6633, "step": 7307 }, { "epoch": 0.76, "learning_rate": 2.856594335558409e-05, "loss": 0.6, "step": 7308 }, { "epoch": 0.76, "learning_rate": 2.854235350147645e-05, "loss": 0.6499, "step": 7309 }, { "epoch": 0.76, "learning_rate": 2.8518771770117845e-05, "loss": 0.6773, "step": 7310 }, { "epoch": 0.76, "learning_rate": 2.8495198164188896e-05, "loss": 0.677, "step": 7311 }, { "epoch": 0.76, "learning_rate": 2.847163268636932e-05, "loss": 0.6703, "step": 7312 }, { "epoch": 0.76, "learning_rate": 2.8448075339337765e-05, "loss": 0.6935, "step": 7313 }, { "epoch": 0.76, "learning_rate": 2.842452612577211e-05, "loss": 0.6279, "step": 7314 }, { "epoch": 0.76, "learning_rate": 2.8400985048349247e-05, "loss": 0.692, "step": 7315 }, { "epoch": 0.76, "learning_rate": 2.8377452109745095e-05, "loss": 0.6631, "step": 7316 }, { "epoch": 0.76, "learning_rate": 2.8353927312634765e-05, "loss": 0.6837, "step": 7317 }, { "epoch": 0.76, "learning_rate": 2.833041065969233e-05, "loss": 0.623, "step": 7318 }, { "epoch": 0.76, "learning_rate": 2.8306902153590943e-05, "loss": 0.702, "step": 7319 }, { "epoch": 0.76, "learning_rate": 2.8283401797002916e-05, "loss": 0.6291, "step": 7320 }, { "epoch": 0.76, "learning_rate": 2.825990959259961e-05, "loss": 0.6005, "step": 7321 }, { "epoch": 0.76, "learning_rate": 2.823642554305137e-05, "loss": 0.6262, "step": 7322 }, { "epoch": 0.76, "learning_rate": 2.821294965102772e-05, "loss": 0.6244, "step": 7323 }, { "epoch": 0.76, "learning_rate": 2.8189481919197237e-05, "loss": 0.6379, "step": 7324 }, { "epoch": 0.76, "learning_rate": 2.8166022350227495e-05, "loss": 0.6846, "step": 7325 }, { "epoch": 0.76, "learning_rate": 2.8142570946785217e-05, "loss": 0.7403, "step": 7326 }, { "epoch": 0.76, "learning_rate": 2.811912771153623e-05, "loss": 0.6136, "step": 7327 }, { "epoch": 0.76, "learning_rate": 2.809569264714529e-05, "loss": 0.6584, "step": 7328 }, { "epoch": 0.76, "learning_rate": 2.8072265756276396e-05, "loss": 0.7047, "step": 7329 }, { "epoch": 0.76, "learning_rate": 2.8048847041592476e-05, "loss": 0.6511, "step": 7330 }, { "epoch": 0.76, "learning_rate": 2.8025436505755586e-05, "loss": 0.6792, "step": 7331 }, { "epoch": 0.76, "learning_rate": 2.8002034151426903e-05, "loss": 0.7717, "step": 7332 }, { "epoch": 0.76, "learning_rate": 2.7978639981266565e-05, "loss": 0.6562, "step": 7333 }, { "epoch": 0.76, "learning_rate": 2.795525399793386e-05, "loss": 0.6185, "step": 7334 }, { "epoch": 0.76, "learning_rate": 2.793187620408717e-05, "loss": 0.6361, "step": 7335 }, { "epoch": 0.76, "learning_rate": 2.790850660238382e-05, "loss": 0.6918, "step": 7336 }, { "epoch": 0.76, "learning_rate": 2.7885145195480345e-05, "loss": 0.7062, "step": 7337 }, { "epoch": 0.76, "learning_rate": 2.7861791986032294e-05, "loss": 0.7123, "step": 7338 }, { "epoch": 0.76, "learning_rate": 2.783844697669422e-05, "loss": 0.7067, "step": 7339 }, { "epoch": 0.76, "learning_rate": 2.781511017011984e-05, "loss": 0.713, "step": 7340 }, { "epoch": 0.76, "learning_rate": 2.7791781568961916e-05, "loss": 0.6326, "step": 7341 }, { "epoch": 0.76, "learning_rate": 2.7768461175872263e-05, "loss": 0.6889, "step": 7342 }, { "epoch": 0.76, "learning_rate": 2.7745148993501703e-05, "loss": 0.6962, "step": 7343 }, { "epoch": 0.76, "learning_rate": 2.7721845024500248e-05, "loss": 0.6981, "step": 7344 }, { "epoch": 0.76, "learning_rate": 2.7698549271516848e-05, "loss": 0.7238, "step": 7345 }, { "epoch": 0.76, "learning_rate": 2.767526173719963e-05, "loss": 0.6822, "step": 7346 }, { "epoch": 0.76, "learning_rate": 2.7651982424195767e-05, "loss": 0.6202, "step": 7347 }, { "epoch": 0.76, "learning_rate": 2.7628711335151403e-05, "loss": 0.6662, "step": 7348 }, { "epoch": 0.76, "learning_rate": 2.760544847271186e-05, "loss": 0.6292, "step": 7349 }, { "epoch": 0.77, "learning_rate": 2.758219383952144e-05, "loss": 0.6557, "step": 7350 }, { "epoch": 0.77, "learning_rate": 2.755894743822358e-05, "loss": 0.6964, "step": 7351 }, { "epoch": 0.77, "learning_rate": 2.7535709271460774e-05, "loss": 0.6697, "step": 7352 }, { "epoch": 0.77, "learning_rate": 2.7512479341874485e-05, "loss": 0.6966, "step": 7353 }, { "epoch": 0.77, "learning_rate": 2.748925765210538e-05, "loss": 0.6577, "step": 7354 }, { "epoch": 0.77, "learning_rate": 2.7466044204793063e-05, "loss": 0.6729, "step": 7355 }, { "epoch": 0.77, "learning_rate": 2.7442839002576316e-05, "loss": 0.6777, "step": 7356 }, { "epoch": 0.77, "learning_rate": 2.7419642048092863e-05, "loss": 0.6405, "step": 7357 }, { "epoch": 0.77, "learning_rate": 2.739645334397962e-05, "loss": 0.6605, "step": 7358 }, { "epoch": 0.77, "learning_rate": 2.7373272892872427e-05, "loss": 0.6578, "step": 7359 }, { "epoch": 0.77, "learning_rate": 2.73501006974063e-05, "loss": 0.614, "step": 7360 }, { "epoch": 0.77, "learning_rate": 2.7326936760215295e-05, "loss": 0.7322, "step": 7361 }, { "epoch": 0.77, "learning_rate": 2.7303781083932446e-05, "loss": 0.6714, "step": 7362 }, { "epoch": 0.77, "learning_rate": 2.728063367118995e-05, "loss": 0.6512, "step": 7363 }, { "epoch": 0.77, "learning_rate": 2.7257494524619043e-05, "loss": 0.6842, "step": 7364 }, { "epoch": 0.77, "learning_rate": 2.7234363646849958e-05, "loss": 0.6775, "step": 7365 }, { "epoch": 0.77, "learning_rate": 2.7211241040512048e-05, "loss": 0.7315, "step": 7366 }, { "epoch": 0.77, "learning_rate": 2.7188126708233754e-05, "loss": 0.6584, "step": 7367 }, { "epoch": 0.77, "learning_rate": 2.716502065264248e-05, "loss": 0.6913, "step": 7368 }, { "epoch": 0.77, "learning_rate": 2.714192287636478e-05, "loss": 0.653, "step": 7369 }, { "epoch": 0.77, "learning_rate": 2.7118833382026166e-05, "loss": 0.6427, "step": 7370 }, { "epoch": 0.77, "learning_rate": 2.709575217225132e-05, "loss": 0.6844, "step": 7371 }, { "epoch": 0.77, "learning_rate": 2.7072679249663956e-05, "loss": 0.6618, "step": 7372 }, { "epoch": 0.77, "learning_rate": 2.7049614616886775e-05, "loss": 0.6174, "step": 7373 }, { "epoch": 0.77, "learning_rate": 2.7026558276541602e-05, "loss": 0.6529, "step": 7374 }, { "epoch": 0.77, "learning_rate": 2.700351023124934e-05, "loss": 0.6827, "step": 7375 }, { "epoch": 0.77, "learning_rate": 2.6980470483629838e-05, "loss": 0.6233, "step": 7376 }, { "epoch": 0.77, "learning_rate": 2.6957439036302135e-05, "loss": 0.6332, "step": 7377 }, { "epoch": 0.77, "learning_rate": 2.693441589188427e-05, "loss": 0.7233, "step": 7378 }, { "epoch": 0.77, "learning_rate": 2.691140105299328e-05, "loss": 0.6565, "step": 7379 }, { "epoch": 0.77, "learning_rate": 2.6888394522245375e-05, "loss": 0.6524, "step": 7380 }, { "epoch": 0.77, "learning_rate": 2.686539630225573e-05, "loss": 0.6372, "step": 7381 }, { "epoch": 0.77, "learning_rate": 2.6842406395638565e-05, "loss": 0.6815, "step": 7382 }, { "epoch": 0.77, "learning_rate": 2.6819424805007243e-05, "loss": 0.6193, "step": 7383 }, { "epoch": 0.77, "learning_rate": 2.6796451532974143e-05, "loss": 0.6847, "step": 7384 }, { "epoch": 0.77, "learning_rate": 2.6773486582150642e-05, "loss": 0.6896, "step": 7385 }, { "epoch": 0.77, "learning_rate": 2.675052995514723e-05, "loss": 0.687, "step": 7386 }, { "epoch": 0.77, "learning_rate": 2.6727581654573485e-05, "loss": 0.6161, "step": 7387 }, { "epoch": 0.77, "learning_rate": 2.6704641683037923e-05, "loss": 0.6812, "step": 7388 }, { "epoch": 0.77, "learning_rate": 2.6681710043148244e-05, "loss": 0.6738, "step": 7389 }, { "epoch": 0.77, "learning_rate": 2.6658786737511077e-05, "loss": 0.6991, "step": 7390 }, { "epoch": 0.77, "learning_rate": 2.663587176873219e-05, "loss": 0.6434, "step": 7391 }, { "epoch": 0.77, "learning_rate": 2.6612965139416424e-05, "loss": 0.6512, "step": 7392 }, { "epoch": 0.77, "learning_rate": 2.6590066852167537e-05, "loss": 0.7175, "step": 7393 }, { "epoch": 0.77, "learning_rate": 2.656717690958852e-05, "loss": 0.662, "step": 7394 }, { "epoch": 0.77, "learning_rate": 2.6544295314281288e-05, "loss": 0.6765, "step": 7395 }, { "epoch": 0.77, "learning_rate": 2.652142206884679e-05, "loss": 0.6882, "step": 7396 }, { "epoch": 0.77, "learning_rate": 2.649855717588512e-05, "loss": 0.6283, "step": 7397 }, { "epoch": 0.77, "learning_rate": 2.6475700637995426e-05, "loss": 0.6814, "step": 7398 }, { "epoch": 0.77, "learning_rate": 2.645285245777578e-05, "loss": 0.6367, "step": 7399 }, { "epoch": 0.77, "learning_rate": 2.643001263782343e-05, "loss": 0.7133, "step": 7400 }, { "epoch": 0.77, "learning_rate": 2.6407181180734654e-05, "loss": 0.6734, "step": 7401 }, { "epoch": 0.77, "learning_rate": 2.6384358089104687e-05, "loss": 0.6557, "step": 7402 }, { "epoch": 0.77, "learning_rate": 2.636154336552793e-05, "loss": 0.6958, "step": 7403 }, { "epoch": 0.77, "learning_rate": 2.6338737012597793e-05, "loss": 0.6811, "step": 7404 }, { "epoch": 0.77, "learning_rate": 2.6315939032906667e-05, "loss": 0.6564, "step": 7405 }, { "epoch": 0.77, "learning_rate": 2.6293149429046126e-05, "loss": 0.691, "step": 7406 }, { "epoch": 0.77, "learning_rate": 2.6270368203606667e-05, "loss": 0.656, "step": 7407 }, { "epoch": 0.77, "learning_rate": 2.6247595359177856e-05, "loss": 0.6791, "step": 7408 }, { "epoch": 0.77, "learning_rate": 2.6224830898348408e-05, "loss": 0.7264, "step": 7409 }, { "epoch": 0.77, "learning_rate": 2.6202074823705924e-05, "loss": 0.6494, "step": 7410 }, { "epoch": 0.77, "learning_rate": 2.6179327137837183e-05, "loss": 0.614, "step": 7411 }, { "epoch": 0.77, "learning_rate": 2.6156587843327985e-05, "loss": 0.674, "step": 7412 }, { "epoch": 0.77, "learning_rate": 2.6133856942763114e-05, "loss": 0.6491, "step": 7413 }, { "epoch": 0.77, "learning_rate": 2.611113443872646e-05, "loss": 0.6694, "step": 7414 }, { "epoch": 0.77, "learning_rate": 2.6088420333800967e-05, "loss": 0.7129, "step": 7415 }, { "epoch": 0.77, "learning_rate": 2.606571463056855e-05, "loss": 0.7152, "step": 7416 }, { "epoch": 0.77, "learning_rate": 2.6043017331610232e-05, "loss": 0.7241, "step": 7417 }, { "epoch": 0.77, "learning_rate": 2.6020328439506103e-05, "loss": 0.7053, "step": 7418 }, { "epoch": 0.77, "learning_rate": 2.5997647956835226e-05, "loss": 0.6558, "step": 7419 }, { "epoch": 0.77, "learning_rate": 2.597497588617572e-05, "loss": 0.6777, "step": 7420 }, { "epoch": 0.77, "learning_rate": 2.5952312230104813e-05, "loss": 0.6612, "step": 7421 }, { "epoch": 0.77, "learning_rate": 2.5929656991198703e-05, "loss": 0.6653, "step": 7422 }, { "epoch": 0.77, "learning_rate": 2.5907010172032654e-05, "loss": 0.6907, "step": 7423 }, { "epoch": 0.77, "learning_rate": 2.588437177518104e-05, "loss": 0.6773, "step": 7424 }, { "epoch": 0.77, "learning_rate": 2.5861741803217145e-05, "loss": 0.6893, "step": 7425 }, { "epoch": 0.77, "learning_rate": 2.583912025871339e-05, "loss": 0.6357, "step": 7426 }, { "epoch": 0.77, "learning_rate": 2.5816507144241263e-05, "loss": 0.6552, "step": 7427 }, { "epoch": 0.77, "learning_rate": 2.579390246237118e-05, "loss": 0.6405, "step": 7428 }, { "epoch": 0.77, "learning_rate": 2.577130621567272e-05, "loss": 0.6452, "step": 7429 }, { "epoch": 0.77, "learning_rate": 2.5748718406714388e-05, "loss": 0.5951, "step": 7430 }, { "epoch": 0.77, "learning_rate": 2.572613903806387e-05, "loss": 0.6555, "step": 7431 }, { "epoch": 0.77, "learning_rate": 2.5703568112287724e-05, "loss": 0.6583, "step": 7432 }, { "epoch": 0.77, "learning_rate": 2.5681005631951726e-05, "loss": 0.6895, "step": 7433 }, { "epoch": 0.77, "learning_rate": 2.5658451599620513e-05, "loss": 0.6899, "step": 7434 }, { "epoch": 0.77, "learning_rate": 2.5635906017857937e-05, "loss": 0.6851, "step": 7435 }, { "epoch": 0.77, "learning_rate": 2.5613368889226728e-05, "loss": 0.6682, "step": 7436 }, { "epoch": 0.77, "learning_rate": 2.559084021628877e-05, "loss": 0.697, "step": 7437 }, { "epoch": 0.77, "learning_rate": 2.5568320001604984e-05, "loss": 0.6495, "step": 7438 }, { "epoch": 0.77, "learning_rate": 2.5545808247735213e-05, "loss": 0.6371, "step": 7439 }, { "epoch": 0.77, "learning_rate": 2.552330495723846e-05, "loss": 0.6976, "step": 7440 }, { "epoch": 0.77, "learning_rate": 2.5500810132672758e-05, "loss": 0.6487, "step": 7441 }, { "epoch": 0.77, "learning_rate": 2.547832377659507e-05, "loss": 0.6593, "step": 7442 }, { "epoch": 0.77, "learning_rate": 2.5455845891561514e-05, "loss": 0.7162, "step": 7443 }, { "epoch": 0.77, "learning_rate": 2.5433376480127223e-05, "loss": 0.5524, "step": 7444 }, { "epoch": 0.77, "learning_rate": 2.5410915544846325e-05, "loss": 0.6566, "step": 7445 }, { "epoch": 0.78, "learning_rate": 2.538846308827195e-05, "loss": 0.6087, "step": 7446 }, { "epoch": 0.78, "learning_rate": 2.5366019112956407e-05, "loss": 0.7739, "step": 7447 }, { "epoch": 0.78, "learning_rate": 2.5343583621450885e-05, "loss": 0.6438, "step": 7448 }, { "epoch": 0.78, "learning_rate": 2.532115661630572e-05, "loss": 0.692, "step": 7449 }, { "epoch": 0.78, "learning_rate": 2.5298738100070196e-05, "loss": 0.6781, "step": 7450 }, { "epoch": 0.78, "learning_rate": 2.5276328075292698e-05, "loss": 0.6053, "step": 7451 }, { "epoch": 0.78, "learning_rate": 2.5253926544520656e-05, "loss": 0.7126, "step": 7452 }, { "epoch": 0.78, "learning_rate": 2.523153351030044e-05, "loss": 0.6883, "step": 7453 }, { "epoch": 0.78, "learning_rate": 2.5209148975177543e-05, "loss": 0.7089, "step": 7454 }, { "epoch": 0.78, "learning_rate": 2.51867729416965e-05, "loss": 0.7249, "step": 7455 }, { "epoch": 0.78, "learning_rate": 2.5164405412400792e-05, "loss": 0.6947, "step": 7456 }, { "epoch": 0.78, "learning_rate": 2.514204638983303e-05, "loss": 0.6125, "step": 7457 }, { "epoch": 0.78, "learning_rate": 2.5119695876534755e-05, "loss": 0.6598, "step": 7458 }, { "epoch": 0.78, "learning_rate": 2.509735387504667e-05, "loss": 0.6537, "step": 7459 }, { "epoch": 0.78, "learning_rate": 2.5075020387908375e-05, "loss": 0.7085, "step": 7460 }, { "epoch": 0.78, "learning_rate": 2.5052695417658632e-05, "loss": 0.6933, "step": 7461 }, { "epoch": 0.78, "learning_rate": 2.50303789668351e-05, "loss": 0.698, "step": 7462 }, { "epoch": 0.78, "learning_rate": 2.5008071037974567e-05, "loss": 0.7073, "step": 7463 }, { "epoch": 0.78, "learning_rate": 2.4985771633612864e-05, "loss": 0.6449, "step": 7464 }, { "epoch": 0.78, "learning_rate": 2.4963480756284752e-05, "loss": 0.5938, "step": 7465 }, { "epoch": 0.78, "learning_rate": 2.4941198408524115e-05, "loss": 0.652, "step": 7466 }, { "epoch": 0.78, "learning_rate": 2.4918924592863868e-05, "loss": 0.6722, "step": 7467 }, { "epoch": 0.78, "learning_rate": 2.4896659311835857e-05, "loss": 0.6941, "step": 7468 }, { "epoch": 0.78, "learning_rate": 2.48744025679711e-05, "loss": 0.7119, "step": 7469 }, { "epoch": 0.78, "learning_rate": 2.4852154363799485e-05, "loss": 0.635, "step": 7470 }, { "epoch": 0.78, "learning_rate": 2.482991470185011e-05, "loss": 0.6909, "step": 7471 }, { "epoch": 0.78, "learning_rate": 2.4807683584650943e-05, "loss": 0.6146, "step": 7472 }, { "epoch": 0.78, "learning_rate": 2.4785461014729037e-05, "loss": 0.6696, "step": 7473 }, { "epoch": 0.78, "learning_rate": 2.47632469946105e-05, "loss": 0.6389, "step": 7474 }, { "epoch": 0.78, "learning_rate": 2.4741041526820484e-05, "loss": 0.6439, "step": 7475 }, { "epoch": 0.78, "learning_rate": 2.4718844613883075e-05, "loss": 0.7202, "step": 7476 }, { "epoch": 0.78, "learning_rate": 2.469665625832147e-05, "loss": 0.6929, "step": 7477 }, { "epoch": 0.78, "learning_rate": 2.4674476462657903e-05, "loss": 0.7008, "step": 7478 }, { "epoch": 0.78, "learning_rate": 2.465230522941353e-05, "loss": 0.6679, "step": 7479 }, { "epoch": 0.78, "learning_rate": 2.463014256110865e-05, "loss": 0.6631, "step": 7480 }, { "epoch": 0.78, "learning_rate": 2.4607988460262565e-05, "loss": 0.7167, "step": 7481 }, { "epoch": 0.78, "learning_rate": 2.458584292939351e-05, "loss": 0.6762, "step": 7482 }, { "epoch": 0.78, "learning_rate": 2.4563705971018903e-05, "loss": 0.6635, "step": 7483 }, { "epoch": 0.78, "learning_rate": 2.454157758765504e-05, "loss": 0.6611, "step": 7484 }, { "epoch": 0.78, "learning_rate": 2.4519457781817303e-05, "loss": 0.6717, "step": 7485 }, { "epoch": 0.78, "learning_rate": 2.4497346556020107e-05, "loss": 0.6861, "step": 7486 }, { "epoch": 0.78, "learning_rate": 2.4475243912776924e-05, "loss": 0.6317, "step": 7487 }, { "epoch": 0.78, "learning_rate": 2.4453149854600155e-05, "loss": 0.7066, "step": 7488 }, { "epoch": 0.78, "learning_rate": 2.443106438400132e-05, "loss": 0.6701, "step": 7489 }, { "epoch": 0.78, "learning_rate": 2.440898750349089e-05, "loss": 0.6792, "step": 7490 }, { "epoch": 0.78, "learning_rate": 2.4386919215578407e-05, "loss": 0.7162, "step": 7491 }, { "epoch": 0.78, "learning_rate": 2.4364859522772454e-05, "loss": 0.6706, "step": 7492 }, { "epoch": 0.78, "learning_rate": 2.4342808427580553e-05, "loss": 0.6655, "step": 7493 }, { "epoch": 0.78, "learning_rate": 2.4320765932509326e-05, "loss": 0.6485, "step": 7494 }, { "epoch": 0.78, "learning_rate": 2.429873204006441e-05, "loss": 0.6771, "step": 7495 }, { "epoch": 0.78, "learning_rate": 2.4276706752750432e-05, "loss": 0.6668, "step": 7496 }, { "epoch": 0.78, "learning_rate": 2.4254690073071028e-05, "loss": 0.7, "step": 7497 }, { "epoch": 0.78, "learning_rate": 2.423268200352893e-05, "loss": 0.5927, "step": 7498 }, { "epoch": 0.78, "learning_rate": 2.4210682546625786e-05, "loss": 0.6565, "step": 7499 }, { "epoch": 0.78, "learning_rate": 2.4188691704862367e-05, "loss": 0.5835, "step": 7500 }, { "epoch": 0.78, "learning_rate": 2.4166709480738426e-05, "loss": 0.645, "step": 7501 }, { "epoch": 0.78, "learning_rate": 2.41447358767527e-05, "loss": 0.6921, "step": 7502 }, { "epoch": 0.78, "learning_rate": 2.412277089540299e-05, "loss": 0.668, "step": 7503 }, { "epoch": 0.78, "learning_rate": 2.4100814539186134e-05, "loss": 0.6589, "step": 7504 }, { "epoch": 0.78, "learning_rate": 2.40788668105979e-05, "loss": 0.6955, "step": 7505 }, { "epoch": 0.78, "learning_rate": 2.405692771213317e-05, "loss": 0.6754, "step": 7506 }, { "epoch": 0.78, "learning_rate": 2.403499724628584e-05, "loss": 0.6678, "step": 7507 }, { "epoch": 0.78, "learning_rate": 2.4013075415548757e-05, "loss": 0.6209, "step": 7508 }, { "epoch": 0.78, "learning_rate": 2.39911622224138e-05, "loss": 0.6926, "step": 7509 }, { "epoch": 0.78, "learning_rate": 2.3969257669371947e-05, "loss": 0.6071, "step": 7510 }, { "epoch": 0.78, "learning_rate": 2.3947361758913088e-05, "loss": 0.6098, "step": 7511 }, { "epoch": 0.78, "learning_rate": 2.3925474493526236e-05, "loss": 0.6934, "step": 7512 }, { "epoch": 0.78, "learning_rate": 2.3903595875699282e-05, "loss": 0.6858, "step": 7513 }, { "epoch": 0.78, "learning_rate": 2.3881725907919282e-05, "loss": 0.7252, "step": 7514 }, { "epoch": 0.78, "learning_rate": 2.3859864592672243e-05, "loss": 0.6561, "step": 7515 }, { "epoch": 0.78, "learning_rate": 2.383801193244316e-05, "loss": 0.6376, "step": 7516 }, { "epoch": 0.78, "learning_rate": 2.3816167929716072e-05, "loss": 0.6227, "step": 7517 }, { "epoch": 0.78, "learning_rate": 2.3794332586974087e-05, "loss": 0.5833, "step": 7518 }, { "epoch": 0.78, "learning_rate": 2.3772505906699205e-05, "loss": 0.6741, "step": 7519 }, { "epoch": 0.78, "learning_rate": 2.3750687891372548e-05, "loss": 0.6932, "step": 7520 }, { "epoch": 0.78, "learning_rate": 2.3728878543474254e-05, "loss": 0.6507, "step": 7521 }, { "epoch": 0.78, "learning_rate": 2.3707077865483394e-05, "loss": 0.6946, "step": 7522 }, { "epoch": 0.78, "learning_rate": 2.368528585987809e-05, "loss": 0.6581, "step": 7523 }, { "epoch": 0.78, "learning_rate": 2.366350252913553e-05, "loss": 0.6699, "step": 7524 }, { "epoch": 0.78, "learning_rate": 2.3641727875731824e-05, "loss": 0.7206, "step": 7525 }, { "epoch": 0.78, "learning_rate": 2.3619961902142172e-05, "loss": 0.6485, "step": 7526 }, { "epoch": 0.78, "learning_rate": 2.359820461084078e-05, "loss": 0.6476, "step": 7527 }, { "epoch": 0.78, "learning_rate": 2.3576456004300806e-05, "loss": 0.6369, "step": 7528 }, { "epoch": 0.78, "learning_rate": 2.3554716084994512e-05, "loss": 0.6956, "step": 7529 }, { "epoch": 0.78, "learning_rate": 2.353298485539307e-05, "loss": 0.6941, "step": 7530 }, { "epoch": 0.78, "learning_rate": 2.351126231796673e-05, "loss": 0.7263, "step": 7531 }, { "epoch": 0.78, "learning_rate": 2.3489548475184786e-05, "loss": 0.6723, "step": 7532 }, { "epoch": 0.78, "learning_rate": 2.3467843329515437e-05, "loss": 0.6797, "step": 7533 }, { "epoch": 0.78, "learning_rate": 2.3446146883426024e-05, "loss": 0.5998, "step": 7534 }, { "epoch": 0.78, "learning_rate": 2.3424459139382748e-05, "loss": 0.6776, "step": 7535 }, { "epoch": 0.78, "learning_rate": 2.3402780099850972e-05, "loss": 0.6166, "step": 7536 }, { "epoch": 0.78, "learning_rate": 2.338110976729494e-05, "loss": 0.6414, "step": 7537 }, { "epoch": 0.78, "learning_rate": 2.3359448144178042e-05, "loss": 0.7012, "step": 7538 }, { "epoch": 0.78, "learning_rate": 2.3337795232962523e-05, "loss": 0.646, "step": 7539 }, { "epoch": 0.78, "learning_rate": 2.3316151036109758e-05, "loss": 0.6688, "step": 7540 }, { "epoch": 0.78, "learning_rate": 2.329451555608011e-05, "loss": 0.6826, "step": 7541 }, { "epoch": 0.79, "learning_rate": 2.327288879533288e-05, "loss": 0.6895, "step": 7542 }, { "epoch": 0.79, "learning_rate": 2.325127075632647e-05, "loss": 0.6447, "step": 7543 }, { "epoch": 0.79, "learning_rate": 2.3229661441518257e-05, "loss": 0.6527, "step": 7544 }, { "epoch": 0.79, "learning_rate": 2.3208060853364576e-05, "loss": 0.6068, "step": 7545 }, { "epoch": 0.79, "learning_rate": 2.3186468994320875e-05, "loss": 0.7261, "step": 7546 }, { "epoch": 0.79, "learning_rate": 2.3164885866841478e-05, "loss": 0.6947, "step": 7547 }, { "epoch": 0.79, "learning_rate": 2.314331147337986e-05, "loss": 0.6444, "step": 7548 }, { "epoch": 0.79, "learning_rate": 2.3121745816388385e-05, "loss": 0.6966, "step": 7549 }, { "epoch": 0.79, "learning_rate": 2.3100188898318454e-05, "loss": 0.7245, "step": 7550 }, { "epoch": 0.79, "learning_rate": 2.3078640721620503e-05, "loss": 0.7076, "step": 7551 }, { "epoch": 0.79, "learning_rate": 2.305710128874401e-05, "loss": 0.7196, "step": 7552 }, { "epoch": 0.79, "learning_rate": 2.3035570602137336e-05, "loss": 0.6817, "step": 7553 }, { "epoch": 0.79, "learning_rate": 2.3014048664247955e-05, "loss": 0.695, "step": 7554 }, { "epoch": 0.79, "learning_rate": 2.299253547752235e-05, "loss": 0.6636, "step": 7555 }, { "epoch": 0.79, "learning_rate": 2.29710310444059e-05, "loss": 0.6724, "step": 7556 }, { "epoch": 0.79, "learning_rate": 2.29495353673431e-05, "loss": 0.659, "step": 7557 }, { "epoch": 0.79, "learning_rate": 2.2928048448777438e-05, "loss": 0.7026, "step": 7558 }, { "epoch": 0.79, "learning_rate": 2.290657029115133e-05, "loss": 0.6657, "step": 7559 }, { "epoch": 0.79, "learning_rate": 2.2885100896906287e-05, "loss": 0.6432, "step": 7560 }, { "epoch": 0.79, "learning_rate": 2.2863640268482768e-05, "loss": 0.6563, "step": 7561 }, { "epoch": 0.79, "learning_rate": 2.2842188408320218e-05, "loss": 0.7075, "step": 7562 }, { "epoch": 0.79, "learning_rate": 2.282074531885715e-05, "loss": 0.6337, "step": 7563 }, { "epoch": 0.79, "learning_rate": 2.2799311002531064e-05, "loss": 0.655, "step": 7564 }, { "epoch": 0.79, "learning_rate": 2.277788546177839e-05, "loss": 0.6623, "step": 7565 }, { "epoch": 0.79, "learning_rate": 2.2756468699034662e-05, "loss": 0.6847, "step": 7566 }, { "epoch": 0.79, "learning_rate": 2.273506071673439e-05, "loss": 0.6911, "step": 7567 }, { "epoch": 0.79, "learning_rate": 2.2713661517311003e-05, "loss": 0.6485, "step": 7568 }, { "epoch": 0.79, "learning_rate": 2.269227110319706e-05, "loss": 0.6484, "step": 7569 }, { "epoch": 0.79, "learning_rate": 2.2670889476823997e-05, "loss": 0.659, "step": 7570 }, { "epoch": 0.79, "learning_rate": 2.2649516640622335e-05, "loss": 0.6543, "step": 7571 }, { "epoch": 0.79, "learning_rate": 2.262815259702161e-05, "loss": 0.6588, "step": 7572 }, { "epoch": 0.79, "learning_rate": 2.2606797348450293e-05, "loss": 0.6416, "step": 7573 }, { "epoch": 0.79, "learning_rate": 2.2585450897335834e-05, "loss": 0.5867, "step": 7574 }, { "epoch": 0.79, "learning_rate": 2.256411324610481e-05, "loss": 0.7219, "step": 7575 }, { "epoch": 0.79, "learning_rate": 2.254278439718266e-05, "loss": 0.6384, "step": 7576 }, { "epoch": 0.79, "learning_rate": 2.2521464352993906e-05, "loss": 0.6933, "step": 7577 }, { "epoch": 0.79, "learning_rate": 2.2500153115962063e-05, "loss": 0.6739, "step": 7578 }, { "epoch": 0.79, "learning_rate": 2.2478850688509578e-05, "loss": 0.6837, "step": 7579 }, { "epoch": 0.79, "learning_rate": 2.2457557073057976e-05, "loss": 0.6743, "step": 7580 }, { "epoch": 0.79, "learning_rate": 2.243627227202778e-05, "loss": 0.6655, "step": 7581 }, { "epoch": 0.79, "learning_rate": 2.2414996287838418e-05, "loss": 0.6463, "step": 7582 }, { "epoch": 0.79, "learning_rate": 2.2393729122908402e-05, "loss": 0.6876, "step": 7583 }, { "epoch": 0.79, "learning_rate": 2.2372470779655265e-05, "loss": 0.707, "step": 7584 }, { "epoch": 0.79, "learning_rate": 2.2351221260495402e-05, "loss": 0.7487, "step": 7585 }, { "epoch": 0.79, "learning_rate": 2.2329980567844376e-05, "loss": 0.6606, "step": 7586 }, { "epoch": 0.79, "learning_rate": 2.2308748704116632e-05, "loss": 0.6307, "step": 7587 }, { "epoch": 0.79, "learning_rate": 2.2287525671725616e-05, "loss": 0.7072, "step": 7588 }, { "epoch": 0.79, "learning_rate": 2.2266311473083833e-05, "loss": 0.7267, "step": 7589 }, { "epoch": 0.79, "learning_rate": 2.224510611060272e-05, "loss": 0.6512, "step": 7590 }, { "epoch": 0.79, "learning_rate": 2.222390958669275e-05, "loss": 0.6611, "step": 7591 }, { "epoch": 0.79, "learning_rate": 2.22027219037634e-05, "loss": 0.6685, "step": 7592 }, { "epoch": 0.79, "learning_rate": 2.2181543064223077e-05, "loss": 0.6196, "step": 7593 }, { "epoch": 0.79, "learning_rate": 2.2160373070479255e-05, "loss": 0.5951, "step": 7594 }, { "epoch": 0.79, "learning_rate": 2.2139211924938396e-05, "loss": 0.61, "step": 7595 }, { "epoch": 0.79, "learning_rate": 2.2118059630005883e-05, "loss": 0.6773, "step": 7596 }, { "epoch": 0.79, "learning_rate": 2.209691618808617e-05, "loss": 0.6848, "step": 7597 }, { "epoch": 0.79, "learning_rate": 2.2075781601582712e-05, "loss": 0.648, "step": 7598 }, { "epoch": 0.79, "learning_rate": 2.205465587289788e-05, "loss": 0.6691, "step": 7599 }, { "epoch": 0.79, "learning_rate": 2.203353900443308e-05, "loss": 0.6986, "step": 7600 }, { "epoch": 0.79, "learning_rate": 2.201243099858874e-05, "loss": 0.6788, "step": 7601 }, { "epoch": 0.79, "learning_rate": 2.199133185776422e-05, "loss": 0.68, "step": 7602 }, { "epoch": 0.79, "learning_rate": 2.197024158435793e-05, "loss": 0.7357, "step": 7603 }, { "epoch": 0.79, "learning_rate": 2.194916018076727e-05, "loss": 0.6199, "step": 7604 }, { "epoch": 0.79, "learning_rate": 2.192808764938856e-05, "loss": 0.6597, "step": 7605 }, { "epoch": 0.79, "learning_rate": 2.190702399261718e-05, "loss": 0.7003, "step": 7606 }, { "epoch": 0.79, "learning_rate": 2.1885969212847523e-05, "loss": 0.6429, "step": 7607 }, { "epoch": 0.79, "learning_rate": 2.1864923312472874e-05, "loss": 0.697, "step": 7608 }, { "epoch": 0.79, "learning_rate": 2.1843886293885617e-05, "loss": 0.6731, "step": 7609 }, { "epoch": 0.79, "learning_rate": 2.182285815947702e-05, "loss": 0.6853, "step": 7610 }, { "epoch": 0.79, "learning_rate": 2.180183891163745e-05, "loss": 0.6385, "step": 7611 }, { "epoch": 0.79, "learning_rate": 2.178082855275617e-05, "loss": 0.5801, "step": 7612 }, { "epoch": 0.79, "learning_rate": 2.1759827085221528e-05, "loss": 0.6937, "step": 7613 }, { "epoch": 0.79, "learning_rate": 2.1738834511420735e-05, "loss": 0.6887, "step": 7614 }, { "epoch": 0.79, "learning_rate": 2.1717850833740138e-05, "loss": 0.7281, "step": 7615 }, { "epoch": 0.79, "learning_rate": 2.169687605456493e-05, "loss": 0.7107, "step": 7616 }, { "epoch": 0.79, "learning_rate": 2.1675910176279402e-05, "loss": 0.687, "step": 7617 }, { "epoch": 0.79, "learning_rate": 2.1654953201266802e-05, "loss": 0.6604, "step": 7618 }, { "epoch": 0.79, "learning_rate": 2.163400513190931e-05, "loss": 0.6847, "step": 7619 }, { "epoch": 0.79, "learning_rate": 2.1613065970588165e-05, "loss": 0.6868, "step": 7620 }, { "epoch": 0.79, "learning_rate": 2.1592135719683592e-05, "loss": 0.6743, "step": 7621 }, { "epoch": 0.79, "learning_rate": 2.1571214381574732e-05, "loss": 0.6628, "step": 7622 }, { "epoch": 0.79, "learning_rate": 2.155030195863982e-05, "loss": 0.6536, "step": 7623 }, { "epoch": 0.79, "learning_rate": 2.1529398453255945e-05, "loss": 0.6426, "step": 7624 }, { "epoch": 0.79, "learning_rate": 2.1508503867799323e-05, "loss": 0.7031, "step": 7625 }, { "epoch": 0.79, "learning_rate": 2.1487618204645054e-05, "loss": 0.6454, "step": 7626 }, { "epoch": 0.79, "learning_rate": 2.146674146616723e-05, "loss": 0.5965, "step": 7627 }, { "epoch": 0.79, "learning_rate": 2.144587365473899e-05, "loss": 0.7226, "step": 7628 }, { "epoch": 0.79, "learning_rate": 2.1425014772732444e-05, "loss": 0.6144, "step": 7629 }, { "epoch": 0.79, "learning_rate": 2.1404164822518613e-05, "loss": 0.7331, "step": 7630 }, { "epoch": 0.79, "learning_rate": 2.1383323806467593e-05, "loss": 0.6715, "step": 7631 }, { "epoch": 0.79, "learning_rate": 2.1362491726948452e-05, "loss": 0.6894, "step": 7632 }, { "epoch": 0.79, "learning_rate": 2.1341668586329154e-05, "loss": 0.6981, "step": 7633 }, { "epoch": 0.79, "learning_rate": 2.1320854386976762e-05, "loss": 0.6992, "step": 7634 }, { "epoch": 0.79, "learning_rate": 2.1300049131257273e-05, "loss": 0.68, "step": 7635 }, { "epoch": 0.79, "learning_rate": 2.1279252821535623e-05, "loss": 0.7078, "step": 7636 }, { "epoch": 0.79, "learning_rate": 2.1258465460175837e-05, "loss": 0.6999, "step": 7637 }, { "epoch": 0.8, "learning_rate": 2.1237687049540822e-05, "loss": 0.6783, "step": 7638 }, { "epoch": 0.8, "learning_rate": 2.121691759199248e-05, "loss": 0.6924, "step": 7639 }, { "epoch": 0.8, "learning_rate": 2.1196157089891756e-05, "loss": 0.686, "step": 7640 }, { "epoch": 0.8, "learning_rate": 2.117540554559857e-05, "loss": 0.7157, "step": 7641 }, { "epoch": 0.8, "learning_rate": 2.115466296147173e-05, "loss": 0.6954, "step": 7642 }, { "epoch": 0.8, "learning_rate": 2.1133929339869118e-05, "loss": 0.6649, "step": 7643 }, { "epoch": 0.8, "learning_rate": 2.1113204683147614e-05, "loss": 0.619, "step": 7644 }, { "epoch": 0.8, "learning_rate": 2.1092488993662972e-05, "loss": 0.6967, "step": 7645 }, { "epoch": 0.8, "learning_rate": 2.1071782273770035e-05, "loss": 0.6791, "step": 7646 }, { "epoch": 0.8, "learning_rate": 2.105108452582255e-05, "loss": 0.7398, "step": 7647 }, { "epoch": 0.8, "learning_rate": 2.103039575217328e-05, "loss": 0.7006, "step": 7648 }, { "epoch": 0.8, "learning_rate": 2.1009715955174014e-05, "loss": 0.64, "step": 7649 }, { "epoch": 0.8, "learning_rate": 2.0989045137175422e-05, "loss": 0.6977, "step": 7650 }, { "epoch": 0.8, "learning_rate": 2.0968383300527182e-05, "loss": 0.7014, "step": 7651 }, { "epoch": 0.8, "learning_rate": 2.094773044757804e-05, "loss": 0.6438, "step": 7652 }, { "epoch": 0.8, "learning_rate": 2.092708658067557e-05, "loss": 0.6899, "step": 7653 }, { "epoch": 0.8, "learning_rate": 2.090645170216645e-05, "loss": 0.6752, "step": 7654 }, { "epoch": 0.8, "learning_rate": 2.0885825814396308e-05, "loss": 0.6856, "step": 7655 }, { "epoch": 0.8, "learning_rate": 2.08652089197097e-05, "loss": 0.7029, "step": 7656 }, { "epoch": 0.8, "learning_rate": 2.0844601020450204e-05, "loss": 0.6874, "step": 7657 }, { "epoch": 0.8, "learning_rate": 2.0824002118960405e-05, "loss": 0.6906, "step": 7658 }, { "epoch": 0.8, "learning_rate": 2.0803412217581762e-05, "loss": 0.6838, "step": 7659 }, { "epoch": 0.8, "learning_rate": 2.0782831318654806e-05, "loss": 0.6199, "step": 7660 }, { "epoch": 0.8, "learning_rate": 2.0762259424519036e-05, "loss": 0.7107, "step": 7661 }, { "epoch": 0.8, "learning_rate": 2.0741696537512855e-05, "loss": 0.7305, "step": 7662 }, { "epoch": 0.8, "learning_rate": 2.0721142659973746e-05, "loss": 0.6826, "step": 7663 }, { "epoch": 0.8, "learning_rate": 2.0700597794238086e-05, "loss": 0.6716, "step": 7664 }, { "epoch": 0.8, "learning_rate": 2.0680061942641227e-05, "loss": 0.6641, "step": 7665 }, { "epoch": 0.8, "learning_rate": 2.0659535107517582e-05, "loss": 0.7276, "step": 7666 }, { "epoch": 0.8, "learning_rate": 2.0639017291200423e-05, "loss": 0.6604, "step": 7667 }, { "epoch": 0.8, "learning_rate": 2.061850849602208e-05, "loss": 0.6861, "step": 7668 }, { "epoch": 0.8, "learning_rate": 2.059800872431388e-05, "loss": 0.7034, "step": 7669 }, { "epoch": 0.8, "learning_rate": 2.0577517978405993e-05, "loss": 0.6919, "step": 7670 }, { "epoch": 0.8, "learning_rate": 2.0557036260627706e-05, "loss": 0.7356, "step": 7671 }, { "epoch": 0.8, "learning_rate": 2.053656357330722e-05, "loss": 0.5944, "step": 7672 }, { "epoch": 0.8, "learning_rate": 2.051609991877168e-05, "loss": 0.7079, "step": 7673 }, { "epoch": 0.8, "learning_rate": 2.0495645299347245e-05, "loss": 0.6071, "step": 7674 }, { "epoch": 0.8, "learning_rate": 2.047519971735907e-05, "loss": 0.7115, "step": 7675 }, { "epoch": 0.8, "learning_rate": 2.045476317513123e-05, "loss": 0.6437, "step": 7676 }, { "epoch": 0.8, "learning_rate": 2.043433567498675e-05, "loss": 0.6288, "step": 7677 }, { "epoch": 0.8, "learning_rate": 2.0413917219247737e-05, "loss": 0.6389, "step": 7678 }, { "epoch": 0.8, "learning_rate": 2.0393507810235145e-05, "loss": 0.6866, "step": 7679 }, { "epoch": 0.8, "learning_rate": 2.037310745026898e-05, "loss": 0.7175, "step": 7680 }, { "epoch": 0.8, "learning_rate": 2.0352716141668215e-05, "loss": 0.6489, "step": 7681 }, { "epoch": 0.8, "learning_rate": 2.0332333886750744e-05, "loss": 0.7024, "step": 7682 }, { "epoch": 0.8, "learning_rate": 2.0311960687833466e-05, "loss": 0.6921, "step": 7683 }, { "epoch": 0.8, "learning_rate": 2.0291596547232293e-05, "loss": 0.7426, "step": 7684 }, { "epoch": 0.8, "learning_rate": 2.0271241467262004e-05, "loss": 0.6026, "step": 7685 }, { "epoch": 0.8, "learning_rate": 2.0250895450236452e-05, "loss": 0.6758, "step": 7686 }, { "epoch": 0.8, "learning_rate": 2.0230558498468357e-05, "loss": 0.6911, "step": 7687 }, { "epoch": 0.8, "learning_rate": 2.021023061426953e-05, "loss": 0.6715, "step": 7688 }, { "epoch": 0.8, "learning_rate": 2.0189911799950632e-05, "loss": 0.6979, "step": 7689 }, { "epoch": 0.8, "learning_rate": 2.0169602057821403e-05, "loss": 0.578, "step": 7690 }, { "epoch": 0.8, "learning_rate": 2.0149301390190433e-05, "loss": 0.6973, "step": 7691 }, { "epoch": 0.8, "learning_rate": 2.0129009799365417e-05, "loss": 0.6624, "step": 7692 }, { "epoch": 0.8, "learning_rate": 2.0108727287652863e-05, "loss": 0.6249, "step": 7693 }, { "epoch": 0.8, "learning_rate": 2.0088453857358368e-05, "loss": 0.6372, "step": 7694 }, { "epoch": 0.8, "learning_rate": 2.0068189510786494e-05, "loss": 0.6672, "step": 7695 }, { "epoch": 0.8, "learning_rate": 2.0047934250240673e-05, "loss": 0.7033, "step": 7696 }, { "epoch": 0.8, "learning_rate": 2.0027688078023398e-05, "loss": 0.7044, "step": 7697 }, { "epoch": 0.8, "learning_rate": 2.0007450996436116e-05, "loss": 0.6944, "step": 7698 }, { "epoch": 0.8, "learning_rate": 1.9987223007779164e-05, "loss": 0.6452, "step": 7699 }, { "epoch": 0.8, "learning_rate": 1.9967004114351973e-05, "loss": 0.7236, "step": 7700 }, { "epoch": 0.8, "learning_rate": 1.9946794318452788e-05, "loss": 0.66, "step": 7701 }, { "epoch": 0.8, "learning_rate": 1.9926593622378987e-05, "loss": 0.6801, "step": 7702 }, { "epoch": 0.8, "learning_rate": 1.990640202842674e-05, "loss": 0.662, "step": 7703 }, { "epoch": 0.8, "learning_rate": 1.988621953889136e-05, "loss": 0.6787, "step": 7704 }, { "epoch": 0.8, "learning_rate": 1.9866046156066954e-05, "loss": 0.6588, "step": 7705 }, { "epoch": 0.8, "learning_rate": 1.9845881882246743e-05, "loss": 0.687, "step": 7706 }, { "epoch": 0.8, "learning_rate": 1.982572671972278e-05, "loss": 0.6702, "step": 7707 }, { "epoch": 0.8, "learning_rate": 1.9805580670786185e-05, "loss": 0.6527, "step": 7708 }, { "epoch": 0.8, "learning_rate": 1.9785443737727028e-05, "loss": 0.6342, "step": 7709 }, { "epoch": 0.8, "learning_rate": 1.976531592283426e-05, "loss": 0.6732, "step": 7710 }, { "epoch": 0.8, "learning_rate": 1.9745197228395896e-05, "loss": 0.7299, "step": 7711 }, { "epoch": 0.8, "learning_rate": 1.972508765669887e-05, "loss": 0.649, "step": 7712 }, { "epoch": 0.8, "learning_rate": 1.970498721002906e-05, "loss": 0.6955, "step": 7713 }, { "epoch": 0.8, "learning_rate": 1.968489589067136e-05, "loss": 0.6644, "step": 7714 }, { "epoch": 0.8, "learning_rate": 1.966481370090958e-05, "loss": 0.6943, "step": 7715 }, { "epoch": 0.8, "learning_rate": 1.9644740643026473e-05, "loss": 0.7217, "step": 7716 }, { "epoch": 0.8, "learning_rate": 1.9624676719303824e-05, "loss": 0.7237, "step": 7717 }, { "epoch": 0.8, "learning_rate": 1.960462193202236e-05, "loss": 0.6555, "step": 7718 }, { "epoch": 0.8, "learning_rate": 1.958457628346171e-05, "loss": 0.7269, "step": 7719 }, { "epoch": 0.8, "learning_rate": 1.9564539775900525e-05, "loss": 0.6385, "step": 7720 }, { "epoch": 0.8, "learning_rate": 1.954451241161642e-05, "loss": 0.6802, "step": 7721 }, { "epoch": 0.8, "learning_rate": 1.9524494192885912e-05, "loss": 0.7, "step": 7722 }, { "epoch": 0.8, "learning_rate": 1.950448512198454e-05, "loss": 0.6717, "step": 7723 }, { "epoch": 0.8, "learning_rate": 1.9484485201186797e-05, "loss": 0.6188, "step": 7724 }, { "epoch": 0.8, "learning_rate": 1.9464494432766077e-05, "loss": 0.6028, "step": 7725 }, { "epoch": 0.8, "learning_rate": 1.944451281899482e-05, "loss": 0.6857, "step": 7726 }, { "epoch": 0.8, "learning_rate": 1.9424540362144328e-05, "loss": 0.6877, "step": 7727 }, { "epoch": 0.8, "learning_rate": 1.9404577064484975e-05, "loss": 0.6324, "step": 7728 }, { "epoch": 0.8, "learning_rate": 1.938462292828599e-05, "loss": 0.6697, "step": 7729 }, { "epoch": 0.8, "learning_rate": 1.936467795581559e-05, "loss": 0.693, "step": 7730 }, { "epoch": 0.8, "learning_rate": 1.9344742149341e-05, "loss": 0.6323, "step": 7731 }, { "epoch": 0.8, "learning_rate": 1.932481551112837e-05, "loss": 0.6262, "step": 7732 }, { "epoch": 0.8, "learning_rate": 1.9304898043442765e-05, "loss": 0.6394, "step": 7733 }, { "epoch": 0.81, "learning_rate": 1.9284989748548276e-05, "loss": 0.612, "step": 7734 }, { "epoch": 0.81, "learning_rate": 1.9265090628707947e-05, "loss": 0.6146, "step": 7735 }, { "epoch": 0.81, "learning_rate": 1.9245200686183708e-05, "loss": 0.6972, "step": 7736 }, { "epoch": 0.81, "learning_rate": 1.9225319923236506e-05, "loss": 0.6462, "step": 7737 }, { "epoch": 0.81, "learning_rate": 1.9205448342126266e-05, "loss": 0.6522, "step": 7738 }, { "epoch": 0.81, "learning_rate": 1.9185585945111784e-05, "loss": 0.649, "step": 7739 }, { "epoch": 0.81, "learning_rate": 1.9165732734450914e-05, "loss": 0.6814, "step": 7740 }, { "epoch": 0.81, "learning_rate": 1.9145888712400384e-05, "loss": 0.6723, "step": 7741 }, { "epoch": 0.81, "learning_rate": 1.9126053881215888e-05, "loss": 0.6999, "step": 7742 }, { "epoch": 0.81, "learning_rate": 1.9106228243152114e-05, "loss": 0.7339, "step": 7743 }, { "epoch": 0.81, "learning_rate": 1.908641180046271e-05, "loss": 0.692, "step": 7744 }, { "epoch": 0.81, "learning_rate": 1.9066604555400224e-05, "loss": 0.6755, "step": 7745 }, { "epoch": 0.81, "learning_rate": 1.904680651021622e-05, "loss": 0.6599, "step": 7746 }, { "epoch": 0.81, "learning_rate": 1.902701766716114e-05, "loss": 0.709, "step": 7747 }, { "epoch": 0.81, "learning_rate": 1.9007238028484455e-05, "loss": 0.6191, "step": 7748 }, { "epoch": 0.81, "learning_rate": 1.8987467596434584e-05, "loss": 0.6767, "step": 7749 }, { "epoch": 0.81, "learning_rate": 1.8967706373258808e-05, "loss": 0.662, "step": 7750 }, { "epoch": 0.81, "learning_rate": 1.894795436120349e-05, "loss": 0.7078, "step": 7751 }, { "epoch": 0.81, "learning_rate": 1.8928211562513875e-05, "loss": 0.5944, "step": 7752 }, { "epoch": 0.81, "learning_rate": 1.890847797943417e-05, "loss": 0.6918, "step": 7753 }, { "epoch": 0.81, "learning_rate": 1.88887536142075e-05, "loss": 0.6906, "step": 7754 }, { "epoch": 0.81, "learning_rate": 1.8869038469076027e-05, "loss": 0.6678, "step": 7755 }, { "epoch": 0.81, "learning_rate": 1.8849332546280774e-05, "loss": 0.6204, "step": 7756 }, { "epoch": 0.81, "learning_rate": 1.8829635848061766e-05, "loss": 0.6912, "step": 7757 }, { "epoch": 0.81, "learning_rate": 1.8809948376658003e-05, "loss": 0.6707, "step": 7758 }, { "epoch": 0.81, "learning_rate": 1.8790270134307363e-05, "loss": 0.6588, "step": 7759 }, { "epoch": 0.81, "learning_rate": 1.877060112324672e-05, "loss": 0.7009, "step": 7760 }, { "epoch": 0.81, "learning_rate": 1.8750941345711946e-05, "loss": 0.6826, "step": 7761 }, { "epoch": 0.81, "learning_rate": 1.873129080393774e-05, "loss": 0.6678, "step": 7762 }, { "epoch": 0.81, "learning_rate": 1.8711649500157847e-05, "loss": 0.6311, "step": 7763 }, { "epoch": 0.81, "learning_rate": 1.869201743660498e-05, "loss": 0.64, "step": 7764 }, { "epoch": 0.81, "learning_rate": 1.8672394615510712e-05, "loss": 0.7065, "step": 7765 }, { "epoch": 0.81, "learning_rate": 1.8652781039105617e-05, "loss": 0.6052, "step": 7766 }, { "epoch": 0.81, "learning_rate": 1.8633176709619227e-05, "loss": 0.6579, "step": 7767 }, { "epoch": 0.81, "learning_rate": 1.8613581629279986e-05, "loss": 0.7111, "step": 7768 }, { "epoch": 0.81, "learning_rate": 1.8593995800315355e-05, "loss": 0.6818, "step": 7769 }, { "epoch": 0.81, "learning_rate": 1.8574419224951644e-05, "loss": 0.7419, "step": 7770 }, { "epoch": 0.81, "learning_rate": 1.8554851905414195e-05, "loss": 0.7035, "step": 7771 }, { "epoch": 0.81, "learning_rate": 1.8535293843927294e-05, "loss": 0.6936, "step": 7772 }, { "epoch": 0.81, "learning_rate": 1.8515745042714096e-05, "loss": 0.6649, "step": 7773 }, { "epoch": 0.81, "learning_rate": 1.849620550399678e-05, "loss": 0.6622, "step": 7774 }, { "epoch": 0.81, "learning_rate": 1.8476675229996476e-05, "loss": 0.5644, "step": 7775 }, { "epoch": 0.81, "learning_rate": 1.845715422293318e-05, "loss": 0.7241, "step": 7776 }, { "epoch": 0.81, "learning_rate": 1.843764248502593e-05, "loss": 0.7161, "step": 7777 }, { "epoch": 0.81, "learning_rate": 1.841814001849267e-05, "loss": 0.6457, "step": 7778 }, { "epoch": 0.81, "learning_rate": 1.839864682555028e-05, "loss": 0.7013, "step": 7779 }, { "epoch": 0.81, "learning_rate": 1.837916290841456e-05, "loss": 0.6656, "step": 7780 }, { "epoch": 0.81, "learning_rate": 1.8359688269300346e-05, "loss": 0.6464, "step": 7781 }, { "epoch": 0.81, "learning_rate": 1.83402229104213e-05, "loss": 0.6169, "step": 7782 }, { "epoch": 0.81, "learning_rate": 1.8320766833990144e-05, "loss": 0.5871, "step": 7783 }, { "epoch": 0.81, "learning_rate": 1.8301320042218496e-05, "loss": 0.6883, "step": 7784 }, { "epoch": 0.81, "learning_rate": 1.8281882537316874e-05, "loss": 0.6029, "step": 7785 }, { "epoch": 0.81, "learning_rate": 1.8262454321494825e-05, "loss": 0.6423, "step": 7786 }, { "epoch": 0.81, "learning_rate": 1.824303539696076e-05, "loss": 0.6704, "step": 7787 }, { "epoch": 0.81, "learning_rate": 1.822362576592208e-05, "loss": 0.6702, "step": 7788 }, { "epoch": 0.81, "learning_rate": 1.8204225430585163e-05, "loss": 0.6679, "step": 7789 }, { "epoch": 0.81, "learning_rate": 1.8184834393155237e-05, "loss": 0.6382, "step": 7790 }, { "epoch": 0.81, "learning_rate": 1.8165452655836557e-05, "loss": 0.6996, "step": 7791 }, { "epoch": 0.81, "learning_rate": 1.8146080220832275e-05, "loss": 0.6897, "step": 7792 }, { "epoch": 0.81, "learning_rate": 1.812671709034448e-05, "loss": 0.646, "step": 7793 }, { "epoch": 0.81, "learning_rate": 1.810736326657423e-05, "loss": 0.6893, "step": 7794 }, { "epoch": 0.81, "learning_rate": 1.8088018751721557e-05, "loss": 0.7188, "step": 7795 }, { "epoch": 0.81, "learning_rate": 1.806868354798533e-05, "loss": 0.6911, "step": 7796 }, { "epoch": 0.81, "learning_rate": 1.804935765756347e-05, "loss": 0.6496, "step": 7797 }, { "epoch": 0.81, "learning_rate": 1.8030041082652805e-05, "loss": 0.6826, "step": 7798 }, { "epoch": 0.81, "learning_rate": 1.8010733825449044e-05, "loss": 0.6709, "step": 7799 }, { "epoch": 0.81, "learning_rate": 1.799143588814691e-05, "loss": 0.6944, "step": 7800 }, { "epoch": 0.81, "learning_rate": 1.7972147272940076e-05, "loss": 0.671, "step": 7801 }, { "epoch": 0.81, "learning_rate": 1.795286798202106e-05, "loss": 0.7074, "step": 7802 }, { "epoch": 0.81, "learning_rate": 1.793359801758143e-05, "loss": 0.6232, "step": 7803 }, { "epoch": 0.81, "learning_rate": 1.7914337381811617e-05, "loss": 0.6895, "step": 7804 }, { "epoch": 0.81, "learning_rate": 1.7895086076901046e-05, "loss": 0.6349, "step": 7805 }, { "epoch": 0.81, "learning_rate": 1.787584410503804e-05, "loss": 0.7137, "step": 7806 }, { "epoch": 0.81, "learning_rate": 1.7856611468409855e-05, "loss": 0.6833, "step": 7807 }, { "epoch": 0.81, "learning_rate": 1.783738816920273e-05, "loss": 0.6778, "step": 7808 }, { "epoch": 0.81, "learning_rate": 1.7818174209601834e-05, "loss": 0.6348, "step": 7809 }, { "epoch": 0.81, "learning_rate": 1.7798969591791236e-05, "loss": 0.722, "step": 7810 }, { "epoch": 0.81, "learning_rate": 1.7779774317953967e-05, "loss": 0.7052, "step": 7811 }, { "epoch": 0.81, "learning_rate": 1.7760588390272038e-05, "loss": 0.6924, "step": 7812 }, { "epoch": 0.81, "learning_rate": 1.774141181092629e-05, "loss": 0.6681, "step": 7813 }, { "epoch": 0.81, "learning_rate": 1.7722244582096605e-05, "loss": 0.6821, "step": 7814 }, { "epoch": 0.81, "learning_rate": 1.770308670596179e-05, "loss": 0.6306, "step": 7815 }, { "epoch": 0.81, "learning_rate": 1.76839381846995e-05, "loss": 0.6967, "step": 7816 }, { "epoch": 0.81, "learning_rate": 1.7664799020486455e-05, "loss": 0.6337, "step": 7817 }, { "epoch": 0.81, "learning_rate": 1.7645669215498217e-05, "loss": 0.6672, "step": 7818 }, { "epoch": 0.81, "learning_rate": 1.762654877190929e-05, "loss": 0.6158, "step": 7819 }, { "epoch": 0.81, "learning_rate": 1.760743769189315e-05, "loss": 0.7134, "step": 7820 }, { "epoch": 0.81, "learning_rate": 1.7588335977622227e-05, "loss": 0.6823, "step": 7821 }, { "epoch": 0.81, "learning_rate": 1.7569243631267816e-05, "loss": 0.6671, "step": 7822 }, { "epoch": 0.81, "learning_rate": 1.7550160655000204e-05, "loss": 0.6277, "step": 7823 }, { "epoch": 0.81, "learning_rate": 1.7531087050988615e-05, "loss": 0.6991, "step": 7824 }, { "epoch": 0.81, "learning_rate": 1.7512022821401142e-05, "loss": 0.6868, "step": 7825 }, { "epoch": 0.81, "learning_rate": 1.7492967968404915e-05, "loss": 0.6764, "step": 7826 }, { "epoch": 0.81, "learning_rate": 1.7473922494165875e-05, "loss": 0.6814, "step": 7827 }, { "epoch": 0.81, "learning_rate": 1.7454886400849e-05, "loss": 0.6632, "step": 7828 }, { "epoch": 0.81, "learning_rate": 1.7435859690618195e-05, "loss": 0.655, "step": 7829 }, { "epoch": 0.82, "learning_rate": 1.7416842365636233e-05, "loss": 0.6553, "step": 7830 }, { "epoch": 0.82, "learning_rate": 1.7397834428064828e-05, "loss": 0.6694, "step": 7831 }, { "epoch": 0.82, "learning_rate": 1.7378835880064714e-05, "loss": 0.6694, "step": 7832 }, { "epoch": 0.82, "learning_rate": 1.735984672379545e-05, "loss": 0.6688, "step": 7833 }, { "epoch": 0.82, "learning_rate": 1.734086696141559e-05, "loss": 0.7235, "step": 7834 }, { "epoch": 0.82, "learning_rate": 1.732189659508263e-05, "loss": 0.6313, "step": 7835 }, { "epoch": 0.82, "learning_rate": 1.7302935626952933e-05, "loss": 0.6768, "step": 7836 }, { "epoch": 0.82, "learning_rate": 1.7283984059181855e-05, "loss": 0.636, "step": 7837 }, { "epoch": 0.82, "learning_rate": 1.7265041893923695e-05, "loss": 0.6459, "step": 7838 }, { "epoch": 0.82, "learning_rate": 1.724610913333159e-05, "loss": 0.6969, "step": 7839 }, { "epoch": 0.82, "learning_rate": 1.72271857795577e-05, "loss": 0.6919, "step": 7840 }, { "epoch": 0.82, "learning_rate": 1.7208271834753097e-05, "loss": 0.6317, "step": 7841 }, { "epoch": 0.82, "learning_rate": 1.718936730106776e-05, "loss": 0.6673, "step": 7842 }, { "epoch": 0.82, "learning_rate": 1.7170472180650587e-05, "loss": 0.6356, "step": 7843 }, { "epoch": 0.82, "learning_rate": 1.7151586475649473e-05, "loss": 0.6998, "step": 7844 }, { "epoch": 0.82, "learning_rate": 1.713271018821113e-05, "loss": 0.651, "step": 7845 }, { "epoch": 0.82, "learning_rate": 1.711384332048135e-05, "loss": 0.6917, "step": 7846 }, { "epoch": 0.82, "learning_rate": 1.7094985874604707e-05, "loss": 0.7087, "step": 7847 }, { "epoch": 0.82, "learning_rate": 1.7076137852724784e-05, "loss": 0.669, "step": 7848 }, { "epoch": 0.82, "learning_rate": 1.7057299256984115e-05, "loss": 0.5856, "step": 7849 }, { "epoch": 0.82, "learning_rate": 1.7038470089524072e-05, "loss": 0.671, "step": 7850 }, { "epoch": 0.82, "learning_rate": 1.7019650352485028e-05, "loss": 0.6197, "step": 7851 }, { "epoch": 0.82, "learning_rate": 1.7000840048006295e-05, "loss": 0.6014, "step": 7852 }, { "epoch": 0.82, "learning_rate": 1.698203917822604e-05, "loss": 0.7136, "step": 7853 }, { "epoch": 0.82, "learning_rate": 1.6963247745281396e-05, "loss": 0.6151, "step": 7854 }, { "epoch": 0.82, "learning_rate": 1.694446575130848e-05, "loss": 0.6591, "step": 7855 }, { "epoch": 0.82, "learning_rate": 1.692569319844226e-05, "loss": 0.5971, "step": 7856 }, { "epoch": 0.82, "learning_rate": 1.6906930088816596e-05, "loss": 0.6918, "step": 7857 }, { "epoch": 0.82, "learning_rate": 1.6888176424564416e-05, "loss": 0.7133, "step": 7858 }, { "epoch": 0.82, "learning_rate": 1.6869432207817425e-05, "loss": 0.6358, "step": 7859 }, { "epoch": 0.82, "learning_rate": 1.6850697440706353e-05, "loss": 0.6572, "step": 7860 }, { "epoch": 0.82, "learning_rate": 1.683197212536084e-05, "loss": 0.6277, "step": 7861 }, { "epoch": 0.82, "learning_rate": 1.681325626390938e-05, "loss": 0.6425, "step": 7862 }, { "epoch": 0.82, "learning_rate": 1.679454985847949e-05, "loss": 0.6497, "step": 7863 }, { "epoch": 0.82, "learning_rate": 1.6775852911197575e-05, "loss": 0.6551, "step": 7864 }, { "epoch": 0.82, "learning_rate": 1.6757165424188913e-05, "loss": 0.6473, "step": 7865 }, { "epoch": 0.82, "learning_rate": 1.6738487399577808e-05, "loss": 0.6346, "step": 7866 }, { "epoch": 0.82, "learning_rate": 1.671981883948738e-05, "loss": 0.6522, "step": 7867 }, { "epoch": 0.82, "learning_rate": 1.6701159746039762e-05, "loss": 0.6081, "step": 7868 }, { "epoch": 0.82, "learning_rate": 1.6682510121355954e-05, "loss": 0.6742, "step": 7869 }, { "epoch": 0.82, "learning_rate": 1.6663869967555924e-05, "loss": 0.6679, "step": 7870 }, { "epoch": 0.82, "learning_rate": 1.6645239286758496e-05, "loss": 0.6554, "step": 7871 }, { "epoch": 0.82, "learning_rate": 1.6626618081081514e-05, "loss": 0.6033, "step": 7872 }, { "epoch": 0.82, "learning_rate": 1.6608006352641636e-05, "loss": 0.6694, "step": 7873 }, { "epoch": 0.82, "learning_rate": 1.658940410355454e-05, "loss": 0.6574, "step": 7874 }, { "epoch": 0.82, "learning_rate": 1.657081133593479e-05, "loss": 0.6902, "step": 7875 }, { "epoch": 0.82, "learning_rate": 1.6552228051895825e-05, "loss": 0.6896, "step": 7876 }, { "epoch": 0.82, "learning_rate": 1.6533654253550078e-05, "loss": 0.6855, "step": 7877 }, { "epoch": 0.82, "learning_rate": 1.65150899430089e-05, "loss": 0.7095, "step": 7878 }, { "epoch": 0.82, "learning_rate": 1.6496535122382474e-05, "loss": 0.6652, "step": 7879 }, { "epoch": 0.82, "learning_rate": 1.6477989793780023e-05, "loss": 0.7149, "step": 7880 }, { "epoch": 0.82, "learning_rate": 1.645945395930959e-05, "loss": 0.6898, "step": 7881 }, { "epoch": 0.82, "learning_rate": 1.644092762107823e-05, "loss": 0.6829, "step": 7882 }, { "epoch": 0.82, "learning_rate": 1.642241078119182e-05, "loss": 0.6335, "step": 7883 }, { "epoch": 0.82, "learning_rate": 1.6403903441755274e-05, "loss": 0.641, "step": 7884 }, { "epoch": 0.82, "learning_rate": 1.6385405604872307e-05, "loss": 0.7044, "step": 7885 }, { "epoch": 0.82, "learning_rate": 1.6366917272645656e-05, "loss": 0.6512, "step": 7886 }, { "epoch": 0.82, "learning_rate": 1.6348438447176873e-05, "loss": 0.6602, "step": 7887 }, { "epoch": 0.82, "learning_rate": 1.6329969130566513e-05, "loss": 0.6901, "step": 7888 }, { "epoch": 0.82, "learning_rate": 1.6311509324914065e-05, "loss": 0.6317, "step": 7889 }, { "epoch": 0.82, "learning_rate": 1.6293059032317837e-05, "loss": 0.6506, "step": 7890 }, { "epoch": 0.82, "learning_rate": 1.627461825487514e-05, "loss": 0.6775, "step": 7891 }, { "epoch": 0.82, "learning_rate": 1.6256186994682198e-05, "loss": 0.6718, "step": 7892 }, { "epoch": 0.82, "learning_rate": 1.6237765253834094e-05, "loss": 0.7424, "step": 7893 }, { "epoch": 0.82, "learning_rate": 1.621935303442491e-05, "loss": 0.7337, "step": 7894 }, { "epoch": 0.82, "learning_rate": 1.6200950338547573e-05, "loss": 0.6981, "step": 7895 }, { "epoch": 0.82, "learning_rate": 1.6182557168293956e-05, "loss": 0.6064, "step": 7896 }, { "epoch": 0.82, "learning_rate": 1.6164173525754844e-05, "loss": 0.6348, "step": 7897 }, { "epoch": 0.82, "learning_rate": 1.6145799413020002e-05, "loss": 0.604, "step": 7898 }, { "epoch": 0.82, "learning_rate": 1.612743483217798e-05, "loss": 0.5991, "step": 7899 }, { "epoch": 0.82, "learning_rate": 1.6109079785316372e-05, "loss": 0.7136, "step": 7900 }, { "epoch": 0.82, "learning_rate": 1.6090734274521635e-05, "loss": 0.6788, "step": 7901 }, { "epoch": 0.82, "learning_rate": 1.607239830187911e-05, "loss": 0.6932, "step": 7902 }, { "epoch": 0.82, "learning_rate": 1.605407186947312e-05, "loss": 0.719, "step": 7903 }, { "epoch": 0.82, "learning_rate": 1.6035754979386874e-05, "loss": 0.6254, "step": 7904 }, { "epoch": 0.82, "learning_rate": 1.6017447633702464e-05, "loss": 0.5909, "step": 7905 }, { "epoch": 0.82, "learning_rate": 1.599914983450096e-05, "loss": 0.6834, "step": 7906 }, { "epoch": 0.82, "learning_rate": 1.5980861583862306e-05, "loss": 0.6609, "step": 7907 }, { "epoch": 0.82, "learning_rate": 1.596258288386533e-05, "loss": 0.7267, "step": 7908 }, { "epoch": 0.82, "learning_rate": 1.594431373658786e-05, "loss": 0.6506, "step": 7909 }, { "epoch": 0.82, "learning_rate": 1.592605414410655e-05, "loss": 0.6768, "step": 7910 }, { "epoch": 0.82, "learning_rate": 1.5907804108497028e-05, "loss": 0.6921, "step": 7911 }, { "epoch": 0.82, "learning_rate": 1.5889563631833836e-05, "loss": 0.6572, "step": 7912 }, { "epoch": 0.82, "learning_rate": 1.5871332716190378e-05, "loss": 0.6943, "step": 7913 }, { "epoch": 0.82, "learning_rate": 1.5853111363639016e-05, "loss": 0.7179, "step": 7914 }, { "epoch": 0.82, "learning_rate": 1.583489957625103e-05, "loss": 0.7001, "step": 7915 }, { "epoch": 0.82, "learning_rate": 1.5816697356096543e-05, "loss": 0.6516, "step": 7916 }, { "epoch": 0.82, "learning_rate": 1.579850470524469e-05, "loss": 0.6173, "step": 7917 }, { "epoch": 0.82, "learning_rate": 1.5780321625763472e-05, "loss": 0.6752, "step": 7918 }, { "epoch": 0.82, "learning_rate": 1.5762148119719756e-05, "loss": 0.6874, "step": 7919 }, { "epoch": 0.82, "learning_rate": 1.5743984189179418e-05, "loss": 0.6944, "step": 7920 }, { "epoch": 0.82, "learning_rate": 1.5725829836207162e-05, "loss": 0.7374, "step": 7921 }, { "epoch": 0.82, "learning_rate": 1.5707685062866607e-05, "loss": 0.6292, "step": 7922 }, { "epoch": 0.82, "learning_rate": 1.5689549871220343e-05, "loss": 0.6923, "step": 7923 }, { "epoch": 0.82, "learning_rate": 1.5671424263329858e-05, "loss": 0.5505, "step": 7924 }, { "epoch": 0.82, "learning_rate": 1.565330824125548e-05, "loss": 0.6982, "step": 7925 }, { "epoch": 0.83, "learning_rate": 1.5635201807056555e-05, "loss": 0.6105, "step": 7926 }, { "epoch": 0.83, "learning_rate": 1.561710496279122e-05, "loss": 0.6446, "step": 7927 }, { "epoch": 0.83, "learning_rate": 1.5599017710516617e-05, "loss": 0.6658, "step": 7928 }, { "epoch": 0.83, "learning_rate": 1.558094005228877e-05, "loss": 0.6245, "step": 7929 }, { "epoch": 0.83, "learning_rate": 1.5562871990162586e-05, "loss": 0.6783, "step": 7930 }, { "epoch": 0.83, "learning_rate": 1.5544813526191916e-05, "loss": 0.6346, "step": 7931 }, { "epoch": 0.83, "learning_rate": 1.5526764662429516e-05, "loss": 0.6832, "step": 7932 }, { "epoch": 0.83, "learning_rate": 1.5508725400927028e-05, "loss": 0.7021, "step": 7933 }, { "epoch": 0.83, "learning_rate": 1.5490695743734986e-05, "loss": 0.6791, "step": 7934 }, { "epoch": 0.83, "learning_rate": 1.5472675692902916e-05, "loss": 0.6399, "step": 7935 }, { "epoch": 0.83, "learning_rate": 1.545466525047914e-05, "loss": 0.7045, "step": 7936 }, { "epoch": 0.83, "learning_rate": 1.5436664418510972e-05, "loss": 0.634, "step": 7937 }, { "epoch": 0.83, "learning_rate": 1.5418673199044643e-05, "loss": 0.7349, "step": 7938 }, { "epoch": 0.83, "learning_rate": 1.5400691594125194e-05, "loss": 0.6936, "step": 7939 }, { "epoch": 0.83, "learning_rate": 1.5382719605796645e-05, "loss": 0.6475, "step": 7940 }, { "epoch": 0.83, "learning_rate": 1.536475723610197e-05, "loss": 0.6924, "step": 7941 }, { "epoch": 0.83, "learning_rate": 1.5346804487082923e-05, "loss": 0.6773, "step": 7942 }, { "epoch": 0.83, "learning_rate": 1.5328861360780245e-05, "loss": 0.6327, "step": 7943 }, { "epoch": 0.83, "learning_rate": 1.5310927859233613e-05, "loss": 0.6381, "step": 7944 }, { "epoch": 0.83, "learning_rate": 1.5293003984481545e-05, "loss": 0.6701, "step": 7945 }, { "epoch": 0.83, "learning_rate": 1.5275089738561453e-05, "loss": 0.6613, "step": 7946 }, { "epoch": 0.83, "learning_rate": 1.5257185123509742e-05, "loss": 0.6792, "step": 7947 }, { "epoch": 0.83, "learning_rate": 1.5239290141361617e-05, "loss": 0.6929, "step": 7948 }, { "epoch": 0.83, "learning_rate": 1.5221404794151295e-05, "loss": 0.6814, "step": 7949 }, { "epoch": 0.83, "learning_rate": 1.5203529083911794e-05, "loss": 0.6649, "step": 7950 }, { "epoch": 0.83, "learning_rate": 1.5185663012675111e-05, "loss": 0.6089, "step": 7951 }, { "epoch": 0.83, "learning_rate": 1.5167806582472132e-05, "loss": 0.7521, "step": 7952 }, { "epoch": 0.83, "learning_rate": 1.5149959795332613e-05, "loss": 0.6468, "step": 7953 }, { "epoch": 0.83, "learning_rate": 1.5132122653285242e-05, "loss": 0.6773, "step": 7954 }, { "epoch": 0.83, "learning_rate": 1.5114295158357627e-05, "loss": 0.6582, "step": 7955 }, { "epoch": 0.83, "learning_rate": 1.5096477312576229e-05, "loss": 0.6797, "step": 7956 }, { "epoch": 0.83, "learning_rate": 1.5078669117966482e-05, "loss": 0.679, "step": 7957 }, { "epoch": 0.83, "learning_rate": 1.5060870576552643e-05, "loss": 0.6743, "step": 7958 }, { "epoch": 0.83, "learning_rate": 1.504308169035794e-05, "loss": 0.6702, "step": 7959 }, { "epoch": 0.83, "learning_rate": 1.5025302461404444e-05, "loss": 0.6315, "step": 7960 }, { "epoch": 0.83, "learning_rate": 1.5007532891713206e-05, "loss": 0.6197, "step": 7961 }, { "epoch": 0.83, "learning_rate": 1.4989772983304074e-05, "loss": 0.7008, "step": 7962 }, { "epoch": 0.83, "learning_rate": 1.4972022738195878e-05, "loss": 0.6861, "step": 7963 }, { "epoch": 0.83, "learning_rate": 1.4954282158406373e-05, "loss": 0.6579, "step": 7964 }, { "epoch": 0.83, "learning_rate": 1.4936551245952101e-05, "loss": 0.6459, "step": 7965 }, { "epoch": 0.83, "learning_rate": 1.4918830002848638e-05, "loss": 0.7229, "step": 7966 }, { "epoch": 0.83, "learning_rate": 1.4901118431110339e-05, "loss": 0.7154, "step": 7967 }, { "epoch": 0.83, "learning_rate": 1.488341653275055e-05, "loss": 0.6589, "step": 7968 }, { "epoch": 0.83, "learning_rate": 1.4865724309781492e-05, "loss": 0.6839, "step": 7969 }, { "epoch": 0.83, "learning_rate": 1.484804176421425e-05, "loss": 0.6128, "step": 7970 }, { "epoch": 0.83, "learning_rate": 1.4830368898058866e-05, "loss": 0.691, "step": 7971 }, { "epoch": 0.83, "learning_rate": 1.481270571332426e-05, "loss": 0.6028, "step": 7972 }, { "epoch": 0.83, "learning_rate": 1.479505221201819e-05, "loss": 0.5791, "step": 7973 }, { "epoch": 0.83, "learning_rate": 1.4777408396147408e-05, "loss": 0.6352, "step": 7974 }, { "epoch": 0.83, "learning_rate": 1.4759774267717553e-05, "loss": 0.6378, "step": 7975 }, { "epoch": 0.83, "learning_rate": 1.4742149828733076e-05, "loss": 0.6627, "step": 7976 }, { "epoch": 0.83, "learning_rate": 1.4724535081197422e-05, "loss": 0.6284, "step": 7977 }, { "epoch": 0.83, "learning_rate": 1.470693002711292e-05, "loss": 0.7381, "step": 7978 }, { "epoch": 0.83, "learning_rate": 1.4689334668480714e-05, "loss": 0.5842, "step": 7979 }, { "epoch": 0.83, "learning_rate": 1.4671749007300951e-05, "loss": 0.644, "step": 7980 }, { "epoch": 0.83, "learning_rate": 1.465417304557264e-05, "loss": 0.6438, "step": 7981 }, { "epoch": 0.83, "learning_rate": 1.4636606785293638e-05, "loss": 0.6497, "step": 7982 }, { "epoch": 0.83, "learning_rate": 1.4619050228460795e-05, "loss": 0.6518, "step": 7983 }, { "epoch": 0.83, "learning_rate": 1.460150337706977e-05, "loss": 0.6052, "step": 7984 }, { "epoch": 0.83, "learning_rate": 1.4583966233115132e-05, "loss": 0.6612, "step": 7985 }, { "epoch": 0.83, "learning_rate": 1.456643879859042e-05, "loss": 0.6459, "step": 7986 }, { "epoch": 0.83, "learning_rate": 1.4548921075487964e-05, "loss": 0.6301, "step": 7987 }, { "epoch": 0.83, "learning_rate": 1.453141306579906e-05, "loss": 0.5882, "step": 7988 }, { "epoch": 0.83, "learning_rate": 1.4513914771513914e-05, "loss": 0.7177, "step": 7989 }, { "epoch": 0.83, "learning_rate": 1.4496426194621549e-05, "loss": 0.6204, "step": 7990 }, { "epoch": 0.83, "learning_rate": 1.447894733710995e-05, "loss": 0.5877, "step": 7991 }, { "epoch": 0.83, "learning_rate": 1.4461478200965994e-05, "loss": 0.6702, "step": 7992 }, { "epoch": 0.83, "learning_rate": 1.4444018788175406e-05, "loss": 0.6703, "step": 7993 }, { "epoch": 0.83, "learning_rate": 1.4426569100722853e-05, "loss": 0.6224, "step": 7994 }, { "epoch": 0.83, "learning_rate": 1.4409129140591904e-05, "loss": 0.6518, "step": 7995 }, { "epoch": 0.83, "learning_rate": 1.4391698909764938e-05, "loss": 0.6755, "step": 7996 }, { "epoch": 0.83, "learning_rate": 1.4374278410223363e-05, "loss": 0.6442, "step": 7997 }, { "epoch": 0.83, "learning_rate": 1.4356867643947346e-05, "loss": 0.6567, "step": 7998 }, { "epoch": 0.83, "learning_rate": 1.433946661291602e-05, "loss": 0.6786, "step": 7999 }, { "epoch": 0.83, "learning_rate": 1.4322075319107397e-05, "loss": 0.6124, "step": 8000 }, { "epoch": 0.83, "learning_rate": 1.430469376449841e-05, "loss": 0.6154, "step": 8001 }, { "epoch": 0.83, "learning_rate": 1.4287321951064824e-05, "loss": 0.6776, "step": 8002 }, { "epoch": 0.83, "learning_rate": 1.4269959880781347e-05, "loss": 0.6553, "step": 8003 }, { "epoch": 0.83, "learning_rate": 1.425260755562159e-05, "loss": 0.6995, "step": 8004 }, { "epoch": 0.83, "learning_rate": 1.4235264977557982e-05, "loss": 0.62, "step": 8005 }, { "epoch": 0.83, "learning_rate": 1.421793214856193e-05, "loss": 0.6172, "step": 8006 }, { "epoch": 0.83, "learning_rate": 1.4200609070603676e-05, "loss": 0.6934, "step": 8007 }, { "epoch": 0.83, "learning_rate": 1.4183295745652358e-05, "loss": 0.6582, "step": 8008 }, { "epoch": 0.83, "learning_rate": 1.416599217567608e-05, "loss": 0.6447, "step": 8009 }, { "epoch": 0.83, "learning_rate": 1.4148698362641732e-05, "loss": 0.6024, "step": 8010 }, { "epoch": 0.83, "learning_rate": 1.4131414308515112e-05, "loss": 0.6207, "step": 8011 }, { "epoch": 0.83, "learning_rate": 1.4114140015261001e-05, "loss": 0.699, "step": 8012 }, { "epoch": 0.83, "learning_rate": 1.4096875484842954e-05, "loss": 0.6686, "step": 8013 }, { "epoch": 0.83, "learning_rate": 1.4079620719223485e-05, "loss": 0.7042, "step": 8014 }, { "epoch": 0.83, "learning_rate": 1.4062375720364018e-05, "loss": 0.6425, "step": 8015 }, { "epoch": 0.83, "learning_rate": 1.4045140490224762e-05, "loss": 0.7279, "step": 8016 }, { "epoch": 0.83, "learning_rate": 1.4027915030764927e-05, "loss": 0.6515, "step": 8017 }, { "epoch": 0.83, "learning_rate": 1.4010699343942578e-05, "loss": 0.6453, "step": 8018 }, { "epoch": 0.83, "learning_rate": 1.3993493431714633e-05, "loss": 0.6977, "step": 8019 }, { "epoch": 0.83, "learning_rate": 1.3976297296036933e-05, "loss": 0.7128, "step": 8020 }, { "epoch": 0.83, "learning_rate": 1.3959110938864228e-05, "loss": 0.6396, "step": 8021 }, { "epoch": 0.84, "learning_rate": 1.39419343621501e-05, "loss": 0.699, "step": 8022 }, { "epoch": 0.84, "learning_rate": 1.3924767567847041e-05, "loss": 0.635, "step": 8023 }, { "epoch": 0.84, "learning_rate": 1.390761055790647e-05, "loss": 0.7192, "step": 8024 }, { "epoch": 0.84, "learning_rate": 1.3890463334278624e-05, "loss": 0.7314, "step": 8025 }, { "epoch": 0.84, "learning_rate": 1.3873325898912714e-05, "loss": 0.5954, "step": 8026 }, { "epoch": 0.84, "learning_rate": 1.3856198253756737e-05, "loss": 0.6869, "step": 8027 }, { "epoch": 0.84, "learning_rate": 1.3839080400757653e-05, "loss": 0.7314, "step": 8028 }, { "epoch": 0.84, "learning_rate": 1.3821972341861323e-05, "loss": 0.6085, "step": 8029 }, { "epoch": 0.84, "learning_rate": 1.3804874079012398e-05, "loss": 0.6239, "step": 8030 }, { "epoch": 0.84, "learning_rate": 1.3787785614154502e-05, "loss": 0.668, "step": 8031 }, { "epoch": 0.84, "learning_rate": 1.3770706949230139e-05, "loss": 0.7107, "step": 8032 }, { "epoch": 0.84, "learning_rate": 1.375363808618063e-05, "loss": 0.647, "step": 8033 }, { "epoch": 0.84, "learning_rate": 1.3736579026946294e-05, "loss": 0.6981, "step": 8034 }, { "epoch": 0.84, "learning_rate": 1.371952977346621e-05, "loss": 0.696, "step": 8035 }, { "epoch": 0.84, "learning_rate": 1.3702490327678452e-05, "loss": 0.6485, "step": 8036 }, { "epoch": 0.84, "learning_rate": 1.3685460691519902e-05, "loss": 0.6636, "step": 8037 }, { "epoch": 0.84, "learning_rate": 1.3668440866926369e-05, "loss": 0.6729, "step": 8038 }, { "epoch": 0.84, "learning_rate": 1.3651430855832525e-05, "loss": 0.6481, "step": 8039 }, { "epoch": 0.84, "learning_rate": 1.3634430660171938e-05, "loss": 0.685, "step": 8040 }, { "epoch": 0.84, "learning_rate": 1.361744028187707e-05, "loss": 0.6657, "step": 8041 }, { "epoch": 0.84, "learning_rate": 1.3600459722879245e-05, "loss": 0.745, "step": 8042 }, { "epoch": 0.84, "learning_rate": 1.3583488985108672e-05, "loss": 0.6481, "step": 8043 }, { "epoch": 0.84, "learning_rate": 1.3566528070494478e-05, "loss": 0.5975, "step": 8044 }, { "epoch": 0.84, "learning_rate": 1.3549576980964617e-05, "loss": 0.6461, "step": 8045 }, { "epoch": 0.84, "learning_rate": 1.3532635718445996e-05, "loss": 0.6926, "step": 8046 }, { "epoch": 0.84, "learning_rate": 1.3515704284864328e-05, "loss": 0.6613, "step": 8047 }, { "epoch": 0.84, "learning_rate": 1.3498782682144273e-05, "loss": 0.6811, "step": 8048 }, { "epoch": 0.84, "learning_rate": 1.3481870912209337e-05, "loss": 0.6538, "step": 8049 }, { "epoch": 0.84, "learning_rate": 1.3464968976981896e-05, "loss": 0.7069, "step": 8050 }, { "epoch": 0.84, "learning_rate": 1.3448076878383243e-05, "loss": 0.7228, "step": 8051 }, { "epoch": 0.84, "learning_rate": 1.3431194618333575e-05, "loss": 0.6507, "step": 8052 }, { "epoch": 0.84, "learning_rate": 1.3414322198751895e-05, "loss": 0.6984, "step": 8053 }, { "epoch": 0.84, "learning_rate": 1.339745962155613e-05, "loss": 0.6558, "step": 8054 }, { "epoch": 0.84, "learning_rate": 1.3380606888663128e-05, "loss": 0.6877, "step": 8055 }, { "epoch": 0.84, "learning_rate": 1.3363764001988532e-05, "loss": 0.6955, "step": 8056 }, { "epoch": 0.84, "learning_rate": 1.3346930963446914e-05, "loss": 0.6352, "step": 8057 }, { "epoch": 0.84, "learning_rate": 1.3330107774951762e-05, "loss": 0.6813, "step": 8058 }, { "epoch": 0.84, "learning_rate": 1.3313294438415346e-05, "loss": 0.6243, "step": 8059 }, { "epoch": 0.84, "learning_rate": 1.3296490955748941e-05, "loss": 0.6225, "step": 8060 }, { "epoch": 0.84, "learning_rate": 1.3279697328862572e-05, "loss": 0.6938, "step": 8061 }, { "epoch": 0.84, "learning_rate": 1.3262913559665268e-05, "loss": 0.66, "step": 8062 }, { "epoch": 0.84, "learning_rate": 1.3246139650064826e-05, "loss": 0.649, "step": 8063 }, { "epoch": 0.84, "learning_rate": 1.3229375601968009e-05, "loss": 0.6682, "step": 8064 }, { "epoch": 0.84, "learning_rate": 1.321262141728039e-05, "loss": 0.6903, "step": 8065 }, { "epoch": 0.84, "learning_rate": 1.3195877097906494e-05, "loss": 0.6752, "step": 8066 }, { "epoch": 0.84, "learning_rate": 1.3179142645749642e-05, "loss": 0.6737, "step": 8067 }, { "epoch": 0.84, "learning_rate": 1.31624180627121e-05, "loss": 0.6793, "step": 8068 }, { "epoch": 0.84, "learning_rate": 1.3145703350695005e-05, "loss": 0.6519, "step": 8069 }, { "epoch": 0.84, "learning_rate": 1.3128998511598322e-05, "loss": 0.6808, "step": 8070 }, { "epoch": 0.84, "learning_rate": 1.3112303547320937e-05, "loss": 0.6238, "step": 8071 }, { "epoch": 0.84, "learning_rate": 1.3095618459760639e-05, "loss": 0.7082, "step": 8072 }, { "epoch": 0.84, "learning_rate": 1.3078943250814001e-05, "loss": 0.6902, "step": 8073 }, { "epoch": 0.84, "learning_rate": 1.3062277922376576e-05, "loss": 0.7286, "step": 8074 }, { "epoch": 0.84, "learning_rate": 1.3045622476342733e-05, "loss": 0.6428, "step": 8075 }, { "epoch": 0.84, "learning_rate": 1.3028976914605717e-05, "loss": 0.6734, "step": 8076 }, { "epoch": 0.84, "learning_rate": 1.301234123905768e-05, "loss": 0.625, "step": 8077 }, { "epoch": 0.84, "learning_rate": 1.2995715451589652e-05, "loss": 0.6749, "step": 8078 }, { "epoch": 0.84, "learning_rate": 1.2979099554091501e-05, "loss": 0.6785, "step": 8079 }, { "epoch": 0.84, "learning_rate": 1.2962493548451981e-05, "loss": 0.6806, "step": 8080 }, { "epoch": 0.84, "learning_rate": 1.2945897436558785e-05, "loss": 0.7213, "step": 8081 }, { "epoch": 0.84, "learning_rate": 1.2929311220298379e-05, "loss": 0.7261, "step": 8082 }, { "epoch": 0.84, "learning_rate": 1.2912734901556167e-05, "loss": 0.6718, "step": 8083 }, { "epoch": 0.84, "learning_rate": 1.2896168482216442e-05, "loss": 0.7223, "step": 8084 }, { "epoch": 0.84, "learning_rate": 1.2879611964162308e-05, "loss": 0.5808, "step": 8085 }, { "epoch": 0.84, "learning_rate": 1.2863065349275826e-05, "loss": 0.6549, "step": 8086 }, { "epoch": 0.84, "learning_rate": 1.284652863943786e-05, "loss": 0.7019, "step": 8087 }, { "epoch": 0.84, "learning_rate": 1.2830001836528138e-05, "loss": 0.6694, "step": 8088 }, { "epoch": 0.84, "learning_rate": 1.2813484942425369e-05, "loss": 0.6352, "step": 8089 }, { "epoch": 0.84, "learning_rate": 1.2796977959007006e-05, "loss": 0.6778, "step": 8090 }, { "epoch": 0.84, "learning_rate": 1.2780480888149459e-05, "loss": 0.6528, "step": 8091 }, { "epoch": 0.84, "learning_rate": 1.2763993731727996e-05, "loss": 0.5959, "step": 8092 }, { "epoch": 0.84, "learning_rate": 1.2747516491616728e-05, "loss": 0.6411, "step": 8093 }, { "epoch": 0.84, "learning_rate": 1.273104916968867e-05, "loss": 0.6549, "step": 8094 }, { "epoch": 0.84, "learning_rate": 1.271459176781572e-05, "loss": 0.7115, "step": 8095 }, { "epoch": 0.84, "learning_rate": 1.2698144287868586e-05, "loss": 0.6383, "step": 8096 }, { "epoch": 0.84, "learning_rate": 1.2681706731716913e-05, "loss": 0.7124, "step": 8097 }, { "epoch": 0.84, "learning_rate": 1.266527910122921e-05, "loss": 0.6769, "step": 8098 }, { "epoch": 0.84, "learning_rate": 1.2648861398272815e-05, "loss": 0.6329, "step": 8099 }, { "epoch": 0.84, "learning_rate": 1.263245362471397e-05, "loss": 0.6384, "step": 8100 }, { "epoch": 0.84, "learning_rate": 1.261605578241779e-05, "loss": 0.6527, "step": 8101 }, { "epoch": 0.84, "learning_rate": 1.2599667873248233e-05, "loss": 0.6812, "step": 8102 }, { "epoch": 0.84, "learning_rate": 1.2583289899068174e-05, "loss": 0.691, "step": 8103 }, { "epoch": 0.84, "learning_rate": 1.2566921861739344e-05, "loss": 0.596, "step": 8104 }, { "epoch": 0.84, "learning_rate": 1.2550563763122291e-05, "loss": 0.6497, "step": 8105 }, { "epoch": 0.84, "learning_rate": 1.2534215605076528e-05, "loss": 0.667, "step": 8106 }, { "epoch": 0.84, "learning_rate": 1.2517877389460341e-05, "loss": 0.6648, "step": 8107 }, { "epoch": 0.84, "learning_rate": 1.250154911813094e-05, "loss": 0.6451, "step": 8108 }, { "epoch": 0.84, "learning_rate": 1.2485230792944436e-05, "loss": 0.6994, "step": 8109 }, { "epoch": 0.84, "learning_rate": 1.2468922415755712e-05, "loss": 0.6128, "step": 8110 }, { "epoch": 0.84, "learning_rate": 1.2452623988418633e-05, "loss": 0.5927, "step": 8111 }, { "epoch": 0.84, "learning_rate": 1.2436335512785814e-05, "loss": 0.6065, "step": 8112 }, { "epoch": 0.84, "learning_rate": 1.2420056990708872e-05, "loss": 0.6785, "step": 8113 }, { "epoch": 0.84, "learning_rate": 1.2403788424038155e-05, "loss": 0.6775, "step": 8114 }, { "epoch": 0.84, "learning_rate": 1.2387529814623011e-05, "loss": 0.6127, "step": 8115 }, { "epoch": 0.84, "learning_rate": 1.2371281164311533e-05, "loss": 0.6648, "step": 8116 }, { "epoch": 0.84, "learning_rate": 1.2355042474950773e-05, "loss": 0.6667, "step": 8117 }, { "epoch": 0.85, "learning_rate": 1.2338813748386635e-05, "loss": 0.6413, "step": 8118 }, { "epoch": 0.85, "learning_rate": 1.2322594986463832e-05, "loss": 0.7077, "step": 8119 }, { "epoch": 0.85, "learning_rate": 1.2306386191026009e-05, "loss": 0.6507, "step": 8120 }, { "epoch": 0.85, "learning_rate": 1.2290187363915674e-05, "loss": 0.6676, "step": 8121 }, { "epoch": 0.85, "learning_rate": 1.227399850697415e-05, "loss": 0.6568, "step": 8122 }, { "epoch": 0.85, "learning_rate": 1.2257819622041666e-05, "loss": 0.6618, "step": 8123 }, { "epoch": 0.85, "learning_rate": 1.2241650710957341e-05, "loss": 0.5513, "step": 8124 }, { "epoch": 0.85, "learning_rate": 1.2225491775559117e-05, "loss": 0.6595, "step": 8125 }, { "epoch": 0.85, "learning_rate": 1.2209342817683811e-05, "loss": 0.6849, "step": 8126 }, { "epoch": 0.85, "learning_rate": 1.219320383916709e-05, "loss": 0.6123, "step": 8127 }, { "epoch": 0.85, "learning_rate": 1.2177074841843528e-05, "loss": 0.6263, "step": 8128 }, { "epoch": 0.85, "learning_rate": 1.216095582754656e-05, "loss": 0.6974, "step": 8129 }, { "epoch": 0.85, "learning_rate": 1.2144846798108433e-05, "loss": 0.6899, "step": 8130 }, { "epoch": 0.85, "learning_rate": 1.2128747755360314e-05, "loss": 0.7016, "step": 8131 }, { "epoch": 0.85, "learning_rate": 1.211265870113224e-05, "loss": 0.7139, "step": 8132 }, { "epoch": 0.85, "learning_rate": 1.2096579637253047e-05, "loss": 0.6141, "step": 8133 }, { "epoch": 0.85, "learning_rate": 1.2080510565550507e-05, "loss": 0.6248, "step": 8134 }, { "epoch": 0.85, "learning_rate": 1.2064451487851235e-05, "loss": 0.5887, "step": 8135 }, { "epoch": 0.85, "learning_rate": 1.2048402405980664e-05, "loss": 0.6226, "step": 8136 }, { "epoch": 0.85, "learning_rate": 1.2032363321763174e-05, "loss": 0.674, "step": 8137 }, { "epoch": 0.85, "learning_rate": 1.201633423702192e-05, "loss": 0.7023, "step": 8138 }, { "epoch": 0.85, "learning_rate": 1.2000315153579e-05, "loss": 0.6471, "step": 8139 }, { "epoch": 0.85, "learning_rate": 1.1984306073255302e-05, "loss": 0.6821, "step": 8140 }, { "epoch": 0.85, "learning_rate": 1.196830699787066e-05, "loss": 0.6791, "step": 8141 }, { "epoch": 0.85, "learning_rate": 1.1952317929243684e-05, "loss": 0.6917, "step": 8142 }, { "epoch": 0.85, "learning_rate": 1.1936338869191888e-05, "loss": 0.6785, "step": 8143 }, { "epoch": 0.85, "learning_rate": 1.1920369819531685e-05, "loss": 0.6936, "step": 8144 }, { "epoch": 0.85, "learning_rate": 1.1904410782078268e-05, "loss": 0.7264, "step": 8145 }, { "epoch": 0.85, "learning_rate": 1.1888461758645786e-05, "loss": 0.6673, "step": 8146 }, { "epoch": 0.85, "learning_rate": 1.1872522751047144e-05, "loss": 0.6094, "step": 8147 }, { "epoch": 0.85, "learning_rate": 1.185659376109418e-05, "loss": 0.7129, "step": 8148 }, { "epoch": 0.85, "learning_rate": 1.1840674790597618e-05, "loss": 0.6885, "step": 8149 }, { "epoch": 0.85, "learning_rate": 1.1824765841366947e-05, "loss": 0.6997, "step": 8150 }, { "epoch": 0.85, "learning_rate": 1.1808866915210626e-05, "loss": 0.6926, "step": 8151 }, { "epoch": 0.85, "learning_rate": 1.1792978013935884e-05, "loss": 0.6653, "step": 8152 }, { "epoch": 0.85, "learning_rate": 1.1777099139348846e-05, "loss": 0.6915, "step": 8153 }, { "epoch": 0.85, "learning_rate": 1.1761230293254511e-05, "loss": 0.6448, "step": 8154 }, { "epoch": 0.85, "learning_rate": 1.1745371477456735e-05, "loss": 0.6689, "step": 8155 }, { "epoch": 0.85, "learning_rate": 1.1729522693758199e-05, "loss": 0.6764, "step": 8156 }, { "epoch": 0.85, "learning_rate": 1.1713683943960485e-05, "loss": 0.6527, "step": 8157 }, { "epoch": 0.85, "learning_rate": 1.1697855229864041e-05, "loss": 0.7426, "step": 8158 }, { "epoch": 0.85, "learning_rate": 1.1682036553268105e-05, "loss": 0.649, "step": 8159 }, { "epoch": 0.85, "learning_rate": 1.166622791597084e-05, "loss": 0.6738, "step": 8160 }, { "epoch": 0.85, "learning_rate": 1.1650429319769285e-05, "loss": 0.6568, "step": 8161 }, { "epoch": 0.85, "learning_rate": 1.1634640766459248e-05, "loss": 0.6511, "step": 8162 }, { "epoch": 0.85, "learning_rate": 1.1618862257835495e-05, "loss": 0.5946, "step": 8163 }, { "epoch": 0.85, "learning_rate": 1.1603093795691578e-05, "loss": 0.6613, "step": 8164 }, { "epoch": 0.85, "learning_rate": 1.1587335381819909e-05, "loss": 0.6363, "step": 8165 }, { "epoch": 0.85, "learning_rate": 1.1571587018011843e-05, "loss": 0.7002, "step": 8166 }, { "epoch": 0.85, "learning_rate": 1.155584870605746e-05, "loss": 0.6237, "step": 8167 }, { "epoch": 0.85, "learning_rate": 1.1540120447745817e-05, "loss": 0.7039, "step": 8168 }, { "epoch": 0.85, "learning_rate": 1.1524402244864785e-05, "loss": 0.6401, "step": 8169 }, { "epoch": 0.85, "learning_rate": 1.1508694099201055e-05, "loss": 0.719, "step": 8170 }, { "epoch": 0.85, "learning_rate": 1.1492996012540225e-05, "loss": 0.7264, "step": 8171 }, { "epoch": 0.85, "learning_rate": 1.147730798666674e-05, "loss": 0.7002, "step": 8172 }, { "epoch": 0.85, "learning_rate": 1.1461630023363867e-05, "loss": 0.641, "step": 8173 }, { "epoch": 0.85, "learning_rate": 1.1445962124413768e-05, "loss": 0.7063, "step": 8174 }, { "epoch": 0.85, "learning_rate": 1.1430304291597471e-05, "loss": 0.6942, "step": 8175 }, { "epoch": 0.85, "learning_rate": 1.1414656526694811e-05, "loss": 0.6993, "step": 8176 }, { "epoch": 0.85, "learning_rate": 1.1399018831484498e-05, "loss": 0.6757, "step": 8177 }, { "epoch": 0.85, "learning_rate": 1.1383391207744121e-05, "loss": 0.6697, "step": 8178 }, { "epoch": 0.85, "learning_rate": 1.136777365725008e-05, "loss": 0.5992, "step": 8179 }, { "epoch": 0.85, "learning_rate": 1.135216618177768e-05, "loss": 0.6529, "step": 8180 }, { "epoch": 0.85, "learning_rate": 1.1336568783101076e-05, "loss": 0.6403, "step": 8181 }, { "epoch": 0.85, "learning_rate": 1.1320981462993208e-05, "loss": 0.6888, "step": 8182 }, { "epoch": 0.85, "learning_rate": 1.1305404223225958e-05, "loss": 0.6815, "step": 8183 }, { "epoch": 0.85, "learning_rate": 1.1289837065570031e-05, "loss": 0.6358, "step": 8184 }, { "epoch": 0.85, "learning_rate": 1.1274279991794944e-05, "loss": 0.6792, "step": 8185 }, { "epoch": 0.85, "learning_rate": 1.1258733003669153e-05, "loss": 0.6847, "step": 8186 }, { "epoch": 0.85, "learning_rate": 1.1243196102959863e-05, "loss": 0.6652, "step": 8187 }, { "epoch": 0.85, "learning_rate": 1.122766929143323e-05, "loss": 0.653, "step": 8188 }, { "epoch": 0.85, "learning_rate": 1.1212152570854217e-05, "loss": 0.7099, "step": 8189 }, { "epoch": 0.85, "learning_rate": 1.1196645942986627e-05, "loss": 0.7304, "step": 8190 }, { "epoch": 0.85, "learning_rate": 1.1181149409593128e-05, "loss": 0.6871, "step": 8191 }, { "epoch": 0.85, "learning_rate": 1.1165662972435287e-05, "loss": 0.6992, "step": 8192 }, { "epoch": 0.85, "learning_rate": 1.1150186633273418e-05, "loss": 0.6527, "step": 8193 }, { "epoch": 0.85, "learning_rate": 1.1134720393866793e-05, "loss": 0.644, "step": 8194 }, { "epoch": 0.85, "learning_rate": 1.1119264255973504e-05, "loss": 0.5953, "step": 8195 }, { "epoch": 0.85, "learning_rate": 1.1103818221350447e-05, "loss": 0.6445, "step": 8196 }, { "epoch": 0.85, "learning_rate": 1.1088382291753419e-05, "loss": 0.6831, "step": 8197 }, { "epoch": 0.85, "learning_rate": 1.1072956468937091e-05, "loss": 0.604, "step": 8198 }, { "epoch": 0.85, "learning_rate": 1.1057540754654905e-05, "loss": 0.6292, "step": 8199 }, { "epoch": 0.85, "learning_rate": 1.1042135150659205e-05, "loss": 0.6403, "step": 8200 }, { "epoch": 0.85, "learning_rate": 1.1026739658701223e-05, "loss": 0.67, "step": 8201 }, { "epoch": 0.85, "learning_rate": 1.1011354280530971e-05, "loss": 0.679, "step": 8202 }, { "epoch": 0.85, "learning_rate": 1.0995979017897307e-05, "loss": 0.6615, "step": 8203 }, { "epoch": 0.85, "learning_rate": 1.098061387254803e-05, "loss": 0.7267, "step": 8204 }, { "epoch": 0.85, "learning_rate": 1.0965258846229675e-05, "loss": 0.6544, "step": 8205 }, { "epoch": 0.85, "learning_rate": 1.0949913940687729e-05, "loss": 0.6755, "step": 8206 }, { "epoch": 0.85, "learning_rate": 1.0934579157666436e-05, "loss": 0.6431, "step": 8207 }, { "epoch": 0.85, "learning_rate": 1.091925449890896e-05, "loss": 0.642, "step": 8208 }, { "epoch": 0.85, "learning_rate": 1.0903939966157305e-05, "loss": 0.679, "step": 8209 }, { "epoch": 0.85, "learning_rate": 1.0888635561152272e-05, "loss": 0.6677, "step": 8210 }, { "epoch": 0.85, "learning_rate": 1.0873341285633576e-05, "loss": 0.6676, "step": 8211 }, { "epoch": 0.85, "learning_rate": 1.085805714133975e-05, "loss": 0.7023, "step": 8212 }, { "epoch": 0.85, "learning_rate": 1.084278313000815e-05, "loss": 0.674, "step": 8213 }, { "epoch": 0.86, "learning_rate": 1.082751925337504e-05, "loss": 0.705, "step": 8214 }, { "epoch": 0.86, "learning_rate": 1.0812265513175467e-05, "loss": 0.6054, "step": 8215 }, { "epoch": 0.86, "learning_rate": 1.079702191114339e-05, "loss": 0.6828, "step": 8216 }, { "epoch": 0.86, "learning_rate": 1.0781788449011543e-05, "loss": 0.6312, "step": 8217 }, { "epoch": 0.86, "learning_rate": 1.0766565128511597e-05, "loss": 0.7541, "step": 8218 }, { "epoch": 0.86, "learning_rate": 1.0751351951373967e-05, "loss": 0.6751, "step": 8219 }, { "epoch": 0.86, "learning_rate": 1.0736148919327994e-05, "loss": 0.7107, "step": 8220 }, { "epoch": 0.86, "learning_rate": 1.072095603410187e-05, "loss": 0.723, "step": 8221 }, { "epoch": 0.86, "learning_rate": 1.070577329742255e-05, "loss": 0.6835, "step": 8222 }, { "epoch": 0.86, "learning_rate": 1.069060071101592e-05, "loss": 0.6353, "step": 8223 }, { "epoch": 0.86, "learning_rate": 1.0675438276606698e-05, "loss": 0.6933, "step": 8224 }, { "epoch": 0.86, "learning_rate": 1.0660285995918384e-05, "loss": 0.6602, "step": 8225 }, { "epoch": 0.86, "learning_rate": 1.0645143870673413e-05, "loss": 0.7082, "step": 8226 }, { "epoch": 0.86, "learning_rate": 1.0630011902592996e-05, "loss": 0.5956, "step": 8227 }, { "epoch": 0.86, "learning_rate": 1.0614890093397244e-05, "loss": 0.7132, "step": 8228 }, { "epoch": 0.86, "learning_rate": 1.0599778444805076e-05, "loss": 0.6897, "step": 8229 }, { "epoch": 0.86, "learning_rate": 1.0584676958534245e-05, "loss": 0.6608, "step": 8230 }, { "epoch": 0.86, "learning_rate": 1.0569585636301382e-05, "loss": 0.6738, "step": 8231 }, { "epoch": 0.86, "learning_rate": 1.055450447982198e-05, "loss": 0.7216, "step": 8232 }, { "epoch": 0.86, "learning_rate": 1.0539433490810314e-05, "loss": 0.66, "step": 8233 }, { "epoch": 0.86, "learning_rate": 1.0524372670979543e-05, "loss": 0.6943, "step": 8234 }, { "epoch": 0.86, "learning_rate": 1.0509322022041679e-05, "loss": 0.6676, "step": 8235 }, { "epoch": 0.86, "learning_rate": 1.0494281545707541e-05, "loss": 0.6149, "step": 8236 }, { "epoch": 0.86, "learning_rate": 1.0479251243686816e-05, "loss": 0.6983, "step": 8237 }, { "epoch": 0.86, "learning_rate": 1.0464231117688073e-05, "loss": 0.6274, "step": 8238 }, { "epoch": 0.86, "learning_rate": 1.0449221169418621e-05, "loss": 0.6606, "step": 8239 }, { "epoch": 0.86, "learning_rate": 1.043422140058472e-05, "loss": 0.7182, "step": 8240 }, { "epoch": 0.86, "learning_rate": 1.0419231812891417e-05, "loss": 0.6607, "step": 8241 }, { "epoch": 0.86, "learning_rate": 1.0404252408042581e-05, "loss": 0.6749, "step": 8242 }, { "epoch": 0.86, "learning_rate": 1.0389283187740972e-05, "loss": 0.6651, "step": 8243 }, { "epoch": 0.86, "learning_rate": 1.0374324153688208e-05, "loss": 0.617, "step": 8244 }, { "epoch": 0.86, "learning_rate": 1.0359375307584673e-05, "loss": 0.635, "step": 8245 }, { "epoch": 0.86, "learning_rate": 1.0344436651129663e-05, "loss": 0.6897, "step": 8246 }, { "epoch": 0.86, "learning_rate": 1.0329508186021253e-05, "loss": 0.6696, "step": 8247 }, { "epoch": 0.86, "learning_rate": 1.0314589913956418e-05, "loss": 0.6699, "step": 8248 }, { "epoch": 0.86, "learning_rate": 1.0299681836630982e-05, "loss": 0.7011, "step": 8249 }, { "epoch": 0.86, "learning_rate": 1.0284783955739518e-05, "loss": 0.7183, "step": 8250 }, { "epoch": 0.86, "learning_rate": 1.0269896272975533e-05, "loss": 0.6875, "step": 8251 }, { "epoch": 0.86, "learning_rate": 1.0255018790031357e-05, "loss": 0.7348, "step": 8252 }, { "epoch": 0.86, "learning_rate": 1.0240151508598128e-05, "loss": 0.6768, "step": 8253 }, { "epoch": 0.86, "learning_rate": 1.0225294430365828e-05, "loss": 0.6515, "step": 8254 }, { "epoch": 0.86, "learning_rate": 1.0210447557023328e-05, "loss": 0.7403, "step": 8255 }, { "epoch": 0.86, "learning_rate": 1.0195610890258279e-05, "loss": 0.698, "step": 8256 }, { "epoch": 0.86, "learning_rate": 1.0180784431757195e-05, "loss": 0.6505, "step": 8257 }, { "epoch": 0.86, "learning_rate": 1.0165968183205466e-05, "loss": 0.6452, "step": 8258 }, { "epoch": 0.86, "learning_rate": 1.0151162146287252e-05, "loss": 0.6764, "step": 8259 }, { "epoch": 0.86, "learning_rate": 1.0136366322685597e-05, "loss": 0.6895, "step": 8260 }, { "epoch": 0.86, "learning_rate": 1.0121580714082402e-05, "loss": 0.6497, "step": 8261 }, { "epoch": 0.86, "learning_rate": 1.0106805322158341e-05, "loss": 0.6285, "step": 8262 }, { "epoch": 0.86, "learning_rate": 1.0092040148592974e-05, "loss": 0.6418, "step": 8263 }, { "epoch": 0.86, "learning_rate": 1.0077285195064723e-05, "loss": 0.6763, "step": 8264 }, { "epoch": 0.86, "learning_rate": 1.006254046325078e-05, "loss": 0.6457, "step": 8265 }, { "epoch": 0.86, "learning_rate": 1.0047805954827239e-05, "loss": 0.6731, "step": 8266 }, { "epoch": 0.86, "learning_rate": 1.003308167146898e-05, "loss": 0.6311, "step": 8267 }, { "epoch": 0.86, "learning_rate": 1.0018367614849744e-05, "loss": 0.6155, "step": 8268 }, { "epoch": 0.86, "learning_rate": 1.0003663786642137e-05, "loss": 0.6617, "step": 8269 }, { "epoch": 0.86, "learning_rate": 9.988970188517543e-06, "loss": 0.6372, "step": 8270 }, { "epoch": 0.86, "learning_rate": 9.974286822146229e-06, "loss": 0.6866, "step": 8271 }, { "epoch": 0.86, "learning_rate": 9.959613689197312e-06, "loss": 0.6284, "step": 8272 }, { "epoch": 0.86, "learning_rate": 9.944950791338681e-06, "loss": 0.6617, "step": 8273 }, { "epoch": 0.86, "learning_rate": 9.930298130237104e-06, "loss": 0.6268, "step": 8274 }, { "epoch": 0.86, "learning_rate": 9.915655707558225e-06, "loss": 0.7122, "step": 8275 }, { "epoch": 0.86, "learning_rate": 9.901023524966425e-06, "loss": 0.7034, "step": 8276 }, { "epoch": 0.86, "learning_rate": 9.886401584124993e-06, "loss": 0.6838, "step": 8277 }, { "epoch": 0.86, "learning_rate": 9.87178988669607e-06, "loss": 0.687, "step": 8278 }, { "epoch": 0.86, "learning_rate": 9.85718843434057e-06, "loss": 0.6681, "step": 8279 }, { "epoch": 0.86, "learning_rate": 9.842597228718264e-06, "loss": 0.6296, "step": 8280 }, { "epoch": 0.86, "learning_rate": 9.828016271487805e-06, "loss": 0.6552, "step": 8281 }, { "epoch": 0.86, "learning_rate": 9.81344556430659e-06, "loss": 0.6326, "step": 8282 }, { "epoch": 0.86, "learning_rate": 9.798885108830946e-06, "loss": 0.5631, "step": 8283 }, { "epoch": 0.86, "learning_rate": 9.784334906715975e-06, "loss": 0.6632, "step": 8284 }, { "epoch": 0.86, "learning_rate": 9.76979495961562e-06, "loss": 0.7027, "step": 8285 }, { "epoch": 0.86, "learning_rate": 9.7552652691827e-06, "loss": 0.6843, "step": 8286 }, { "epoch": 0.86, "learning_rate": 9.74074583706881e-06, "loss": 0.6602, "step": 8287 }, { "epoch": 0.86, "learning_rate": 9.726236664924415e-06, "loss": 0.6916, "step": 8288 }, { "epoch": 0.86, "learning_rate": 9.71173775439882e-06, "loss": 0.6815, "step": 8289 }, { "epoch": 0.86, "learning_rate": 9.697249107140117e-06, "loss": 0.6516, "step": 8290 }, { "epoch": 0.86, "learning_rate": 9.682770724795288e-06, "loss": 0.6128, "step": 8291 }, { "epoch": 0.86, "learning_rate": 9.668302609010105e-06, "loss": 0.66, "step": 8292 }, { "epoch": 0.86, "learning_rate": 9.65384476142922e-06, "loss": 0.6268, "step": 8293 }, { "epoch": 0.86, "learning_rate": 9.639397183696042e-06, "loss": 0.6073, "step": 8294 }, { "epoch": 0.86, "learning_rate": 9.62495987745291e-06, "loss": 0.6513, "step": 8295 }, { "epoch": 0.86, "learning_rate": 9.610532844340902e-06, "loss": 0.6562, "step": 8296 }, { "epoch": 0.86, "learning_rate": 9.596116085999984e-06, "loss": 0.7182, "step": 8297 }, { "epoch": 0.86, "learning_rate": 9.581709604068966e-06, "loss": 0.6604, "step": 8298 }, { "epoch": 0.86, "learning_rate": 9.567313400185428e-06, "loss": 0.6967, "step": 8299 }, { "epoch": 0.86, "learning_rate": 9.55292747598584e-06, "loss": 0.6365, "step": 8300 }, { "epoch": 0.86, "learning_rate": 9.538551833105491e-06, "loss": 0.659, "step": 8301 }, { "epoch": 0.86, "learning_rate": 9.524186473178465e-06, "loss": 0.6721, "step": 8302 }, { "epoch": 0.86, "learning_rate": 9.509831397837731e-06, "loss": 0.6175, "step": 8303 }, { "epoch": 0.86, "learning_rate": 9.49548660871502e-06, "loss": 0.6563, "step": 8304 }, { "epoch": 0.86, "learning_rate": 9.481152107440993e-06, "loss": 0.6641, "step": 8305 }, { "epoch": 0.86, "learning_rate": 9.466827895645059e-06, "loss": 0.6893, "step": 8306 }, { "epoch": 0.86, "learning_rate": 9.452513974955456e-06, "loss": 0.7039, "step": 8307 }, { "epoch": 0.86, "learning_rate": 9.43821034699931e-06, "loss": 0.677, "step": 8308 }, { "epoch": 0.86, "learning_rate": 9.42391701340255e-06, "loss": 0.6596, "step": 8309 }, { "epoch": 0.86, "learning_rate": 9.409633975789911e-06, "loss": 0.6938, "step": 8310 }, { "epoch": 0.87, "learning_rate": 9.395361235784984e-06, "loss": 0.7241, "step": 8311 }, { "epoch": 0.87, "learning_rate": 9.381098795010201e-06, "loss": 0.7121, "step": 8312 }, { "epoch": 0.87, "learning_rate": 9.36684665508677e-06, "loss": 0.6472, "step": 8313 }, { "epoch": 0.87, "learning_rate": 9.35260481763478e-06, "loss": 0.6833, "step": 8314 }, { "epoch": 0.87, "learning_rate": 9.33837328427316e-06, "loss": 0.6858, "step": 8315 }, { "epoch": 0.87, "learning_rate": 9.324152056619606e-06, "loss": 0.6586, "step": 8316 }, { "epoch": 0.87, "learning_rate": 9.30994113629069e-06, "loss": 0.6972, "step": 8317 }, { "epoch": 0.87, "learning_rate": 9.295740524901797e-06, "loss": 0.682, "step": 8318 }, { "epoch": 0.87, "learning_rate": 9.281550224067126e-06, "loss": 0.6698, "step": 8319 }, { "epoch": 0.87, "learning_rate": 9.267370235399731e-06, "loss": 0.6578, "step": 8320 }, { "epoch": 0.87, "learning_rate": 9.25320056051151e-06, "loss": 0.6073, "step": 8321 }, { "epoch": 0.87, "learning_rate": 9.23904120101311e-06, "loss": 0.6566, "step": 8322 }, { "epoch": 0.87, "learning_rate": 9.224892158514108e-06, "loss": 0.6678, "step": 8323 }, { "epoch": 0.87, "learning_rate": 9.21075343462281e-06, "loss": 0.6266, "step": 8324 }, { "epoch": 0.87, "learning_rate": 9.196625030946426e-06, "loss": 0.639, "step": 8325 }, { "epoch": 0.87, "learning_rate": 9.182506949090963e-06, "loss": 0.6872, "step": 8326 }, { "epoch": 0.87, "learning_rate": 9.168399190661237e-06, "loss": 0.6131, "step": 8327 }, { "epoch": 0.87, "learning_rate": 9.154301757260918e-06, "loss": 0.6882, "step": 8328 }, { "epoch": 0.87, "learning_rate": 9.140214650492507e-06, "loss": 0.6648, "step": 8329 }, { "epoch": 0.87, "learning_rate": 9.126137871957285e-06, "loss": 0.6656, "step": 8330 }, { "epoch": 0.87, "learning_rate": 9.112071423255431e-06, "loss": 0.6974, "step": 8331 }, { "epoch": 0.87, "learning_rate": 9.098015305985884e-06, "loss": 0.6442, "step": 8332 }, { "epoch": 0.87, "learning_rate": 9.083969521746415e-06, "loss": 0.7142, "step": 8333 }, { "epoch": 0.87, "learning_rate": 9.069934072133669e-06, "loss": 0.6321, "step": 8334 }, { "epoch": 0.87, "learning_rate": 9.055908958743097e-06, "loss": 0.638, "step": 8335 }, { "epoch": 0.87, "learning_rate": 9.041894183168919e-06, "loss": 0.6457, "step": 8336 }, { "epoch": 0.87, "learning_rate": 9.027889747004259e-06, "loss": 0.707, "step": 8337 }, { "epoch": 0.87, "learning_rate": 9.013895651841042e-06, "loss": 0.6733, "step": 8338 }, { "epoch": 0.87, "learning_rate": 8.999911899269986e-06, "loss": 0.6823, "step": 8339 }, { "epoch": 0.87, "learning_rate": 8.985938490880652e-06, "loss": 0.6872, "step": 8340 }, { "epoch": 0.87, "learning_rate": 8.971975428261447e-06, "loss": 0.6842, "step": 8341 }, { "epoch": 0.87, "learning_rate": 8.95802271299957e-06, "loss": 0.6395, "step": 8342 }, { "epoch": 0.87, "learning_rate": 8.944080346681071e-06, "loss": 0.7154, "step": 8343 }, { "epoch": 0.87, "learning_rate": 8.930148330890808e-06, "loss": 0.6936, "step": 8344 }, { "epoch": 0.87, "learning_rate": 8.916226667212424e-06, "loss": 0.7124, "step": 8345 }, { "epoch": 0.87, "learning_rate": 8.902315357228485e-06, "loss": 0.6575, "step": 8346 }, { "epoch": 0.87, "learning_rate": 8.888414402520273e-06, "loss": 0.6496, "step": 8347 }, { "epoch": 0.87, "learning_rate": 8.874523804667967e-06, "loss": 0.6886, "step": 8348 }, { "epoch": 0.87, "learning_rate": 8.860643565250548e-06, "loss": 0.6678, "step": 8349 }, { "epoch": 0.87, "learning_rate": 8.846773685845777e-06, "loss": 0.6821, "step": 8350 }, { "epoch": 0.87, "learning_rate": 8.832914168030305e-06, "loss": 0.5891, "step": 8351 }, { "epoch": 0.87, "learning_rate": 8.81906501337958e-06, "loss": 0.6745, "step": 8352 }, { "epoch": 0.87, "learning_rate": 8.805226223467833e-06, "loss": 0.6761, "step": 8353 }, { "epoch": 0.87, "learning_rate": 8.791397799868173e-06, "loss": 0.6683, "step": 8354 }, { "epoch": 0.87, "learning_rate": 8.77757974415252e-06, "loss": 0.5839, "step": 8355 }, { "epoch": 0.87, "learning_rate": 8.763772057891594e-06, "loss": 0.6157, "step": 8356 }, { "epoch": 0.87, "learning_rate": 8.74997474265492e-06, "loss": 0.6534, "step": 8357 }, { "epoch": 0.87, "learning_rate": 8.736187800010898e-06, "loss": 0.6325, "step": 8358 }, { "epoch": 0.87, "learning_rate": 8.722411231526695e-06, "loss": 0.6658, "step": 8359 }, { "epoch": 0.87, "learning_rate": 8.708645038768349e-06, "loss": 0.6303, "step": 8360 }, { "epoch": 0.87, "learning_rate": 8.694889223300696e-06, "loss": 0.6713, "step": 8361 }, { "epoch": 0.87, "learning_rate": 8.681143786687352e-06, "loss": 0.6985, "step": 8362 }, { "epoch": 0.87, "learning_rate": 8.667408730490844e-06, "loss": 0.7657, "step": 8363 }, { "epoch": 0.87, "learning_rate": 8.653684056272415e-06, "loss": 0.6657, "step": 8364 }, { "epoch": 0.87, "learning_rate": 8.639969765592216e-06, "loss": 0.6885, "step": 8365 }, { "epoch": 0.87, "learning_rate": 8.626265860009175e-06, "loss": 0.6448, "step": 8366 }, { "epoch": 0.87, "learning_rate": 8.612572341081026e-06, "loss": 0.7287, "step": 8367 }, { "epoch": 0.87, "learning_rate": 8.59888921036437e-06, "loss": 0.6429, "step": 8368 }, { "epoch": 0.87, "learning_rate": 8.58521646941457e-06, "loss": 0.6308, "step": 8369 }, { "epoch": 0.87, "learning_rate": 8.571554119785863e-06, "loss": 0.6729, "step": 8370 }, { "epoch": 0.87, "learning_rate": 8.55790216303125e-06, "loss": 0.6875, "step": 8371 }, { "epoch": 0.87, "learning_rate": 8.544260600702615e-06, "loss": 0.7135, "step": 8372 }, { "epoch": 0.87, "learning_rate": 8.53062943435058e-06, "loss": 0.6501, "step": 8373 }, { "epoch": 0.87, "learning_rate": 8.517008665524661e-06, "loss": 0.696, "step": 8374 }, { "epoch": 0.87, "learning_rate": 8.503398295773168e-06, "loss": 0.6785, "step": 8375 }, { "epoch": 0.87, "learning_rate": 8.489798326643195e-06, "loss": 0.7056, "step": 8376 }, { "epoch": 0.87, "learning_rate": 8.476208759680693e-06, "loss": 0.6598, "step": 8377 }, { "epoch": 0.87, "learning_rate": 8.462629596430439e-06, "loss": 0.6766, "step": 8378 }, { "epoch": 0.87, "learning_rate": 8.449060838435963e-06, "loss": 0.6613, "step": 8379 }, { "epoch": 0.87, "learning_rate": 8.435502487239688e-06, "loss": 0.6176, "step": 8380 }, { "epoch": 0.87, "learning_rate": 8.421954544382826e-06, "loss": 0.6567, "step": 8381 }, { "epoch": 0.87, "learning_rate": 8.408417011405389e-06, "loss": 0.742, "step": 8382 }, { "epoch": 0.87, "learning_rate": 8.394889889846214e-06, "loss": 0.7078, "step": 8383 }, { "epoch": 0.87, "learning_rate": 8.381373181242947e-06, "loss": 0.7056, "step": 8384 }, { "epoch": 0.87, "learning_rate": 8.36786688713208e-06, "loss": 0.676, "step": 8385 }, { "epoch": 0.87, "learning_rate": 8.354371009048922e-06, "loss": 0.5847, "step": 8386 }, { "epoch": 0.87, "learning_rate": 8.340885548527545e-06, "loss": 0.7199, "step": 8387 }, { "epoch": 0.87, "learning_rate": 8.327410507100885e-06, "loss": 0.6243, "step": 8388 }, { "epoch": 0.87, "learning_rate": 8.31394588630069e-06, "loss": 0.6432, "step": 8389 }, { "epoch": 0.87, "learning_rate": 8.300491687657496e-06, "loss": 0.6393, "step": 8390 }, { "epoch": 0.87, "learning_rate": 8.287047912700675e-06, "loss": 0.6934, "step": 8391 }, { "epoch": 0.87, "learning_rate": 8.273614562958432e-06, "loss": 0.6685, "step": 8392 }, { "epoch": 0.87, "learning_rate": 8.260191639957727e-06, "loss": 0.7162, "step": 8393 }, { "epoch": 0.87, "learning_rate": 8.246779145224415e-06, "loss": 0.6575, "step": 8394 }, { "epoch": 0.87, "learning_rate": 8.233377080283111e-06, "loss": 0.6332, "step": 8395 }, { "epoch": 0.87, "learning_rate": 8.219985446657219e-06, "loss": 0.7188, "step": 8396 }, { "epoch": 0.87, "learning_rate": 8.206604245869043e-06, "loss": 0.6351, "step": 8397 }, { "epoch": 0.87, "learning_rate": 8.193233479439644e-06, "loss": 0.6756, "step": 8398 }, { "epoch": 0.87, "learning_rate": 8.179873148888884e-06, "loss": 0.6841, "step": 8399 }, { "epoch": 0.87, "learning_rate": 8.166523255735481e-06, "loss": 0.6755, "step": 8400 }, { "epoch": 0.87, "learning_rate": 8.153183801496966e-06, "loss": 0.6448, "step": 8401 }, { "epoch": 0.87, "learning_rate": 8.139854787689616e-06, "loss": 0.7071, "step": 8402 }, { "epoch": 0.87, "learning_rate": 8.126536215828617e-06, "loss": 0.6972, "step": 8403 }, { "epoch": 0.87, "learning_rate": 8.113228087427882e-06, "loss": 0.6608, "step": 8404 }, { "epoch": 0.87, "learning_rate": 8.0999304040002e-06, "loss": 0.7201, "step": 8405 }, { "epoch": 0.87, "learning_rate": 8.086643167057151e-06, "loss": 0.6699, "step": 8406 }, { "epoch": 0.88, "learning_rate": 8.073366378109092e-06, "loss": 0.634, "step": 8407 }, { "epoch": 0.88, "learning_rate": 8.060100038665275e-06, "loss": 0.6719, "step": 8408 }, { "epoch": 0.88, "learning_rate": 8.04684415023368e-06, "loss": 0.7049, "step": 8409 }, { "epoch": 0.88, "learning_rate": 8.033598714321123e-06, "loss": 0.6533, "step": 8410 }, { "epoch": 0.88, "learning_rate": 8.020363732433266e-06, "loss": 0.6204, "step": 8411 }, { "epoch": 0.88, "learning_rate": 8.007139206074566e-06, "loss": 0.658, "step": 8412 }, { "epoch": 0.88, "learning_rate": 7.993925136748248e-06, "loss": 0.7133, "step": 8413 }, { "epoch": 0.88, "learning_rate": 7.980721525956413e-06, "loss": 0.7265, "step": 8414 }, { "epoch": 0.88, "learning_rate": 7.96752837519995e-06, "loss": 0.645, "step": 8415 }, { "epoch": 0.88, "learning_rate": 7.954345685978525e-06, "loss": 0.611, "step": 8416 }, { "epoch": 0.88, "learning_rate": 7.941173459790664e-06, "loss": 0.6505, "step": 8417 }, { "epoch": 0.88, "learning_rate": 7.928011698133697e-06, "loss": 0.6951, "step": 8418 }, { "epoch": 0.88, "learning_rate": 7.91486040250371e-06, "loss": 0.6201, "step": 8419 }, { "epoch": 0.88, "learning_rate": 7.901719574395694e-06, "loss": 0.5938, "step": 8420 }, { "epoch": 0.88, "learning_rate": 7.888589215303355e-06, "loss": 0.5961, "step": 8421 }, { "epoch": 0.88, "learning_rate": 7.875469326719242e-06, "loss": 0.6983, "step": 8422 }, { "epoch": 0.88, "learning_rate": 7.862359910134765e-06, "loss": 0.6735, "step": 8423 }, { "epoch": 0.88, "learning_rate": 7.84926096704005e-06, "loss": 0.6782, "step": 8424 }, { "epoch": 0.88, "learning_rate": 7.83617249892411e-06, "loss": 0.6161, "step": 8425 }, { "epoch": 0.88, "learning_rate": 7.823094507274764e-06, "loss": 0.6321, "step": 8426 }, { "epoch": 0.88, "learning_rate": 7.810026993578567e-06, "loss": 0.6795, "step": 8427 }, { "epoch": 0.88, "learning_rate": 7.796969959320954e-06, "loss": 0.6786, "step": 8428 }, { "epoch": 0.88, "learning_rate": 7.783923405986171e-06, "loss": 0.6736, "step": 8429 }, { "epoch": 0.88, "learning_rate": 7.77088733505721e-06, "loss": 0.7043, "step": 8430 }, { "epoch": 0.88, "learning_rate": 7.757861748015926e-06, "loss": 0.6556, "step": 8431 }, { "epoch": 0.88, "learning_rate": 7.744846646342985e-06, "loss": 0.6435, "step": 8432 }, { "epoch": 0.88, "learning_rate": 7.731842031517823e-06, "loss": 0.6955, "step": 8433 }, { "epoch": 0.88, "learning_rate": 7.718847905018688e-06, "loss": 0.7693, "step": 8434 }, { "epoch": 0.88, "learning_rate": 7.705864268322682e-06, "loss": 0.6655, "step": 8435 }, { "epoch": 0.88, "learning_rate": 7.692891122905666e-06, "loss": 0.6692, "step": 8436 }, { "epoch": 0.88, "learning_rate": 7.679928470242315e-06, "loss": 0.6543, "step": 8437 }, { "epoch": 0.88, "learning_rate": 7.666976311806163e-06, "loss": 0.706, "step": 8438 }, { "epoch": 0.88, "learning_rate": 7.654034649069475e-06, "loss": 0.6866, "step": 8439 }, { "epoch": 0.88, "learning_rate": 7.641103483503354e-06, "loss": 0.69, "step": 8440 }, { "epoch": 0.88, "learning_rate": 7.628182816577756e-06, "loss": 0.69, "step": 8441 }, { "epoch": 0.88, "learning_rate": 7.615272649761351e-06, "loss": 0.6253, "step": 8442 }, { "epoch": 0.88, "learning_rate": 7.602372984521711e-06, "loss": 0.6403, "step": 8443 }, { "epoch": 0.88, "learning_rate": 7.5894838223251386e-06, "loss": 0.6664, "step": 8444 }, { "epoch": 0.88, "learning_rate": 7.576605164636785e-06, "loss": 0.6432, "step": 8445 }, { "epoch": 0.88, "learning_rate": 7.563737012920591e-06, "loss": 0.6962, "step": 8446 }, { "epoch": 0.88, "learning_rate": 7.550879368639319e-06, "loss": 0.634, "step": 8447 }, { "epoch": 0.88, "learning_rate": 7.5380322332545105e-06, "loss": 0.7044, "step": 8448 }, { "epoch": 0.88, "learning_rate": 7.525195608226543e-06, "loss": 0.6234, "step": 8449 }, { "epoch": 0.88, "learning_rate": 7.512369495014571e-06, "loss": 0.6113, "step": 8450 }, { "epoch": 0.88, "learning_rate": 7.499553895076561e-06, "loss": 0.6887, "step": 8451 }, { "epoch": 0.88, "learning_rate": 7.486748809869326e-06, "loss": 0.6323, "step": 8452 }, { "epoch": 0.88, "learning_rate": 7.473954240848413e-06, "loss": 0.699, "step": 8453 }, { "epoch": 0.88, "learning_rate": 7.461170189468214e-06, "loss": 0.6594, "step": 8454 }, { "epoch": 0.88, "learning_rate": 7.448396657181944e-06, "loss": 0.6683, "step": 8455 }, { "epoch": 0.88, "learning_rate": 7.435633645441565e-06, "loss": 0.6548, "step": 8456 }, { "epoch": 0.88, "learning_rate": 7.422881155697892e-06, "loss": 0.6823, "step": 8457 }, { "epoch": 0.88, "learning_rate": 7.410139189400555e-06, "loss": 0.6378, "step": 8458 }, { "epoch": 0.88, "learning_rate": 7.397407747997931e-06, "loss": 0.6582, "step": 8459 }, { "epoch": 0.88, "learning_rate": 7.384686832937226e-06, "loss": 0.6364, "step": 8460 }, { "epoch": 0.88, "learning_rate": 7.371976445664485e-06, "loss": 0.6971, "step": 8461 }, { "epoch": 0.88, "learning_rate": 7.359276587624486e-06, "loss": 0.6423, "step": 8462 }, { "epoch": 0.88, "learning_rate": 7.3465872602608845e-06, "loss": 0.6359, "step": 8463 }, { "epoch": 0.88, "learning_rate": 7.333908465016082e-06, "loss": 0.6529, "step": 8464 }, { "epoch": 0.88, "learning_rate": 7.321240203331303e-06, "loss": 0.7061, "step": 8465 }, { "epoch": 0.88, "learning_rate": 7.308582476646608e-06, "loss": 0.6504, "step": 8466 }, { "epoch": 0.88, "learning_rate": 7.295935286400801e-06, "loss": 0.6759, "step": 8467 }, { "epoch": 0.88, "learning_rate": 7.283298634031522e-06, "loss": 0.6717, "step": 8468 }, { "epoch": 0.88, "learning_rate": 7.2706725209752195e-06, "loss": 0.6636, "step": 8469 }, { "epoch": 0.88, "learning_rate": 7.258056948667113e-06, "loss": 0.621, "step": 8470 }, { "epoch": 0.88, "learning_rate": 7.245451918541257e-06, "loss": 0.6681, "step": 8471 }, { "epoch": 0.88, "learning_rate": 7.232857432030482e-06, "loss": 0.6855, "step": 8472 }, { "epoch": 0.88, "learning_rate": 7.220273490566443e-06, "loss": 0.7041, "step": 8473 }, { "epoch": 0.88, "learning_rate": 7.207700095579573e-06, "loss": 0.603, "step": 8474 }, { "epoch": 0.88, "learning_rate": 7.195137248499129e-06, "loss": 0.6323, "step": 8475 }, { "epoch": 0.88, "learning_rate": 7.1825849507531464e-06, "loss": 0.6584, "step": 8476 }, { "epoch": 0.88, "learning_rate": 7.170043203768472e-06, "loss": 0.6763, "step": 8477 }, { "epoch": 0.88, "learning_rate": 7.157512008970768e-06, "loss": 0.6151, "step": 8478 }, { "epoch": 0.88, "learning_rate": 7.14499136778447e-06, "loss": 0.6169, "step": 8479 }, { "epoch": 0.88, "learning_rate": 7.13248128163283e-06, "loss": 0.6543, "step": 8480 }, { "epoch": 0.88, "learning_rate": 7.119981751937909e-06, "loss": 0.6262, "step": 8481 }, { "epoch": 0.88, "learning_rate": 7.107492780120539e-06, "loss": 0.6867, "step": 8482 }, { "epoch": 0.88, "learning_rate": 7.095014367600395e-06, "loss": 0.6514, "step": 8483 }, { "epoch": 0.88, "learning_rate": 7.082546515795874e-06, "loss": 0.6333, "step": 8484 }, { "epoch": 0.88, "learning_rate": 7.070089226124288e-06, "loss": 0.7009, "step": 8485 }, { "epoch": 0.88, "learning_rate": 7.057642500001649e-06, "loss": 0.7212, "step": 8486 }, { "epoch": 0.88, "learning_rate": 7.045206338842803e-06, "loss": 0.6281, "step": 8487 }, { "epoch": 0.88, "learning_rate": 7.032780744061396e-06, "loss": 0.6599, "step": 8488 }, { "epoch": 0.88, "learning_rate": 7.020365717069888e-06, "loss": 0.6392, "step": 8489 }, { "epoch": 0.88, "learning_rate": 7.0079612592795055e-06, "loss": 0.6686, "step": 8490 }, { "epoch": 0.88, "learning_rate": 6.995567372100298e-06, "loss": 0.6919, "step": 8491 }, { "epoch": 0.88, "learning_rate": 6.983184056941127e-06, "loss": 0.6643, "step": 8492 }, { "epoch": 0.88, "learning_rate": 6.970811315209591e-06, "loss": 0.6065, "step": 8493 }, { "epoch": 0.88, "learning_rate": 6.958449148312151e-06, "loss": 0.6913, "step": 8494 }, { "epoch": 0.88, "learning_rate": 6.946097557654052e-06, "loss": 0.6136, "step": 8495 }, { "epoch": 0.88, "learning_rate": 6.933756544639292e-06, "loss": 0.6589, "step": 8496 }, { "epoch": 0.88, "learning_rate": 6.921426110670748e-06, "loss": 0.7056, "step": 8497 }, { "epoch": 0.88, "learning_rate": 6.909106257150022e-06, "loss": 0.7456, "step": 8498 }, { "epoch": 0.88, "learning_rate": 6.896796985477516e-06, "loss": 0.6807, "step": 8499 }, { "epoch": 0.88, "learning_rate": 6.884498297052477e-06, "loss": 0.6207, "step": 8500 }, { "epoch": 0.88, "learning_rate": 6.872210193272943e-06, "loss": 0.6579, "step": 8501 }, { "epoch": 0.88, "learning_rate": 6.859932675535696e-06, "loss": 0.6763, "step": 8502 }, { "epoch": 0.89, "learning_rate": 6.847665745236376e-06, "loss": 0.6816, "step": 8503 }, { "epoch": 0.89, "learning_rate": 6.835409403769355e-06, "loss": 0.6715, "step": 8504 }, { "epoch": 0.89, "learning_rate": 6.823163652527875e-06, "loss": 0.5934, "step": 8505 }, { "epoch": 0.89, "learning_rate": 6.810928492903934e-06, "loss": 0.6318, "step": 8506 }, { "epoch": 0.89, "learning_rate": 6.798703926288297e-06, "loss": 0.6815, "step": 8507 }, { "epoch": 0.89, "learning_rate": 6.786489954070596e-06, "loss": 0.7225, "step": 8508 }, { "epoch": 0.89, "learning_rate": 6.7742865776392104e-06, "loss": 0.6091, "step": 8509 }, { "epoch": 0.89, "learning_rate": 6.76209379838132e-06, "loss": 0.664, "step": 8510 }, { "epoch": 0.89, "learning_rate": 6.749911617682891e-06, "loss": 0.6436, "step": 8511 }, { "epoch": 0.89, "learning_rate": 6.737740036928741e-06, "loss": 0.6063, "step": 8512 }, { "epoch": 0.89, "learning_rate": 6.725579057502385e-06, "loss": 0.6318, "step": 8513 }, { "epoch": 0.89, "learning_rate": 6.713428680786216e-06, "loss": 0.6608, "step": 8514 }, { "epoch": 0.89, "learning_rate": 6.701288908161407e-06, "loss": 0.6883, "step": 8515 }, { "epoch": 0.89, "learning_rate": 6.689159741007889e-06, "loss": 0.7057, "step": 8516 }, { "epoch": 0.89, "learning_rate": 6.6770411807044244e-06, "loss": 0.6431, "step": 8517 }, { "epoch": 0.89, "learning_rate": 6.664933228628567e-06, "loss": 0.7344, "step": 8518 }, { "epoch": 0.89, "learning_rate": 6.652835886156627e-06, "loss": 0.6771, "step": 8519 }, { "epoch": 0.89, "learning_rate": 6.64074915466375e-06, "loss": 0.6813, "step": 8520 }, { "epoch": 0.89, "learning_rate": 6.628673035523891e-06, "loss": 0.6706, "step": 8521 }, { "epoch": 0.89, "learning_rate": 6.616607530109709e-06, "loss": 0.6844, "step": 8522 }, { "epoch": 0.89, "learning_rate": 6.604552639792771e-06, "loss": 0.689, "step": 8523 }, { "epoch": 0.89, "learning_rate": 6.5925083659433615e-06, "loss": 0.6899, "step": 8524 }, { "epoch": 0.89, "learning_rate": 6.580474709930562e-06, "loss": 0.6297, "step": 8525 }, { "epoch": 0.89, "learning_rate": 6.568451673122311e-06, "loss": 0.6093, "step": 8526 }, { "epoch": 0.89, "learning_rate": 6.556439256885238e-06, "loss": 0.6665, "step": 8527 }, { "epoch": 0.89, "learning_rate": 6.54443746258484e-06, "loss": 0.6656, "step": 8528 }, { "epoch": 0.89, "learning_rate": 6.532446291585426e-06, "loss": 0.6447, "step": 8529 }, { "epoch": 0.89, "learning_rate": 6.520465745250004e-06, "loss": 0.649, "step": 8530 }, { "epoch": 0.89, "learning_rate": 6.508495824940453e-06, "loss": 0.6893, "step": 8531 }, { "epoch": 0.89, "learning_rate": 6.49653653201745e-06, "loss": 0.6811, "step": 8532 }, { "epoch": 0.89, "learning_rate": 6.484587867840375e-06, "loss": 0.6281, "step": 8533 }, { "epoch": 0.89, "learning_rate": 6.472649833767497e-06, "loss": 0.7499, "step": 8534 }, { "epoch": 0.89, "learning_rate": 6.460722431155841e-06, "loss": 0.6331, "step": 8535 }, { "epoch": 0.89, "learning_rate": 6.448805661361223e-06, "loss": 0.6884, "step": 8536 }, { "epoch": 0.89, "learning_rate": 6.4368995257382155e-06, "loss": 0.6567, "step": 8537 }, { "epoch": 0.89, "learning_rate": 6.425004025640247e-06, "loss": 0.6516, "step": 8538 }, { "epoch": 0.89, "learning_rate": 6.41311916241949e-06, "loss": 0.6098, "step": 8539 }, { "epoch": 0.89, "learning_rate": 6.40124493742692e-06, "loss": 0.7085, "step": 8540 }, { "epoch": 0.89, "learning_rate": 6.389381352012336e-06, "loss": 0.6746, "step": 8541 }, { "epoch": 0.89, "learning_rate": 6.377528407524269e-06, "loss": 0.6734, "step": 8542 }, { "epoch": 0.89, "learning_rate": 6.365686105310076e-06, "loss": 0.6696, "step": 8543 }, { "epoch": 0.89, "learning_rate": 6.353854446715901e-06, "loss": 0.7086, "step": 8544 }, { "epoch": 0.89, "learning_rate": 6.342033433086669e-06, "loss": 0.6412, "step": 8545 }, { "epoch": 0.89, "learning_rate": 6.330223065766117e-06, "loss": 0.6709, "step": 8546 }, { "epoch": 0.89, "learning_rate": 6.3184233460967245e-06, "loss": 0.6275, "step": 8547 }, { "epoch": 0.89, "learning_rate": 6.306634275419832e-06, "loss": 0.7093, "step": 8548 }, { "epoch": 0.89, "learning_rate": 6.294855855075499e-06, "loss": 0.7019, "step": 8549 }, { "epoch": 0.89, "learning_rate": 6.283088086402622e-06, "loss": 0.6708, "step": 8550 }, { "epoch": 0.89, "learning_rate": 6.271330970738842e-06, "loss": 0.6612, "step": 8551 }, { "epoch": 0.89, "learning_rate": 6.2595845094206575e-06, "loss": 0.6556, "step": 8552 }, { "epoch": 0.89, "learning_rate": 6.247848703783277e-06, "loss": 0.6133, "step": 8553 }, { "epoch": 0.89, "learning_rate": 6.236123555160755e-06, "loss": 0.7072, "step": 8554 }, { "epoch": 0.89, "learning_rate": 6.224409064885928e-06, "loss": 0.6399, "step": 8555 }, { "epoch": 0.89, "learning_rate": 6.212705234290372e-06, "loss": 0.6952, "step": 8556 }, { "epoch": 0.89, "learning_rate": 6.201012064704504e-06, "loss": 0.6718, "step": 8557 }, { "epoch": 0.89, "learning_rate": 6.189329557457535e-06, "loss": 0.5791, "step": 8558 }, { "epoch": 0.89, "learning_rate": 6.177657713877416e-06, "loss": 0.7298, "step": 8559 }, { "epoch": 0.89, "learning_rate": 6.165996535290919e-06, "loss": 0.6109, "step": 8560 }, { "epoch": 0.89, "learning_rate": 6.1543460230235825e-06, "loss": 0.6779, "step": 8561 }, { "epoch": 0.89, "learning_rate": 6.142706178399782e-06, "loss": 0.6706, "step": 8562 }, { "epoch": 0.89, "learning_rate": 6.131077002742613e-06, "loss": 0.6362, "step": 8563 }, { "epoch": 0.89, "learning_rate": 6.119458497373986e-06, "loss": 0.7682, "step": 8564 }, { "epoch": 0.89, "learning_rate": 6.107850663614611e-06, "loss": 0.6286, "step": 8565 }, { "epoch": 0.89, "learning_rate": 6.096253502784e-06, "loss": 0.6708, "step": 8566 }, { "epoch": 0.89, "learning_rate": 6.084667016200385e-06, "loss": 0.7119, "step": 8567 }, { "epoch": 0.89, "learning_rate": 6.073091205180847e-06, "loss": 0.6944, "step": 8568 }, { "epoch": 0.89, "learning_rate": 6.061526071041257e-06, "loss": 0.6749, "step": 8569 }, { "epoch": 0.89, "learning_rate": 6.049971615096217e-06, "loss": 0.6874, "step": 8570 }, { "epoch": 0.89, "learning_rate": 6.038427838659155e-06, "loss": 0.734, "step": 8571 }, { "epoch": 0.89, "learning_rate": 6.026894743042288e-06, "loss": 0.7095, "step": 8572 }, { "epoch": 0.89, "learning_rate": 6.015372329556601e-06, "loss": 0.7067, "step": 8573 }, { "epoch": 0.89, "learning_rate": 6.00386059951189e-06, "loss": 0.5888, "step": 8574 }, { "epoch": 0.89, "learning_rate": 5.992359554216697e-06, "loss": 0.6902, "step": 8575 }, { "epoch": 0.89, "learning_rate": 5.980869194978356e-06, "loss": 0.6613, "step": 8576 }, { "epoch": 0.89, "learning_rate": 5.969389523103031e-06, "loss": 0.7051, "step": 8577 }, { "epoch": 0.89, "learning_rate": 5.957920539895656e-06, "loss": 0.6917, "step": 8578 }, { "epoch": 0.89, "learning_rate": 5.94646224665989e-06, "loss": 0.6213, "step": 8579 }, { "epoch": 0.89, "learning_rate": 5.935014644698245e-06, "loss": 0.7357, "step": 8580 }, { "epoch": 0.89, "learning_rate": 5.923577735312014e-06, "loss": 0.6052, "step": 8581 }, { "epoch": 0.89, "learning_rate": 5.912151519801213e-06, "loss": 0.6798, "step": 8582 }, { "epoch": 0.89, "learning_rate": 5.900735999464735e-06, "loss": 0.6441, "step": 8583 }, { "epoch": 0.89, "learning_rate": 5.889331175600166e-06, "loss": 0.7344, "step": 8584 }, { "epoch": 0.89, "learning_rate": 5.877937049503934e-06, "loss": 0.692, "step": 8585 }, { "epoch": 0.89, "learning_rate": 5.866553622471249e-06, "loss": 0.7276, "step": 8586 }, { "epoch": 0.89, "learning_rate": 5.855180895796087e-06, "loss": 0.6345, "step": 8587 }, { "epoch": 0.89, "learning_rate": 5.8438188707711675e-06, "loss": 0.6297, "step": 8588 }, { "epoch": 0.89, "learning_rate": 5.832467548688103e-06, "loss": 0.7053, "step": 8589 }, { "epoch": 0.89, "learning_rate": 5.821126930837162e-06, "loss": 0.7055, "step": 8590 }, { "epoch": 0.89, "learning_rate": 5.80979701850749e-06, "loss": 0.6622, "step": 8591 }, { "epoch": 0.89, "learning_rate": 5.798477812987002e-06, "loss": 0.6008, "step": 8592 }, { "epoch": 0.89, "learning_rate": 5.787169315562324e-06, "loss": 0.6677, "step": 8593 }, { "epoch": 0.89, "learning_rate": 5.775871527518962e-06, "loss": 0.6425, "step": 8594 }, { "epoch": 0.89, "learning_rate": 5.764584450141153e-06, "loss": 0.6583, "step": 8595 }, { "epoch": 0.89, "learning_rate": 5.7533080847119055e-06, "loss": 0.6579, "step": 8596 }, { "epoch": 0.89, "learning_rate": 5.74204243251305e-06, "loss": 0.6354, "step": 8597 }, { "epoch": 0.89, "learning_rate": 5.7307874948251736e-06, "loss": 0.6489, "step": 8598 }, { "epoch": 0.9, "learning_rate": 5.719543272927641e-06, "loss": 0.6695, "step": 8599 }, { "epoch": 0.9, "learning_rate": 5.708309768098618e-06, "loss": 0.6033, "step": 8600 }, { "epoch": 0.9, "learning_rate": 5.697086981615052e-06, "loss": 0.6748, "step": 8601 }, { "epoch": 0.9, "learning_rate": 5.6858749147526204e-06, "loss": 0.6707, "step": 8602 }, { "epoch": 0.9, "learning_rate": 5.67467356878586e-06, "loss": 0.6814, "step": 8603 }, { "epoch": 0.9, "learning_rate": 5.663482944988041e-06, "loss": 0.6618, "step": 8604 }, { "epoch": 0.9, "learning_rate": 5.652303044631224e-06, "loss": 0.6959, "step": 8605 }, { "epoch": 0.9, "learning_rate": 5.6411338689862705e-06, "loss": 0.6035, "step": 8606 }, { "epoch": 0.9, "learning_rate": 5.629975419322775e-06, "loss": 0.6639, "step": 8607 }, { "epoch": 0.9, "learning_rate": 5.618827696909168e-06, "loss": 0.6235, "step": 8608 }, { "epoch": 0.9, "learning_rate": 5.6076907030126356e-06, "loss": 0.6668, "step": 8609 }, { "epoch": 0.9, "learning_rate": 5.596564438899132e-06, "loss": 0.6667, "step": 8610 }, { "epoch": 0.9, "learning_rate": 5.585448905833401e-06, "loss": 0.6434, "step": 8611 }, { "epoch": 0.9, "learning_rate": 5.574344105078999e-06, "loss": 0.6594, "step": 8612 }, { "epoch": 0.9, "learning_rate": 5.563250037898204e-06, "loss": 0.6252, "step": 8613 }, { "epoch": 0.9, "learning_rate": 5.5521667055521086e-06, "loss": 0.6164, "step": 8614 }, { "epoch": 0.9, "learning_rate": 5.541094109300593e-06, "loss": 0.6921, "step": 8615 }, { "epoch": 0.9, "learning_rate": 5.530032250402284e-06, "loss": 0.7163, "step": 8616 }, { "epoch": 0.9, "learning_rate": 5.518981130114609e-06, "loss": 0.6606, "step": 8617 }, { "epoch": 0.9, "learning_rate": 5.507940749693796e-06, "loss": 0.6393, "step": 8618 }, { "epoch": 0.9, "learning_rate": 5.496911110394809e-06, "loss": 0.6434, "step": 8619 }, { "epoch": 0.9, "learning_rate": 5.485892213471422e-06, "loss": 0.7019, "step": 8620 }, { "epoch": 0.9, "learning_rate": 5.474884060176178e-06, "loss": 0.6719, "step": 8621 }, { "epoch": 0.9, "learning_rate": 5.463886651760386e-06, "loss": 0.7158, "step": 8622 }, { "epoch": 0.9, "learning_rate": 5.452899989474159e-06, "loss": 0.6766, "step": 8623 }, { "epoch": 0.9, "learning_rate": 5.441924074566362e-06, "loss": 0.6147, "step": 8624 }, { "epoch": 0.9, "learning_rate": 5.430958908284667e-06, "loss": 0.6558, "step": 8625 }, { "epoch": 0.9, "learning_rate": 5.420004491875497e-06, "loss": 0.6704, "step": 8626 }, { "epoch": 0.9, "learning_rate": 5.409060826584078e-06, "loss": 0.5834, "step": 8627 }, { "epoch": 0.9, "learning_rate": 5.398127913654383e-06, "loss": 0.7637, "step": 8628 }, { "epoch": 0.9, "learning_rate": 5.3872057543291945e-06, "loss": 0.6531, "step": 8629 }, { "epoch": 0.9, "learning_rate": 5.376294349850042e-06, "loss": 0.6719, "step": 8630 }, { "epoch": 0.9, "learning_rate": 5.365393701457255e-06, "loss": 0.6615, "step": 8631 }, { "epoch": 0.9, "learning_rate": 5.354503810389966e-06, "loss": 0.635, "step": 8632 }, { "epoch": 0.9, "learning_rate": 5.343624677886005e-06, "loss": 0.7111, "step": 8633 }, { "epoch": 0.9, "learning_rate": 5.332756305182051e-06, "loss": 0.6243, "step": 8634 }, { "epoch": 0.9, "learning_rate": 5.321898693513538e-06, "loss": 0.6818, "step": 8635 }, { "epoch": 0.9, "learning_rate": 5.311051844114667e-06, "loss": 0.6404, "step": 8636 }, { "epoch": 0.9, "learning_rate": 5.300215758218441e-06, "loss": 0.6517, "step": 8637 }, { "epoch": 0.9, "learning_rate": 5.289390437056596e-06, "loss": 0.6187, "step": 8638 }, { "epoch": 0.9, "learning_rate": 5.278575881859693e-06, "loss": 0.6874, "step": 8639 }, { "epoch": 0.9, "learning_rate": 5.267772093857015e-06, "loss": 0.651, "step": 8640 }, { "epoch": 0.9, "learning_rate": 5.256979074276691e-06, "loss": 0.6624, "step": 8641 }, { "epoch": 0.9, "learning_rate": 5.246196824345562e-06, "loss": 0.6709, "step": 8642 }, { "epoch": 0.9, "learning_rate": 5.23542534528928e-06, "loss": 0.669, "step": 8643 }, { "epoch": 0.9, "learning_rate": 5.2246646383322554e-06, "loss": 0.661, "step": 8644 }, { "epoch": 0.9, "learning_rate": 5.213914704697687e-06, "loss": 0.6708, "step": 8645 }, { "epoch": 0.9, "learning_rate": 5.203175545607552e-06, "loss": 0.5937, "step": 8646 }, { "epoch": 0.9, "learning_rate": 5.192447162282576e-06, "loss": 0.7037, "step": 8647 }, { "epoch": 0.9, "learning_rate": 5.181729555942283e-06, "loss": 0.7205, "step": 8648 }, { "epoch": 0.9, "learning_rate": 5.171022727804986e-06, "loss": 0.6842, "step": 8649 }, { "epoch": 0.9, "learning_rate": 5.160326679087735e-06, "loss": 0.6633, "step": 8650 }, { "epoch": 0.9, "learning_rate": 5.149641411006389e-06, "loss": 0.6731, "step": 8651 }, { "epoch": 0.9, "learning_rate": 5.138966924775546e-06, "loss": 0.6065, "step": 8652 }, { "epoch": 0.9, "learning_rate": 5.12830322160861e-06, "loss": 0.6145, "step": 8653 }, { "epoch": 0.9, "learning_rate": 5.1176503027177356e-06, "loss": 0.6666, "step": 8654 }, { "epoch": 0.9, "learning_rate": 5.107008169313887e-06, "loss": 0.667, "step": 8655 }, { "epoch": 0.9, "learning_rate": 5.096376822606752e-06, "loss": 0.6818, "step": 8656 }, { "epoch": 0.9, "learning_rate": 5.085756263804841e-06, "loss": 0.6526, "step": 8657 }, { "epoch": 0.9, "learning_rate": 5.075146494115424e-06, "loss": 0.6424, "step": 8658 }, { "epoch": 0.9, "learning_rate": 5.0645475147445e-06, "loss": 0.6761, "step": 8659 }, { "epoch": 0.9, "learning_rate": 5.0539593268968955e-06, "loss": 0.6774, "step": 8660 }, { "epoch": 0.9, "learning_rate": 5.043381931776226e-06, "loss": 0.6027, "step": 8661 }, { "epoch": 0.9, "learning_rate": 5.032815330584795e-06, "loss": 0.658, "step": 8662 }, { "epoch": 0.9, "learning_rate": 5.022259524523776e-06, "loss": 0.7417, "step": 8663 }, { "epoch": 0.9, "learning_rate": 5.011714514793053e-06, "loss": 0.6255, "step": 8664 }, { "epoch": 0.9, "learning_rate": 5.001180302591279e-06, "loss": 0.5993, "step": 8665 }, { "epoch": 0.9, "learning_rate": 4.990656889115941e-06, "loss": 0.5829, "step": 8666 }, { "epoch": 0.9, "learning_rate": 4.980144275563214e-06, "loss": 0.6511, "step": 8667 }, { "epoch": 0.9, "learning_rate": 4.969642463128122e-06, "loss": 0.6966, "step": 8668 }, { "epoch": 0.9, "learning_rate": 4.95915145300444e-06, "loss": 0.6909, "step": 8669 }, { "epoch": 0.9, "learning_rate": 4.948671246384662e-06, "loss": 0.6799, "step": 8670 }, { "epoch": 0.9, "learning_rate": 4.938201844460133e-06, "loss": 0.6741, "step": 8671 }, { "epoch": 0.9, "learning_rate": 4.927743248420924e-06, "loss": 0.6466, "step": 8672 }, { "epoch": 0.9, "learning_rate": 4.917295459455873e-06, "loss": 0.6717, "step": 8673 }, { "epoch": 0.9, "learning_rate": 4.906858478752618e-06, "loss": 0.6698, "step": 8674 }, { "epoch": 0.9, "learning_rate": 4.896432307497556e-06, "loss": 0.6643, "step": 8675 }, { "epoch": 0.9, "learning_rate": 4.886016946875838e-06, "loss": 0.7273, "step": 8676 }, { "epoch": 0.9, "learning_rate": 4.8756123980714276e-06, "loss": 0.6552, "step": 8677 }, { "epoch": 0.9, "learning_rate": 4.8652186622670125e-06, "loss": 0.588, "step": 8678 }, { "epoch": 0.9, "learning_rate": 4.8548357406440594e-06, "loss": 0.6697, "step": 8679 }, { "epoch": 0.9, "learning_rate": 4.844463634382823e-06, "loss": 0.6609, "step": 8680 }, { "epoch": 0.9, "learning_rate": 4.834102344662361e-06, "loss": 0.6517, "step": 8681 }, { "epoch": 0.9, "learning_rate": 4.82375187266042e-06, "loss": 0.72, "step": 8682 }, { "epoch": 0.9, "learning_rate": 4.813412219553593e-06, "loss": 0.6151, "step": 8683 }, { "epoch": 0.9, "learning_rate": 4.803083386517171e-06, "loss": 0.707, "step": 8684 }, { "epoch": 0.9, "learning_rate": 4.792765374725294e-06, "loss": 0.6306, "step": 8685 }, { "epoch": 0.9, "learning_rate": 4.782458185350825e-06, "loss": 0.6726, "step": 8686 }, { "epoch": 0.9, "learning_rate": 4.772161819565391e-06, "loss": 0.6352, "step": 8687 }, { "epoch": 0.9, "learning_rate": 4.761876278539412e-06, "loss": 0.6991, "step": 8688 }, { "epoch": 0.9, "learning_rate": 4.751601563442076e-06, "loss": 0.651, "step": 8689 }, { "epoch": 0.9, "learning_rate": 4.741337675441326e-06, "loss": 0.6264, "step": 8690 }, { "epoch": 0.9, "learning_rate": 4.7310846157038735e-06, "loss": 0.6626, "step": 8691 }, { "epoch": 0.9, "learning_rate": 4.7208423853952185e-06, "loss": 0.6145, "step": 8692 }, { "epoch": 0.9, "learning_rate": 4.710610985679598e-06, "loss": 0.6508, "step": 8693 }, { "epoch": 0.9, "learning_rate": 4.700390417720058e-06, "loss": 0.6121, "step": 8694 }, { "epoch": 0.91, "learning_rate": 4.690180682678391e-06, "loss": 0.5888, "step": 8695 }, { "epoch": 0.91, "learning_rate": 4.679981781715148e-06, "loss": 0.685, "step": 8696 }, { "epoch": 0.91, "learning_rate": 4.669793715989667e-06, "loss": 0.6838, "step": 8697 }, { "epoch": 0.91, "learning_rate": 4.6596164866600675e-06, "loss": 0.6509, "step": 8698 }, { "epoch": 0.91, "learning_rate": 4.649450094883179e-06, "loss": 0.677, "step": 8699 }, { "epoch": 0.91, "learning_rate": 4.639294541814665e-06, "loss": 0.6394, "step": 8700 }, { "epoch": 0.91, "learning_rate": 4.629149828608936e-06, "loss": 0.7007, "step": 8701 }, { "epoch": 0.91, "learning_rate": 4.619015956419148e-06, "loss": 0.6593, "step": 8702 }, { "epoch": 0.91, "learning_rate": 4.608892926397235e-06, "loss": 0.67, "step": 8703 }, { "epoch": 0.91, "learning_rate": 4.5987807396939305e-06, "loss": 0.6514, "step": 8704 }, { "epoch": 0.91, "learning_rate": 4.588679397458673e-06, "loss": 0.7355, "step": 8705 }, { "epoch": 0.91, "learning_rate": 4.578588900839731e-06, "loss": 0.6953, "step": 8706 }, { "epoch": 0.91, "learning_rate": 4.568509250984099e-06, "loss": 0.7114, "step": 8707 }, { "epoch": 0.91, "learning_rate": 4.55844044903756e-06, "loss": 0.6435, "step": 8708 }, { "epoch": 0.91, "learning_rate": 4.548382496144676e-06, "loss": 0.6199, "step": 8709 }, { "epoch": 0.91, "learning_rate": 4.538335393448723e-06, "loss": 0.699, "step": 8710 }, { "epoch": 0.91, "learning_rate": 4.528299142091785e-06, "loss": 0.6932, "step": 8711 }, { "epoch": 0.91, "learning_rate": 4.518273743214729e-06, "loss": 0.6394, "step": 8712 }, { "epoch": 0.91, "learning_rate": 4.508259197957143e-06, "loss": 0.6767, "step": 8713 }, { "epoch": 0.91, "learning_rate": 4.498255507457416e-06, "loss": 0.6183, "step": 8714 }, { "epoch": 0.91, "learning_rate": 4.4882626728526615e-06, "loss": 0.6682, "step": 8715 }, { "epoch": 0.91, "learning_rate": 4.4782806952788245e-06, "loss": 0.652, "step": 8716 }, { "epoch": 0.91, "learning_rate": 4.468309575870555e-06, "loss": 0.7402, "step": 8717 }, { "epoch": 0.91, "learning_rate": 4.458349315761301e-06, "loss": 0.6249, "step": 8718 }, { "epoch": 0.91, "learning_rate": 4.448399916083257e-06, "loss": 0.6165, "step": 8719 }, { "epoch": 0.91, "learning_rate": 4.438461377967395e-06, "loss": 0.5386, "step": 8720 }, { "epoch": 0.91, "learning_rate": 4.428533702543481e-06, "loss": 0.6491, "step": 8721 }, { "epoch": 0.91, "learning_rate": 4.418616890939964e-06, "loss": 0.6717, "step": 8722 }, { "epoch": 0.91, "learning_rate": 4.4087109442841555e-06, "loss": 0.6686, "step": 8723 }, { "epoch": 0.91, "learning_rate": 4.398815863702066e-06, "loss": 0.6855, "step": 8724 }, { "epoch": 0.91, "learning_rate": 4.388931650318484e-06, "loss": 0.6655, "step": 8725 }, { "epoch": 0.91, "learning_rate": 4.379058305256989e-06, "loss": 0.7186, "step": 8726 }, { "epoch": 0.91, "learning_rate": 4.369195829639883e-06, "loss": 0.6643, "step": 8727 }, { "epoch": 0.91, "learning_rate": 4.359344224588291e-06, "loss": 0.6541, "step": 8728 }, { "epoch": 0.91, "learning_rate": 4.34950349122204e-06, "loss": 0.6681, "step": 8729 }, { "epoch": 0.91, "learning_rate": 4.339673630659735e-06, "loss": 0.7024, "step": 8730 }, { "epoch": 0.91, "learning_rate": 4.329854644018783e-06, "loss": 0.6163, "step": 8731 }, { "epoch": 0.91, "learning_rate": 4.320046532415323e-06, "loss": 0.6654, "step": 8732 }, { "epoch": 0.91, "learning_rate": 4.310249296964264e-06, "loss": 0.5805, "step": 8733 }, { "epoch": 0.91, "learning_rate": 4.300462938779282e-06, "loss": 0.5881, "step": 8734 }, { "epoch": 0.91, "learning_rate": 4.290687458972808e-06, "loss": 0.6255, "step": 8735 }, { "epoch": 0.91, "learning_rate": 4.2809228586560445e-06, "loss": 0.6939, "step": 8736 }, { "epoch": 0.91, "learning_rate": 4.2711691389389576e-06, "loss": 0.6503, "step": 8737 }, { "epoch": 0.91, "learning_rate": 4.261426300930293e-06, "loss": 0.6807, "step": 8738 }, { "epoch": 0.91, "learning_rate": 4.2516943457375e-06, "loss": 0.6484, "step": 8739 }, { "epoch": 0.91, "learning_rate": 4.241973274466871e-06, "loss": 0.647, "step": 8740 }, { "epoch": 0.91, "learning_rate": 4.232263088223387e-06, "loss": 0.7202, "step": 8741 }, { "epoch": 0.91, "learning_rate": 4.222563788110856e-06, "loss": 0.62, "step": 8742 }, { "epoch": 0.91, "learning_rate": 4.212875375231806e-06, "loss": 0.6447, "step": 8743 }, { "epoch": 0.91, "learning_rate": 4.203197850687523e-06, "loss": 0.6154, "step": 8744 }, { "epoch": 0.91, "learning_rate": 4.193531215578095e-06, "loss": 0.5697, "step": 8745 }, { "epoch": 0.91, "learning_rate": 4.183875471002363e-06, "loss": 0.634, "step": 8746 }, { "epoch": 0.91, "learning_rate": 4.174230618057872e-06, "loss": 0.6164, "step": 8747 }, { "epoch": 0.91, "learning_rate": 4.164596657841013e-06, "loss": 0.6502, "step": 8748 }, { "epoch": 0.91, "learning_rate": 4.154973591446898e-06, "loss": 0.6924, "step": 8749 }, { "epoch": 0.91, "learning_rate": 4.145361419969373e-06, "loss": 0.6519, "step": 8750 }, { "epoch": 0.91, "learning_rate": 4.135760144501099e-06, "loss": 0.6518, "step": 8751 }, { "epoch": 0.91, "learning_rate": 4.126169766133481e-06, "loss": 0.6406, "step": 8752 }, { "epoch": 0.91, "learning_rate": 4.116590285956657e-06, "loss": 0.6844, "step": 8753 }, { "epoch": 0.91, "learning_rate": 4.107021705059566e-06, "loss": 0.7338, "step": 8754 }, { "epoch": 0.91, "learning_rate": 4.097464024529873e-06, "loss": 0.6917, "step": 8755 }, { "epoch": 0.91, "learning_rate": 4.087917245454021e-06, "loss": 0.7247, "step": 8756 }, { "epoch": 0.91, "learning_rate": 4.078381368917228e-06, "loss": 0.6682, "step": 8757 }, { "epoch": 0.91, "learning_rate": 4.068856396003462e-06, "loss": 0.6721, "step": 8758 }, { "epoch": 0.91, "learning_rate": 4.059342327795412e-06, "loss": 0.6315, "step": 8759 }, { "epoch": 0.91, "learning_rate": 4.049839165374602e-06, "loss": 0.6461, "step": 8760 }, { "epoch": 0.91, "learning_rate": 4.040346909821269e-06, "loss": 0.6243, "step": 8761 }, { "epoch": 0.91, "learning_rate": 4.0308655622144036e-06, "loss": 0.6762, "step": 8762 }, { "epoch": 0.91, "learning_rate": 4.021395123631799e-06, "loss": 0.5625, "step": 8763 }, { "epoch": 0.91, "learning_rate": 4.01193559514994e-06, "loss": 0.6915, "step": 8764 }, { "epoch": 0.91, "learning_rate": 4.0024869778441444e-06, "loss": 0.6809, "step": 8765 }, { "epoch": 0.91, "learning_rate": 3.993049272788452e-06, "loss": 0.7097, "step": 8766 }, { "epoch": 0.91, "learning_rate": 3.983622481055671e-06, "loss": 0.6208, "step": 8767 }, { "epoch": 0.91, "learning_rate": 3.974206603717345e-06, "loss": 0.7336, "step": 8768 }, { "epoch": 0.91, "learning_rate": 3.9648016418438295e-06, "loss": 0.6625, "step": 8769 }, { "epoch": 0.91, "learning_rate": 3.955407596504168e-06, "loss": 0.6776, "step": 8770 }, { "epoch": 0.91, "learning_rate": 3.94602446876623e-06, "loss": 0.6574, "step": 8771 }, { "epoch": 0.91, "learning_rate": 3.9366522596966275e-06, "loss": 0.7115, "step": 8772 }, { "epoch": 0.91, "learning_rate": 3.927290970360687e-06, "loss": 0.6838, "step": 8773 }, { "epoch": 0.91, "learning_rate": 3.917940601822534e-06, "loss": 0.6409, "step": 8774 }, { "epoch": 0.91, "learning_rate": 3.908601155145075e-06, "loss": 0.6172, "step": 8775 }, { "epoch": 0.91, "learning_rate": 3.899272631389916e-06, "loss": 0.5918, "step": 8776 }, { "epoch": 0.91, "learning_rate": 3.889955031617454e-06, "loss": 0.7018, "step": 8777 }, { "epoch": 0.91, "learning_rate": 3.880648356886862e-06, "loss": 0.6659, "step": 8778 }, { "epoch": 0.91, "learning_rate": 3.87135260825604e-06, "loss": 0.6481, "step": 8779 }, { "epoch": 0.91, "learning_rate": 3.8620677867816315e-06, "loss": 0.6436, "step": 8780 }, { "epoch": 0.91, "learning_rate": 3.852793893519102e-06, "loss": 0.6649, "step": 8781 }, { "epoch": 0.91, "learning_rate": 3.8435309295226096e-06, "loss": 0.6496, "step": 8782 }, { "epoch": 0.91, "learning_rate": 3.834278895845111e-06, "loss": 0.6073, "step": 8783 }, { "epoch": 0.91, "learning_rate": 3.8250377935382776e-06, "loss": 0.6224, "step": 8784 }, { "epoch": 0.91, "learning_rate": 3.815807623652601e-06, "loss": 0.67, "step": 8785 }, { "epoch": 0.91, "learning_rate": 3.8065883872372866e-06, "loss": 0.6903, "step": 8786 }, { "epoch": 0.91, "learning_rate": 3.7973800853402852e-06, "loss": 0.6861, "step": 8787 }, { "epoch": 0.91, "learning_rate": 3.7881827190083374e-06, "loss": 0.6036, "step": 8788 }, { "epoch": 0.91, "learning_rate": 3.77899628928694e-06, "loss": 0.621, "step": 8789 }, { "epoch": 0.91, "learning_rate": 3.7698207972203135e-06, "loss": 0.696, "step": 8790 }, { "epoch": 0.92, "learning_rate": 3.760656243851468e-06, "loss": 0.6976, "step": 8791 }, { "epoch": 0.92, "learning_rate": 3.751502630222181e-06, "loss": 0.647, "step": 8792 }, { "epoch": 0.92, "learning_rate": 3.742359957372932e-06, "loss": 0.6349, "step": 8793 }, { "epoch": 0.92, "learning_rate": 3.7332282263429774e-06, "loss": 0.6888, "step": 8794 }, { "epoch": 0.92, "learning_rate": 3.7241074381703876e-06, "loss": 0.6774, "step": 8795 }, { "epoch": 0.92, "learning_rate": 3.7149975938919003e-06, "loss": 0.6803, "step": 8796 }, { "epoch": 0.92, "learning_rate": 3.7058986945430643e-06, "loss": 0.6968, "step": 8797 }, { "epoch": 0.92, "learning_rate": 3.6968107411581963e-06, "loss": 0.6924, "step": 8798 }, { "epoch": 0.92, "learning_rate": 3.6877337347703045e-06, "loss": 0.6706, "step": 8799 }, { "epoch": 0.92, "learning_rate": 3.678667676411207e-06, "loss": 0.5971, "step": 8800 }, { "epoch": 0.92, "learning_rate": 3.669612567111491e-06, "loss": 0.625, "step": 8801 }, { "epoch": 0.92, "learning_rate": 3.6605684079004333e-06, "loss": 0.7324, "step": 8802 }, { "epoch": 0.92, "learning_rate": 3.651535199806122e-06, "loss": 0.6761, "step": 8803 }, { "epoch": 0.92, "learning_rate": 3.6425129438553698e-06, "loss": 0.6634, "step": 8804 }, { "epoch": 0.92, "learning_rate": 3.6335016410737778e-06, "loss": 0.7213, "step": 8805 }, { "epoch": 0.92, "learning_rate": 3.62450129248566e-06, "loss": 0.6313, "step": 8806 }, { "epoch": 0.92, "learning_rate": 3.615511899114099e-06, "loss": 0.6426, "step": 8807 }, { "epoch": 0.92, "learning_rate": 3.606533461980965e-06, "loss": 0.6521, "step": 8808 }, { "epoch": 0.92, "learning_rate": 3.597565982106843e-06, "loss": 0.6907, "step": 8809 }, { "epoch": 0.92, "learning_rate": 3.588609460511083e-06, "loss": 0.6162, "step": 8810 }, { "epoch": 0.92, "learning_rate": 3.5796638982118047e-06, "loss": 0.6835, "step": 8811 }, { "epoch": 0.92, "learning_rate": 3.570729296225872e-06, "loss": 0.6587, "step": 8812 }, { "epoch": 0.92, "learning_rate": 3.5618056555688726e-06, "loss": 0.7015, "step": 8813 }, { "epoch": 0.92, "learning_rate": 3.5528929772551955e-06, "loss": 0.6787, "step": 8814 }, { "epoch": 0.92, "learning_rate": 3.5439912622979855e-06, "loss": 0.6604, "step": 8815 }, { "epoch": 0.92, "learning_rate": 3.5351005117090772e-06, "loss": 0.6489, "step": 8816 }, { "epoch": 0.92, "learning_rate": 3.526220726499152e-06, "loss": 0.741, "step": 8817 }, { "epoch": 0.92, "learning_rate": 3.517351907677535e-06, "loss": 0.6869, "step": 8818 }, { "epoch": 0.92, "learning_rate": 3.5084940562524205e-06, "loss": 0.674, "step": 8819 }, { "epoch": 0.92, "learning_rate": 3.499647173230669e-06, "loss": 0.7065, "step": 8820 }, { "epoch": 0.92, "learning_rate": 3.490811259617932e-06, "loss": 0.7294, "step": 8821 }, { "epoch": 0.92, "learning_rate": 3.481986316418606e-06, "loss": 0.6559, "step": 8822 }, { "epoch": 0.92, "learning_rate": 3.4731723446358555e-06, "loss": 0.6181, "step": 8823 }, { "epoch": 0.92, "learning_rate": 3.4643693452715565e-06, "loss": 0.7079, "step": 8824 }, { "epoch": 0.92, "learning_rate": 3.4555773193263864e-06, "loss": 0.7093, "step": 8825 }, { "epoch": 0.92, "learning_rate": 3.4467962677997565e-06, "loss": 0.5822, "step": 8826 }, { "epoch": 0.92, "learning_rate": 3.4380261916898027e-06, "loss": 0.6086, "step": 8827 }, { "epoch": 0.92, "learning_rate": 3.429267091993471e-06, "loss": 0.6628, "step": 8828 }, { "epoch": 0.92, "learning_rate": 3.420518969706421e-06, "loss": 0.6385, "step": 8829 }, { "epoch": 0.92, "learning_rate": 3.411781825823046e-06, "loss": 0.6327, "step": 8830 }, { "epoch": 0.92, "learning_rate": 3.4030556613365627e-06, "loss": 0.6189, "step": 8831 }, { "epoch": 0.92, "learning_rate": 3.3943404772388553e-06, "loss": 0.6356, "step": 8832 }, { "epoch": 0.92, "learning_rate": 3.3856362745205982e-06, "loss": 0.6284, "step": 8833 }, { "epoch": 0.92, "learning_rate": 3.376943054171222e-06, "loss": 0.7031, "step": 8834 }, { "epoch": 0.92, "learning_rate": 3.368260817178925e-06, "loss": 0.608, "step": 8835 }, { "epoch": 0.92, "learning_rate": 3.3595895645306185e-06, "loss": 0.6617, "step": 8836 }, { "epoch": 0.92, "learning_rate": 3.350929297211969e-06, "loss": 0.7153, "step": 8837 }, { "epoch": 0.92, "learning_rate": 3.3422800162074554e-06, "loss": 0.6647, "step": 8838 }, { "epoch": 0.92, "learning_rate": 3.3336417225002027e-06, "loss": 0.6435, "step": 8839 }, { "epoch": 0.92, "learning_rate": 3.3250144170721808e-06, "loss": 0.6232, "step": 8840 }, { "epoch": 0.92, "learning_rate": 3.3163981009040836e-06, "loss": 0.7109, "step": 8841 }, { "epoch": 0.92, "learning_rate": 3.307792774975316e-06, "loss": 0.6672, "step": 8842 }, { "epoch": 0.92, "learning_rate": 3.299198440264084e-06, "loss": 0.6726, "step": 8843 }, { "epoch": 0.92, "learning_rate": 3.2906150977473184e-06, "loss": 0.7411, "step": 8844 }, { "epoch": 0.92, "learning_rate": 3.2820427484006933e-06, "loss": 0.6611, "step": 8845 }, { "epoch": 0.92, "learning_rate": 3.2734813931986854e-06, "loss": 0.5927, "step": 8846 }, { "epoch": 0.92, "learning_rate": 3.2649310331144376e-06, "loss": 0.617, "step": 8847 }, { "epoch": 0.92, "learning_rate": 3.256391669119907e-06, "loss": 0.6552, "step": 8848 }, { "epoch": 0.92, "learning_rate": 3.247863302185794e-06, "loss": 0.7091, "step": 8849 }, { "epoch": 0.92, "learning_rate": 3.2393459332815234e-06, "loss": 0.6863, "step": 8850 }, { "epoch": 0.92, "learning_rate": 3.2308395633752764e-06, "loss": 0.6844, "step": 8851 }, { "epoch": 0.92, "learning_rate": 3.2223441934340237e-06, "loss": 0.6558, "step": 8852 }, { "epoch": 0.92, "learning_rate": 3.2138598244234155e-06, "loss": 0.6067, "step": 8853 }, { "epoch": 0.92, "learning_rate": 3.2053864573079017e-06, "loss": 0.5795, "step": 8854 }, { "epoch": 0.92, "learning_rate": 3.1969240930506796e-06, "loss": 0.6838, "step": 8855 }, { "epoch": 0.92, "learning_rate": 3.18847273261369e-06, "loss": 0.7195, "step": 8856 }, { "epoch": 0.92, "learning_rate": 3.1800323769575756e-06, "loss": 0.6951, "step": 8857 }, { "epoch": 0.92, "learning_rate": 3.171603027041825e-06, "loss": 0.6646, "step": 8858 }, { "epoch": 0.92, "learning_rate": 3.1631846838245714e-06, "loss": 0.5914, "step": 8859 }, { "epoch": 0.92, "learning_rate": 3.154777348262772e-06, "loss": 0.6541, "step": 8860 }, { "epoch": 0.92, "learning_rate": 3.146381021312117e-06, "loss": 0.6184, "step": 8861 }, { "epoch": 0.92, "learning_rate": 3.1379957039270213e-06, "loss": 0.6751, "step": 8862 }, { "epoch": 0.92, "learning_rate": 3.129621397060667e-06, "loss": 0.6719, "step": 8863 }, { "epoch": 0.92, "learning_rate": 3.12125810166497e-06, "loss": 0.6636, "step": 8864 }, { "epoch": 0.92, "learning_rate": 3.1129058186906033e-06, "loss": 0.6444, "step": 8865 }, { "epoch": 0.92, "learning_rate": 3.104564549087019e-06, "loss": 0.6626, "step": 8866 }, { "epoch": 0.92, "learning_rate": 3.096234293802358e-06, "loss": 0.6875, "step": 8867 }, { "epoch": 0.92, "learning_rate": 3.087915053783541e-06, "loss": 0.7161, "step": 8868 }, { "epoch": 0.92, "learning_rate": 3.079606829976267e-06, "loss": 0.6809, "step": 8869 }, { "epoch": 0.92, "learning_rate": 3.071309623324914e-06, "loss": 0.6822, "step": 8870 }, { "epoch": 0.92, "learning_rate": 3.0630234347726383e-06, "loss": 0.6748, "step": 8871 }, { "epoch": 0.92, "learning_rate": 3.054748265261387e-06, "loss": 0.6583, "step": 8872 }, { "epoch": 0.92, "learning_rate": 3.046484115731785e-06, "loss": 0.6937, "step": 8873 }, { "epoch": 0.92, "learning_rate": 3.0382309871232364e-06, "loss": 0.6727, "step": 8874 }, { "epoch": 0.92, "learning_rate": 3.029988880373924e-06, "loss": 0.7291, "step": 8875 }, { "epoch": 0.92, "learning_rate": 3.021757796420721e-06, "loss": 0.6148, "step": 8876 }, { "epoch": 0.92, "learning_rate": 3.013537736199268e-06, "loss": 0.738, "step": 8877 }, { "epoch": 0.92, "learning_rate": 3.0053287006439832e-06, "loss": 0.6818, "step": 8878 }, { "epoch": 0.92, "learning_rate": 2.997130690687977e-06, "loss": 0.6546, "step": 8879 }, { "epoch": 0.92, "learning_rate": 2.988943707263148e-06, "loss": 0.6727, "step": 8880 }, { "epoch": 0.92, "learning_rate": 2.9807677513001397e-06, "loss": 0.6649, "step": 8881 }, { "epoch": 0.92, "learning_rate": 2.9726028237283097e-06, "loss": 0.6813, "step": 8882 }, { "epoch": 0.92, "learning_rate": 2.9644489254758045e-06, "loss": 0.6889, "step": 8883 }, { "epoch": 0.92, "learning_rate": 2.9563060574694822e-06, "loss": 0.6816, "step": 8884 }, { "epoch": 0.92, "learning_rate": 2.9481742206349584e-06, "loss": 0.6679, "step": 8885 }, { "epoch": 0.92, "learning_rate": 2.9400534158966154e-06, "loss": 0.6283, "step": 8886 }, { "epoch": 0.93, "learning_rate": 2.931943644177537e-06, "loss": 0.6885, "step": 8887 }, { "epoch": 0.93, "learning_rate": 2.9238449063995864e-06, "loss": 0.6684, "step": 8888 }, { "epoch": 0.93, "learning_rate": 2.9157572034833936e-06, "loss": 0.6568, "step": 8889 }, { "epoch": 0.93, "learning_rate": 2.907680536348256e-06, "loss": 0.6535, "step": 8890 }, { "epoch": 0.93, "learning_rate": 2.899614905912307e-06, "loss": 0.7125, "step": 8891 }, { "epoch": 0.93, "learning_rate": 2.8915603130923786e-06, "loss": 0.6, "step": 8892 }, { "epoch": 0.93, "learning_rate": 2.883516758804039e-06, "loss": 0.6617, "step": 8893 }, { "epoch": 0.93, "learning_rate": 2.8754842439616237e-06, "loss": 0.6278, "step": 8894 }, { "epoch": 0.93, "learning_rate": 2.8674627694782132e-06, "loss": 0.6106, "step": 8895 }, { "epoch": 0.93, "learning_rate": 2.859452336265622e-06, "loss": 0.6764, "step": 8896 }, { "epoch": 0.93, "learning_rate": 2.8514529452344007e-06, "loss": 0.6836, "step": 8897 }, { "epoch": 0.93, "learning_rate": 2.8434645972938766e-06, "loss": 0.7339, "step": 8898 }, { "epoch": 0.93, "learning_rate": 2.8354872933520906e-06, "loss": 0.6887, "step": 8899 }, { "epoch": 0.93, "learning_rate": 2.8275210343158386e-06, "loss": 0.6446, "step": 8900 }, { "epoch": 0.93, "learning_rate": 2.819565821090686e-06, "loss": 0.6697, "step": 8901 }, { "epoch": 0.93, "learning_rate": 2.811621654580898e-06, "loss": 0.6082, "step": 8902 }, { "epoch": 0.93, "learning_rate": 2.803688535689519e-06, "loss": 0.6534, "step": 8903 }, { "epoch": 0.93, "learning_rate": 2.795766465318295e-06, "loss": 0.6519, "step": 8904 }, { "epoch": 0.93, "learning_rate": 2.787855444367782e-06, "loss": 0.6704, "step": 8905 }, { "epoch": 0.93, "learning_rate": 2.779955473737228e-06, "loss": 0.5759, "step": 8906 }, { "epoch": 0.93, "learning_rate": 2.772066554324626e-06, "loss": 0.7112, "step": 8907 }, { "epoch": 0.93, "learning_rate": 2.7641886870267585e-06, "loss": 0.709, "step": 8908 }, { "epoch": 0.93, "learning_rate": 2.7563218727391094e-06, "loss": 0.6568, "step": 8909 }, { "epoch": 0.93, "learning_rate": 2.748466112355885e-06, "loss": 0.6228, "step": 8910 }, { "epoch": 0.93, "learning_rate": 2.7406214067701054e-06, "loss": 0.7042, "step": 8911 }, { "epoch": 0.93, "learning_rate": 2.732787756873478e-06, "loss": 0.6218, "step": 8912 }, { "epoch": 0.93, "learning_rate": 2.72496516355647e-06, "loss": 0.6853, "step": 8913 }, { "epoch": 0.93, "learning_rate": 2.717153627708302e-06, "loss": 0.7101, "step": 8914 }, { "epoch": 0.93, "learning_rate": 2.7093531502169424e-06, "loss": 0.6378, "step": 8915 }, { "epoch": 0.93, "learning_rate": 2.701563731969048e-06, "loss": 0.6896, "step": 8916 }, { "epoch": 0.93, "learning_rate": 2.6937853738500883e-06, "loss": 0.7256, "step": 8917 }, { "epoch": 0.93, "learning_rate": 2.6860180767442456e-06, "loss": 0.6745, "step": 8918 }, { "epoch": 0.93, "learning_rate": 2.6782618415344352e-06, "loss": 0.6448, "step": 8919 }, { "epoch": 0.93, "learning_rate": 2.670516669102352e-06, "loss": 0.6624, "step": 8920 }, { "epoch": 0.93, "learning_rate": 2.6627825603283697e-06, "loss": 0.6801, "step": 8921 }, { "epoch": 0.93, "learning_rate": 2.6550595160916514e-06, "loss": 0.6402, "step": 8922 }, { "epoch": 0.93, "learning_rate": 2.647347537270117e-06, "loss": 0.6377, "step": 8923 }, { "epoch": 0.93, "learning_rate": 2.6396466247403663e-06, "loss": 0.6413, "step": 8924 }, { "epoch": 0.93, "learning_rate": 2.631956779377809e-06, "loss": 0.6474, "step": 8925 }, { "epoch": 0.93, "learning_rate": 2.6242780020565683e-06, "loss": 0.6759, "step": 8926 }, { "epoch": 0.93, "learning_rate": 2.6166102936494795e-06, "loss": 0.6461, "step": 8927 }, { "epoch": 0.93, "learning_rate": 2.6089536550281677e-06, "loss": 0.6597, "step": 8928 }, { "epoch": 0.93, "learning_rate": 2.6013080870629813e-06, "loss": 0.6267, "step": 8929 }, { "epoch": 0.93, "learning_rate": 2.5936735906230024e-06, "loss": 0.5862, "step": 8930 }, { "epoch": 0.93, "learning_rate": 2.5860501665760705e-06, "loss": 0.6636, "step": 8931 }, { "epoch": 0.93, "learning_rate": 2.578437815788748e-06, "loss": 0.6864, "step": 8932 }, { "epoch": 0.93, "learning_rate": 2.5708365391263423e-06, "loss": 0.6528, "step": 8933 }, { "epoch": 0.93, "learning_rate": 2.563246337452929e-06, "loss": 0.6672, "step": 8934 }, { "epoch": 0.93, "learning_rate": 2.5556672116312963e-06, "loss": 0.6731, "step": 8935 }, { "epoch": 0.93, "learning_rate": 2.5480991625229543e-06, "loss": 0.7107, "step": 8936 }, { "epoch": 0.93, "learning_rate": 2.540542190988193e-06, "loss": 0.7135, "step": 8937 }, { "epoch": 0.93, "learning_rate": 2.532996297886059e-06, "loss": 0.6388, "step": 8938 }, { "epoch": 0.93, "learning_rate": 2.525461484074276e-06, "loss": 0.6703, "step": 8939 }, { "epoch": 0.93, "learning_rate": 2.5179377504093494e-06, "loss": 0.6249, "step": 8940 }, { "epoch": 0.93, "learning_rate": 2.5104250977465384e-06, "loss": 0.5946, "step": 8941 }, { "epoch": 0.93, "learning_rate": 2.5029235269397934e-06, "loss": 0.5913, "step": 8942 }, { "epoch": 0.93, "learning_rate": 2.4954330388418657e-06, "loss": 0.7094, "step": 8943 }, { "epoch": 0.93, "learning_rate": 2.4879536343041855e-06, "loss": 0.658, "step": 8944 }, { "epoch": 0.93, "learning_rate": 2.4804853141769724e-06, "loss": 0.6748, "step": 8945 }, { "epoch": 0.93, "learning_rate": 2.4730280793091587e-06, "loss": 0.6495, "step": 8946 }, { "epoch": 0.93, "learning_rate": 2.465581930548444e-06, "loss": 0.6905, "step": 8947 }, { "epoch": 0.93, "learning_rate": 2.4581468687412178e-06, "loss": 0.6533, "step": 8948 }, { "epoch": 0.93, "learning_rate": 2.45072289473266e-06, "loss": 0.6158, "step": 8949 }, { "epoch": 0.93, "learning_rate": 2.4433100093666617e-06, "loss": 0.7012, "step": 8950 }, { "epoch": 0.93, "learning_rate": 2.43590821348586e-06, "loss": 0.6061, "step": 8951 }, { "epoch": 0.93, "learning_rate": 2.4285175079316602e-06, "loss": 0.671, "step": 8952 }, { "epoch": 0.93, "learning_rate": 2.421137893544134e-06, "loss": 0.7027, "step": 8953 }, { "epoch": 0.93, "learning_rate": 2.4137693711621776e-06, "loss": 0.6261, "step": 8954 }, { "epoch": 0.93, "learning_rate": 2.4064119416233654e-06, "loss": 0.6475, "step": 8955 }, { "epoch": 0.93, "learning_rate": 2.3990656057640505e-06, "loss": 0.6206, "step": 8956 }, { "epoch": 0.93, "learning_rate": 2.3917303644192867e-06, "loss": 0.662, "step": 8957 }, { "epoch": 0.93, "learning_rate": 2.3844062184229078e-06, "loss": 0.6822, "step": 8958 }, { "epoch": 0.93, "learning_rate": 2.377093168607447e-06, "loss": 0.6475, "step": 8959 }, { "epoch": 0.93, "learning_rate": 2.3697912158042067e-06, "loss": 0.6175, "step": 8960 }, { "epoch": 0.93, "learning_rate": 2.362500360843223e-06, "loss": 0.6473, "step": 8961 }, { "epoch": 0.93, "learning_rate": 2.355220604553232e-06, "loss": 0.6096, "step": 8962 }, { "epoch": 0.93, "learning_rate": 2.347951947761784e-06, "loss": 0.6469, "step": 8963 }, { "epoch": 0.93, "learning_rate": 2.3406943912950842e-06, "loss": 0.6823, "step": 8964 }, { "epoch": 0.93, "learning_rate": 2.333447935978128e-06, "loss": 0.7006, "step": 8965 }, { "epoch": 0.93, "learning_rate": 2.3262125826346458e-06, "loss": 0.6982, "step": 8966 }, { "epoch": 0.93, "learning_rate": 2.318988332087091e-06, "loss": 0.6572, "step": 8967 }, { "epoch": 0.93, "learning_rate": 2.3117751851566504e-06, "loss": 0.6374, "step": 8968 }, { "epoch": 0.93, "learning_rate": 2.30457314266328e-06, "loss": 0.6901, "step": 8969 }, { "epoch": 0.93, "learning_rate": 2.2973822054256357e-06, "loss": 0.6614, "step": 8970 }, { "epoch": 0.93, "learning_rate": 2.29020237426113e-06, "loss": 0.5894, "step": 8971 }, { "epoch": 0.93, "learning_rate": 2.2830336499859108e-06, "loss": 0.6196, "step": 8972 }, { "epoch": 0.93, "learning_rate": 2.275876033414859e-06, "loss": 0.6387, "step": 8973 }, { "epoch": 0.93, "learning_rate": 2.2687295253616016e-06, "loss": 0.6988, "step": 8974 }, { "epoch": 0.93, "learning_rate": 2.2615941266385e-06, "loss": 0.6096, "step": 8975 }, { "epoch": 0.93, "learning_rate": 2.254469838056639e-06, "loss": 0.6511, "step": 8976 }, { "epoch": 0.93, "learning_rate": 2.24735666042587e-06, "loss": 0.666, "step": 8977 }, { "epoch": 0.93, "learning_rate": 2.240254594554758e-06, "loss": 0.6503, "step": 8978 }, { "epoch": 0.93, "learning_rate": 2.2331636412505907e-06, "loss": 0.6156, "step": 8979 }, { "epoch": 0.93, "learning_rate": 2.226083801319445e-06, "loss": 0.6905, "step": 8980 }, { "epoch": 0.93, "learning_rate": 2.2190150755660776e-06, "loss": 0.6962, "step": 8981 }, { "epoch": 0.93, "learning_rate": 2.211957464794012e-06, "loss": 0.6659, "step": 8982 }, { "epoch": 0.94, "learning_rate": 2.2049109698055183e-06, "loss": 0.6127, "step": 8983 }, { "epoch": 0.94, "learning_rate": 2.197875591401566e-06, "loss": 0.7134, "step": 8984 }, { "epoch": 0.94, "learning_rate": 2.190851330381893e-06, "loss": 0.6424, "step": 8985 }, { "epoch": 0.94, "learning_rate": 2.1838381875449622e-06, "loss": 0.6667, "step": 8986 }, { "epoch": 0.94, "learning_rate": 2.1768361636879564e-06, "loss": 0.7217, "step": 8987 }, { "epoch": 0.94, "learning_rate": 2.1698452596068397e-06, "loss": 0.7311, "step": 8988 }, { "epoch": 0.94, "learning_rate": 2.162865476096265e-06, "loss": 0.6465, "step": 8989 }, { "epoch": 0.94, "learning_rate": 2.1558968139496427e-06, "loss": 0.582, "step": 8990 }, { "epoch": 0.94, "learning_rate": 2.148939273959105e-06, "loss": 0.7062, "step": 8991 }, { "epoch": 0.94, "learning_rate": 2.1419928569155646e-06, "loss": 0.5851, "step": 8992 }, { "epoch": 0.94, "learning_rate": 2.1350575636086e-06, "loss": 0.5849, "step": 8993 }, { "epoch": 0.94, "learning_rate": 2.1281333948265816e-06, "loss": 0.6853, "step": 8994 }, { "epoch": 0.94, "learning_rate": 2.121220351356601e-06, "loss": 0.6843, "step": 8995 }, { "epoch": 0.94, "learning_rate": 2.1143184339844523e-06, "loss": 0.6599, "step": 8996 }, { "epoch": 0.94, "learning_rate": 2.1074276434947193e-06, "loss": 0.6879, "step": 8997 }, { "epoch": 0.94, "learning_rate": 2.1005479806706752e-06, "loss": 0.6804, "step": 8998 }, { "epoch": 0.94, "learning_rate": 2.09367944629435e-06, "loss": 0.6317, "step": 8999 }, { "epoch": 0.94, "learning_rate": 2.086822041146519e-06, "loss": 0.6802, "step": 9000 }, { "epoch": 0.94, "learning_rate": 2.0799757660066475e-06, "loss": 0.6111, "step": 9001 }, { "epoch": 0.94, "learning_rate": 2.0731406216530027e-06, "loss": 0.691, "step": 9002 }, { "epoch": 0.94, "learning_rate": 2.0663166088625287e-06, "loss": 0.6749, "step": 9003 }, { "epoch": 0.94, "learning_rate": 2.0595037284109388e-06, "loss": 0.6996, "step": 9004 }, { "epoch": 0.94, "learning_rate": 2.0527019810726468e-06, "loss": 0.66, "step": 9005 }, { "epoch": 0.94, "learning_rate": 2.0459113676208565e-06, "loss": 0.6579, "step": 9006 }, { "epoch": 0.94, "learning_rate": 2.039131888827439e-06, "loss": 0.6494, "step": 9007 }, { "epoch": 0.94, "learning_rate": 2.0323635454630454e-06, "loss": 0.646, "step": 9008 }, { "epoch": 0.94, "learning_rate": 2.025606338297059e-06, "loss": 0.6552, "step": 9009 }, { "epoch": 0.94, "learning_rate": 2.0188602680975775e-06, "loss": 0.6758, "step": 9010 }, { "epoch": 0.94, "learning_rate": 2.012125335631443e-06, "loss": 0.6219, "step": 9011 }, { "epoch": 0.94, "learning_rate": 2.0054015416642202e-06, "loss": 0.7223, "step": 9012 }, { "epoch": 0.94, "learning_rate": 1.9986888869602204e-06, "loss": 0.6327, "step": 9013 }, { "epoch": 0.94, "learning_rate": 1.9919873722825e-06, "loss": 0.7367, "step": 9014 }, { "epoch": 0.94, "learning_rate": 1.985296998392827e-06, "loss": 0.5667, "step": 9015 }, { "epoch": 0.94, "learning_rate": 1.978617766051705e-06, "loss": 0.6305, "step": 9016 }, { "epoch": 0.94, "learning_rate": 1.971949676018381e-06, "loss": 0.69, "step": 9017 }, { "epoch": 0.94, "learning_rate": 1.9652927290508493e-06, "loss": 0.6429, "step": 9018 }, { "epoch": 0.94, "learning_rate": 1.9586469259057828e-06, "loss": 0.701, "step": 9019 }, { "epoch": 0.94, "learning_rate": 1.952012267338665e-06, "loss": 0.7021, "step": 9020 }, { "epoch": 0.94, "learning_rate": 1.945388754103639e-06, "loss": 0.6633, "step": 9021 }, { "epoch": 0.94, "learning_rate": 1.9387763869536224e-06, "loss": 0.6596, "step": 9022 }, { "epoch": 0.94, "learning_rate": 1.932175166640271e-06, "loss": 0.6812, "step": 9023 }, { "epoch": 0.94, "learning_rate": 1.925585093913962e-06, "loss": 0.6774, "step": 9024 }, { "epoch": 0.94, "learning_rate": 1.919006169523785e-06, "loss": 0.6997, "step": 9025 }, { "epoch": 0.94, "learning_rate": 1.912438394217586e-06, "loss": 0.6787, "step": 9026 }, { "epoch": 0.94, "learning_rate": 1.9058817687419462e-06, "loss": 0.6588, "step": 9027 }, { "epoch": 0.94, "learning_rate": 1.8993362938421689e-06, "loss": 0.6493, "step": 9028 }, { "epoch": 0.94, "learning_rate": 1.8928019702622923e-06, "loss": 0.7311, "step": 9029 }, { "epoch": 0.94, "learning_rate": 1.8862787987450781e-06, "loss": 0.6657, "step": 9030 }, { "epoch": 0.94, "learning_rate": 1.879766780032044e-06, "loss": 0.6316, "step": 9031 }, { "epoch": 0.94, "learning_rate": 1.8732659148634202e-06, "loss": 0.6914, "step": 9032 }, { "epoch": 0.94, "learning_rate": 1.866776203978171e-06, "loss": 0.5707, "step": 9033 }, { "epoch": 0.94, "learning_rate": 1.8602976481140066e-06, "loss": 0.6609, "step": 9034 }, { "epoch": 0.94, "learning_rate": 1.8538302480073488e-06, "loss": 0.6283, "step": 9035 }, { "epoch": 0.94, "learning_rate": 1.8473740043933763e-06, "loss": 0.6878, "step": 9036 }, { "epoch": 0.94, "learning_rate": 1.8409289180059575e-06, "loss": 0.698, "step": 9037 }, { "epoch": 0.94, "learning_rate": 1.8344949895777397e-06, "loss": 0.6316, "step": 9038 }, { "epoch": 0.94, "learning_rate": 1.8280722198400712e-06, "loss": 0.682, "step": 9039 }, { "epoch": 0.94, "learning_rate": 1.821660609523057e-06, "loss": 0.6659, "step": 9040 }, { "epoch": 0.94, "learning_rate": 1.815260159355503e-06, "loss": 0.6151, "step": 9041 }, { "epoch": 0.94, "learning_rate": 1.8088708700649714e-06, "loss": 0.6825, "step": 9042 }, { "epoch": 0.94, "learning_rate": 1.8024927423777481e-06, "loss": 0.6815, "step": 9043 }, { "epoch": 0.94, "learning_rate": 1.7961257770188423e-06, "loss": 0.6766, "step": 9044 }, { "epoch": 0.94, "learning_rate": 1.7897699747119968e-06, "loss": 0.6812, "step": 9045 }, { "epoch": 0.94, "learning_rate": 1.7834253361797115e-06, "loss": 0.6077, "step": 9046 }, { "epoch": 0.94, "learning_rate": 1.7770918621431765e-06, "loss": 0.6764, "step": 9047 }, { "epoch": 0.94, "learning_rate": 1.7707695533223378e-06, "loss": 0.6438, "step": 9048 }, { "epoch": 0.94, "learning_rate": 1.7644584104358653e-06, "loss": 0.6559, "step": 9049 }, { "epoch": 0.94, "learning_rate": 1.7581584342011626e-06, "loss": 0.6876, "step": 9050 }, { "epoch": 0.94, "learning_rate": 1.7518696253343569e-06, "loss": 0.6652, "step": 9051 }, { "epoch": 0.94, "learning_rate": 1.7455919845503211e-06, "loss": 0.6404, "step": 9052 }, { "epoch": 0.94, "learning_rate": 1.7393255125626395e-06, "loss": 0.6737, "step": 9053 }, { "epoch": 0.94, "learning_rate": 1.7330702100836315e-06, "loss": 0.6802, "step": 9054 }, { "epoch": 0.94, "learning_rate": 1.7268260778243617e-06, "loss": 0.6381, "step": 9055 }, { "epoch": 0.94, "learning_rate": 1.7205931164946176e-06, "loss": 0.6657, "step": 9056 }, { "epoch": 0.94, "learning_rate": 1.7143713268028884e-06, "loss": 0.6629, "step": 9057 }, { "epoch": 0.94, "learning_rate": 1.7081607094564522e-06, "loss": 0.6573, "step": 9058 }, { "epoch": 0.94, "learning_rate": 1.701961265161267e-06, "loss": 0.6892, "step": 9059 }, { "epoch": 0.94, "learning_rate": 1.6957729946220468e-06, "loss": 0.6093, "step": 9060 }, { "epoch": 0.94, "learning_rate": 1.6895958985422066e-06, "loss": 0.6359, "step": 9061 }, { "epoch": 0.94, "learning_rate": 1.6834299776239292e-06, "loss": 0.6841, "step": 9062 }, { "epoch": 0.94, "learning_rate": 1.6772752325680984e-06, "loss": 0.6175, "step": 9063 }, { "epoch": 0.94, "learning_rate": 1.6711316640743325e-06, "loss": 0.6389, "step": 9064 }, { "epoch": 0.94, "learning_rate": 1.6649992728409947e-06, "loss": 0.6769, "step": 9065 }, { "epoch": 0.94, "learning_rate": 1.6588780595651832e-06, "loss": 0.7234, "step": 9066 }, { "epoch": 0.94, "learning_rate": 1.6527680249426747e-06, "loss": 0.7046, "step": 9067 }, { "epoch": 0.94, "learning_rate": 1.6466691696680247e-06, "loss": 0.6538, "step": 9068 }, { "epoch": 0.94, "learning_rate": 1.6405814944345233e-06, "loss": 0.6773, "step": 9069 }, { "epoch": 0.94, "learning_rate": 1.6345049999341389e-06, "loss": 0.6714, "step": 9070 }, { "epoch": 0.94, "learning_rate": 1.628439686857619e-06, "loss": 0.7061, "step": 9071 }, { "epoch": 0.94, "learning_rate": 1.6223855558944235e-06, "loss": 0.6894, "step": 9072 }, { "epoch": 0.94, "learning_rate": 1.616342607732735e-06, "loss": 0.7342, "step": 9073 }, { "epoch": 0.94, "learning_rate": 1.6103108430594593e-06, "loss": 0.6357, "step": 9074 }, { "epoch": 0.94, "learning_rate": 1.6042902625602484e-06, "loss": 0.6501, "step": 9075 }, { "epoch": 0.94, "learning_rate": 1.5982808669194772e-06, "loss": 0.6495, "step": 9076 }, { "epoch": 0.94, "learning_rate": 1.592282656820232e-06, "loss": 0.6835, "step": 9077 }, { "epoch": 0.94, "learning_rate": 1.5862956329443678e-06, "loss": 0.6343, "step": 9078 }, { "epoch": 0.95, "learning_rate": 1.5803197959724292e-06, "loss": 0.7794, "step": 9079 }, { "epoch": 0.95, "learning_rate": 1.5743551465836947e-06, "loss": 0.6858, "step": 9080 }, { "epoch": 0.95, "learning_rate": 1.5684016854561888e-06, "loss": 0.6846, "step": 9081 }, { "epoch": 0.95, "learning_rate": 1.5624594132666592e-06, "loss": 0.7036, "step": 9082 }, { "epoch": 0.95, "learning_rate": 1.5565283306905653e-06, "loss": 0.6834, "step": 9083 }, { "epoch": 0.95, "learning_rate": 1.5506084384021125e-06, "loss": 0.6957, "step": 9084 }, { "epoch": 0.95, "learning_rate": 1.5446997370742289e-06, "loss": 0.6336, "step": 9085 }, { "epoch": 0.95, "learning_rate": 1.5388022273785775e-06, "loss": 0.6576, "step": 9086 }, { "epoch": 0.95, "learning_rate": 1.5329159099855217e-06, "loss": 0.6385, "step": 9087 }, { "epoch": 0.95, "learning_rate": 1.5270407855641934e-06, "loss": 0.6444, "step": 9088 }, { "epoch": 0.95, "learning_rate": 1.5211768547824245e-06, "loss": 0.6805, "step": 9089 }, { "epoch": 0.95, "learning_rate": 1.5153241183067711e-06, "loss": 0.7182, "step": 9090 }, { "epoch": 0.95, "learning_rate": 1.5094825768025233e-06, "loss": 0.6118, "step": 9091 }, { "epoch": 0.95, "learning_rate": 1.5036522309337274e-06, "loss": 0.6476, "step": 9092 }, { "epoch": 0.95, "learning_rate": 1.4978330813630982e-06, "loss": 0.6152, "step": 9093 }, { "epoch": 0.95, "learning_rate": 1.4920251287521392e-06, "loss": 0.675, "step": 9094 }, { "epoch": 0.95, "learning_rate": 1.4862283737610449e-06, "loss": 0.7037, "step": 9095 }, { "epoch": 0.95, "learning_rate": 1.4804428170487438e-06, "loss": 0.6348, "step": 9096 }, { "epoch": 0.95, "learning_rate": 1.4746684592728876e-06, "loss": 0.6623, "step": 9097 }, { "epoch": 0.95, "learning_rate": 1.4689053010898735e-06, "loss": 0.6823, "step": 9098 }, { "epoch": 0.95, "learning_rate": 1.4631533431547994e-06, "loss": 0.6881, "step": 9099 }, { "epoch": 0.95, "learning_rate": 1.4574125861215093e-06, "loss": 0.6181, "step": 9100 }, { "epoch": 0.95, "learning_rate": 1.4516830306425699e-06, "loss": 0.6502, "step": 9101 }, { "epoch": 0.95, "learning_rate": 1.4459646773692603e-06, "loss": 0.6417, "step": 9102 }, { "epoch": 0.95, "learning_rate": 1.4402575269516272e-06, "loss": 0.6643, "step": 9103 }, { "epoch": 0.95, "learning_rate": 1.4345615800383737e-06, "loss": 0.7056, "step": 9104 }, { "epoch": 0.95, "learning_rate": 1.4288768372769935e-06, "loss": 0.6758, "step": 9105 }, { "epoch": 0.95, "learning_rate": 1.4232032993137022e-06, "loss": 0.6683, "step": 9106 }, { "epoch": 0.95, "learning_rate": 1.4175409667933848e-06, "loss": 0.7293, "step": 9107 }, { "epoch": 0.95, "learning_rate": 1.4118898403597147e-06, "loss": 0.6123, "step": 9108 }, { "epoch": 0.95, "learning_rate": 1.4062499206550671e-06, "loss": 0.6722, "step": 9109 }, { "epoch": 0.95, "learning_rate": 1.4006212083205406e-06, "loss": 0.7414, "step": 9110 }, { "epoch": 0.95, "learning_rate": 1.3950037039959563e-06, "loss": 0.7, "step": 9111 }, { "epoch": 0.95, "learning_rate": 1.3893974083198813e-06, "loss": 0.6433, "step": 9112 }, { "epoch": 0.95, "learning_rate": 1.3838023219295948e-06, "loss": 0.6853, "step": 9113 }, { "epoch": 0.95, "learning_rate": 1.378218445461088e-06, "loss": 0.6428, "step": 9114 }, { "epoch": 0.95, "learning_rate": 1.37264577954912e-06, "loss": 0.6346, "step": 9115 }, { "epoch": 0.95, "learning_rate": 1.367084324827106e-06, "loss": 0.6534, "step": 9116 }, { "epoch": 0.95, "learning_rate": 1.3615340819272627e-06, "loss": 0.6551, "step": 9117 }, { "epoch": 0.95, "learning_rate": 1.3559950514804963e-06, "loss": 0.719, "step": 9118 }, { "epoch": 0.95, "learning_rate": 1.350467234116426e-06, "loss": 0.6857, "step": 9119 }, { "epoch": 0.95, "learning_rate": 1.3449506304634262e-06, "loss": 0.7508, "step": 9120 }, { "epoch": 0.95, "learning_rate": 1.3394452411485625e-06, "loss": 0.6946, "step": 9121 }, { "epoch": 0.95, "learning_rate": 1.3339510667976562e-06, "loss": 0.7018, "step": 9122 }, { "epoch": 0.95, "learning_rate": 1.3284681080352522e-06, "loss": 0.6711, "step": 9123 }, { "epoch": 0.95, "learning_rate": 1.3229963654845968e-06, "loss": 0.6629, "step": 9124 }, { "epoch": 0.95, "learning_rate": 1.3175358397676808e-06, "loss": 0.6917, "step": 9125 }, { "epoch": 0.95, "learning_rate": 1.3120865315052078e-06, "loss": 0.5971, "step": 9126 }, { "epoch": 0.95, "learning_rate": 1.3066484413166268e-06, "loss": 0.6658, "step": 9127 }, { "epoch": 0.95, "learning_rate": 1.3012215698200769e-06, "loss": 0.7186, "step": 9128 }, { "epoch": 0.95, "learning_rate": 1.2958059176324534e-06, "loss": 0.6265, "step": 9129 }, { "epoch": 0.95, "learning_rate": 1.2904014853693747e-06, "loss": 0.6304, "step": 9130 }, { "epoch": 0.95, "learning_rate": 1.2850082736451497e-06, "loss": 0.67, "step": 9131 }, { "epoch": 0.95, "learning_rate": 1.2796262830728655e-06, "loss": 0.6442, "step": 9132 }, { "epoch": 0.95, "learning_rate": 1.2742555142642887e-06, "loss": 0.6723, "step": 9133 }, { "epoch": 0.95, "learning_rate": 1.2688959678299306e-06, "loss": 0.6892, "step": 9134 }, { "epoch": 0.95, "learning_rate": 1.2635476443790262e-06, "loss": 0.7305, "step": 9135 }, { "epoch": 0.95, "learning_rate": 1.2582105445195224e-06, "loss": 0.6988, "step": 9136 }, { "epoch": 0.95, "learning_rate": 1.2528846688581009e-06, "loss": 0.5967, "step": 9137 }, { "epoch": 0.95, "learning_rate": 1.247570018000177e-06, "loss": 0.7137, "step": 9138 }, { "epoch": 0.95, "learning_rate": 1.2422665925498678e-06, "loss": 0.6052, "step": 9139 }, { "epoch": 0.95, "learning_rate": 1.2369743931100242e-06, "loss": 0.6264, "step": 9140 }, { "epoch": 0.95, "learning_rate": 1.2316934202822316e-06, "loss": 0.7053, "step": 9141 }, { "epoch": 0.95, "learning_rate": 1.2264236746667769e-06, "loss": 0.6817, "step": 9142 }, { "epoch": 0.95, "learning_rate": 1.2211651568626915e-06, "loss": 0.6985, "step": 9143 }, { "epoch": 0.95, "learning_rate": 1.2159178674677307e-06, "loss": 0.6975, "step": 9144 }, { "epoch": 0.95, "learning_rate": 1.210681807078351e-06, "loss": 0.6321, "step": 9145 }, { "epoch": 0.95, "learning_rate": 1.2054569762897538e-06, "loss": 0.6424, "step": 9146 }, { "epoch": 0.95, "learning_rate": 1.200243375695853e-06, "loss": 0.7173, "step": 9147 }, { "epoch": 0.95, "learning_rate": 1.195041005889297e-06, "loss": 0.6394, "step": 9148 }, { "epoch": 0.95, "learning_rate": 1.1898498674614567e-06, "loss": 0.6774, "step": 9149 }, { "epoch": 0.95, "learning_rate": 1.1846699610024048e-06, "loss": 0.6381, "step": 9150 }, { "epoch": 0.95, "learning_rate": 1.1795012871009591e-06, "loss": 0.6637, "step": 9151 }, { "epoch": 0.95, "learning_rate": 1.174343846344661e-06, "loss": 0.6505, "step": 9152 }, { "epoch": 0.95, "learning_rate": 1.1691976393197524e-06, "loss": 0.643, "step": 9153 }, { "epoch": 0.95, "learning_rate": 1.164062666611221e-06, "loss": 0.6571, "step": 9154 }, { "epoch": 0.95, "learning_rate": 1.1589389288027886e-06, "loss": 0.6975, "step": 9155 }, { "epoch": 0.95, "learning_rate": 1.153826426476845e-06, "loss": 0.694, "step": 9156 }, { "epoch": 0.95, "learning_rate": 1.1487251602145699e-06, "loss": 0.645, "step": 9157 }, { "epoch": 0.95, "learning_rate": 1.1436351305958325e-06, "loss": 0.6435, "step": 9158 }, { "epoch": 0.95, "learning_rate": 1.1385563381992147e-06, "loss": 0.6823, "step": 9159 }, { "epoch": 0.95, "learning_rate": 1.1334887836020436e-06, "loss": 0.6425, "step": 9160 }, { "epoch": 0.95, "learning_rate": 1.128432467380358e-06, "loss": 0.6898, "step": 9161 }, { "epoch": 0.95, "learning_rate": 1.1233873901089097e-06, "loss": 0.6724, "step": 9162 }, { "epoch": 0.95, "learning_rate": 1.1183535523612066e-06, "loss": 0.6395, "step": 9163 }, { "epoch": 0.95, "learning_rate": 1.113330954709435e-06, "loss": 0.6233, "step": 9164 }, { "epoch": 0.95, "learning_rate": 1.1083195977245387e-06, "loss": 0.6257, "step": 9165 }, { "epoch": 0.95, "learning_rate": 1.1033194819761728e-06, "loss": 0.6529, "step": 9166 }, { "epoch": 0.95, "learning_rate": 1.0983306080326828e-06, "loss": 0.6554, "step": 9167 }, { "epoch": 0.95, "learning_rate": 1.0933529764611928e-06, "loss": 0.6217, "step": 9168 }, { "epoch": 0.95, "learning_rate": 1.0883865878275169e-06, "loss": 0.6686, "step": 9169 }, { "epoch": 0.95, "learning_rate": 1.083431442696181e-06, "loss": 0.6464, "step": 9170 }, { "epoch": 0.95, "learning_rate": 1.0784875416304574e-06, "loss": 0.6838, "step": 9171 }, { "epoch": 0.95, "learning_rate": 1.0735548851923516e-06, "loss": 0.633, "step": 9172 }, { "epoch": 0.95, "learning_rate": 1.0686334739425264e-06, "loss": 0.6846, "step": 9173 }, { "epoch": 0.95, "learning_rate": 1.0637233084404452e-06, "loss": 0.6894, "step": 9174 }, { "epoch": 0.96, "learning_rate": 1.0588243892442396e-06, "loss": 0.5706, "step": 9175 }, { "epoch": 0.96, "learning_rate": 1.0539367169107861e-06, "loss": 0.7135, "step": 9176 }, { "epoch": 0.96, "learning_rate": 1.049060291995685e-06, "loss": 0.6033, "step": 9177 }, { "epoch": 0.96, "learning_rate": 1.044195115053237e-06, "loss": 0.6095, "step": 9178 }, { "epoch": 0.96, "learning_rate": 1.0393411866364778e-06, "loss": 0.6433, "step": 9179 }, { "epoch": 0.96, "learning_rate": 1.0344985072971658e-06, "loss": 0.7098, "step": 9180 }, { "epoch": 0.96, "learning_rate": 1.0296670775857942e-06, "loss": 0.6237, "step": 9181 }, { "epoch": 0.96, "learning_rate": 1.0248468980515347e-06, "loss": 0.6508, "step": 9182 }, { "epoch": 0.96, "learning_rate": 1.0200379692423378e-06, "loss": 0.7456, "step": 9183 }, { "epoch": 0.96, "learning_rate": 1.015240291704822e-06, "loss": 0.6658, "step": 9184 }, { "epoch": 0.96, "learning_rate": 1.0104538659843621e-06, "loss": 0.7158, "step": 9185 }, { "epoch": 0.96, "learning_rate": 1.005678692625045e-06, "loss": 0.6784, "step": 9186 }, { "epoch": 0.96, "learning_rate": 1.0009147721696588e-06, "loss": 0.6813, "step": 9187 }, { "epoch": 0.96, "learning_rate": 9.96162105159737e-07, "loss": 0.6514, "step": 9188 }, { "epoch": 0.96, "learning_rate": 9.914206921355363e-07, "loss": 0.736, "step": 9189 }, { "epoch": 0.96, "learning_rate": 9.866905336360145e-07, "loss": 0.6562, "step": 9190 }, { "epoch": 0.96, "learning_rate": 9.819716301988413e-07, "loss": 0.7537, "step": 9191 }, { "epoch": 0.96, "learning_rate": 9.772639823604656e-07, "loss": 0.7047, "step": 9192 }, { "epoch": 0.96, "learning_rate": 9.725675906559817e-07, "loss": 0.6342, "step": 9193 }, { "epoch": 0.96, "learning_rate": 9.678824556192512e-07, "loss": 0.7287, "step": 9194 }, { "epoch": 0.96, "learning_rate": 9.632085777828482e-07, "loss": 0.6564, "step": 9195 }, { "epoch": 0.96, "learning_rate": 9.585459576780587e-07, "loss": 0.6782, "step": 9196 }, { "epoch": 0.96, "learning_rate": 9.53894595834881e-07, "loss": 0.6723, "step": 9197 }, { "epoch": 0.96, "learning_rate": 9.492544927820701e-07, "loss": 0.6814, "step": 9198 }, { "epoch": 0.96, "learning_rate": 9.446256490470596e-07, "loss": 0.623, "step": 9199 }, { "epoch": 0.96, "learning_rate": 9.400080651560284e-07, "loss": 0.6889, "step": 9200 }, { "epoch": 0.96, "learning_rate": 9.354017416338567e-07, "loss": 0.6967, "step": 9201 }, { "epoch": 0.96, "learning_rate": 9.308066790041592e-07, "loss": 0.697, "step": 9202 }, { "epoch": 0.96, "learning_rate": 9.262228777892735e-07, "loss": 0.6456, "step": 9203 }, { "epoch": 0.96, "learning_rate": 9.216503385102604e-07, "loss": 0.6967, "step": 9204 }, { "epoch": 0.96, "learning_rate": 9.1708906168686e-07, "loss": 0.6836, "step": 9205 }, { "epoch": 0.96, "learning_rate": 9.125390478375906e-07, "loss": 0.6842, "step": 9206 }, { "epoch": 0.96, "learning_rate": 9.080002974796387e-07, "loss": 0.6418, "step": 9207 }, { "epoch": 0.96, "learning_rate": 9.034728111289581e-07, "loss": 0.703, "step": 9208 }, { "epoch": 0.96, "learning_rate": 8.989565893001817e-07, "loss": 0.6459, "step": 9209 }, { "epoch": 0.96, "learning_rate": 8.944516325066877e-07, "loss": 0.7049, "step": 9210 }, { "epoch": 0.96, "learning_rate": 8.899579412605552e-07, "loss": 0.731, "step": 9211 }, { "epoch": 0.96, "learning_rate": 8.854755160726092e-07, "loss": 0.6811, "step": 9212 }, { "epoch": 0.96, "learning_rate": 8.81004357452353e-07, "loss": 0.6232, "step": 9213 }, { "epoch": 0.96, "learning_rate": 8.765444659080469e-07, "loss": 0.6681, "step": 9214 }, { "epoch": 0.96, "learning_rate": 8.720958419466629e-07, "loss": 0.6509, "step": 9215 }, { "epoch": 0.96, "learning_rate": 8.676584860738745e-07, "loss": 0.6891, "step": 9216 }, { "epoch": 0.96, "learning_rate": 8.632323987940893e-07, "loss": 0.6716, "step": 9217 }, { "epoch": 0.96, "learning_rate": 8.588175806104382e-07, "loss": 0.6467, "step": 9218 }, { "epoch": 0.96, "learning_rate": 8.544140320247418e-07, "loss": 0.6212, "step": 9219 }, { "epoch": 0.96, "learning_rate": 8.500217535375888e-07, "loss": 0.6806, "step": 9220 }, { "epoch": 0.96, "learning_rate": 8.456407456482352e-07, "loss": 0.6583, "step": 9221 }, { "epoch": 0.96, "learning_rate": 8.412710088546938e-07, "loss": 0.6843, "step": 9222 }, { "epoch": 0.96, "learning_rate": 8.369125436536785e-07, "loss": 0.6867, "step": 9223 }, { "epoch": 0.96, "learning_rate": 8.325653505406262e-07, "loss": 0.6201, "step": 9224 }, { "epoch": 0.96, "learning_rate": 8.28229430009686e-07, "loss": 0.6444, "step": 9225 }, { "epoch": 0.96, "learning_rate": 8.239047825537527e-07, "loss": 0.6368, "step": 9226 }, { "epoch": 0.96, "learning_rate": 8.195914086643885e-07, "loss": 0.6248, "step": 9227 }, { "epoch": 0.96, "learning_rate": 8.152893088319236e-07, "loss": 0.6649, "step": 9228 }, { "epoch": 0.96, "learning_rate": 8.109984835453888e-07, "loss": 0.6417, "step": 9229 }, { "epoch": 0.96, "learning_rate": 8.067189332925163e-07, "loss": 0.6942, "step": 9230 }, { "epoch": 0.96, "learning_rate": 8.024506585597835e-07, "loss": 0.6928, "step": 9231 }, { "epoch": 0.96, "learning_rate": 7.981936598323802e-07, "loss": 0.7141, "step": 9232 }, { "epoch": 0.96, "learning_rate": 7.939479375941972e-07, "loss": 0.7166, "step": 9233 }, { "epoch": 0.96, "learning_rate": 7.897134923278482e-07, "loss": 0.6683, "step": 9234 }, { "epoch": 0.96, "learning_rate": 7.854903245146928e-07, "loss": 0.6934, "step": 9235 }, { "epoch": 0.96, "learning_rate": 7.812784346347801e-07, "loss": 0.6944, "step": 9236 }, { "epoch": 0.96, "learning_rate": 7.770778231668718e-07, "loss": 0.6411, "step": 9237 }, { "epoch": 0.96, "learning_rate": 7.728884905884859e-07, "loss": 0.6237, "step": 9238 }, { "epoch": 0.96, "learning_rate": 7.687104373758081e-07, "loss": 0.6791, "step": 9239 }, { "epoch": 0.96, "learning_rate": 7.645436640037918e-07, "loss": 0.6744, "step": 9240 }, { "epoch": 0.96, "learning_rate": 7.603881709460581e-07, "loss": 0.6823, "step": 9241 }, { "epoch": 0.96, "learning_rate": 7.562439586749847e-07, "loss": 0.666, "step": 9242 }, { "epoch": 0.96, "learning_rate": 7.521110276616505e-07, "loss": 0.6433, "step": 9243 }, { "epoch": 0.96, "learning_rate": 7.479893783758574e-07, "loss": 0.6658, "step": 9244 }, { "epoch": 0.96, "learning_rate": 7.438790112861082e-07, "loss": 0.6922, "step": 9245 }, { "epoch": 0.96, "learning_rate": 7.397799268596628e-07, "loss": 0.6765, "step": 9246 }, { "epoch": 0.96, "learning_rate": 7.356921255624593e-07, "loss": 0.6948, "step": 9247 }, { "epoch": 0.96, "learning_rate": 7.316156078591596e-07, "loss": 0.5792, "step": 9248 }, { "epoch": 0.96, "learning_rate": 7.275503742131707e-07, "loss": 0.7015, "step": 9249 }, { "epoch": 0.96, "learning_rate": 7.234964250865783e-07, "loss": 0.6206, "step": 9250 }, { "epoch": 0.96, "learning_rate": 7.19453760940203e-07, "loss": 0.6625, "step": 9251 }, { "epoch": 0.96, "learning_rate": 7.154223822335992e-07, "loss": 0.6065, "step": 9252 }, { "epoch": 0.96, "learning_rate": 7.114022894250116e-07, "loss": 0.712, "step": 9253 }, { "epoch": 0.96, "learning_rate": 7.073934829714302e-07, "loss": 0.6531, "step": 9254 }, { "epoch": 0.96, "learning_rate": 7.033959633285125e-07, "loss": 0.669, "step": 9255 }, { "epoch": 0.96, "learning_rate": 6.994097309506952e-07, "loss": 0.6708, "step": 9256 }, { "epoch": 0.96, "learning_rate": 6.954347862910715e-07, "loss": 0.6827, "step": 9257 }, { "epoch": 0.96, "learning_rate": 6.914711298015241e-07, "loss": 0.6157, "step": 9258 }, { "epoch": 0.96, "learning_rate": 6.875187619325707e-07, "loss": 0.6394, "step": 9259 }, { "epoch": 0.96, "learning_rate": 6.835776831335184e-07, "loss": 0.632, "step": 9260 }, { "epoch": 0.96, "learning_rate": 6.796478938523198e-07, "loss": 0.6473, "step": 9261 }, { "epoch": 0.96, "learning_rate": 6.757293945357179e-07, "loss": 0.6986, "step": 9262 }, { "epoch": 0.96, "learning_rate": 6.71822185629134e-07, "loss": 0.6984, "step": 9263 }, { "epoch": 0.96, "learning_rate": 6.679262675766906e-07, "loss": 0.6284, "step": 9264 }, { "epoch": 0.96, "learning_rate": 6.640416408212447e-07, "loss": 0.678, "step": 9265 }, { "epoch": 0.96, "learning_rate": 6.601683058043983e-07, "loss": 0.6769, "step": 9266 }, { "epoch": 0.96, "learning_rate": 6.563062629664218e-07, "loss": 0.655, "step": 9267 }, { "epoch": 0.96, "learning_rate": 6.524555127463083e-07, "loss": 0.6462, "step": 9268 }, { "epoch": 0.96, "learning_rate": 6.486160555818188e-07, "loss": 0.6624, "step": 9269 }, { "epoch": 0.96, "learning_rate": 6.447878919093486e-07, "loss": 0.6217, "step": 9270 }, { "epoch": 0.97, "learning_rate": 6.409710221640941e-07, "loss": 0.6311, "step": 9271 }, { "epoch": 0.97, "learning_rate": 6.371654467799082e-07, "loss": 0.715, "step": 9272 }, { "epoch": 0.97, "learning_rate": 6.333711661893671e-07, "loss": 0.7206, "step": 9273 }, { "epoch": 0.97, "learning_rate": 6.295881808237925e-07, "loss": 0.6651, "step": 9274 }, { "epoch": 0.97, "learning_rate": 6.25816491113218e-07, "loss": 0.5973, "step": 9275 }, { "epoch": 0.97, "learning_rate": 6.220560974863454e-07, "loss": 0.5995, "step": 9276 }, { "epoch": 0.97, "learning_rate": 6.183070003706437e-07, "loss": 0.703, "step": 9277 }, { "epoch": 0.97, "learning_rate": 6.145692001922943e-07, "loss": 0.5964, "step": 9278 }, { "epoch": 0.97, "learning_rate": 6.108426973761572e-07, "loss": 0.6916, "step": 9279 }, { "epoch": 0.97, "learning_rate": 6.071274923458492e-07, "loss": 0.6732, "step": 9280 }, { "epoch": 0.97, "learning_rate": 6.03423585523677e-07, "loss": 0.6375, "step": 9281 }, { "epoch": 0.97, "learning_rate": 5.997309773306703e-07, "loss": 0.6805, "step": 9282 }, { "epoch": 0.97, "learning_rate": 5.960496681865935e-07, "loss": 0.6678, "step": 9283 }, { "epoch": 0.97, "learning_rate": 5.923796585098895e-07, "loss": 0.64, "step": 9284 }, { "epoch": 0.97, "learning_rate": 5.887209487177358e-07, "loss": 0.6559, "step": 9285 }, { "epoch": 0.97, "learning_rate": 5.850735392260443e-07, "loss": 0.6771, "step": 9286 }, { "epoch": 0.97, "learning_rate": 5.814374304494163e-07, "loss": 0.6379, "step": 9287 }, { "epoch": 0.97, "learning_rate": 5.778126228011659e-07, "loss": 0.6734, "step": 9288 }, { "epoch": 0.97, "learning_rate": 5.741991166933414e-07, "loss": 0.7449, "step": 9289 }, { "epoch": 0.97, "learning_rate": 5.705969125366916e-07, "loss": 0.6391, "step": 9290 }, { "epoch": 0.97, "learning_rate": 5.670060107407005e-07, "loss": 0.701, "step": 9291 }, { "epoch": 0.97, "learning_rate": 5.634264117135524e-07, "loss": 0.6395, "step": 9292 }, { "epoch": 0.97, "learning_rate": 5.59858115862133e-07, "loss": 0.6319, "step": 9293 }, { "epoch": 0.97, "learning_rate": 5.563011235920734e-07, "loss": 0.6772, "step": 9294 }, { "epoch": 0.97, "learning_rate": 5.527554353076947e-07, "loss": 0.6739, "step": 9295 }, { "epoch": 0.97, "learning_rate": 5.492210514120411e-07, "loss": 0.625, "step": 9296 }, { "epoch": 0.97, "learning_rate": 5.456979723068911e-07, "loss": 0.7012, "step": 9297 }, { "epoch": 0.97, "learning_rate": 5.421861983927024e-07, "loss": 0.6867, "step": 9298 }, { "epoch": 0.97, "learning_rate": 5.386857300686776e-07, "loss": 0.635, "step": 9299 }, { "epoch": 0.97, "learning_rate": 5.351965677327209e-07, "loss": 0.629, "step": 9300 }, { "epoch": 0.97, "learning_rate": 5.317187117814482e-07, "loss": 0.7014, "step": 9301 }, { "epoch": 0.97, "learning_rate": 5.282521626101877e-07, "loss": 0.6296, "step": 9302 }, { "epoch": 0.97, "learning_rate": 5.247969206130132e-07, "loss": 0.6486, "step": 9303 }, { "epoch": 0.97, "learning_rate": 5.213529861826661e-07, "loss": 0.7078, "step": 9304 }, { "epoch": 0.97, "learning_rate": 5.179203597106441e-07, "loss": 0.6959, "step": 9305 }, { "epoch": 0.97, "learning_rate": 5.144990415871353e-07, "loss": 0.6792, "step": 9306 }, { "epoch": 0.97, "learning_rate": 5.110890322010398e-07, "loss": 0.7018, "step": 9307 }, { "epoch": 0.97, "learning_rate": 5.076903319399917e-07, "loss": 0.6212, "step": 9308 }, { "epoch": 0.97, "learning_rate": 5.043029411903266e-07, "loss": 0.6713, "step": 9309 }, { "epoch": 0.97, "learning_rate": 5.00926860337092e-07, "loss": 0.6747, "step": 9310 }, { "epoch": 0.97, "learning_rate": 4.975620897640587e-07, "loss": 0.6279, "step": 9311 }, { "epoch": 0.97, "learning_rate": 4.942086298537096e-07, "loss": 0.6745, "step": 9312 }, { "epoch": 0.97, "learning_rate": 4.908664809872287e-07, "loss": 0.6694, "step": 9313 }, { "epoch": 0.97, "learning_rate": 4.875356435445344e-07, "loss": 0.7434, "step": 9314 }, { "epoch": 0.97, "learning_rate": 4.84216117904257e-07, "loss": 0.6784, "step": 9315 }, { "epoch": 0.97, "learning_rate": 4.809079044437282e-07, "loss": 0.6487, "step": 9316 }, { "epoch": 0.97, "learning_rate": 4.776110035389914e-07, "loss": 0.6496, "step": 9317 }, { "epoch": 0.97, "learning_rate": 4.743254155648247e-07, "loss": 0.6116, "step": 9318 }, { "epoch": 0.97, "learning_rate": 4.7105114089470717e-07, "loss": 0.6555, "step": 9319 }, { "epoch": 0.97, "learning_rate": 4.677881799008188e-07, "loss": 0.6401, "step": 9320 }, { "epoch": 0.97, "learning_rate": 4.645365329540852e-07, "loss": 0.6168, "step": 9321 }, { "epoch": 0.97, "learning_rate": 4.612962004241217e-07, "loss": 0.6835, "step": 9322 }, { "epoch": 0.97, "learning_rate": 4.5806718267925596e-07, "loss": 0.6546, "step": 9323 }, { "epoch": 0.97, "learning_rate": 4.548494800865499e-07, "loss": 0.6621, "step": 9324 }, { "epoch": 0.97, "learning_rate": 4.516430930117554e-07, "loss": 0.6147, "step": 9325 }, { "epoch": 0.97, "learning_rate": 4.4844802181936985e-07, "loss": 0.6392, "step": 9326 }, { "epoch": 0.97, "learning_rate": 4.452642668725582e-07, "loss": 0.6659, "step": 9327 }, { "epoch": 0.97, "learning_rate": 4.4209182853324205e-07, "loss": 0.6822, "step": 9328 }, { "epoch": 0.97, "learning_rate": 4.3893070716204407e-07, "loss": 0.658, "step": 9329 }, { "epoch": 0.97, "learning_rate": 4.357809031182658e-07, "loss": 0.5891, "step": 9330 }, { "epoch": 0.97, "learning_rate": 4.326424167599874e-07, "loss": 0.6909, "step": 9331 }, { "epoch": 0.97, "learning_rate": 4.295152484439569e-07, "loss": 0.6792, "step": 9332 }, { "epoch": 0.97, "learning_rate": 4.263993985256343e-07, "loss": 0.6589, "step": 9333 }, { "epoch": 0.97, "learning_rate": 4.2329486735921407e-07, "loss": 0.6753, "step": 9334 }, { "epoch": 0.97, "learning_rate": 4.202016552976029e-07, "loss": 0.6468, "step": 9335 }, { "epoch": 0.97, "learning_rate": 4.171197626923973e-07, "loss": 0.7079, "step": 9336 }, { "epoch": 0.97, "learning_rate": 4.1404918989392803e-07, "loss": 0.6334, "step": 9337 }, { "epoch": 0.97, "learning_rate": 4.1098993725123827e-07, "loss": 0.6194, "step": 9338 }, { "epoch": 0.97, "learning_rate": 4.07942005112083e-07, "loss": 0.6722, "step": 9339 }, { "epoch": 0.97, "learning_rate": 4.0490539382291856e-07, "loss": 0.6377, "step": 9340 }, { "epoch": 0.97, "learning_rate": 4.0188010372892437e-07, "loss": 0.622, "step": 9341 }, { "epoch": 0.97, "learning_rate": 3.9886613517400305e-07, "loss": 0.6677, "step": 9342 }, { "epoch": 0.97, "learning_rate": 3.958634885007473e-07, "loss": 0.6957, "step": 9343 }, { "epoch": 0.97, "learning_rate": 3.928721640504729e-07, "loss": 0.6538, "step": 9344 }, { "epoch": 0.97, "learning_rate": 3.898921621632301e-07, "loss": 0.6962, "step": 9345 }, { "epoch": 0.97, "learning_rate": 3.8692348317773685e-07, "loss": 0.6689, "step": 9346 }, { "epoch": 0.97, "learning_rate": 3.8396612743145656e-07, "loss": 0.6325, "step": 9347 }, { "epoch": 0.97, "learning_rate": 3.810200952605647e-07, "loss": 0.6023, "step": 9348 }, { "epoch": 0.97, "learning_rate": 3.78085386999949e-07, "loss": 0.681, "step": 9349 }, { "epoch": 0.97, "learning_rate": 3.75162002983187e-07, "loss": 0.6255, "step": 9350 }, { "epoch": 0.97, "learning_rate": 3.722499435426019e-07, "loss": 0.6282, "step": 9351 }, { "epoch": 0.97, "learning_rate": 3.6934920900920656e-07, "loss": 0.7518, "step": 9352 }, { "epoch": 0.97, "learning_rate": 3.6645979971272616e-07, "loss": 0.7036, "step": 9353 }, { "epoch": 0.97, "learning_rate": 3.635817159816202e-07, "loss": 0.6546, "step": 9354 }, { "epoch": 0.97, "learning_rate": 3.6071495814304914e-07, "loss": 0.6248, "step": 9355 }, { "epoch": 0.97, "learning_rate": 3.5785952652286346e-07, "loss": 0.6404, "step": 9356 }, { "epoch": 0.97, "learning_rate": 3.550154214456702e-07, "loss": 0.6166, "step": 9357 }, { "epoch": 0.97, "learning_rate": 3.5218264323474414e-07, "loss": 0.7149, "step": 9358 }, { "epoch": 0.97, "learning_rate": 3.493611922121054e-07, "loss": 0.6735, "step": 9359 }, { "epoch": 0.97, "learning_rate": 3.465510686984863e-07, "loss": 0.6663, "step": 9360 }, { "epoch": 0.97, "learning_rate": 3.4375227301328696e-07, "loss": 0.68, "step": 9361 }, { "epoch": 0.97, "learning_rate": 3.40964805474675e-07, "loss": 0.6768, "step": 9362 }, { "epoch": 0.97, "learning_rate": 3.381886663995193e-07, "loss": 0.6869, "step": 9363 }, { "epoch": 0.97, "learning_rate": 3.3542385610335626e-07, "loss": 0.6465, "step": 9364 }, { "epoch": 0.97, "learning_rate": 3.3267037490049e-07, "loss": 0.6717, "step": 9365 }, { "epoch": 0.97, "learning_rate": 3.299282231039258e-07, "loss": 0.6596, "step": 9366 }, { "epoch": 0.98, "learning_rate": 3.271974010253476e-07, "loss": 0.6209, "step": 9367 }, { "epoch": 0.98, "learning_rate": 3.244779089751737e-07, "loss": 0.5683, "step": 9368 }, { "epoch": 0.98, "learning_rate": 3.217697472625569e-07, "loss": 0.6971, "step": 9369 }, { "epoch": 0.98, "learning_rate": 3.1907291619531765e-07, "loss": 0.6997, "step": 9370 }, { "epoch": 0.98, "learning_rate": 3.163874160800218e-07, "loss": 0.659, "step": 9371 }, { "epoch": 0.98, "learning_rate": 3.137132472219362e-07, "loss": 0.6568, "step": 9372 }, { "epoch": 0.98, "learning_rate": 3.1105040992504e-07, "loss": 0.7005, "step": 9373 }, { "epoch": 0.98, "learning_rate": 3.0839890449201325e-07, "loss": 0.6643, "step": 9374 }, { "epoch": 0.98, "learning_rate": 3.0575873122427046e-07, "loss": 0.6023, "step": 9375 }, { "epoch": 0.98, "learning_rate": 3.031298904219271e-07, "loss": 0.6146, "step": 9376 }, { "epoch": 0.98, "learning_rate": 3.0051238238378856e-07, "loss": 0.6736, "step": 9377 }, { "epoch": 0.98, "learning_rate": 2.9790620740742793e-07, "loss": 0.6997, "step": 9378 }, { "epoch": 0.98, "learning_rate": 2.953113657890638e-07, "loss": 0.6771, "step": 9379 }, { "epoch": 0.98, "learning_rate": 2.927278578236714e-07, "loss": 0.6665, "step": 9380 }, { "epoch": 0.98, "learning_rate": 2.901556838049158e-07, "loss": 0.7012, "step": 9381 }, { "epoch": 0.98, "learning_rate": 2.875948440251963e-07, "loss": 0.6467, "step": 9382 }, { "epoch": 0.98, "learning_rate": 2.850453387755914e-07, "loss": 0.6665, "step": 9383 }, { "epoch": 0.98, "learning_rate": 2.825071683459246e-07, "loss": 0.6167, "step": 9384 }, { "epoch": 0.98, "learning_rate": 2.7998033302470974e-07, "loss": 0.6861, "step": 9385 }, { "epoch": 0.98, "learning_rate": 2.774648330991725e-07, "loss": 0.661, "step": 9386 }, { "epoch": 0.98, "learning_rate": 2.7496066885526193e-07, "loss": 0.6533, "step": 9387 }, { "epoch": 0.98, "learning_rate": 2.724678405776171e-07, "loss": 0.6315, "step": 9388 }, { "epoch": 0.98, "learning_rate": 2.6998634854963347e-07, "loss": 0.693, "step": 9389 }, { "epoch": 0.98, "learning_rate": 2.675161930533632e-07, "loss": 0.6504, "step": 9390 }, { "epoch": 0.98, "learning_rate": 2.650573743695928e-07, "loss": 0.6446, "step": 9391 }, { "epoch": 0.98, "learning_rate": 2.626098927778431e-07, "loss": 0.6098, "step": 9392 }, { "epoch": 0.98, "learning_rate": 2.6017374855630273e-07, "loss": 0.6366, "step": 9393 }, { "epoch": 0.98, "learning_rate": 2.577489419819057e-07, "loss": 0.6895, "step": 9394 }, { "epoch": 0.98, "learning_rate": 2.5533547333028705e-07, "loss": 0.6839, "step": 9395 }, { "epoch": 0.98, "learning_rate": 2.5293334287578297e-07, "loss": 0.5921, "step": 9396 }, { "epoch": 0.98, "learning_rate": 2.5054255089145274e-07, "loss": 0.5575, "step": 9397 }, { "epoch": 0.98, "learning_rate": 2.4816309764905676e-07, "loss": 0.6179, "step": 9398 }, { "epoch": 0.98, "learning_rate": 2.457949834190787e-07, "loss": 0.6692, "step": 9399 }, { "epoch": 0.98, "learning_rate": 2.434382084707143e-07, "loss": 0.7538, "step": 9400 }, { "epoch": 0.98, "learning_rate": 2.410927730718493e-07, "loss": 0.6384, "step": 9401 }, { "epoch": 0.98, "learning_rate": 2.3875867748910374e-07, "loss": 0.7078, "step": 9402 }, { "epoch": 0.98, "learning_rate": 2.3643592198779872e-07, "loss": 0.7183, "step": 9403 }, { "epoch": 0.98, "learning_rate": 2.3412450683195642e-07, "loss": 0.6643, "step": 9404 }, { "epoch": 0.98, "learning_rate": 2.3182443228433327e-07, "loss": 0.7079, "step": 9405 }, { "epoch": 0.98, "learning_rate": 2.295356986063868e-07, "loss": 0.6779, "step": 9406 }, { "epoch": 0.98, "learning_rate": 2.2725830605827558e-07, "loss": 0.5988, "step": 9407 }, { "epoch": 0.98, "learning_rate": 2.2499225489887033e-07, "loss": 0.6235, "step": 9408 }, { "epoch": 0.98, "learning_rate": 2.2273754538576497e-07, "loss": 0.5698, "step": 9409 }, { "epoch": 0.98, "learning_rate": 2.204941777752545e-07, "loss": 0.6721, "step": 9410 }, { "epoch": 0.98, "learning_rate": 2.1826215232234603e-07, "loss": 0.6545, "step": 9411 }, { "epoch": 0.98, "learning_rate": 2.1604146928076996e-07, "loss": 0.6068, "step": 9412 }, { "epoch": 0.98, "learning_rate": 2.1383212890294656e-07, "loss": 0.6863, "step": 9413 }, { "epoch": 0.98, "learning_rate": 2.116341314400083e-07, "loss": 0.6554, "step": 9414 }, { "epoch": 0.98, "learning_rate": 2.09447477141822e-07, "loss": 0.6513, "step": 9415 }, { "epoch": 0.98, "learning_rate": 2.0727216625694435e-07, "loss": 0.6668, "step": 9416 }, { "epoch": 0.98, "learning_rate": 2.0510819903264422e-07, "loss": 0.6337, "step": 9417 }, { "epoch": 0.98, "learning_rate": 2.0295557571491376e-07, "loss": 0.6019, "step": 9418 }, { "epoch": 0.98, "learning_rate": 2.00814296548435e-07, "loss": 0.713, "step": 9419 }, { "epoch": 0.98, "learning_rate": 1.986843617766243e-07, "loss": 0.6407, "step": 9420 }, { "epoch": 0.98, "learning_rate": 1.9656577164157696e-07, "loss": 0.7104, "step": 9421 }, { "epoch": 0.98, "learning_rate": 1.9445852638413363e-07, "loss": 0.7053, "step": 9422 }, { "epoch": 0.98, "learning_rate": 1.9236262624383604e-07, "loss": 0.6508, "step": 9423 }, { "epoch": 0.98, "learning_rate": 1.9027807145890474e-07, "loss": 0.6797, "step": 9424 }, { "epoch": 0.98, "learning_rate": 1.8820486226631683e-07, "loss": 0.6556, "step": 9425 }, { "epoch": 0.98, "learning_rate": 1.8614299890172827e-07, "loss": 0.6706, "step": 9426 }, { "epoch": 0.98, "learning_rate": 1.840924815995182e-07, "loss": 0.7369, "step": 9427 }, { "epoch": 0.98, "learning_rate": 1.8205331059277796e-07, "loss": 0.705, "step": 9428 }, { "epoch": 0.98, "learning_rate": 1.8002548611329994e-07, "loss": 0.6527, "step": 9429 }, { "epoch": 0.98, "learning_rate": 1.7800900839159973e-07, "loss": 0.6639, "step": 9430 }, { "epoch": 0.98, "learning_rate": 1.7600387765688286e-07, "loss": 0.6436, "step": 9431 }, { "epoch": 0.98, "learning_rate": 1.7401009413707815e-07, "loss": 0.6267, "step": 9432 }, { "epoch": 0.98, "learning_rate": 1.7202765805882648e-07, "loss": 0.6756, "step": 9433 }, { "epoch": 0.98, "learning_rate": 1.7005656964748096e-07, "loss": 0.7028, "step": 9434 }, { "epoch": 0.98, "learning_rate": 1.6809682912709567e-07, "loss": 0.6202, "step": 9435 }, { "epoch": 0.98, "learning_rate": 1.661484367204369e-07, "loss": 0.6916, "step": 9436 }, { "epoch": 0.98, "learning_rate": 1.64211392648983e-07, "loss": 0.7245, "step": 9437 }, { "epoch": 0.98, "learning_rate": 1.6228569713292452e-07, "loss": 0.6527, "step": 9438 }, { "epoch": 0.98, "learning_rate": 1.6037135039115304e-07, "loss": 0.6696, "step": 9439 }, { "epoch": 0.98, "learning_rate": 1.5846835264128334e-07, "loss": 0.6873, "step": 9440 }, { "epoch": 0.98, "learning_rate": 1.565767040996424e-07, "loss": 0.7487, "step": 9441 }, { "epoch": 0.98, "learning_rate": 1.5469640498123606e-07, "loss": 0.653, "step": 9442 }, { "epoch": 0.98, "learning_rate": 1.5282745549981549e-07, "loss": 0.6611, "step": 9443 }, { "epoch": 0.98, "learning_rate": 1.5096985586782187e-07, "loss": 0.6792, "step": 9444 }, { "epoch": 0.98, "learning_rate": 1.4912360629641964e-07, "loss": 0.734, "step": 9445 }, { "epoch": 0.98, "learning_rate": 1.4728870699547426e-07, "loss": 0.6026, "step": 9446 }, { "epoch": 0.98, "learning_rate": 1.4546515817356333e-07, "loss": 0.6618, "step": 9447 }, { "epoch": 0.98, "learning_rate": 1.4365296003797657e-07, "loss": 0.5991, "step": 9448 }, { "epoch": 0.98, "learning_rate": 1.418521127947048e-07, "loss": 0.6147, "step": 9449 }, { "epoch": 0.98, "learning_rate": 1.4006261664845088e-07, "loss": 0.6995, "step": 9450 }, { "epoch": 0.98, "learning_rate": 1.3828447180262993e-07, "loss": 0.6608, "step": 9451 }, { "epoch": 0.98, "learning_rate": 1.3651767845938025e-07, "loss": 0.6749, "step": 9452 }, { "epoch": 0.98, "learning_rate": 1.3476223681953003e-07, "loss": 0.6644, "step": 9453 }, { "epoch": 0.98, "learning_rate": 1.3301814708263083e-07, "loss": 0.6933, "step": 9454 }, { "epoch": 0.98, "learning_rate": 1.3128540944692402e-07, "loss": 0.7052, "step": 9455 }, { "epoch": 0.98, "learning_rate": 1.2956402410937428e-07, "loss": 0.6609, "step": 9456 }, { "epoch": 0.98, "learning_rate": 1.2785399126566955e-07, "loss": 0.6793, "step": 9457 }, { "epoch": 0.98, "learning_rate": 1.2615531111018763e-07, "loss": 0.5938, "step": 9458 }, { "epoch": 0.98, "learning_rate": 1.2446798383601855e-07, "loss": 0.6681, "step": 9459 }, { "epoch": 0.98, "learning_rate": 1.227920096349644e-07, "loss": 0.7086, "step": 9460 }, { "epoch": 0.98, "learning_rate": 1.2112738869752838e-07, "loss": 0.6664, "step": 9461 }, { "epoch": 0.98, "learning_rate": 1.19474121212948e-07, "loss": 0.6604, "step": 9462 }, { "epoch": 0.99, "learning_rate": 1.1783220736913958e-07, "loss": 0.6181, "step": 9463 }, { "epoch": 0.99, "learning_rate": 1.1620164735275385e-07, "loss": 0.6384, "step": 9464 }, { "epoch": 0.99, "learning_rate": 1.1458244134914253e-07, "loss": 0.6997, "step": 9465 }, { "epoch": 0.99, "learning_rate": 1.129745895423584e-07, "loss": 0.6477, "step": 9466 }, { "epoch": 0.99, "learning_rate": 1.1137809211515526e-07, "loss": 0.7133, "step": 9467 }, { "epoch": 0.99, "learning_rate": 1.0979294924903238e-07, "loss": 0.6635, "step": 9468 }, { "epoch": 0.99, "learning_rate": 1.0821916112416786e-07, "loss": 0.6485, "step": 9469 }, { "epoch": 0.99, "learning_rate": 1.0665672791946301e-07, "loss": 0.6852, "step": 9470 }, { "epoch": 0.99, "learning_rate": 1.0510564981250914e-07, "loss": 0.6802, "step": 9471 }, { "epoch": 0.99, "learning_rate": 1.0356592697964296e-07, "loss": 0.609, "step": 9472 }, { "epoch": 0.99, "learning_rate": 1.0203755959585781e-07, "loss": 0.6698, "step": 9473 }, { "epoch": 0.99, "learning_rate": 1.0052054783491471e-07, "loss": 0.7276, "step": 9474 }, { "epoch": 0.99, "learning_rate": 9.90148918692424e-08, "loss": 0.7203, "step": 9475 }, { "epoch": 0.99, "learning_rate": 9.752059187000395e-08, "loss": 0.6682, "step": 9476 }, { "epoch": 0.99, "learning_rate": 9.603764800704129e-08, "loss": 0.6778, "step": 9477 }, { "epoch": 0.99, "learning_rate": 9.456606044893069e-08, "loss": 0.6361, "step": 9478 }, { "epoch": 0.99, "learning_rate": 9.310582936296053e-08, "loss": 0.6331, "step": 9479 }, { "epoch": 0.99, "learning_rate": 9.165695491510917e-08, "loss": 0.6824, "step": 9480 }, { "epoch": 0.99, "learning_rate": 9.02194372700671e-08, "loss": 0.6798, "step": 9481 }, { "epoch": 0.99, "learning_rate": 8.879327659125913e-08, "loss": 0.7, "step": 9482 }, { "epoch": 0.99, "learning_rate": 8.737847304077785e-08, "loss": 0.6324, "step": 9483 }, { "epoch": 0.99, "learning_rate": 8.597502677947233e-08, "loss": 0.6763, "step": 9484 }, { "epoch": 0.99, "learning_rate": 8.458293796685945e-08, "loss": 0.6271, "step": 9485 }, { "epoch": 0.99, "learning_rate": 8.320220676116818e-08, "loss": 0.6988, "step": 9486 }, { "epoch": 0.99, "learning_rate": 8.183283331938407e-08, "loss": 0.677, "step": 9487 }, { "epoch": 0.99, "learning_rate": 8.047481779713816e-08, "loss": 0.6564, "step": 9488 }, { "epoch": 0.99, "learning_rate": 7.912816034880699e-08, "loss": 0.6538, "step": 9489 }, { "epoch": 0.99, "learning_rate": 7.779286112746808e-08, "loss": 0.6489, "step": 9490 }, { "epoch": 0.99, "learning_rate": 7.646892028491115e-08, "loss": 0.6743, "step": 9491 }, { "epoch": 0.99, "learning_rate": 7.515633797163801e-08, "loss": 0.71, "step": 9492 }, { "epoch": 0.99, "learning_rate": 7.385511433682935e-08, "loss": 0.6538, "step": 9493 }, { "epoch": 0.99, "learning_rate": 7.256524952842237e-08, "loss": 0.7017, "step": 9494 }, { "epoch": 0.99, "learning_rate": 7.128674369303312e-08, "loss": 0.6652, "step": 9495 }, { "epoch": 0.99, "learning_rate": 7.001959697597871e-08, "loss": 0.7004, "step": 9496 }, { "epoch": 0.99, "learning_rate": 6.876380952131056e-08, "loss": 0.7261, "step": 9497 }, { "epoch": 0.99, "learning_rate": 6.751938147178117e-08, "loss": 0.6255, "step": 9498 }, { "epoch": 0.99, "learning_rate": 6.628631296883292e-08, "loss": 0.6551, "step": 9499 }, { "epoch": 0.99, "learning_rate": 6.506460415264259e-08, "loss": 0.5898, "step": 9500 }, { "epoch": 0.99, "learning_rate": 6.385425516208798e-08, "loss": 0.7092, "step": 9501 }, { "epoch": 0.99, "learning_rate": 6.265526613473683e-08, "loss": 0.7055, "step": 9502 }, { "epoch": 0.99, "learning_rate": 6.14676372068912e-08, "loss": 0.6714, "step": 9503 }, { "epoch": 0.99, "learning_rate": 6.029136851355421e-08, "loss": 0.6302, "step": 9504 }, { "epoch": 0.99, "learning_rate": 5.912646018841894e-08, "loss": 0.6529, "step": 9505 }, { "epoch": 0.99, "learning_rate": 5.797291236392388e-08, "loss": 0.6937, "step": 9506 }, { "epoch": 0.99, "learning_rate": 5.6830725171186374e-08, "loss": 0.6932, "step": 9507 }, { "epoch": 0.99, "learning_rate": 5.5699898740035894e-08, "loss": 0.7102, "step": 9508 }, { "epoch": 0.99, "learning_rate": 5.458043319902517e-08, "loss": 0.6727, "step": 9509 }, { "epoch": 0.99, "learning_rate": 5.347232867540797e-08, "loss": 0.6818, "step": 9510 }, { "epoch": 0.99, "learning_rate": 5.237558529512798e-08, "loss": 0.6614, "step": 9511 }, { "epoch": 0.99, "learning_rate": 5.129020318287436e-08, "loss": 0.6601, "step": 9512 }, { "epoch": 0.99, "learning_rate": 5.021618246201509e-08, "loss": 0.6647, "step": 9513 }, { "epoch": 0.99, "learning_rate": 4.91535232546414e-08, "loss": 0.6493, "step": 9514 }, { "epoch": 0.99, "learning_rate": 4.810222568153444e-08, "loss": 0.6921, "step": 9515 }, { "epoch": 0.99, "learning_rate": 4.706228986220973e-08, "loss": 0.649, "step": 9516 }, { "epoch": 0.99, "learning_rate": 4.603371591488381e-08, "loss": 0.65, "step": 9517 }, { "epoch": 0.99, "learning_rate": 4.5016503956463174e-08, "loss": 0.7071, "step": 9518 }, { "epoch": 0.99, "learning_rate": 4.4010654102588645e-08, "loss": 0.6659, "step": 9519 }, { "epoch": 0.99, "learning_rate": 4.301616646759099e-08, "loss": 0.7508, "step": 9520 }, { "epoch": 0.99, "learning_rate": 4.2033041164524225e-08, "loss": 0.69, "step": 9521 }, { "epoch": 0.99, "learning_rate": 4.106127830512119e-08, "loss": 0.7257, "step": 9522 }, { "epoch": 0.99, "learning_rate": 4.010087799987128e-08, "loss": 0.7134, "step": 9523 }, { "epoch": 0.99, "learning_rate": 3.9151840357931626e-08, "loss": 0.6572, "step": 9524 }, { "epoch": 0.99, "learning_rate": 3.821416548717149e-08, "loss": 0.7145, "step": 9525 }, { "epoch": 0.99, "learning_rate": 3.72878534941945e-08, "loss": 0.7151, "step": 9526 }, { "epoch": 0.99, "learning_rate": 3.6372904484294204e-08, "loss": 0.7346, "step": 9527 }, { "epoch": 0.99, "learning_rate": 3.546931856146518e-08, "loss": 0.6561, "step": 9528 }, { "epoch": 0.99, "learning_rate": 3.457709582843638e-08, "loss": 0.6922, "step": 9529 }, { "epoch": 0.99, "learning_rate": 3.3696236386615565e-08, "loss": 0.7074, "step": 9530 }, { "epoch": 0.99, "learning_rate": 3.282674033613375e-08, "loss": 0.6748, "step": 9531 }, { "epoch": 0.99, "learning_rate": 3.19686077758341e-08, "loss": 0.6429, "step": 9532 }, { "epoch": 0.99, "learning_rate": 3.1121838803260806e-08, "loss": 0.6817, "step": 9533 }, { "epoch": 0.99, "learning_rate": 3.02864335146591e-08, "loss": 0.6019, "step": 9534 }, { "epoch": 0.99, "learning_rate": 2.9462392004997453e-08, "loss": 0.617, "step": 9535 }, { "epoch": 0.99, "learning_rate": 2.8649714367956492e-08, "loss": 0.6733, "step": 9536 }, { "epoch": 0.99, "learning_rate": 2.784840069589567e-08, "loss": 0.6136, "step": 9537 }, { "epoch": 0.99, "learning_rate": 2.705845107991989e-08, "loss": 0.6068, "step": 9538 }, { "epoch": 0.99, "learning_rate": 2.627986560981288e-08, "loss": 0.6653, "step": 9539 }, { "epoch": 0.99, "learning_rate": 2.551264437408163e-08, "loss": 0.668, "step": 9540 }, { "epoch": 0.99, "learning_rate": 2.475678745993415e-08, "loss": 0.62, "step": 9541 }, { "epoch": 0.99, "learning_rate": 2.4012294953301705e-08, "loss": 0.5547, "step": 9542 }, { "epoch": 0.99, "learning_rate": 2.3279166938805496e-08, "loss": 0.6285, "step": 9543 }, { "epoch": 0.99, "learning_rate": 2.255740349977886e-08, "loss": 0.6234, "step": 9544 }, { "epoch": 0.99, "learning_rate": 2.1847004718267285e-08, "loss": 0.652, "step": 9545 }, { "epoch": 0.99, "learning_rate": 2.1147970675028384e-08, "loss": 0.6829, "step": 9546 }, { "epoch": 0.99, "learning_rate": 2.0460301449520824e-08, "loss": 0.6075, "step": 9547 }, { "epoch": 0.99, "learning_rate": 1.978399711991541e-08, "loss": 0.6706, "step": 9548 }, { "epoch": 0.99, "learning_rate": 1.911905776307288e-08, "loss": 0.5884, "step": 9549 }, { "epoch": 0.99, "learning_rate": 1.8465483454610522e-08, "loss": 0.6318, "step": 9550 }, { "epoch": 0.99, "learning_rate": 1.7823274268791157e-08, "loss": 0.6835, "step": 9551 }, { "epoch": 0.99, "learning_rate": 1.719243027862305e-08, "loss": 0.6565, "step": 9552 }, { "epoch": 0.99, "learning_rate": 1.657295155582661e-08, "loss": 0.6761, "step": 9553 }, { "epoch": 0.99, "learning_rate": 1.596483817081218e-08, "loss": 0.6068, "step": 9554 }, { "epoch": 0.99, "learning_rate": 1.5368090192702243e-08, "loss": 0.5882, "step": 9555 }, { "epoch": 0.99, "learning_rate": 1.4782707689342534e-08, "loss": 0.6242, "step": 9556 }, { "epoch": 0.99, "learning_rate": 1.4208690727257612e-08, "loss": 0.7206, "step": 9557 }, { "epoch": 0.99, "learning_rate": 1.3646039371706388e-08, "loss": 0.6129, "step": 9558 }, { "epoch": 1.0, "learning_rate": 1.3094753686648809e-08, "loss": 0.748, "step": 9559 }, { "epoch": 1.0, "learning_rate": 1.2554833734756965e-08, "loss": 0.6729, "step": 9560 }, { "epoch": 1.0, "learning_rate": 1.2026279577381783e-08, "loss": 0.747, "step": 9561 }, { "epoch": 1.0, "learning_rate": 1.1509091274630735e-08, "loss": 0.669, "step": 9562 }, { "epoch": 1.0, "learning_rate": 1.1003268885279028e-08, "loss": 0.6591, "step": 9563 }, { "epoch": 1.0, "learning_rate": 1.0508812466825112e-08, "loss": 0.6705, "step": 9564 }, { "epoch": 1.0, "learning_rate": 1.0025722075479583e-08, "loss": 0.6642, "step": 9565 }, { "epoch": 1.0, "learning_rate": 9.553997766165168e-09, "loss": 0.5728, "step": 9566 }, { "epoch": 1.0, "learning_rate": 9.093639592483439e-09, "loss": 0.6682, "step": 9567 }, { "epoch": 1.0, "learning_rate": 8.644647606770307e-09, "loss": 0.6687, "step": 9568 }, { "epoch": 1.0, "learning_rate": 8.207021860073827e-09, "loss": 0.6263, "step": 9569 }, { "epoch": 1.0, "learning_rate": 7.780762402131991e-09, "loss": 0.6505, "step": 9570 }, { "epoch": 1.0, "learning_rate": 7.365869281406035e-09, "loss": 0.6777, "step": 9571 }, { "epoch": 1.0, "learning_rate": 6.962342545047129e-09, "loss": 0.6794, "step": 9572 }, { "epoch": 1.0, "learning_rate": 6.570182238929689e-09, "loss": 0.5929, "step": 9573 }, { "epoch": 1.0, "learning_rate": 6.189388407629171e-09, "loss": 0.6814, "step": 9574 }, { "epoch": 1.0, "learning_rate": 5.819961094433168e-09, "loss": 0.723, "step": 9575 }, { "epoch": 1.0, "learning_rate": 5.461900341341419e-09, "loss": 0.6309, "step": 9576 }, { "epoch": 1.0, "learning_rate": 5.1152061890547e-09, "loss": 0.5747, "step": 9577 }, { "epoch": 1.0, "learning_rate": 4.779878676974825e-09, "loss": 0.6523, "step": 9578 }, { "epoch": 1.0, "learning_rate": 4.4559178432157514e-09, "loss": 0.6159, "step": 9579 }, { "epoch": 1.0, "learning_rate": 4.143323724614678e-09, "loss": 0.6756, "step": 9580 }, { "epoch": 1.0, "learning_rate": 3.842096356698743e-09, "loss": 0.6822, "step": 9581 }, { "epoch": 1.0, "learning_rate": 3.5522357737072243e-09, "loss": 0.6457, "step": 9582 }, { "epoch": 1.0, "learning_rate": 3.2737420086026425e-09, "loss": 0.7219, "step": 9583 }, { "epoch": 1.0, "learning_rate": 3.0066150930152524e-09, "loss": 0.6506, "step": 9584 }, { "epoch": 1.0, "learning_rate": 2.7508550573318583e-09, "loss": 0.6174, "step": 9585 }, { "epoch": 1.0, "learning_rate": 2.5064619306292005e-09, "loss": 0.7331, "step": 9586 }, { "epoch": 1.0, "learning_rate": 2.273435740673957e-09, "loss": 0.715, "step": 9587 }, { "epoch": 1.0, "learning_rate": 2.0517765139560497e-09, "loss": 0.5992, "step": 9588 }, { "epoch": 1.0, "learning_rate": 1.8414842756775408e-09, "loss": 0.6738, "step": 9589 }, { "epoch": 1.0, "learning_rate": 1.64255904973043e-09, "loss": 0.6459, "step": 9590 }, { "epoch": 1.0, "learning_rate": 1.4550008587521647e-09, "loss": 0.6493, "step": 9591 }, { "epoch": 1.0, "learning_rate": 1.2788097240368224e-09, "loss": 0.599, "step": 9592 }, { "epoch": 1.0, "learning_rate": 1.113985665623929e-09, "loss": 0.7196, "step": 9593 }, { "epoch": 1.0, "learning_rate": 9.605287022540488e-10, "loss": 0.6364, "step": 9594 }, { "epoch": 1.0, "learning_rate": 8.184388513576835e-10, "loss": 0.6683, "step": 9595 }, { "epoch": 1.0, "learning_rate": 6.877161290996803e-10, "loss": 0.6552, "step": 9596 }, { "epoch": 1.0, "learning_rate": 5.683605503348232e-10, "loss": 0.6066, "step": 9597 }, { "epoch": 1.0, "learning_rate": 4.6037212863003775e-10, "loss": 0.6859, "step": 9598 }, { "epoch": 1.0, "learning_rate": 3.637508762643904e-10, "loss": 0.605, "step": 9599 }, { "epoch": 1.0, "learning_rate": 2.784968042068847e-10, "loss": 0.6389, "step": 9600 }, { "epoch": 1.0, "learning_rate": 2.0460992216086993e-10, "loss": 0.7023, "step": 9601 }, { "epoch": 1.0, "learning_rate": 1.4209023853073432e-10, "loss": 0.6473, "step": 9602 }, { "epoch": 1.0, "learning_rate": 9.093776041080304e-11, "loss": 0.6474, "step": 9603 }, { "epoch": 1.0, "learning_rate": 5.1152493629746944e-11, "loss": 0.6888, "step": 9604 }, { "epoch": 1.0, "learning_rate": 2.2734442683969292e-11, "loss": 0.6564, "step": 9605 }, { "epoch": 1.0, "learning_rate": 5.683610837525777e-12, "loss": 0.6433, "step": 9606 }, { "epoch": 1.0, "learning_rate": 0.0, "loss": 0.649, "step": 9607 }, { "epoch": 1.0, "step": 9607, "total_flos": 2548396022218752.0, "train_loss": 0.6906294351352716, "train_runtime": 75940.5246, "train_samples_per_second": 16.192, "train_steps_per_second": 0.127 } ], "logging_steps": 1.0, "max_steps": 9607, "num_input_tokens_seen": 0, "num_train_epochs": 1, "save_steps": 100000, "total_flos": 2548396022218752.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }