{"current_steps": 10, "total_steps": 4632, "loss": 1.0408, "learning_rate": 2.1551724137931036e-07, "epoch": 0.008629989212513484, "percentage": 0.22, "elapsed_time": "0:01:35", "remaining_time": "12:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 4632, "loss": 1.047, "learning_rate": 4.3103448275862073e-07, "epoch": 0.017259978425026967, "percentage": 0.43, "elapsed_time": "0:02:44", "remaining_time": "10:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 4632, "loss": 1.0718, "learning_rate": 6.465517241379311e-07, "epoch": 0.025889967637540454, "percentage": 0.65, "elapsed_time": "0:04:07", "remaining_time": "10:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 4632, "loss": 1.0488, "learning_rate": 8.620689655172415e-07, "epoch": 0.034519956850053934, "percentage": 0.86, "elapsed_time": "0:05:32", "remaining_time": "10:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 4632, "loss": 1.075, "learning_rate": 1.0775862068965518e-06, "epoch": 0.043149946062567425, "percentage": 1.08, "elapsed_time": "0:06:50", "remaining_time": "10:27:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 4632, "eval_loss": 1.018173336982727, "epoch": 0.043149946062567425, "percentage": 1.08, "elapsed_time": "0:12:13", "remaining_time": "18:40:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 4632, "loss": 1.1389, "learning_rate": 1.2931034482758623e-06, "epoch": 0.05177993527508091, "percentage": 1.3, "elapsed_time": "0:13:09", "remaining_time": "16:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 4632, "loss": 1.1116, "learning_rate": 1.5086206896551726e-06, "epoch": 0.06040992448759439, "percentage": 1.51, "elapsed_time": "0:14:12", "remaining_time": "15:25:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 4632, "loss": 1.0697, "learning_rate": 1.724137931034483e-06, "epoch": 0.06903991370010787, "percentage": 1.73, "elapsed_time": "0:15:42", "remaining_time": "14:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 4632, "loss": 1.0242, "learning_rate": 1.9396551724137932e-06, "epoch": 0.07766990291262135, "percentage": 1.94, "elapsed_time": "0:16:47", "remaining_time": "14:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 4632, "loss": 1.0505, "learning_rate": 2.1551724137931035e-06, "epoch": 0.08629989212513485, "percentage": 2.16, "elapsed_time": "0:18:03", "remaining_time": "13:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 4632, "eval_loss": 0.9943639039993286, "epoch": 0.08629989212513485, "percentage": 2.16, "elapsed_time": "0:23:25", "remaining_time": "17:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 4632, "loss": 1.0073, "learning_rate": 2.370689655172414e-06, "epoch": 0.09492988133764833, "percentage": 2.37, "elapsed_time": "0:24:47", "remaining_time": "16:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 4632, "loss": 0.9802, "learning_rate": 2.5862068965517246e-06, "epoch": 0.10355987055016182, "percentage": 2.59, "elapsed_time": "0:26:00", "remaining_time": "16:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 4632, "loss": 0.9827, "learning_rate": 2.8017241379310345e-06, "epoch": 0.1121898597626753, "percentage": 2.81, "elapsed_time": "0:27:41", "remaining_time": "15:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 4632, "loss": 1.0015, "learning_rate": 3.017241379310345e-06, "epoch": 0.12081984897518878, "percentage": 3.02, "elapsed_time": "0:28:57", "remaining_time": "15:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 4632, "loss": 0.9387, "learning_rate": 3.2327586206896555e-06, "epoch": 0.12944983818770225, "percentage": 3.24, "elapsed_time": "0:30:18", "remaining_time": "15:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 4632, "eval_loss": 0.9101472496986389, "epoch": 0.12944983818770225, "percentage": 3.24, "elapsed_time": "0:35:40", "remaining_time": "17:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 4632, "loss": 0.9255, "learning_rate": 3.448275862068966e-06, "epoch": 0.13807982740021574, "percentage": 3.45, "elapsed_time": "0:37:16", "remaining_time": "17:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 4632, "loss": 0.8775, "learning_rate": 3.663793103448276e-06, "epoch": 0.14670981661272922, "percentage": 3.67, "elapsed_time": "0:38:44", "remaining_time": "16:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 4632, "loss": 0.8675, "learning_rate": 3.8793103448275865e-06, "epoch": 0.1553398058252427, "percentage": 3.89, "elapsed_time": "0:40:20", "remaining_time": "16:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 4632, "loss": 0.9728, "learning_rate": 4.094827586206897e-06, "epoch": 0.16396979503775622, "percentage": 4.1, "elapsed_time": "0:41:23", "remaining_time": "16:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 4632, "loss": 0.92, "learning_rate": 4.310344827586207e-06, "epoch": 0.1725997842502697, "percentage": 4.32, "elapsed_time": "0:42:39", "remaining_time": "15:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 4632, "eval_loss": 0.9019931554794312, "epoch": 0.1725997842502697, "percentage": 4.32, "elapsed_time": "0:48:01", "remaining_time": "17:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 4632, "loss": 0.9633, "learning_rate": 4.525862068965518e-06, "epoch": 0.18122977346278318, "percentage": 4.53, "elapsed_time": "0:49:16", "remaining_time": "17:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 4632, "loss": 0.9646, "learning_rate": 4.741379310344828e-06, "epoch": 0.18985976267529667, "percentage": 4.75, "elapsed_time": "0:50:23", "remaining_time": "16:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 4632, "loss": 0.9956, "learning_rate": 4.9568965517241384e-06, "epoch": 0.19848975188781015, "percentage": 4.97, "elapsed_time": "0:51:39", "remaining_time": "16:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 4632, "loss": 0.8929, "learning_rate": 5.172413793103449e-06, "epoch": 0.20711974110032363, "percentage": 5.18, "elapsed_time": "0:53:11", "remaining_time": "16:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 4632, "loss": 0.9531, "learning_rate": 5.38793103448276e-06, "epoch": 0.21574973031283712, "percentage": 5.4, "elapsed_time": "0:54:35", "remaining_time": "15:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 4632, "eval_loss": 0.886761486530304, "epoch": 0.21574973031283712, "percentage": 5.4, "elapsed_time": "0:59:57", "remaining_time": "17:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 4632, "loss": 0.9716, "learning_rate": 5.603448275862069e-06, "epoch": 0.2243797195253506, "percentage": 5.61, "elapsed_time": "1:01:26", "remaining_time": "17:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 4632, "loss": 0.9407, "learning_rate": 5.81896551724138e-06, "epoch": 0.23300970873786409, "percentage": 5.83, "elapsed_time": "1:02:39", "remaining_time": "16:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 4632, "loss": 0.9464, "learning_rate": 6.03448275862069e-06, "epoch": 0.24163969795037757, "percentage": 6.04, "elapsed_time": "1:03:42", "remaining_time": "16:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 4632, "loss": 0.9151, "learning_rate": 6.25e-06, "epoch": 0.25026968716289105, "percentage": 6.26, "elapsed_time": "1:05:19", "remaining_time": "16:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 4632, "loss": 0.849, "learning_rate": 6.465517241379311e-06, "epoch": 0.2588996763754045, "percentage": 6.48, "elapsed_time": "1:06:42", "remaining_time": "16:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 4632, "eval_loss": 0.856666088104248, "epoch": 0.2588996763754045, "percentage": 6.48, "elapsed_time": "1:12:03", "remaining_time": "17:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 4632, "loss": 1.0237, "learning_rate": 6.681034482758622e-06, "epoch": 0.267529665587918, "percentage": 6.69, "elapsed_time": "1:13:17", "remaining_time": "17:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 4632, "loss": 0.8401, "learning_rate": 6.896551724137932e-06, "epoch": 0.2761596548004315, "percentage": 6.91, "elapsed_time": "1:14:34", "remaining_time": "16:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 4632, "loss": 0.9366, "learning_rate": 7.1120689655172415e-06, "epoch": 0.284789644012945, "percentage": 7.12, "elapsed_time": "1:16:02", "remaining_time": "16:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 4632, "loss": 0.8198, "learning_rate": 7.327586206896552e-06, "epoch": 0.29341963322545844, "percentage": 7.34, "elapsed_time": "1:17:26", "remaining_time": "16:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 4632, "loss": 0.8897, "learning_rate": 7.543103448275862e-06, "epoch": 0.30204962243797195, "percentage": 7.56, "elapsed_time": "1:18:42", "remaining_time": "16:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 4632, "eval_loss": 0.8523032069206238, "epoch": 0.30204962243797195, "percentage": 7.56, "elapsed_time": "1:24:04", "remaining_time": "17:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 4632, "loss": 0.8352, "learning_rate": 7.758620689655173e-06, "epoch": 0.3106796116504854, "percentage": 7.77, "elapsed_time": "1:25:28", "remaining_time": "16:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 4632, "loss": 0.7918, "learning_rate": 7.974137931034484e-06, "epoch": 0.3193096008629989, "percentage": 7.99, "elapsed_time": "1:26:52", "remaining_time": "16:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 4632, "loss": 0.9004, "learning_rate": 8.189655172413794e-06, "epoch": 0.32793959007551243, "percentage": 8.2, "elapsed_time": "1:28:01", "remaining_time": "16:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 4632, "loss": 0.8079, "learning_rate": 8.405172413793105e-06, "epoch": 0.3365695792880259, "percentage": 8.42, "elapsed_time": "1:29:28", "remaining_time": "16:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 4632, "loss": 0.8512, "learning_rate": 8.620689655172414e-06, "epoch": 0.3451995685005394, "percentage": 8.64, "elapsed_time": "1:30:41", "remaining_time": "15:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 4632, "eval_loss": 0.8104857206344604, "epoch": 0.3451995685005394, "percentage": 8.64, "elapsed_time": "1:36:03", "remaining_time": "16:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 4632, "loss": 0.8049, "learning_rate": 8.836206896551725e-06, "epoch": 0.35382955771305286, "percentage": 8.85, "elapsed_time": "1:37:17", "remaining_time": "16:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 4632, "loss": 0.7887, "learning_rate": 9.051724137931036e-06, "epoch": 0.36245954692556637, "percentage": 9.07, "elapsed_time": "1:38:26", "remaining_time": "16:27:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 4632, "loss": 0.8286, "learning_rate": 9.267241379310346e-06, "epoch": 0.3710895361380798, "percentage": 9.28, "elapsed_time": "1:39:50", "remaining_time": "16:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 4632, "loss": 0.8201, "learning_rate": 9.482758620689655e-06, "epoch": 0.37971952535059333, "percentage": 9.5, "elapsed_time": "1:41:04", "remaining_time": "16:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 4632, "loss": 0.7854, "learning_rate": 9.698275862068966e-06, "epoch": 0.3883495145631068, "percentage": 9.72, "elapsed_time": "1:42:19", "remaining_time": "15:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 4632, "eval_loss": 0.7994323372840881, "epoch": 0.3883495145631068, "percentage": 9.72, "elapsed_time": "1:47:41", "remaining_time": "16:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 4632, "loss": 0.8339, "learning_rate": 9.913793103448277e-06, "epoch": 0.3969795037756203, "percentage": 9.93, "elapsed_time": "1:48:42", "remaining_time": "16:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 4632, "loss": 0.8063, "learning_rate": 9.9999488687872e-06, "epoch": 0.40560949298813376, "percentage": 10.15, "elapsed_time": "1:49:59", "remaining_time": "16:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 4632, "loss": 0.8554, "learning_rate": 9.999636404051638e-06, "epoch": 0.41423948220064727, "percentage": 10.36, "elapsed_time": "1:51:13", "remaining_time": "16:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 4632, "loss": 0.9297, "learning_rate": 9.999039898540166e-06, "epoch": 0.4228694714131607, "percentage": 10.58, "elapsed_time": "1:52:29", "remaining_time": "15:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 4632, "loss": 0.8147, "learning_rate": 9.998159386141626e-06, "epoch": 0.43149946062567424, "percentage": 10.79, "elapsed_time": "1:53:46", "remaining_time": "15:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 4632, "eval_loss": 0.7859384417533875, "epoch": 0.43149946062567424, "percentage": 10.79, "elapsed_time": "1:59:08", "remaining_time": "16:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 4632, "loss": 0.8449, "learning_rate": 9.996994916879941e-06, "epoch": 0.4401294498381877, "percentage": 11.01, "elapsed_time": "2:00:32", "remaining_time": "16:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 4632, "loss": 0.779, "learning_rate": 9.995546556911271e-06, "epoch": 0.4487594390507012, "percentage": 11.23, "elapsed_time": "2:01:38", "remaining_time": "16:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 4632, "loss": 0.7262, "learning_rate": 9.99381438852026e-06, "epoch": 0.45738942826321466, "percentage": 11.44, "elapsed_time": "2:02:53", "remaining_time": "15:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 4632, "loss": 0.8282, "learning_rate": 9.991798510115351e-06, "epoch": 0.46601941747572817, "percentage": 11.66, "elapsed_time": "2:04:08", "remaining_time": "15:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 4632, "loss": 0.8075, "learning_rate": 9.989499036223209e-06, "epoch": 0.4746494066882416, "percentage": 11.87, "elapsed_time": "2:05:40", "remaining_time": "15:32:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 4632, "eval_loss": 0.7565743923187256, "epoch": 0.4746494066882416, "percentage": 11.87, "elapsed_time": "2:11:02", "remaining_time": "16:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 4632, "loss": 0.7747, "learning_rate": 9.986916097482204e-06, "epoch": 0.48327939590075514, "percentage": 12.09, "elapsed_time": "2:12:08", "remaining_time": "16:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 4632, "loss": 0.7563, "learning_rate": 9.98404984063499e-06, "epoch": 0.4919093851132686, "percentage": 12.31, "elapsed_time": "2:13:28", "remaining_time": "15:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 4632, "loss": 0.7819, "learning_rate": 9.980900428520171e-06, "epoch": 0.5005393743257821, "percentage": 12.52, "elapsed_time": "2:14:35", "remaining_time": "15:40:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 4632, "loss": 0.7777, "learning_rate": 9.977468040063054e-06, "epoch": 0.5091693635382956, "percentage": 12.74, "elapsed_time": "2:15:58", "remaining_time": "15:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 4632, "loss": 0.8282, "learning_rate": 9.973752870265473e-06, "epoch": 0.517799352750809, "percentage": 12.95, "elapsed_time": "2:17:15", "remaining_time": "15:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 4632, "eval_loss": 0.7454360127449036, "epoch": 0.517799352750809, "percentage": 12.95, "elapsed_time": "2:22:36", "remaining_time": "15:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 4632, "loss": 0.7907, "learning_rate": 9.96975513019472e-06, "epoch": 0.5264293419633226, "percentage": 13.17, "elapsed_time": "2:23:51", "remaining_time": "15:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 4632, "loss": 0.8475, "learning_rate": 9.965475046971548e-06, "epoch": 0.535059331175836, "percentage": 13.39, "elapsed_time": "2:25:08", "remaining_time": "15:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 4632, "loss": 0.7363, "learning_rate": 9.960912863757273e-06, "epoch": 0.5436893203883495, "percentage": 13.6, "elapsed_time": "2:26:40", "remaining_time": "15:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 4632, "loss": 0.8291, "learning_rate": 9.956068839739955e-06, "epoch": 0.552319309600863, "percentage": 13.82, "elapsed_time": "2:27:48", "remaining_time": "15:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 4632, "loss": 0.7524, "learning_rate": 9.950943250119674e-06, "epoch": 0.5609492988133765, "percentage": 14.03, "elapsed_time": "2:29:03", "remaining_time": "15:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 4632, "eval_loss": 0.7317044138908386, "epoch": 0.5609492988133765, "percentage": 14.03, "elapsed_time": "2:34:24", "remaining_time": "15:45:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 4632, "loss": 0.7319, "learning_rate": 9.945536386092893e-06, "epoch": 0.56957928802589, "percentage": 14.25, "elapsed_time": "2:36:00", "remaining_time": "15:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 4632, "loss": 0.6644, "learning_rate": 9.939848554835927e-06, "epoch": 0.5782092772384034, "percentage": 14.46, "elapsed_time": "2:37:13", "remaining_time": "15:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 4632, "loss": 0.8749, "learning_rate": 9.93388007948747e-06, "epoch": 0.5868392664509169, "percentage": 14.68, "elapsed_time": "2:38:19", "remaining_time": "15:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 4632, "loss": 0.8157, "learning_rate": 9.927631299130254e-06, "epoch": 0.5954692556634305, "percentage": 14.9, "elapsed_time": "2:39:47", "remaining_time": "15:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 4632, "loss": 0.7338, "learning_rate": 9.921102568771781e-06, "epoch": 0.6040992448759439, "percentage": 15.11, "elapsed_time": "2:40:59", "remaining_time": "15:04:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 4632, "eval_loss": 0.7266865968704224, "epoch": 0.6040992448759439, "percentage": 15.11, "elapsed_time": "2:46:21", "remaining_time": "15:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 4632, "loss": 0.7609, "learning_rate": 9.914294259324149e-06, "epoch": 0.6127292340884574, "percentage": 15.33, "elapsed_time": "2:47:49", "remaining_time": "15:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 4632, "loss": 0.7681, "learning_rate": 9.907206757582987e-06, "epoch": 0.6213592233009708, "percentage": 15.54, "elapsed_time": "2:48:56", "remaining_time": "15:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 4632, "loss": 0.8052, "learning_rate": 9.899840466205473e-06, "epoch": 0.6299892125134844, "percentage": 15.76, "elapsed_time": "2:50:22", "remaining_time": "15:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 4632, "loss": 0.739, "learning_rate": 9.892195803687464e-06, "epoch": 0.6386192017259978, "percentage": 15.98, "elapsed_time": "2:51:39", "remaining_time": "15:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 4632, "loss": 0.7909, "learning_rate": 9.884273204339716e-06, "epoch": 0.6472491909385113, "percentage": 16.19, "elapsed_time": "2:53:11", "remaining_time": "14:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 4632, "eval_loss": 0.7110950350761414, "epoch": 0.6472491909385113, "percentage": 16.19, "elapsed_time": "2:58:32", "remaining_time": "15:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 4632, "loss": 0.8172, "learning_rate": 9.876073118263216e-06, "epoch": 0.6558791801510249, "percentage": 16.41, "elapsed_time": "3:00:02", "remaining_time": "15:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 4632, "loss": 0.7901, "learning_rate": 9.867596011323602e-06, "epoch": 0.6645091693635383, "percentage": 16.62, "elapsed_time": "3:01:29", "remaining_time": "15:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 4632, "loss": 0.7284, "learning_rate": 9.858842365124702e-06, "epoch": 0.6731391585760518, "percentage": 16.84, "elapsed_time": "3:03:07", "remaining_time": "15:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 4632, "loss": 0.7501, "learning_rate": 9.849812676981172e-06, "epoch": 0.6817691477885652, "percentage": 17.06, "elapsed_time": "3:04:16", "remaining_time": "14:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 4632, "loss": 0.7783, "learning_rate": 9.840507459890244e-06, "epoch": 0.6903991370010788, "percentage": 17.27, "elapsed_time": "3:05:16", "remaining_time": "14:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 4632, "eval_loss": 0.7211207151412964, "epoch": 0.6903991370010788, "percentage": 17.27, "elapsed_time": "3:10:37", "remaining_time": "15:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 4632, "loss": 0.6965, "learning_rate": 9.830927242502575e-06, "epoch": 0.6990291262135923, "percentage": 17.49, "elapsed_time": "3:11:46", "remaining_time": "15:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 4632, "loss": 0.77, "learning_rate": 9.821072569092223e-06, "epoch": 0.7076591154261057, "percentage": 17.7, "elapsed_time": "3:13:09", "remaining_time": "14:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 4632, "loss": 0.7158, "learning_rate": 9.810943999525714e-06, "epoch": 0.7162891046386192, "percentage": 17.92, "elapsed_time": "3:14:19", "remaining_time": "14:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 4632, "loss": 0.6938, "learning_rate": 9.800542109230247e-06, "epoch": 0.7249190938511327, "percentage": 18.13, "elapsed_time": "3:15:30", "remaining_time": "14:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 4632, "loss": 0.7895, "learning_rate": 9.78986748916099e-06, "epoch": 0.7335490830636462, "percentage": 18.35, "elapsed_time": "3:16:44", "remaining_time": "14:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 4632, "eval_loss": 0.7069711685180664, "epoch": 0.7335490830636462, "percentage": 18.35, "elapsed_time": "3:22:06", "remaining_time": "14:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 4632, "loss": 0.6717, "learning_rate": 9.778920745767524e-06, "epoch": 0.7421790722761596, "percentage": 18.57, "elapsed_time": "3:23:30", "remaining_time": "14:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 4632, "loss": 0.7353, "learning_rate": 9.767702500959365e-06, "epoch": 0.7508090614886731, "percentage": 18.78, "elapsed_time": "3:24:51", "remaining_time": "14:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 4632, "loss": 0.7315, "learning_rate": 9.756213392070654e-06, "epoch": 0.7594390507011867, "percentage": 19.0, "elapsed_time": "3:26:08", "remaining_time": "14:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 4632, "loss": 0.6777, "learning_rate": 9.744454071823936e-06, "epoch": 0.7680690399137001, "percentage": 19.21, "elapsed_time": "3:27:41", "remaining_time": "14:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 4632, "loss": 0.6881, "learning_rate": 9.732425208293083e-06, "epoch": 0.7766990291262136, "percentage": 19.43, "elapsed_time": "3:28:47", "remaining_time": "14:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 4632, "eval_loss": 0.7709933519363403, "epoch": 0.7766990291262136, "percentage": 19.43, "elapsed_time": "3:34:08", "remaining_time": "14:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 4632, "loss": 0.7973, "learning_rate": 9.720127484865336e-06, "epoch": 0.785329018338727, "percentage": 19.65, "elapsed_time": "3:35:10", "remaining_time": "14:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 4632, "loss": 0.6946, "learning_rate": 9.707561600202481e-06, "epoch": 0.7939590075512406, "percentage": 19.86, "elapsed_time": "3:36:21", "remaining_time": "14:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 4632, "loss": 0.7697, "learning_rate": 9.694728268201162e-06, "epoch": 0.8025889967637541, "percentage": 20.08, "elapsed_time": "3:37:58", "remaining_time": "14:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 4632, "loss": 0.7183, "learning_rate": 9.681628217952308e-06, "epoch": 0.8112189859762675, "percentage": 20.29, "elapsed_time": "3:39:25", "remaining_time": "14:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 4632, "loss": 0.7137, "learning_rate": 9.668262193699731e-06, "epoch": 0.819848975188781, "percentage": 20.51, "elapsed_time": "3:40:49", "remaining_time": "14:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 4632, "eval_loss": 0.6908486485481262, "epoch": 0.819848975188781, "percentage": 20.51, "elapsed_time": "3:46:10", "remaining_time": "14:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 4632, "loss": 0.7166, "learning_rate": 9.65463095479783e-06, "epoch": 0.8284789644012945, "percentage": 20.73, "elapsed_time": "3:47:15", "remaining_time": "14:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 4632, "loss": 0.7713, "learning_rate": 9.640735275668453e-06, "epoch": 0.837108953613808, "percentage": 20.94, "elapsed_time": "3:48:25", "remaining_time": "14:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 4632, "loss": 0.7101, "learning_rate": 9.62657594575691e-06, "epoch": 0.8457389428263214, "percentage": 21.16, "elapsed_time": "3:49:37", "remaining_time": "14:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 4632, "loss": 0.741, "learning_rate": 9.6121537694871e-06, "epoch": 0.8543689320388349, "percentage": 21.37, "elapsed_time": "3:50:57", "remaining_time": "14:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 4632, "loss": 0.6924, "learning_rate": 9.597469566215841e-06, "epoch": 0.8629989212513485, "percentage": 21.59, "elapsed_time": "3:52:27", "remaining_time": "14:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 4632, "eval_loss": 0.6857309341430664, "epoch": 0.8629989212513485, "percentage": 21.59, "elapsed_time": "3:57:48", "remaining_time": "14:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 4632, "loss": 0.6936, "learning_rate": 9.582524170186294e-06, "epoch": 0.8716289104638619, "percentage": 21.8, "elapsed_time": "3:59:16", "remaining_time": "14:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 4632, "loss": 0.6853, "learning_rate": 9.567318430480579e-06, "epoch": 0.8802588996763754, "percentage": 22.02, "elapsed_time": "4:00:54", "remaining_time": "14:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 4632, "loss": 0.6846, "learning_rate": 9.55185321097154e-06, "epoch": 0.8888888888888888, "percentage": 22.24, "elapsed_time": "4:02:18", "remaining_time": "14:07:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 4632, "loss": 0.7125, "learning_rate": 9.536129390273659e-06, "epoch": 0.8975188781014024, "percentage": 22.45, "elapsed_time": "4:03:51", "remaining_time": "14:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 4632, "loss": 0.7275, "learning_rate": 9.520147861693138e-06, "epoch": 0.9061488673139159, "percentage": 22.67, "elapsed_time": "4:05:18", "remaining_time": "13:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 4632, "eval_loss": 0.6835415959358215, "epoch": 0.9061488673139159, "percentage": 22.67, "elapsed_time": "4:10:39", "remaining_time": "14:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 4632, "loss": 0.7286, "learning_rate": 9.503909533177162e-06, "epoch": 0.9147788565264293, "percentage": 22.88, "elapsed_time": "4:11:54", "remaining_time": "14:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 4632, "loss": 0.7012, "learning_rate": 9.487415327262303e-06, "epoch": 0.9234088457389428, "percentage": 23.1, "elapsed_time": "4:13:16", "remaining_time": "14:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 4632, "loss": 0.7057, "learning_rate": 9.470666181022114e-06, "epoch": 0.9320388349514563, "percentage": 23.32, "elapsed_time": "4:14:41", "remaining_time": "13:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 4632, "loss": 0.7165, "learning_rate": 9.453663046013889e-06, "epoch": 0.9406688241639698, "percentage": 23.53, "elapsed_time": "4:16:03", "remaining_time": "13:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 4632, "loss": 0.67, "learning_rate": 9.436406888224603e-06, "epoch": 0.9492988133764833, "percentage": 23.75, "elapsed_time": "4:17:24", "remaining_time": "13:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 4632, "eval_loss": 0.6888366341590881, "epoch": 0.9492988133764833, "percentage": 23.75, "elapsed_time": "4:22:45", "remaining_time": "14:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 4632, "loss": 0.7177, "learning_rate": 9.418898688016042e-06, "epoch": 0.9579288025889967, "percentage": 23.96, "elapsed_time": "4:24:01", "remaining_time": "13:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 4632, "loss": 0.6841, "learning_rate": 9.40113944006909e-06, "epoch": 0.9665587918015103, "percentage": 24.18, "elapsed_time": "4:25:27", "remaining_time": "13:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 4632, "loss": 0.6808, "learning_rate": 9.383130153327231e-06, "epoch": 0.9751887810140237, "percentage": 24.4, "elapsed_time": "4:26:44", "remaining_time": "13:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 4632, "loss": 0.7059, "learning_rate": 9.36487185093922e-06, "epoch": 0.9838187702265372, "percentage": 24.61, "elapsed_time": "4:27:57", "remaining_time": "13:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 4632, "loss": 0.6787, "learning_rate": 9.34636557020097e-06, "epoch": 0.9924487594390508, "percentage": 24.83, "elapsed_time": "4:29:24", "remaining_time": "13:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 4632, "eval_loss": 0.6860348582267761, "epoch": 0.9924487594390508, "percentage": 24.83, "elapsed_time": "4:34:45", "remaining_time": "13:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 4632, "loss": 0.6904, "learning_rate": 9.327612362496601e-06, "epoch": 1.0010787486515642, "percentage": 25.04, "elapsed_time": "4:35:53", "remaining_time": "13:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 4632, "loss": 0.7516, "learning_rate": 9.308613293238722e-06, "epoch": 1.0097087378640777, "percentage": 25.26, "elapsed_time": "4:37:22", "remaining_time": "13:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 4632, "loss": 0.7105, "learning_rate": 9.2893694418079e-06, "epoch": 1.0183387270765911, "percentage": 25.47, "elapsed_time": "4:38:34", "remaining_time": "13:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 4632, "loss": 0.67, "learning_rate": 9.269881901491335e-06, "epoch": 1.0269687162891046, "percentage": 25.69, "elapsed_time": "4:40:01", "remaining_time": "13:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 4632, "loss": 0.7012, "learning_rate": 9.250151779420756e-06, "epoch": 1.035598705501618, "percentage": 25.91, "elapsed_time": "4:41:23", "remaining_time": "13:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 4632, "eval_loss": 0.6847370266914368, "epoch": 1.035598705501618, "percentage": 25.91, "elapsed_time": "4:46:44", "remaining_time": "13:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 4632, "loss": 0.6726, "learning_rate": 9.230180196509506e-06, "epoch": 1.0442286947141317, "percentage": 26.12, "elapsed_time": "4:48:15", "remaining_time": "13:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 4632, "loss": 0.6737, "learning_rate": 9.209968287388878e-06, "epoch": 1.0528586839266452, "percentage": 26.34, "elapsed_time": "4:49:53", "remaining_time": "13:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 4632, "loss": 0.6421, "learning_rate": 9.189517200343643e-06, "epoch": 1.0614886731391586, "percentage": 26.55, "elapsed_time": "4:51:19", "remaining_time": "13:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 4632, "loss": 0.7709, "learning_rate": 9.168828097246819e-06, "epoch": 1.070118662351672, "percentage": 26.77, "elapsed_time": "4:52:22", "remaining_time": "13:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 4632, "loss": 0.6765, "learning_rate": 9.147902153493659e-06, "epoch": 1.0787486515641855, "percentage": 26.99, "elapsed_time": "4:53:24", "remaining_time": "13:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 4632, "eval_loss": 0.6961000561714172, "epoch": 1.0787486515641855, "percentage": 26.99, "elapsed_time": "4:58:45", "remaining_time": "13:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 4632, "loss": 0.6551, "learning_rate": 9.126740557934874e-06, "epoch": 1.087378640776699, "percentage": 27.2, "elapsed_time": "4:59:51", "remaining_time": "13:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 4632, "loss": 0.6606, "learning_rate": 9.105344512809097e-06, "epoch": 1.0960086299892124, "percentage": 27.42, "elapsed_time": "5:01:20", "remaining_time": "13:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 4632, "loss": 0.7058, "learning_rate": 9.083715233674572e-06, "epoch": 1.104638619201726, "percentage": 27.63, "elapsed_time": "5:02:33", "remaining_time": "13:12:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 4632, "loss": 0.6577, "learning_rate": 9.061853949340104e-06, "epoch": 1.1132686084142396, "percentage": 27.85, "elapsed_time": "5:03:41", "remaining_time": "13:06:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 4632, "loss": 0.7052, "learning_rate": 9.039761901795241e-06, "epoch": 1.121898597626753, "percentage": 28.07, "elapsed_time": "5:04:52", "remaining_time": "13:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 4632, "eval_loss": 0.6881099939346313, "epoch": 1.121898597626753, "percentage": 28.07, "elapsed_time": "5:10:13", "remaining_time": "13:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 4632, "loss": 0.681, "learning_rate": 9.017440346139718e-06, "epoch": 1.1305285868392665, "percentage": 28.28, "elapsed_time": "5:11:18", "remaining_time": "13:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 4632, "loss": 0.7117, "learning_rate": 8.994890550512152e-06, "epoch": 1.13915857605178, "percentage": 28.5, "elapsed_time": "5:12:41", "remaining_time": "13:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 4632, "loss": 0.7058, "learning_rate": 8.972113796017992e-06, "epoch": 1.1477885652642934, "percentage": 28.71, "elapsed_time": "5:14:04", "remaining_time": "12:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 4632, "loss": 0.6867, "learning_rate": 8.949111376656741e-06, "epoch": 1.1564185544768069, "percentage": 28.93, "elapsed_time": "5:15:31", "remaining_time": "12:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 4632, "loss": 0.6804, "learning_rate": 8.925884599248437e-06, "epoch": 1.1650485436893203, "percentage": 29.15, "elapsed_time": "5:16:48", "remaining_time": "12:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 4632, "eval_loss": 0.6778111457824707, "epoch": 1.1650485436893203, "percentage": 29.15, "elapsed_time": "5:22:09", "remaining_time": "13:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 4632, "loss": 0.6812, "learning_rate": 8.902434783359417e-06, "epoch": 1.173678532901834, "percentage": 29.36, "elapsed_time": "5:23:12", "remaining_time": "12:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 4632, "loss": 0.7111, "learning_rate": 8.878763261227337e-06, "epoch": 1.1823085221143474, "percentage": 29.58, "elapsed_time": "5:24:31", "remaining_time": "12:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 4632, "loss": 0.6762, "learning_rate": 8.854871377685496e-06, "epoch": 1.190938511326861, "percentage": 29.79, "elapsed_time": "5:25:38", "remaining_time": "12:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 4632, "loss": 0.6817, "learning_rate": 8.830760490086427e-06, "epoch": 1.1995685005393744, "percentage": 30.01, "elapsed_time": "5:26:54", "remaining_time": "12:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 4632, "loss": 0.6644, "learning_rate": 8.806431968224784e-06, "epoch": 1.2081984897518878, "percentage": 30.22, "elapsed_time": "5:28:09", "remaining_time": "12:37:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 4632, "eval_loss": 0.6810408234596252, "epoch": 1.2081984897518878, "percentage": 30.22, "elapsed_time": "5:33:30", "remaining_time": "12:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 4632, "loss": 0.6684, "learning_rate": 8.781887194259523e-06, "epoch": 1.2168284789644013, "percentage": 30.44, "elapsed_time": "5:35:05", "remaining_time": "12:45:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 4632, "loss": 0.6802, "learning_rate": 8.757127562635374e-06, "epoch": 1.2254584681769147, "percentage": 30.66, "elapsed_time": "5:36:34", "remaining_time": "12:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 4632, "loss": 0.7045, "learning_rate": 8.732154480003625e-06, "epoch": 1.2340884573894282, "percentage": 30.87, "elapsed_time": "5:38:05", "remaining_time": "12:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 4632, "loss": 0.6916, "learning_rate": 8.706969365142202e-06, "epoch": 1.2427184466019416, "percentage": 31.09, "elapsed_time": "5:39:05", "remaining_time": "12:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 4632, "loss": 0.6566, "learning_rate": 8.681573648875064e-06, "epoch": 1.2513484358144553, "percentage": 31.3, "elapsed_time": "5:40:09", "remaining_time": "12:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 4632, "eval_loss": 0.6820415258407593, "epoch": 1.2513484358144553, "percentage": 31.3, "elapsed_time": "5:45:30", "remaining_time": "12:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 4632, "loss": 0.6696, "learning_rate": 8.655968773990922e-06, "epoch": 1.2599784250269688, "percentage": 31.52, "elapsed_time": "5:46:51", "remaining_time": "12:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 4632, "loss": 0.6407, "learning_rate": 8.630156195161264e-06, "epoch": 1.2686084142394822, "percentage": 31.74, "elapsed_time": "5:47:49", "remaining_time": "12:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 4632, "loss": 0.6507, "learning_rate": 8.604137378857713e-06, "epoch": 1.2772384034519957, "percentage": 31.95, "elapsed_time": "5:49:07", "remaining_time": "12:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 4632, "loss": 0.7229, "learning_rate": 8.577913803268719e-06, "epoch": 1.2858683926645091, "percentage": 32.17, "elapsed_time": "5:50:34", "remaining_time": "12:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 4632, "loss": 0.7024, "learning_rate": 8.551486958215569e-06, "epoch": 1.2944983818770226, "percentage": 32.38, "elapsed_time": "5:51:56", "remaining_time": "12:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 4632, "eval_loss": 0.6744683384895325, "epoch": 1.2944983818770226, "percentage": 32.38, "elapsed_time": "5:57:17", "remaining_time": "12:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 4632, "loss": 0.6842, "learning_rate": 8.524858345067757e-06, "epoch": 1.303128371089536, "percentage": 32.6, "elapsed_time": "5:58:39", "remaining_time": "12:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 4632, "loss": 0.6904, "learning_rate": 8.498029476657686e-06, "epoch": 1.3117583603020497, "percentage": 32.82, "elapsed_time": "6:00:13", "remaining_time": "12:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 4632, "loss": 0.6733, "learning_rate": 8.471001877194708e-06, "epoch": 1.3203883495145632, "percentage": 33.03, "elapsed_time": "6:01:22", "remaining_time": "12:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 4632, "loss": 0.6767, "learning_rate": 8.443777082178556e-06, "epoch": 1.3290183387270766, "percentage": 33.25, "elapsed_time": "6:02:33", "remaining_time": "12:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 4632, "loss": 0.7241, "learning_rate": 8.416356638312082e-06, "epoch": 1.33764832793959, "percentage": 33.46, "elapsed_time": "6:03:41", "remaining_time": "12:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 4632, "eval_loss": 0.6697773933410645, "epoch": 1.33764832793959, "percentage": 33.46, "elapsed_time": "6:09:02", "remaining_time": "12:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 4632, "loss": 0.6738, "learning_rate": 8.388742103413397e-06, "epoch": 1.3462783171521036, "percentage": 33.68, "elapsed_time": "6:10:19", "remaining_time": "12:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 4632, "loss": 0.671, "learning_rate": 8.360935046327373e-06, "epoch": 1.354908306364617, "percentage": 33.89, "elapsed_time": "6:11:37", "remaining_time": "12:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 4632, "loss": 0.69, "learning_rate": 8.332937046836503e-06, "epoch": 1.3635382955771305, "percentage": 34.11, "elapsed_time": "6:13:02", "remaining_time": "12:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 4632, "loss": 0.6583, "learning_rate": 8.304749695571157e-06, "epoch": 1.3721682847896441, "percentage": 34.33, "elapsed_time": "6:14:22", "remaining_time": "11:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 4632, "loss": 0.7378, "learning_rate": 8.276374593919213e-06, "epoch": 1.3807982740021574, "percentage": 34.54, "elapsed_time": "6:15:56", "remaining_time": "11:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 4632, "eval_loss": 0.6734395027160645, "epoch": 1.3807982740021574, "percentage": 34.54, "elapsed_time": "6:21:17", "remaining_time": "12:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 4632, "loss": 0.664, "learning_rate": 8.247813353935073e-06, "epoch": 1.389428263214671, "percentage": 34.76, "elapsed_time": "6:22:53", "remaining_time": "11:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1620, "total_steps": 4632, "loss": 0.6718, "learning_rate": 8.219067598248087e-06, "epoch": 1.3980582524271845, "percentage": 34.97, "elapsed_time": "6:23:59", "remaining_time": "11:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1630, "total_steps": 4632, "loss": 0.6476, "learning_rate": 8.190138959970366e-06, "epoch": 1.406688241639698, "percentage": 35.19, "elapsed_time": "6:25:35", "remaining_time": "11:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1640, "total_steps": 4632, "loss": 0.642, "learning_rate": 8.161029082603994e-06, "epoch": 1.4153182308522114, "percentage": 35.41, "elapsed_time": "6:26:57", "remaining_time": "11:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 4632, "loss": 0.6584, "learning_rate": 8.131739619947667e-06, "epoch": 1.4239482200647249, "percentage": 35.62, "elapsed_time": "6:28:06", "remaining_time": "11:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 4632, "eval_loss": 0.6994197964668274, "epoch": 1.4239482200647249, "percentage": 35.62, "elapsed_time": "6:33:27", "remaining_time": "11:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1660, "total_steps": 4632, "loss": 0.7239, "learning_rate": 8.102272236002729e-06, "epoch": 1.4325782092772383, "percentage": 35.84, "elapsed_time": "6:34:31", "remaining_time": "11:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1670, "total_steps": 4632, "loss": 0.7182, "learning_rate": 8.072628604878638e-06, "epoch": 1.4412081984897518, "percentage": 36.05, "elapsed_time": "6:36:03", "remaining_time": "11:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 4632, "loss": 0.717, "learning_rate": 8.042810410697861e-06, "epoch": 1.4498381877022655, "percentage": 36.27, "elapsed_time": "6:37:14", "remaining_time": "11:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1690, "total_steps": 4632, "loss": 0.6567, "learning_rate": 8.012819347500189e-06, "epoch": 1.458468176914779, "percentage": 36.49, "elapsed_time": "6:38:34", "remaining_time": "11:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 4632, "loss": 0.6724, "learning_rate": 7.982657119146495e-06, "epoch": 1.4670981661272924, "percentage": 36.7, "elapsed_time": "6:39:54", "remaining_time": "11:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 4632, "eval_loss": 0.6715120077133179, "epoch": 1.4670981661272924, "percentage": 36.7, "elapsed_time": "6:45:15", "remaining_time": "11:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1710, "total_steps": 4632, "loss": 0.6653, "learning_rate": 7.952325439221944e-06, "epoch": 1.4757281553398058, "percentage": 36.92, "elapsed_time": "6:46:25", "remaining_time": "11:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1720, "total_steps": 4632, "loss": 0.722, "learning_rate": 7.921826030938623e-06, "epoch": 1.4843581445523193, "percentage": 37.13, "elapsed_time": "6:47:33", "remaining_time": "11:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1730, "total_steps": 4632, "loss": 0.7034, "learning_rate": 7.891160627037653e-06, "epoch": 1.4929881337648327, "percentage": 37.35, "elapsed_time": "6:48:54", "remaining_time": "11:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1740, "total_steps": 4632, "loss": 0.6338, "learning_rate": 7.860330969690749e-06, "epoch": 1.5016181229773462, "percentage": 37.56, "elapsed_time": "6:49:53", "remaining_time": "11:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1750, "total_steps": 4632, "loss": 0.6774, "learning_rate": 7.829338810401238e-06, "epoch": 1.5102481121898599, "percentage": 37.78, "elapsed_time": "6:51:21", "remaining_time": "11:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1750, "total_steps": 4632, "eval_loss": 0.669984757900238, "epoch": 1.5102481121898599, "percentage": 37.78, "elapsed_time": "6:56:43", "remaining_time": "11:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1760, "total_steps": 4632, "loss": 0.6813, "learning_rate": 7.798185909904552e-06, "epoch": 1.5188781014023731, "percentage": 38.0, "elapsed_time": "6:58:02", "remaining_time": "11:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1770, "total_steps": 4632, "loss": 0.7138, "learning_rate": 7.766874038068202e-06, "epoch": 1.5275080906148868, "percentage": 38.21, "elapsed_time": "6:59:52", "remaining_time": "11:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1780, "total_steps": 4632, "loss": 0.7025, "learning_rate": 7.735404973791223e-06, "epoch": 1.5361380798274002, "percentage": 38.43, "elapsed_time": "7:01:03", "remaining_time": "11:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1790, "total_steps": 4632, "loss": 0.6643, "learning_rate": 7.703780504903107e-06, "epoch": 1.5447680690399137, "percentage": 38.64, "elapsed_time": "7:02:19", "remaining_time": "11:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1800, "total_steps": 4632, "loss": 0.6653, "learning_rate": 7.672002428062245e-06, "epoch": 1.5533980582524272, "percentage": 38.86, "elapsed_time": "7:03:43", "remaining_time": "11:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1800, "total_steps": 4632, "eval_loss": 0.6695827841758728, "epoch": 1.5533980582524272, "percentage": 38.86, "elapsed_time": "7:09:05", "remaining_time": "11:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1810, "total_steps": 4632, "loss": 0.6681, "learning_rate": 7.640072548653843e-06, "epoch": 1.5620280474649406, "percentage": 39.08, "elapsed_time": "7:10:27", "remaining_time": "11:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1820, "total_steps": 4632, "loss": 0.6297, "learning_rate": 7.607992680687362e-06, "epoch": 1.5706580366774543, "percentage": 39.29, "elapsed_time": "7:11:37", "remaining_time": "11:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1830, "total_steps": 4632, "loss": 0.706, "learning_rate": 7.575764646693447e-06, "epoch": 1.5792880258899675, "percentage": 39.51, "elapsed_time": "7:13:09", "remaining_time": "11:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1840, "total_steps": 4632, "loss": 0.6669, "learning_rate": 7.5433902776204015e-06, "epoch": 1.5879180151024812, "percentage": 39.72, "elapsed_time": "7:14:15", "remaining_time": "10:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1850, "total_steps": 4632, "loss": 0.6641, "learning_rate": 7.510871412730157e-06, "epoch": 1.5965480043149944, "percentage": 39.94, "elapsed_time": "7:15:34", "remaining_time": "10:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1850, "total_steps": 4632, "eval_loss": 0.6732643246650696, "epoch": 1.5965480043149944, "percentage": 39.94, "elapsed_time": "7:20:55", "remaining_time": "11:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1860, "total_steps": 4632, "loss": 0.6345, "learning_rate": 7.478209899493787e-06, "epoch": 1.6051779935275081, "percentage": 40.16, "elapsed_time": "7:22:09", "remaining_time": "10:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1870, "total_steps": 4632, "loss": 0.6899, "learning_rate": 7.445407593486535e-06, "epoch": 1.6138079827400216, "percentage": 40.37, "elapsed_time": "7:23:16", "remaining_time": "10:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1880, "total_steps": 4632, "loss": 0.6848, "learning_rate": 7.41246635828241e-06, "epoch": 1.622437971952535, "percentage": 40.59, "elapsed_time": "7:24:44", "remaining_time": "10:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1890, "total_steps": 4632, "loss": 0.6829, "learning_rate": 7.379388065348305e-06, "epoch": 1.6310679611650487, "percentage": 40.8, "elapsed_time": "7:26:35", "remaining_time": "10:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1900, "total_steps": 4632, "loss": 0.7241, "learning_rate": 7.346174593937676e-06, "epoch": 1.639697950377562, "percentage": 41.02, "elapsed_time": "7:27:55", "remaining_time": "10:44:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1900, "total_steps": 4632, "eval_loss": 0.6652901768684387, "epoch": 1.639697950377562, "percentage": 41.02, "elapsed_time": "7:33:16", "remaining_time": "10:51:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1910, "total_steps": 4632, "loss": 0.6428, "learning_rate": 7.31282783098378e-06, "epoch": 1.6483279395900756, "percentage": 41.23, "elapsed_time": "7:34:45", "remaining_time": "10:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1920, "total_steps": 4632, "loss": 0.6494, "learning_rate": 7.279349670992464e-06, "epoch": 1.6569579288025889, "percentage": 41.45, "elapsed_time": "7:36:04", "remaining_time": "10:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1930, "total_steps": 4632, "loss": 0.5778, "learning_rate": 7.245742015934547e-06, "epoch": 1.6655879180151025, "percentage": 41.67, "elapsed_time": "7:37:16", "remaining_time": "10:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1940, "total_steps": 4632, "loss": 0.6912, "learning_rate": 7.212006775137761e-06, "epoch": 1.674217907227616, "percentage": 41.88, "elapsed_time": "7:38:32", "remaining_time": "10:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1950, "total_steps": 4632, "loss": 0.6496, "learning_rate": 7.178145865178268e-06, "epoch": 1.6828478964401294, "percentage": 42.1, "elapsed_time": "7:39:55", "remaining_time": "10:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1950, "total_steps": 4632, "eval_loss": 0.6761239767074585, "epoch": 1.6828478964401294, "percentage": 42.1, "elapsed_time": "7:45:16", "remaining_time": "10:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1960, "total_steps": 4632, "loss": 0.6757, "learning_rate": 7.144161209771788e-06, "epoch": 1.691477885652643, "percentage": 42.31, "elapsed_time": "7:46:38", "remaining_time": "10:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1970, "total_steps": 4632, "loss": 0.6111, "learning_rate": 7.110054739664303e-06, "epoch": 1.7001078748651564, "percentage": 42.53, "elapsed_time": "7:47:52", "remaining_time": "10:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1980, "total_steps": 4632, "loss": 0.5998, "learning_rate": 7.075828392522362e-06, "epoch": 1.70873786407767, "percentage": 42.75, "elapsed_time": "7:49:06", "remaining_time": "10:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1990, "total_steps": 4632, "loss": 0.655, "learning_rate": 7.04148411282301e-06, "epoch": 1.7173678532901833, "percentage": 42.96, "elapsed_time": "7:50:08", "remaining_time": "10:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 4632, "loss": 0.662, "learning_rate": 7.0070238517433e-06, "epoch": 1.725997842502697, "percentage": 43.18, "elapsed_time": "7:51:29", "remaining_time": "10:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 4632, "eval_loss": 0.6728688478469849, "epoch": 1.725997842502697, "percentage": 43.18, "elapsed_time": "7:56:50", "remaining_time": "10:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2010, "total_steps": 4632, "loss": 0.6923, "learning_rate": 6.972449567049463e-06, "epoch": 1.7346278317152104, "percentage": 43.39, "elapsed_time": "7:58:08", "remaining_time": "10:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2020, "total_steps": 4632, "loss": 0.6625, "learning_rate": 6.9377632229856665e-06, "epoch": 1.7432578209277239, "percentage": 43.61, "elapsed_time": "7:59:48", "remaining_time": "10:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2030, "total_steps": 4632, "loss": 0.6919, "learning_rate": 6.902966790162425e-06, "epoch": 1.7518878101402373, "percentage": 43.83, "elapsed_time": "8:01:10", "remaining_time": "10:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2040, "total_steps": 4632, "loss": 0.6468, "learning_rate": 6.868062245444655e-06, "epoch": 1.7605177993527508, "percentage": 44.04, "elapsed_time": "8:02:32", "remaining_time": "10:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2050, "total_steps": 4632, "loss": 0.7049, "learning_rate": 6.833051571839347e-06, "epoch": 1.7691477885652644, "percentage": 44.26, "elapsed_time": "8:03:25", "remaining_time": "10:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2050, "total_steps": 4632, "eval_loss": 0.6757835149765015, "epoch": 1.7691477885652644, "percentage": 44.26, "elapsed_time": "8:08:46", "remaining_time": "10:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2060, "total_steps": 4632, "loss": 0.6384, "learning_rate": 6.797936758382924e-06, "epoch": 1.7777777777777777, "percentage": 44.47, "elapsed_time": "8:09:56", "remaining_time": "10:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2070, "total_steps": 4632, "loss": 0.6169, "learning_rate": 6.762719800028231e-06, "epoch": 1.7864077669902914, "percentage": 44.69, "elapsed_time": "8:11:29", "remaining_time": "10:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2080, "total_steps": 4632, "loss": 0.6596, "learning_rate": 6.727402697531193e-06, "epoch": 1.7950377562028046, "percentage": 44.91, "elapsed_time": "8:12:24", "remaining_time": "10:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2090, "total_steps": 4632, "loss": 0.6964, "learning_rate": 6.69198745733716e-06, "epoch": 1.8036677454153183, "percentage": 45.12, "elapsed_time": "8:13:52", "remaining_time": "10:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2100, "total_steps": 4632, "loss": 0.6483, "learning_rate": 6.656476091466901e-06, "epoch": 1.8122977346278317, "percentage": 45.34, "elapsed_time": "8:15:17", "remaining_time": "9:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2100, "total_steps": 4632, "eval_loss": 0.6741885542869568, "epoch": 1.8122977346278317, "percentage": 45.34, "elapsed_time": "8:20:38", "remaining_time": "10:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2110, "total_steps": 4632, "loss": 0.6732, "learning_rate": 6.620870617402312e-06, "epoch": 1.8209277238403452, "percentage": 45.55, "elapsed_time": "8:21:45", "remaining_time": "9:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2120, "total_steps": 4632, "loss": 0.6674, "learning_rate": 6.585173057971787e-06, "epoch": 1.8295577130528586, "percentage": 45.77, "elapsed_time": "8:23:04", "remaining_time": "9:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2130, "total_steps": 4632, "loss": 0.6807, "learning_rate": 6.5493854412352985e-06, "epoch": 1.838187702265372, "percentage": 45.98, "elapsed_time": "8:24:39", "remaining_time": "9:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2140, "total_steps": 4632, "loss": 0.6637, "learning_rate": 6.5135098003691865e-06, "epoch": 1.8468176914778858, "percentage": 46.2, "elapsed_time": "8:26:29", "remaining_time": "9:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2150, "total_steps": 4632, "loss": 0.678, "learning_rate": 6.477548173550635e-06, "epoch": 1.855447680690399, "percentage": 46.42, "elapsed_time": "8:27:45", "remaining_time": "9:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2150, "total_steps": 4632, "eval_loss": 0.6695934534072876, "epoch": 1.855447680690399, "percentage": 46.42, "elapsed_time": "8:33:06", "remaining_time": "9:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2160, "total_steps": 4632, "loss": 0.6592, "learning_rate": 6.441502603841892e-06, "epoch": 1.8640776699029127, "percentage": 46.63, "elapsed_time": "8:34:35", "remaining_time": "9:48:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2170, "total_steps": 4632, "loss": 0.6413, "learning_rate": 6.405375139074194e-06, "epoch": 1.8727076591154261, "percentage": 46.85, "elapsed_time": "8:35:45", "remaining_time": "9:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2180, "total_steps": 4632, "loss": 0.6304, "learning_rate": 6.369167831731419e-06, "epoch": 1.8813376483279396, "percentage": 47.06, "elapsed_time": "8:37:18", "remaining_time": "9:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2190, "total_steps": 4632, "loss": 0.6144, "learning_rate": 6.332882738833485e-06, "epoch": 1.889967637540453, "percentage": 47.28, "elapsed_time": "8:38:28", "remaining_time": "9:38:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2200, "total_steps": 4632, "loss": 0.678, "learning_rate": 6.296521921819489e-06, "epoch": 1.8985976267529665, "percentage": 47.5, "elapsed_time": "8:39:42", "remaining_time": "9:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2200, "total_steps": 4632, "eval_loss": 0.6689735054969788, "epoch": 1.8985976267529665, "percentage": 47.5, "elapsed_time": "8:45:02", "remaining_time": "9:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2210, "total_steps": 4632, "loss": 0.6622, "learning_rate": 6.260087446430582e-06, "epoch": 1.9072276159654802, "percentage": 47.71, "elapsed_time": "8:46:13", "remaining_time": "9:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2220, "total_steps": 4632, "loss": 0.6567, "learning_rate": 6.223581382592625e-06, "epoch": 1.9158576051779934, "percentage": 47.93, "elapsed_time": "8:47:25", "remaining_time": "9:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2230, "total_steps": 4632, "loss": 0.6634, "learning_rate": 6.18700580429857e-06, "epoch": 1.924487594390507, "percentage": 48.14, "elapsed_time": "8:48:51", "remaining_time": "9:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2240, "total_steps": 4632, "loss": 0.6532, "learning_rate": 6.150362789490654e-06, "epoch": 1.9331175836030206, "percentage": 48.36, "elapsed_time": "8:50:10", "remaining_time": "9:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2250, "total_steps": 4632, "loss": 0.6953, "learning_rate": 6.113654419942334e-06, "epoch": 1.941747572815534, "percentage": 48.58, "elapsed_time": "8:51:06", "remaining_time": "9:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2250, "total_steps": 4632, "eval_loss": 0.6624494791030884, "epoch": 1.941747572815534, "percentage": 48.58, "elapsed_time": "8:56:27", "remaining_time": "9:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2260, "total_steps": 4632, "loss": 0.71, "learning_rate": 6.0768827811400166e-06, "epoch": 1.9503775620280475, "percentage": 48.79, "elapsed_time": "8:57:48", "remaining_time": "9:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2270, "total_steps": 4632, "loss": 0.6464, "learning_rate": 6.040049962164585e-06, "epoch": 1.959007551240561, "percentage": 49.01, "elapsed_time": "8:59:14", "remaining_time": "9:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2280, "total_steps": 4632, "loss": 0.6598, "learning_rate": 6.0031580555727005e-06, "epoch": 1.9676375404530746, "percentage": 49.22, "elapsed_time": "9:00:15", "remaining_time": "9:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2290, "total_steps": 4632, "loss": 0.6292, "learning_rate": 5.9662091572779325e-06, "epoch": 1.9762675296655878, "percentage": 49.44, "elapsed_time": "9:01:33", "remaining_time": "9:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2300, "total_steps": 4632, "loss": 0.6969, "learning_rate": 5.929205366431679e-06, "epoch": 1.9848975188781015, "percentage": 49.65, "elapsed_time": "9:02:56", "remaining_time": "9:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2300, "total_steps": 4632, "eval_loss": 0.6725260019302368, "epoch": 1.9848975188781015, "percentage": 49.65, "elapsed_time": "9:08:16", "remaining_time": "9:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2310, "total_steps": 4632, "loss": 0.6386, "learning_rate": 5.892148785303905e-06, "epoch": 1.9935275080906147, "percentage": 49.87, "elapsed_time": "9:09:36", "remaining_time": "9:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2320, "total_steps": 4632, "loss": 0.5936, "learning_rate": 5.855041519163718e-06, "epoch": 2.0021574973031284, "percentage": 50.09, "elapsed_time": "9:10:54", "remaining_time": "9:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2330, "total_steps": 4632, "loss": 0.7021, "learning_rate": 5.817885676159754e-06, "epoch": 2.0107874865156417, "percentage": 50.3, "elapsed_time": "9:12:16", "remaining_time": "9:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2340, "total_steps": 4632, "loss": 0.62, "learning_rate": 5.78068336720041e-06, "epoch": 2.0194174757281553, "percentage": 50.52, "elapsed_time": "9:13:27", "remaining_time": "9:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2350, "total_steps": 4632, "loss": 0.6492, "learning_rate": 5.743436705833922e-06, "epoch": 2.028047464940669, "percentage": 50.73, "elapsed_time": "9:14:49", "remaining_time": "8:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2350, "total_steps": 4632, "eval_loss": 0.656815767288208, "epoch": 2.028047464940669, "percentage": 50.73, "elapsed_time": "9:20:10", "remaining_time": "9:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2360, "total_steps": 4632, "loss": 0.6385, "learning_rate": 5.706147808128288e-06, "epoch": 2.0366774541531822, "percentage": 50.95, "elapsed_time": "9:21:24", "remaining_time": "9:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2370, "total_steps": 4632, "loss": 0.5838, "learning_rate": 5.668818792551052e-06, "epoch": 2.045307443365696, "percentage": 51.17, "elapsed_time": "9:22:50", "remaining_time": "8:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2380, "total_steps": 4632, "loss": 0.655, "learning_rate": 5.6314517798489395e-06, "epoch": 2.053937432578209, "percentage": 51.38, "elapsed_time": "9:24:19", "remaining_time": "8:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2390, "total_steps": 4632, "loss": 0.7095, "learning_rate": 5.594048892927382e-06, "epoch": 2.062567421790723, "percentage": 51.6, "elapsed_time": "9:25:32", "remaining_time": "8:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2400, "total_steps": 4632, "loss": 0.6572, "learning_rate": 5.556612256729909e-06, "epoch": 2.071197411003236, "percentage": 51.81, "elapsed_time": "9:26:45", "remaining_time": "8:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2400, "total_steps": 4632, "eval_loss": 0.669795036315918, "epoch": 2.071197411003236, "percentage": 51.81, "elapsed_time": "9:32:05", "remaining_time": "8:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2410, "total_steps": 4632, "loss": 0.6518, "learning_rate": 5.519143998117424e-06, "epoch": 2.0798274002157497, "percentage": 52.03, "elapsed_time": "9:33:13", "remaining_time": "8:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2420, "total_steps": 4632, "loss": 0.6492, "learning_rate": 5.48164624574737e-06, "epoch": 2.0884573894282634, "percentage": 52.25, "elapsed_time": "9:34:21", "remaining_time": "8:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2430, "total_steps": 4632, "loss": 0.648, "learning_rate": 5.444121129952799e-06, "epoch": 2.0970873786407767, "percentage": 52.46, "elapsed_time": "9:35:33", "remaining_time": "8:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2440, "total_steps": 4632, "loss": 0.6533, "learning_rate": 5.406570782621341e-06, "epoch": 2.1057173678532903, "percentage": 52.68, "elapsed_time": "9:36:51", "remaining_time": "8:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2450, "total_steps": 4632, "loss": 0.6204, "learning_rate": 5.368997337074088e-06, "epoch": 2.1143473570658036, "percentage": 52.89, "elapsed_time": "9:38:15", "remaining_time": "8:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2450, "total_steps": 4632, "eval_loss": 0.6549546122550964, "epoch": 2.1143473570658036, "percentage": 52.89, "elapsed_time": "9:43:36", "remaining_time": "8:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2460, "total_steps": 4632, "loss": 0.5746, "learning_rate": 5.331402927944392e-06, "epoch": 2.1229773462783172, "percentage": 53.11, "elapsed_time": "9:44:49", "remaining_time": "8:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2470, "total_steps": 4632, "loss": 0.6352, "learning_rate": 5.293789691056601e-06, "epoch": 2.1316073354908305, "percentage": 53.32, "elapsed_time": "9:46:01", "remaining_time": "8:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2480, "total_steps": 4632, "loss": 0.6815, "learning_rate": 5.256159763304703e-06, "epoch": 2.140237324703344, "percentage": 53.54, "elapsed_time": "9:47:33", "remaining_time": "8:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2490, "total_steps": 4632, "loss": 0.5849, "learning_rate": 5.218515282530934e-06, "epoch": 2.148867313915858, "percentage": 53.76, "elapsed_time": "9:48:49", "remaining_time": "8:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 4632, "loss": 0.6479, "learning_rate": 5.180858387404325e-06, "epoch": 2.157497303128371, "percentage": 53.97, "elapsed_time": "9:50:10", "remaining_time": "8:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 4632, "eval_loss": 0.6610180735588074, "epoch": 2.157497303128371, "percentage": 53.97, "elapsed_time": "9:55:31", "remaining_time": "8:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2510, "total_steps": 4632, "loss": 0.5588, "learning_rate": 5.143191217299189e-06, "epoch": 2.1661272923408847, "percentage": 54.19, "elapsed_time": "9:57:03", "remaining_time": "8:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2520, "total_steps": 4632, "loss": 0.6862, "learning_rate": 5.10551591217359e-06, "epoch": 2.174757281553398, "percentage": 54.4, "elapsed_time": "9:58:12", "remaining_time": "8:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2530, "total_steps": 4632, "loss": 0.6218, "learning_rate": 5.067834612447755e-06, "epoch": 2.1833872707659117, "percentage": 54.62, "elapsed_time": "9:59:23", "remaining_time": "8:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2540, "total_steps": 4632, "loss": 0.5711, "learning_rate": 5.0301494588824795e-06, "epoch": 2.192017259978425, "percentage": 54.84, "elapsed_time": "10:00:50", "remaining_time": "8:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2550, "total_steps": 4632, "loss": 0.6954, "learning_rate": 4.9924625924575095e-06, "epoch": 2.2006472491909386, "percentage": 55.05, "elapsed_time": "10:01:55", "remaining_time": "8:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2550, "total_steps": 4632, "eval_loss": 0.6637104153633118, "epoch": 2.2006472491909386, "percentage": 55.05, "elapsed_time": "10:07:16", "remaining_time": "8:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2560, "total_steps": 4632, "loss": 0.6567, "learning_rate": 4.954776154249896e-06, "epoch": 2.209277238403452, "percentage": 55.27, "elapsed_time": "10:08:24", "remaining_time": "8:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2570, "total_steps": 4632, "loss": 0.6283, "learning_rate": 4.9170922853123635e-06, "epoch": 2.2179072276159655, "percentage": 55.48, "elapsed_time": "10:10:06", "remaining_time": "8:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2580, "total_steps": 4632, "loss": 0.6072, "learning_rate": 4.879413126551675e-06, "epoch": 2.226537216828479, "percentage": 55.7, "elapsed_time": "10:11:30", "remaining_time": "8:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2590, "total_steps": 4632, "loss": 0.5966, "learning_rate": 4.84174081860699e-06, "epoch": 2.2351672060409924, "percentage": 55.92, "elapsed_time": "10:12:56", "remaining_time": "8:03:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2600, "total_steps": 4632, "loss": 0.5668, "learning_rate": 4.8040775017282644e-06, "epoch": 2.243797195253506, "percentage": 56.13, "elapsed_time": "10:14:10", "remaining_time": "8:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2600, "total_steps": 4632, "eval_loss": 0.6660070419311523, "epoch": 2.243797195253506, "percentage": 56.13, "elapsed_time": "10:19:31", "remaining_time": "8:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2610, "total_steps": 4632, "loss": 0.5675, "learning_rate": 4.766425315654648e-06, "epoch": 2.2524271844660193, "percentage": 56.35, "elapsed_time": "10:21:02", "remaining_time": "8:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2620, "total_steps": 4632, "loss": 0.6543, "learning_rate": 4.728786399492923e-06, "epoch": 2.261057173678533, "percentage": 56.56, "elapsed_time": "10:22:09", "remaining_time": "7:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2630, "total_steps": 4632, "loss": 0.5984, "learning_rate": 4.69116289159598e-06, "epoch": 2.269687162891046, "percentage": 56.78, "elapsed_time": "10:23:19", "remaining_time": "7:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2640, "total_steps": 4632, "loss": 0.5777, "learning_rate": 4.653556929441332e-06, "epoch": 2.27831715210356, "percentage": 56.99, "elapsed_time": "10:24:32", "remaining_time": "7:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2650, "total_steps": 4632, "loss": 0.6185, "learning_rate": 4.61597064950967e-06, "epoch": 2.286947141316073, "percentage": 57.21, "elapsed_time": "10:25:36", "remaining_time": "7:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2650, "total_steps": 4632, "eval_loss": 0.6793263554573059, "epoch": 2.286947141316073, "percentage": 57.21, "elapsed_time": "10:30:57", "remaining_time": "7:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2660, "total_steps": 4632, "loss": 0.5651, "learning_rate": 4.578406187163503e-06, "epoch": 2.295577130528587, "percentage": 57.43, "elapsed_time": "10:32:22", "remaining_time": "7:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2670, "total_steps": 4632, "loss": 0.6087, "learning_rate": 4.540865676525828e-06, "epoch": 2.3042071197411005, "percentage": 57.64, "elapsed_time": "10:33:24", "remaining_time": "7:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2680, "total_steps": 4632, "loss": 0.6153, "learning_rate": 4.503351250358893e-06, "epoch": 2.3128371089536137, "percentage": 57.86, "elapsed_time": "10:34:34", "remaining_time": "7:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2690, "total_steps": 4632, "loss": 0.5765, "learning_rate": 4.465865039943023e-06, "epoch": 2.3214670981661274, "percentage": 58.07, "elapsed_time": "10:35:50", "remaining_time": "7:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2700, "total_steps": 4632, "loss": 0.5314, "learning_rate": 4.428409174955548e-06, "epoch": 2.3300970873786406, "percentage": 58.29, "elapsed_time": "10:36:50", "remaining_time": "7:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2700, "total_steps": 4632, "eval_loss": 0.6751753091812134, "epoch": 2.3300970873786406, "percentage": 58.29, "elapsed_time": "10:42:11", "remaining_time": "7:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2710, "total_steps": 4632, "loss": 0.6288, "learning_rate": 4.3909857833498015e-06, "epoch": 2.3387270765911543, "percentage": 58.51, "elapsed_time": "10:43:26", "remaining_time": "7:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2720, "total_steps": 4632, "loss": 0.6502, "learning_rate": 4.353596991234228e-06, "epoch": 2.347357065803668, "percentage": 58.72, "elapsed_time": "10:44:35", "remaining_time": "7:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2730, "total_steps": 4632, "loss": 0.6461, "learning_rate": 4.3162449227516015e-06, "epoch": 2.355987055016181, "percentage": 58.94, "elapsed_time": "10:46:17", "remaining_time": "7:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2740, "total_steps": 4632, "loss": 0.5786, "learning_rate": 4.278931699958337e-06, "epoch": 2.364617044228695, "percentage": 59.15, "elapsed_time": "10:47:32", "remaining_time": "7:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2750, "total_steps": 4632, "loss": 0.6406, "learning_rate": 4.241659442703937e-06, "epoch": 2.373247033441208, "percentage": 59.37, "elapsed_time": "10:48:41", "remaining_time": "7:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2750, "total_steps": 4632, "eval_loss": 0.6680858731269836, "epoch": 2.373247033441208, "percentage": 59.37, "elapsed_time": "10:54:02", "remaining_time": "7:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2760, "total_steps": 4632, "loss": 0.6201, "learning_rate": 4.2044302685105635e-06, "epoch": 2.381877022653722, "percentage": 59.59, "elapsed_time": "10:55:28", "remaining_time": "7:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2770, "total_steps": 4632, "loss": 0.5944, "learning_rate": 4.167246292452724e-06, "epoch": 2.390507011866235, "percentage": 59.8, "elapsed_time": "10:57:01", "remaining_time": "7:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2780, "total_steps": 4632, "loss": 0.5883, "learning_rate": 4.130109627037124e-06, "epoch": 2.3991370010787487, "percentage": 60.02, "elapsed_time": "10:58:17", "remaining_time": "7:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2790, "total_steps": 4632, "loss": 0.6618, "learning_rate": 4.093022382082639e-06, "epoch": 2.407766990291262, "percentage": 60.23, "elapsed_time": "10:59:41", "remaining_time": "7:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2800, "total_steps": 4632, "loss": 0.7011, "learning_rate": 4.0559866646004546e-06, "epoch": 2.4163969795037756, "percentage": 60.45, "elapsed_time": "11:01:19", "remaining_time": "7:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2800, "total_steps": 4632, "eval_loss": 0.6721732020378113, "epoch": 2.4163969795037756, "percentage": 60.45, "elapsed_time": "11:06:40", "remaining_time": "7:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2810, "total_steps": 4632, "loss": 0.5454, "learning_rate": 4.0190045786743656e-06, "epoch": 2.4250269687162893, "percentage": 60.66, "elapsed_time": "11:07:49", "remaining_time": "7:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2820, "total_steps": 4632, "loss": 0.5114, "learning_rate": 3.982078225341232e-06, "epoch": 2.4336569579288025, "percentage": 60.88, "elapsed_time": "11:09:15", "remaining_time": "7:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2830, "total_steps": 4632, "loss": 0.712, "learning_rate": 3.945209702471622e-06, "epoch": 2.4422869471413162, "percentage": 61.1, "elapsed_time": "11:10:49", "remaining_time": "7:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2840, "total_steps": 4632, "loss": 0.6119, "learning_rate": 3.908401104650621e-06, "epoch": 2.4509169363538295, "percentage": 61.31, "elapsed_time": "11:12:13", "remaining_time": "7:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2850, "total_steps": 4632, "loss": 0.6195, "learning_rate": 3.871654523058831e-06, "epoch": 2.459546925566343, "percentage": 61.53, "elapsed_time": "11:13:31", "remaining_time": "7:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2850, "total_steps": 4632, "eval_loss": 0.6643590927124023, "epoch": 2.459546925566343, "percentage": 61.53, "elapsed_time": "11:18:51", "remaining_time": "7:04:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2860, "total_steps": 4632, "loss": 0.6087, "learning_rate": 3.834972045353575e-06, "epoch": 2.4681769147788564, "percentage": 61.74, "elapsed_time": "11:20:05", "remaining_time": "7:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2870, "total_steps": 4632, "loss": 0.6224, "learning_rate": 3.798355755550292e-06, "epoch": 2.47680690399137, "percentage": 61.96, "elapsed_time": "11:21:19", "remaining_time": "6:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2880, "total_steps": 4632, "loss": 0.6495, "learning_rate": 3.7618077339041244e-06, "epoch": 2.4854368932038833, "percentage": 62.18, "elapsed_time": "11:22:55", "remaining_time": "6:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2890, "total_steps": 4632, "loss": 0.627, "learning_rate": 3.725330056791753e-06, "epoch": 2.494066882416397, "percentage": 62.39, "elapsed_time": "11:24:13", "remaining_time": "6:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2900, "total_steps": 4632, "loss": 0.6675, "learning_rate": 3.6889247965934195e-06, "epoch": 2.5026968716289106, "percentage": 62.61, "elapsed_time": "11:25:52", "remaining_time": "6:49:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2900, "total_steps": 4632, "eval_loss": 0.6530495285987854, "epoch": 2.5026968716289106, "percentage": 62.61, "elapsed_time": "11:31:13", "remaining_time": "6:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2910, "total_steps": 4632, "loss": 0.6522, "learning_rate": 3.6525940215751987e-06, "epoch": 2.511326860841424, "percentage": 62.82, "elapsed_time": "11:32:23", "remaining_time": "6:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2920, "total_steps": 4632, "loss": 0.6759, "learning_rate": 3.6163397957714895e-06, "epoch": 2.5199568500539375, "percentage": 63.04, "elapsed_time": "11:33:34", "remaining_time": "6:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2930, "total_steps": 4632, "loss": 0.6035, "learning_rate": 3.5801641788677576e-06, "epoch": 2.528586839266451, "percentage": 63.26, "elapsed_time": "11:34:37", "remaining_time": "6:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2940, "total_steps": 4632, "loss": 0.6256, "learning_rate": 3.5440692260835162e-06, "epoch": 2.5372168284789645, "percentage": 63.47, "elapsed_time": "11:35:48", "remaining_time": "6:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2950, "total_steps": 4632, "loss": 0.5796, "learning_rate": 3.508056988055564e-06, "epoch": 2.545846817691478, "percentage": 63.69, "elapsed_time": "11:37:13", "remaining_time": "6:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2950, "total_steps": 4632, "eval_loss": 0.6489056348800659, "epoch": 2.545846817691478, "percentage": 63.69, "elapsed_time": "11:42:34", "remaining_time": "6:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2960, "total_steps": 4632, "loss": 0.4864, "learning_rate": 3.4721295107214835e-06, "epoch": 2.5544768069039914, "percentage": 63.9, "elapsed_time": "11:44:04", "remaining_time": "6:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2970, "total_steps": 4632, "loss": 0.6728, "learning_rate": 3.4362888352034153e-06, "epoch": 2.5631067961165046, "percentage": 64.12, "elapsed_time": "11:45:32", "remaining_time": "6:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2980, "total_steps": 4632, "loss": 0.6055, "learning_rate": 3.4005369976920837e-06, "epoch": 2.5717367853290183, "percentage": 64.34, "elapsed_time": "11:46:42", "remaining_time": "6:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2990, "total_steps": 4632, "loss": 0.6123, "learning_rate": 3.3648760293311267e-06, "epoch": 2.580366774541532, "percentage": 64.55, "elapsed_time": "11:48:20", "remaining_time": "6:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 4632, "loss": 0.6148, "learning_rate": 3.3293079561016957e-06, "epoch": 2.588996763754045, "percentage": 64.77, "elapsed_time": "11:49:58", "remaining_time": "6:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 4632, "eval_loss": 0.6675190329551697, "epoch": 2.588996763754045, "percentage": 64.77, "elapsed_time": "11:55:18", "remaining_time": "6:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3010, "total_steps": 4632, "loss": 0.6054, "learning_rate": 3.2938347987073576e-06, "epoch": 2.597626752966559, "percentage": 64.98, "elapsed_time": "11:56:38", "remaining_time": "6:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3020, "total_steps": 4632, "loss": 0.5767, "learning_rate": 3.2584585724592967e-06, "epoch": 2.606256742179072, "percentage": 65.2, "elapsed_time": "11:57:42", "remaining_time": "6:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3030, "total_steps": 4632, "loss": 0.5214, "learning_rate": 3.223181287161812e-06, "epoch": 2.614886731391586, "percentage": 65.41, "elapsed_time": "11:59:14", "remaining_time": "6:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3040, "total_steps": 4632, "loss": 0.5823, "learning_rate": 3.1880049469981468e-06, "epoch": 2.6235167206040995, "percentage": 65.63, "elapsed_time": "12:00:24", "remaining_time": "6:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3050, "total_steps": 4632, "loss": 0.6293, "learning_rate": 3.1529315504166147e-06, "epoch": 2.6321467098166127, "percentage": 65.85, "elapsed_time": "12:01:24", "remaining_time": "6:14:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3050, "total_steps": 4632, "eval_loss": 0.6685478091239929, "epoch": 2.6321467098166127, "percentage": 65.85, "elapsed_time": "12:06:45", "remaining_time": "6:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3060, "total_steps": 4632, "loss": 0.5728, "learning_rate": 3.117963090017071e-06, "epoch": 2.6407766990291264, "percentage": 66.06, "elapsed_time": "12:08:13", "remaining_time": "6:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3070, "total_steps": 4632, "loss": 0.7621, "learning_rate": 3.08310155243771e-06, "epoch": 2.6494066882416396, "percentage": 66.28, "elapsed_time": "12:09:34", "remaining_time": "6:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3080, "total_steps": 4632, "loss": 0.5567, "learning_rate": 3.048348918242191e-06, "epoch": 2.6580366774541533, "percentage": 66.49, "elapsed_time": "12:11:05", "remaining_time": "6:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3090, "total_steps": 4632, "loss": 0.6592, "learning_rate": 3.013707161807128e-06, "epoch": 2.6666666666666665, "percentage": 66.71, "elapsed_time": "12:12:12", "remaining_time": "6:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3100, "total_steps": 4632, "loss": 0.6095, "learning_rate": 2.9791782512099098e-06, "epoch": 2.67529665587918, "percentage": 66.93, "elapsed_time": "12:13:19", "remaining_time": "6:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3100, "total_steps": 4632, "eval_loss": 0.6717608571052551, "epoch": 2.67529665587918, "percentage": 66.93, "elapsed_time": "12:18:40", "remaining_time": "6:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3110, "total_steps": 4632, "loss": 0.4862, "learning_rate": 2.944764148116902e-06, "epoch": 2.6839266450916934, "percentage": 67.14, "elapsed_time": "12:20:16", "remaining_time": "6:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3120, "total_steps": 4632, "loss": 0.5833, "learning_rate": 2.9104668076719876e-06, "epoch": 2.692556634304207, "percentage": 67.36, "elapsed_time": "12:21:39", "remaining_time": "5:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3130, "total_steps": 4632, "loss": 0.5887, "learning_rate": 2.8762881783855025e-06, "epoch": 2.701186623516721, "percentage": 67.57, "elapsed_time": "12:22:52", "remaining_time": "5:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3140, "total_steps": 4632, "loss": 0.6644, "learning_rate": 2.8422302020235252e-06, "epoch": 2.709816612729234, "percentage": 67.79, "elapsed_time": "12:24:08", "remaining_time": "5:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3150, "total_steps": 4632, "loss": 0.5422, "learning_rate": 2.808294813497563e-06, "epoch": 2.7184466019417477, "percentage": 68.01, "elapsed_time": "12:25:21", "remaining_time": "5:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3150, "total_steps": 4632, "eval_loss": 0.6904874444007874, "epoch": 2.7184466019417477, "percentage": 68.01, "elapsed_time": "12:30:42", "remaining_time": "5:53:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3160, "total_steps": 4632, "loss": 0.6523, "learning_rate": 2.7744839407546374e-06, "epoch": 2.727076591154261, "percentage": 68.22, "elapsed_time": "12:32:01", "remaining_time": "5:50:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3170, "total_steps": 4632, "loss": 0.5283, "learning_rate": 2.7407995046677377e-06, "epoch": 2.7357065803667746, "percentage": 68.44, "elapsed_time": "12:33:17", "remaining_time": "5:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3180, "total_steps": 4632, "loss": 0.5934, "learning_rate": 2.7072434189266945e-06, "epoch": 2.7443365695792883, "percentage": 68.65, "elapsed_time": "12:34:25", "remaining_time": "5:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3190, "total_steps": 4632, "loss": 0.6699, "learning_rate": 2.6738175899294703e-06, "epoch": 2.7529665587918015, "percentage": 68.87, "elapsed_time": "12:35:53", "remaining_time": "5:41:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3200, "total_steps": 4632, "loss": 0.6089, "learning_rate": 2.640523916673838e-06, "epoch": 2.7615965480043148, "percentage": 69.08, "elapsed_time": "12:37:21", "remaining_time": "5:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3200, "total_steps": 4632, "eval_loss": 0.6814106106758118, "epoch": 2.7615965480043148, "percentage": 69.08, "elapsed_time": "12:42:43", "remaining_time": "5:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3210, "total_steps": 4632, "loss": 0.6884, "learning_rate": 2.607364290649501e-06, "epoch": 2.7702265372168284, "percentage": 69.3, "elapsed_time": "12:44:01", "remaining_time": "5:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3220, "total_steps": 4632, "loss": 0.6264, "learning_rate": 2.574340595730633e-06, "epoch": 2.778856526429342, "percentage": 69.52, "elapsed_time": "12:45:11", "remaining_time": "5:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3230, "total_steps": 4632, "loss": 0.5552, "learning_rate": 2.541454708068855e-06, "epoch": 2.7874865156418553, "percentage": 69.73, "elapsed_time": "12:46:23", "remaining_time": "5:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3240, "total_steps": 4632, "loss": 0.596, "learning_rate": 2.5087084959866403e-06, "epoch": 2.796116504854369, "percentage": 69.95, "elapsed_time": "12:47:45", "remaining_time": "5:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3250, "total_steps": 4632, "loss": 0.6238, "learning_rate": 2.476103819871166e-06, "epoch": 2.8047464940668823, "percentage": 70.16, "elapsed_time": "12:48:57", "remaining_time": "5:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3250, "total_steps": 4632, "eval_loss": 0.6738768815994263, "epoch": 2.8047464940668823, "percentage": 70.16, "elapsed_time": "12:54:18", "remaining_time": "5:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3260, "total_steps": 4632, "loss": 0.6472, "learning_rate": 2.44364253206864e-06, "epoch": 2.813376483279396, "percentage": 70.38, "elapsed_time": "12:55:50", "remaining_time": "5:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3270, "total_steps": 4632, "loss": 0.6375, "learning_rate": 2.4113264767790433e-06, "epoch": 2.8220064724919096, "percentage": 70.6, "elapsed_time": "12:56:51", "remaining_time": "5:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3280, "total_steps": 4632, "loss": 0.6185, "learning_rate": 2.379157489951367e-06, "epoch": 2.830636461704423, "percentage": 70.81, "elapsed_time": "12:58:38", "remaining_time": "5:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3290, "total_steps": 4632, "loss": 0.6608, "learning_rate": 2.3471373991793116e-06, "epoch": 2.839266450916936, "percentage": 71.03, "elapsed_time": "13:00:03", "remaining_time": "5:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3300, "total_steps": 4632, "loss": 0.7386, "learning_rate": 2.315268023597447e-06, "epoch": 2.8478964401294498, "percentage": 71.24, "elapsed_time": "13:01:37", "remaining_time": "5:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3300, "total_steps": 4632, "eval_loss": 0.6621807813644409, "epoch": 2.8478964401294498, "percentage": 71.24, "elapsed_time": "13:06:58", "remaining_time": "5:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3310, "total_steps": 4632, "loss": 0.5386, "learning_rate": 2.2835511737778687e-06, "epoch": 2.8565264293419634, "percentage": 71.46, "elapsed_time": "13:08:16", "remaining_time": "5:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3320, "total_steps": 4632, "loss": 0.6754, "learning_rate": 2.2519886516273365e-06, "epoch": 2.8651564185544767, "percentage": 71.68, "elapsed_time": "13:09:31", "remaining_time": "5:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3330, "total_steps": 4632, "loss": 0.6129, "learning_rate": 2.220582250284905e-06, "epoch": 2.8737864077669903, "percentage": 71.89, "elapsed_time": "13:11:04", "remaining_time": "5:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3340, "total_steps": 4632, "loss": 0.6185, "learning_rate": 2.189333754020046e-06, "epoch": 2.8824163969795036, "percentage": 72.11, "elapsed_time": "13:12:24", "remaining_time": "5:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3350, "total_steps": 4632, "loss": 0.6166, "learning_rate": 2.158244938131277e-06, "epoch": 2.8910463861920173, "percentage": 72.32, "elapsed_time": "13:13:42", "remaining_time": "5:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3350, "total_steps": 4632, "eval_loss": 0.6567447781562805, "epoch": 2.8910463861920173, "percentage": 72.32, "elapsed_time": "13:19:03", "remaining_time": "5:05:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3360, "total_steps": 4632, "loss": 0.6601, "learning_rate": 2.12731756884532e-06, "epoch": 2.899676375404531, "percentage": 72.54, "elapsed_time": "13:20:21", "remaining_time": "5:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3370, "total_steps": 4632, "loss": 0.7397, "learning_rate": 2.096553403216739e-06, "epoch": 2.908306364617044, "percentage": 72.75, "elapsed_time": "13:21:43", "remaining_time": "5:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3380, "total_steps": 4632, "loss": 0.5167, "learning_rate": 2.0659541890281236e-06, "epoch": 2.916936353829558, "percentage": 72.97, "elapsed_time": "13:22:56", "remaining_time": "4:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3390, "total_steps": 4632, "loss": 0.6497, "learning_rate": 2.0355216646908016e-06, "epoch": 2.925566343042071, "percentage": 73.19, "elapsed_time": "13:24:03", "remaining_time": "4:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3400, "total_steps": 4632, "loss": 0.5866, "learning_rate": 2.0052575591460636e-06, "epoch": 2.9341963322545848, "percentage": 73.4, "elapsed_time": "13:25:18", "remaining_time": "4:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3400, "total_steps": 4632, "eval_loss": 0.6615984439849854, "epoch": 2.9341963322545848, "percentage": 73.4, "elapsed_time": "13:30:38", "remaining_time": "4:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3410, "total_steps": 4632, "loss": 0.6723, "learning_rate": 1.975163591766946e-06, "epoch": 2.9428263214670984, "percentage": 73.62, "elapsed_time": "13:31:43", "remaining_time": "4:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3420, "total_steps": 4632, "loss": 0.592, "learning_rate": 1.9452414722605432e-06, "epoch": 2.9514563106796117, "percentage": 73.83, "elapsed_time": "13:33:13", "remaining_time": "4:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3430, "total_steps": 4632, "loss": 0.6623, "learning_rate": 1.915492900570887e-06, "epoch": 2.960086299892125, "percentage": 74.05, "elapsed_time": "13:34:53", "remaining_time": "4:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3440, "total_steps": 4632, "loss": 0.6295, "learning_rate": 1.885919566782352e-06, "epoch": 2.9687162891046386, "percentage": 74.27, "elapsed_time": "13:36:12", "remaining_time": "4:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3450, "total_steps": 4632, "loss": 0.6348, "learning_rate": 1.8565231510236531e-06, "epoch": 2.9773462783171523, "percentage": 74.48, "elapsed_time": "13:37:15", "remaining_time": "4:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3450, "total_steps": 4632, "eval_loss": 0.6633828282356262, "epoch": 2.9773462783171523, "percentage": 74.48, "elapsed_time": "13:42:35", "remaining_time": "4:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3460, "total_steps": 4632, "loss": 0.5338, "learning_rate": 1.8273053233723843e-06, "epoch": 2.9859762675296655, "percentage": 74.7, "elapsed_time": "13:43:47", "remaining_time": "4:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3470, "total_steps": 4632, "loss": 0.633, "learning_rate": 1.798267743760142e-06, "epoch": 2.994606256742179, "percentage": 74.91, "elapsed_time": "13:44:54", "remaining_time": "4:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3480, "total_steps": 4632, "loss": 0.5085, "learning_rate": 1.7694120618782169e-06, "epoch": 3.0032362459546924, "percentage": 75.13, "elapsed_time": "13:45:58", "remaining_time": "4:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3490, "total_steps": 4632, "loss": 0.5477, "learning_rate": 1.7407399170838802e-06, "epoch": 3.011866235167206, "percentage": 75.35, "elapsed_time": "13:47:00", "remaining_time": "4:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 4632, "loss": 0.5907, "learning_rate": 1.7122529383072346e-06, "epoch": 3.0204962243797193, "percentage": 75.56, "elapsed_time": "13:48:15", "remaining_time": "4:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 4632, "eval_loss": 0.6642096042633057, "epoch": 3.0204962243797193, "percentage": 75.56, "elapsed_time": "13:53:35", "remaining_time": "4:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3510, "total_steps": 4632, "loss": 0.5256, "learning_rate": 1.68395274395868e-06, "epoch": 3.029126213592233, "percentage": 75.78, "elapsed_time": "13:54:46", "remaining_time": "4:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3520, "total_steps": 4632, "loss": 0.4449, "learning_rate": 1.6558409418369686e-06, "epoch": 3.0377562028047467, "percentage": 75.99, "elapsed_time": "13:56:16", "remaining_time": "4:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3530, "total_steps": 4632, "loss": 0.449, "learning_rate": 1.6279191290378566e-06, "epoch": 3.04638619201726, "percentage": 76.21, "elapsed_time": "13:57:34", "remaining_time": "4:21:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3540, "total_steps": 4632, "loss": 0.4746, "learning_rate": 1.6001888918633728e-06, "epoch": 3.0550161812297736, "percentage": 76.42, "elapsed_time": "13:58:32", "remaining_time": "4:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3550, "total_steps": 4632, "loss": 0.4985, "learning_rate": 1.5726518057316969e-06, "epoch": 3.063646170442287, "percentage": 76.64, "elapsed_time": "14:00:04", "remaining_time": "4:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3550, "total_steps": 4632, "eval_loss": 0.6903661489486694, "epoch": 3.063646170442287, "percentage": 76.64, "elapsed_time": "14:05:24", "remaining_time": "4:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3560, "total_steps": 4632, "loss": 0.5309, "learning_rate": 1.5453094350876563e-06, "epoch": 3.0722761596548005, "percentage": 76.86, "elapsed_time": "14:06:44", "remaining_time": "4:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3570, "total_steps": 4632, "loss": 0.5263, "learning_rate": 1.5181633333138456e-06, "epoch": 3.0809061488673137, "percentage": 77.07, "elapsed_time": "14:07:54", "remaining_time": "4:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3580, "total_steps": 4632, "loss": 0.5077, "learning_rate": 1.4912150426423766e-06, "epoch": 3.0895361380798274, "percentage": 77.29, "elapsed_time": "14:09:18", "remaining_time": "4:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3590, "total_steps": 4632, "loss": 0.5556, "learning_rate": 1.4644660940672628e-06, "epoch": 3.098166127292341, "percentage": 77.5, "elapsed_time": "14:10:25", "remaining_time": "4:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3600, "total_steps": 4632, "loss": 0.53, "learning_rate": 1.4379180072574335e-06, "epoch": 3.1067961165048543, "percentage": 77.72, "elapsed_time": "14:11:58", "remaining_time": "4:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3600, "total_steps": 4632, "eval_loss": 0.6925872564315796, "epoch": 3.1067961165048543, "percentage": 77.72, "elapsed_time": "14:17:19", "remaining_time": "4:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3610, "total_steps": 4632, "loss": 0.5956, "learning_rate": 1.411572290470401e-06, "epoch": 3.115426105717368, "percentage": 77.94, "elapsed_time": "14:18:32", "remaining_time": "4:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3620, "total_steps": 4632, "loss": 0.5019, "learning_rate": 1.3854304404665796e-06, "epoch": 3.1240560949298812, "percentage": 78.15, "elapsed_time": "14:19:53", "remaining_time": "4:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3630, "total_steps": 4632, "loss": 0.5761, "learning_rate": 1.359493942424241e-06, "epoch": 3.132686084142395, "percentage": 78.37, "elapsed_time": "14:21:01", "remaining_time": "3:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3640, "total_steps": 4632, "loss": 0.4957, "learning_rate": 1.3337642698551428e-06, "epoch": 3.141316073354908, "percentage": 78.58, "elapsed_time": "14:22:15", "remaining_time": "3:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3650, "total_steps": 4632, "loss": 0.5728, "learning_rate": 1.3082428845208155e-06, "epoch": 3.149946062567422, "percentage": 78.8, "elapsed_time": "14:23:30", "remaining_time": "3:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3650, "total_steps": 4632, "eval_loss": 0.6939272880554199, "epoch": 3.149946062567422, "percentage": 78.8, "elapsed_time": "14:28:51", "remaining_time": "3:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3660, "total_steps": 4632, "loss": 0.5602, "learning_rate": 1.2829312363495155e-06, "epoch": 3.158576051779935, "percentage": 79.02, "elapsed_time": "14:30:19", "remaining_time": "3:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3670, "total_steps": 4632, "loss": 0.6031, "learning_rate": 1.2578307633538505e-06, "epoch": 3.1672060409924487, "percentage": 79.23, "elapsed_time": "14:31:40", "remaining_time": "3:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3680, "total_steps": 4632, "loss": 0.6053, "learning_rate": 1.232942891549083e-06, "epoch": 3.1758360302049624, "percentage": 79.45, "elapsed_time": "14:32:58", "remaining_time": "3:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3690, "total_steps": 4632, "loss": 0.5024, "learning_rate": 1.2082690348721204e-06, "epoch": 3.1844660194174756, "percentage": 79.66, "elapsed_time": "14:34:03", "remaining_time": "3:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3700, "total_steps": 4632, "loss": 0.5011, "learning_rate": 1.1838105951011758e-06, "epoch": 3.1930960086299893, "percentage": 79.88, "elapsed_time": "14:35:18", "remaining_time": "3:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3700, "total_steps": 4632, "eval_loss": 0.6916132569313049, "epoch": 3.1930960086299893, "percentage": 79.88, "elapsed_time": "14:40:38", "remaining_time": "3:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3710, "total_steps": 4632, "loss": 0.4906, "learning_rate": 1.1595689617761363e-06, "epoch": 3.2017259978425026, "percentage": 80.09, "elapsed_time": "14:42:08", "remaining_time": "3:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3720, "total_steps": 4632, "loss": 0.5705, "learning_rate": 1.1355455121196234e-06, "epoch": 3.2103559870550162, "percentage": 80.31, "elapsed_time": "14:43:25", "remaining_time": "3:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3730, "total_steps": 4632, "loss": 0.6581, "learning_rate": 1.1117416109587403e-06, "epoch": 3.2189859762675295, "percentage": 80.53, "elapsed_time": "14:44:34", "remaining_time": "3:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3740, "total_steps": 4632, "loss": 0.6133, "learning_rate": 1.0881586106475406e-06, "epoch": 3.227615965480043, "percentage": 80.74, "elapsed_time": "14:45:48", "remaining_time": "3:31:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3750, "total_steps": 4632, "loss": 0.4987, "learning_rate": 1.0647978509901946e-06, "epoch": 3.236245954692557, "percentage": 80.96, "elapsed_time": "14:47:10", "remaining_time": "3:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3750, "total_steps": 4632, "eval_loss": 0.6906397938728333, "epoch": 3.236245954692557, "percentage": 80.96, "elapsed_time": "14:52:31", "remaining_time": "3:29:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3760, "total_steps": 4632, "loss": 0.6638, "learning_rate": 1.0416606591648737e-06, "epoch": 3.24487594390507, "percentage": 81.17, "elapsed_time": "14:53:35", "remaining_time": "3:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3770, "total_steps": 4632, "loss": 0.5556, "learning_rate": 1.018748349648348e-06, "epoch": 3.2535059331175837, "percentage": 81.39, "elapsed_time": "14:54:54", "remaining_time": "3:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3780, "total_steps": 4632, "loss": 0.5817, "learning_rate": 9.960622241413137e-07, "epoch": 3.262135922330097, "percentage": 81.61, "elapsed_time": "14:56:09", "remaining_time": "3:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3790, "total_steps": 4632, "loss": 0.5237, "learning_rate": 9.736035714944314e-07, "epoch": 3.2707659115426106, "percentage": 81.82, "elapsed_time": "14:57:32", "remaining_time": "3:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3800, "total_steps": 4632, "loss": 0.5909, "learning_rate": 9.513736676351104e-07, "epoch": 3.279395900755124, "percentage": 82.04, "elapsed_time": "14:58:41", "remaining_time": "3:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3800, "total_steps": 4632, "eval_loss": 0.6882277727127075, "epoch": 3.279395900755124, "percentage": 82.04, "elapsed_time": "15:04:02", "remaining_time": "3:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3810, "total_steps": 4632, "loss": 0.5828, "learning_rate": 9.293737754950166e-07, "epoch": 3.2880258899676376, "percentage": 82.25, "elapsed_time": "15:05:36", "remaining_time": "3:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3820, "total_steps": 4632, "loss": 0.6515, "learning_rate": 9.076051449383294e-07, "epoch": 3.2966558791801512, "percentage": 82.47, "elapsed_time": "15:06:56", "remaining_time": "3:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3830, "total_steps": 4632, "loss": 0.5751, "learning_rate": 8.860690126907229e-07, "epoch": 3.3052858683926645, "percentage": 82.69, "elapsed_time": "15:08:03", "remaining_time": "3:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3840, "total_steps": 4632, "loss": 0.6061, "learning_rate": 8.64766602269112e-07, "epoch": 3.313915857605178, "percentage": 82.9, "elapsed_time": "15:09:20", "remaining_time": "3:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3850, "total_steps": 4632, "loss": 0.5194, "learning_rate": 8.436991239121451e-07, "epoch": 3.3225458468176914, "percentage": 83.12, "elapsed_time": "15:10:51", "remaining_time": "3:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3850, "total_steps": 4632, "eval_loss": 0.6874131560325623, "epoch": 3.3225458468176914, "percentage": 83.12, "elapsed_time": "15:16:12", "remaining_time": "3:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3860, "total_steps": 4632, "loss": 0.5395, "learning_rate": 8.22867774511435e-07, "epoch": 3.331175836030205, "percentage": 83.33, "elapsed_time": "15:17:49", "remaining_time": "3:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3870, "total_steps": 4632, "loss": 0.566, "learning_rate": 8.022737375435735e-07, "epoch": 3.3398058252427183, "percentage": 83.55, "elapsed_time": "15:19:33", "remaining_time": "3:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3880, "total_steps": 4632, "loss": 0.5703, "learning_rate": 7.81918183002891e-07, "epoch": 3.348435814455232, "percentage": 83.77, "elapsed_time": "15:20:35", "remaining_time": "2:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3890, "total_steps": 4632, "loss": 0.5318, "learning_rate": 7.618022673349834e-07, "epoch": 3.357065803667745, "percentage": 83.98, "elapsed_time": "15:22:06", "remaining_time": "2:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3900, "total_steps": 4632, "loss": 0.5925, "learning_rate": 7.419271333710154e-07, "epoch": 3.365695792880259, "percentage": 84.2, "elapsed_time": "15:23:49", "remaining_time": "2:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3900, "total_steps": 4632, "eval_loss": 0.685357391834259, "epoch": 3.365695792880259, "percentage": 84.2, "elapsed_time": "15:29:10", "remaining_time": "2:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3910, "total_steps": 4632, "loss": 0.6622, "learning_rate": 7.222939102627919e-07, "epoch": 3.3743257820927726, "percentage": 84.41, "elapsed_time": "15:30:31", "remaining_time": "2:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3920, "total_steps": 4632, "loss": 0.4916, "learning_rate": 7.029037134186112e-07, "epoch": 3.382955771305286, "percentage": 84.63, "elapsed_time": "15:31:28", "remaining_time": "2:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3930, "total_steps": 4632, "loss": 0.5409, "learning_rate": 6.837576444398913e-07, "epoch": 3.3915857605177995, "percentage": 84.84, "elapsed_time": "15:33:03", "remaining_time": "2:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3940, "total_steps": 4632, "loss": 0.6555, "learning_rate": 6.648567910585874e-07, "epoch": 3.4002157497303127, "percentage": 85.06, "elapsed_time": "15:34:26", "remaining_time": "2:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3950, "total_steps": 4632, "loss": 0.4709, "learning_rate": 6.46202227075401e-07, "epoch": 3.4088457389428264, "percentage": 85.28, "elapsed_time": "15:35:49", "remaining_time": "2:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3950, "total_steps": 4632, "eval_loss": 0.6879016160964966, "epoch": 3.4088457389428264, "percentage": 85.28, "elapsed_time": "15:41:10", "remaining_time": "2:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3960, "total_steps": 4632, "loss": 0.542, "learning_rate": 6.277950122987631e-07, "epoch": 3.4174757281553396, "percentage": 85.49, "elapsed_time": "15:42:40", "remaining_time": "2:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3970, "total_steps": 4632, "loss": 0.6621, "learning_rate": 6.096361924846333e-07, "epoch": 3.4261057173678533, "percentage": 85.71, "elapsed_time": "15:44:02", "remaining_time": "2:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3980, "total_steps": 4632, "loss": 0.5217, "learning_rate": 5.917267992770881e-07, "epoch": 3.4347357065803665, "percentage": 85.92, "elapsed_time": "15:45:19", "remaining_time": "2:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3990, "total_steps": 4632, "loss": 0.669, "learning_rate": 5.740678501497049e-07, "epoch": 3.44336569579288, "percentage": 86.14, "elapsed_time": "15:46:42", "remaining_time": "2:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4000, "total_steps": 4632, "loss": 0.5317, "learning_rate": 5.566603483477607e-07, "epoch": 3.451995685005394, "percentage": 86.36, "elapsed_time": "15:48:16", "remaining_time": "2:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4000, "total_steps": 4632, "eval_loss": 0.6886419057846069, "epoch": 3.451995685005394, "percentage": 86.36, "elapsed_time": "15:53:37", "remaining_time": "2:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4010, "total_steps": 4632, "loss": 0.5363, "learning_rate": 5.395052828312359e-07, "epoch": 3.460625674217907, "percentage": 86.57, "elapsed_time": "15:55:01", "remaining_time": "2:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4020, "total_steps": 4632, "loss": 0.6681, "learning_rate": 5.226036282186286e-07, "epoch": 3.469255663430421, "percentage": 86.79, "elapsed_time": "15:56:13", "remaining_time": "2:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4030, "total_steps": 4632, "loss": 0.5089, "learning_rate": 5.059563447315829e-07, "epoch": 3.477885652642934, "percentage": 87.0, "elapsed_time": "15:57:30", "remaining_time": "2:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4040, "total_steps": 4632, "loss": 0.4644, "learning_rate": 4.895643781403375e-07, "epoch": 3.4865156418554477, "percentage": 87.22, "elapsed_time": "15:58:43", "remaining_time": "2:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4050, "total_steps": 4632, "loss": 0.5821, "learning_rate": 4.73428659709998e-07, "epoch": 3.4951456310679614, "percentage": 87.44, "elapsed_time": "16:00:01", "remaining_time": "2:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4050, "total_steps": 4632, "eval_loss": 0.6889378428459167, "epoch": 3.4951456310679614, "percentage": 87.44, "elapsed_time": "16:05:22", "remaining_time": "2:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4060, "total_steps": 4632, "loss": 0.5951, "learning_rate": 4.575501061476195e-07, "epoch": 3.5037756202804746, "percentage": 87.65, "elapsed_time": "16:06:51", "remaining_time": "2:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4070, "total_steps": 4632, "loss": 0.5985, "learning_rate": 4.4192961955013766e-07, "epoch": 3.512405609492988, "percentage": 87.87, "elapsed_time": "16:08:17", "remaining_time": "2:13:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4080, "total_steps": 4632, "loss": 0.5232, "learning_rate": 4.265680873531136e-07, "epoch": 3.5210355987055015, "percentage": 88.08, "elapsed_time": "16:09:25", "remaining_time": "2:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4090, "total_steps": 4632, "loss": 0.5554, "learning_rate": 4.1146638228031557e-07, "epoch": 3.529665587918015, "percentage": 88.3, "elapsed_time": "16:10:28", "remaining_time": "2:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4100, "total_steps": 4632, "loss": 0.5887, "learning_rate": 3.966253622941385e-07, "epoch": 3.5382955771305284, "percentage": 88.51, "elapsed_time": "16:11:41", "remaining_time": "2:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4100, "total_steps": 4632, "eval_loss": 0.6890589594841003, "epoch": 3.5382955771305284, "percentage": 88.51, "elapsed_time": "16:17:02", "remaining_time": "2:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4110, "total_steps": 4632, "loss": 0.5101, "learning_rate": 3.820458705468633e-07, "epoch": 3.546925566343042, "percentage": 88.73, "elapsed_time": "16:18:30", "remaining_time": "2:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4120, "total_steps": 4632, "loss": 0.6162, "learning_rate": 3.677287353327519e-07, "epoch": 3.5555555555555554, "percentage": 88.95, "elapsed_time": "16:19:39", "remaining_time": "2:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4130, "total_steps": 4632, "loss": 0.6591, "learning_rate": 3.536747700409932e-07, "epoch": 3.564185544768069, "percentage": 89.16, "elapsed_time": "16:21:05", "remaining_time": "1:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4140, "total_steps": 4632, "loss": 0.5749, "learning_rate": 3.3988477310948785e-07, "epoch": 3.5728155339805827, "percentage": 89.38, "elapsed_time": "16:22:23", "remaining_time": "1:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4150, "total_steps": 4632, "loss": 0.5362, "learning_rate": 3.2635952797949566e-07, "epoch": 3.581445523193096, "percentage": 89.59, "elapsed_time": "16:23:43", "remaining_time": "1:54:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4150, "total_steps": 4632, "eval_loss": 0.6879053711891174, "epoch": 3.581445523193096, "percentage": 89.59, "elapsed_time": "16:29:04", "remaining_time": "1:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4160, "total_steps": 4632, "loss": 0.5753, "learning_rate": 3.1309980305111674e-07, "epoch": 3.5900755124056096, "percentage": 89.81, "elapsed_time": "16:30:27", "remaining_time": "1:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4170, "total_steps": 4632, "loss": 0.5671, "learning_rate": 3.0010635163964186e-07, "epoch": 3.598705501618123, "percentage": 90.03, "elapsed_time": "16:31:24", "remaining_time": "1:49:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4180, "total_steps": 4632, "loss": 0.525, "learning_rate": 2.8737991193275805e-07, "epoch": 3.6073354908306365, "percentage": 90.24, "elapsed_time": "16:32:41", "remaining_time": "1:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4190, "total_steps": 4632, "loss": 0.5276, "learning_rate": 2.7492120694860237e-07, "epoch": 3.61596548004315, "percentage": 90.46, "elapsed_time": "16:34:03", "remaining_time": "1:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4200, "total_steps": 4632, "loss": 0.4971, "learning_rate": 2.627309444946929e-07, "epoch": 3.6245954692556634, "percentage": 90.67, "elapsed_time": "16:35:35", "remaining_time": "1:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4200, "total_steps": 4632, "eval_loss": 0.6887635588645935, "epoch": 3.6245954692556634, "percentage": 90.67, "elapsed_time": "16:40:56", "remaining_time": "1:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4210, "total_steps": 4632, "loss": 0.4793, "learning_rate": 2.5080981712771344e-07, "epoch": 3.6332254584681767, "percentage": 90.89, "elapsed_time": "16:42:22", "remaining_time": "1:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4220, "total_steps": 4632, "loss": 0.4916, "learning_rate": 2.391585021141668e-07, "epoch": 3.6418554476806904, "percentage": 91.11, "elapsed_time": "16:43:44", "remaining_time": "1:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4230, "total_steps": 4632, "loss": 0.54, "learning_rate": 2.2777766139190084e-07, "epoch": 3.650485436893204, "percentage": 91.32, "elapsed_time": "16:45:03", "remaining_time": "1:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4240, "total_steps": 4632, "loss": 0.6402, "learning_rate": 2.1666794153249792e-07, "epoch": 3.6591154261057173, "percentage": 91.54, "elapsed_time": "16:46:16", "remaining_time": "1:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4250, "total_steps": 4632, "loss": 0.5009, "learning_rate": 2.0582997370454882e-07, "epoch": 3.667745415318231, "percentage": 91.75, "elapsed_time": "16:47:43", "remaining_time": "1:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4250, "total_steps": 4632, "eval_loss": 0.6899433732032776, "epoch": 3.667745415318231, "percentage": 91.75, "elapsed_time": "16:53:04", "remaining_time": "1:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4260, "total_steps": 4632, "loss": 0.7073, "learning_rate": 1.9526437363778404e-07, "epoch": 3.676375404530744, "percentage": 91.97, "elapsed_time": "16:54:19", "remaining_time": "1:28:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4270, "total_steps": 4632, "loss": 0.6589, "learning_rate": 1.8497174158810361e-07, "epoch": 3.685005393743258, "percentage": 92.18, "elapsed_time": "16:55:43", "remaining_time": "1:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4280, "total_steps": 4632, "loss": 0.6127, "learning_rate": 1.749526623034681e-07, "epoch": 3.6936353829557715, "percentage": 92.4, "elapsed_time": "16:57:03", "remaining_time": "1:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4290, "total_steps": 4632, "loss": 0.4761, "learning_rate": 1.6520770499068083e-07, "epoch": 3.7022653721682848, "percentage": 92.62, "elapsed_time": "16:58:30", "remaining_time": "1:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4300, "total_steps": 4632, "loss": 0.5813, "learning_rate": 1.557374232830483e-07, "epoch": 3.710895361380798, "percentage": 92.83, "elapsed_time": "16:59:53", "remaining_time": "1:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4300, "total_steps": 4632, "eval_loss": 0.6886661648750305, "epoch": 3.710895361380798, "percentage": 92.83, "elapsed_time": "17:05:14", "remaining_time": "1:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4310, "total_steps": 4632, "loss": 0.5689, "learning_rate": 1.4654235520892958e-07, "epoch": 3.7195253505933117, "percentage": 93.05, "elapsed_time": "17:06:26", "remaining_time": "1:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4320, "total_steps": 4632, "loss": 0.4723, "learning_rate": 1.3762302316116527e-07, "epoch": 3.7281553398058254, "percentage": 93.26, "elapsed_time": "17:07:50", "remaining_time": "1:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4330, "total_steps": 4632, "loss": 0.6008, "learning_rate": 1.289799338674036e-07, "epoch": 3.7367853290183386, "percentage": 93.48, "elapsed_time": "17:09:00", "remaining_time": "1:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4340, "total_steps": 4632, "loss": 0.5452, "learning_rate": 1.2061357836131104e-07, "epoch": 3.7454153182308523, "percentage": 93.7, "elapsed_time": "17:10:41", "remaining_time": "1:09:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4350, "total_steps": 4632, "loss": 0.6147, "learning_rate": 1.1252443195467311e-07, "epoch": 3.7540453074433655, "percentage": 93.91, "elapsed_time": "17:11:47", "remaining_time": "1:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4350, "total_steps": 4632, "eval_loss": 0.6891469955444336, "epoch": 3.7540453074433655, "percentage": 93.91, "elapsed_time": "17:17:08", "remaining_time": "1:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4360, "total_steps": 4632, "loss": 0.5173, "learning_rate": 1.0471295421039251e-07, "epoch": 3.762675296655879, "percentage": 94.13, "elapsed_time": "17:18:22", "remaining_time": "1:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4370, "total_steps": 4632, "loss": 0.6093, "learning_rate": 9.71795889163818e-08, "epoch": 3.771305285868393, "percentage": 94.34, "elapsed_time": "17:19:39", "remaining_time": "1:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4380, "total_steps": 4632, "loss": 0.5655, "learning_rate": 8.992476406034845e-08, "epoch": 3.779935275080906, "percentage": 94.56, "elapsed_time": "17:21:09", "remaining_time": "0:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4390, "total_steps": 4632, "loss": 0.7, "learning_rate": 8.294889180548104e-08, "epoch": 3.7885652642934198, "percentage": 94.78, "elapsed_time": "17:22:23", "remaining_time": "0:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4400, "total_steps": 4632, "loss": 0.6033, "learning_rate": 7.625236846703243e-08, "epoch": 3.797195253505933, "percentage": 94.99, "elapsed_time": "17:23:43", "remaining_time": "0:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4400, "total_steps": 4632, "eval_loss": 0.6890521049499512, "epoch": 3.797195253505933, "percentage": 94.99, "elapsed_time": "17:29:04", "remaining_time": "0:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4410, "total_steps": 4632, "loss": 0.5508, "learning_rate": 6.983557448980549e-08, "epoch": 3.8058252427184467, "percentage": 95.21, "elapsed_time": "17:30:29", "remaining_time": "0:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4420, "total_steps": 4632, "loss": 0.5819, "learning_rate": 6.369887442653877e-08, "epoch": 3.81445523193096, "percentage": 95.42, "elapsed_time": "17:31:32", "remaining_time": "0:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4430, "total_steps": 4632, "loss": 0.4267, "learning_rate": 5.7842616917193064e-08, "epoch": 3.8230852211434736, "percentage": 95.64, "elapsed_time": "17:32:42", "remaining_time": "0:48:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4440, "total_steps": 4632, "loss": 0.5266, "learning_rate": 5.226713466915001e-08, "epoch": 3.831715210355987, "percentage": 95.85, "elapsed_time": "17:34:03", "remaining_time": "0:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4450, "total_steps": 4632, "loss": 0.565, "learning_rate": 4.697274443830335e-08, "epoch": 3.8403451995685005, "percentage": 96.07, "elapsed_time": "17:35:24", "remaining_time": "0:43:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4450, "total_steps": 4632, "eval_loss": 0.6890508532524109, "epoch": 3.8403451995685005, "percentage": 96.07, "elapsed_time": "17:40:45", "remaining_time": "0:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4460, "total_steps": 4632, "loss": 0.5493, "learning_rate": 4.195974701106775e-08, "epoch": 3.848975188781014, "percentage": 96.29, "elapsed_time": "17:42:03", "remaining_time": "0:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4470, "total_steps": 4632, "loss": 0.5646, "learning_rate": 3.722842718728969e-08, "epoch": 3.8576051779935274, "percentage": 96.5, "elapsed_time": "17:43:40", "remaining_time": "0:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4480, "total_steps": 4632, "loss": 0.5774, "learning_rate": 3.277905376406654e-08, "epoch": 3.866235167206041, "percentage": 96.72, "elapsed_time": "17:44:53", "remaining_time": "0:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4490, "total_steps": 4632, "loss": 0.6114, "learning_rate": 2.8611879520476503e-08, "epoch": 3.8748651564185543, "percentage": 96.93, "elapsed_time": "17:46:13", "remaining_time": "0:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4500, "total_steps": 4632, "loss": 0.5044, "learning_rate": 2.4727141203216286e-08, "epoch": 3.883495145631068, "percentage": 97.15, "elapsed_time": "17:47:26", "remaining_time": "0:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4500, "total_steps": 4632, "eval_loss": 0.6893202662467957, "epoch": 3.883495145631068, "percentage": 97.15, "elapsed_time": "17:52:47", "remaining_time": "0:31:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4510, "total_steps": 4632, "loss": 0.5512, "learning_rate": 2.1125059513152357e-08, "epoch": 3.8921251348435817, "percentage": 97.37, "elapsed_time": "17:54:04", "remaining_time": "0:29:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4520, "total_steps": 4632, "loss": 0.633, "learning_rate": 1.7805839092781553e-08, "epoch": 3.900755124056095, "percentage": 97.58, "elapsed_time": "17:55:19", "remaining_time": "0:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4530, "total_steps": 4632, "loss": 0.5216, "learning_rate": 1.4769668514605374e-08, "epoch": 3.909385113268608, "percentage": 97.8, "elapsed_time": "17:56:33", "remaining_time": "0:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4540, "total_steps": 4632, "loss": 0.5502, "learning_rate": 1.2016720270417448e-08, "epoch": 3.918015102481122, "percentage": 98.01, "elapsed_time": "17:57:54", "remaining_time": "0:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4550, "total_steps": 4632, "loss": 0.613, "learning_rate": 9.547150761501922e-09, "epoch": 3.9266450916936355, "percentage": 98.23, "elapsed_time": "17:59:00", "remaining_time": "0:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4550, "total_steps": 4632, "eval_loss": 0.68938148021698, "epoch": 3.9266450916936355, "percentage": 98.23, "elapsed_time": "18:04:21", "remaining_time": "0:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4560, "total_steps": 4632, "loss": 0.5943, "learning_rate": 7.3611002897489015e-09, "epoch": 3.9352750809061487, "percentage": 98.45, "elapsed_time": "18:05:48", "remaining_time": "0:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4570, "total_steps": 4632, "loss": 0.5628, "learning_rate": 5.458693049684161e-09, "epoch": 3.9439050701186624, "percentage": 98.66, "elapsed_time": "18:07:01", "remaining_time": "0:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4580, "total_steps": 4632, "loss": 0.5538, "learning_rate": 3.8400371214131205e-09, "epoch": 3.9525350593311757, "percentage": 98.88, "elapsed_time": "18:08:38", "remaining_time": "0:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4590, "total_steps": 4632, "loss": 0.64, "learning_rate": 2.5052244644802048e-09, "epoch": 3.9611650485436893, "percentage": 99.09, "elapsed_time": "18:09:41", "remaining_time": "0:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4600, "total_steps": 4632, "loss": 0.4614, "learning_rate": 1.4543309126446858e-09, "epoch": 3.969795037756203, "percentage": 99.31, "elapsed_time": "18:10:49", "remaining_time": "0:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4600, "total_steps": 4632, "eval_loss": 0.6896011829376221, "epoch": 3.969795037756203, "percentage": 99.31, "elapsed_time": "18:16:10", "remaining_time": "0:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4610, "total_steps": 4632, "loss": 0.5865, "learning_rate": 6.874161695719084e-10, "epoch": 3.9784250269687162, "percentage": 99.53, "elapsed_time": "18:17:24", "remaining_time": "0:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4620, "total_steps": 4632, "loss": 0.5533, "learning_rate": 2.045238054415588e-10, "epoch": 3.98705501618123, "percentage": 99.74, "elapsed_time": "18:18:50", "remaining_time": "0:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4630, "total_steps": 4632, "loss": 0.6292, "learning_rate": 5.681254474088072e-12, "epoch": 3.995685005393743, "percentage": 99.96, "elapsed_time": "18:19:54", "remaining_time": "0:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4632, "total_steps": 4632, "epoch": 3.997411003236246, "percentage": 100.0, "elapsed_time": "18:20:08", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}