{"current_steps": 1, "total_steps": 3836, "loss": 0.3892, "learning_rate": 2.6041666666666667e-08, "epoch": 0.0002606457498452416, "percentage": 0.03, "elapsed_time": "0:00:12", "remaining_time": "13:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2, "total_steps": 3836, "loss": 0.3909, "learning_rate": 5.208333333333333e-08, "epoch": 0.0005212914996904832, "percentage": 0.05, "elapsed_time": "0:00:17", "remaining_time": "9:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3, "total_steps": 3836, "loss": 0.38, "learning_rate": 7.8125e-08, "epoch": 0.0007819372495357248, "percentage": 0.08, "elapsed_time": "0:00:23", "remaining_time": "8:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 3836, "loss": 0.4106, "learning_rate": 1.0416666666666667e-07, "epoch": 0.0010425829993809665, "percentage": 0.1, "elapsed_time": "0:00:28", "remaining_time": "7:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5, "total_steps": 3836, "loss": 0.3933, "learning_rate": 1.3020833333333334e-07, "epoch": 0.001303228749226208, "percentage": 0.13, "elapsed_time": "0:00:34", "remaining_time": "7:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 3836, "loss": 0.3758, "learning_rate": 1.5625e-07, "epoch": 0.0015638744990714496, "percentage": 0.16, "elapsed_time": "0:00:40", "remaining_time": "7:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7, "total_steps": 3836, "loss": 0.3852, "learning_rate": 1.8229166666666669e-07, "epoch": 0.0018245202489166911, "percentage": 0.18, "elapsed_time": "0:00:45", "remaining_time": "6:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 3836, "loss": 0.3831, "learning_rate": 2.0833333333333333e-07, "epoch": 0.002085165998761933, "percentage": 0.21, "elapsed_time": "0:00:50", "remaining_time": "6:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9, "total_steps": 3836, "loss": 0.3993, "learning_rate": 2.3437500000000003e-07, "epoch": 0.0023458117486071742, "percentage": 0.23, "elapsed_time": "0:00:55", "remaining_time": "6:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 3836, "loss": 0.3958, "learning_rate": 2.604166666666667e-07, "epoch": 0.002606457498452416, "percentage": 0.26, "elapsed_time": "0:01:00", "remaining_time": "6:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11, "total_steps": 3836, "loss": 0.3971, "learning_rate": 2.864583333333333e-07, "epoch": 0.0028671032482976574, "percentage": 0.29, "elapsed_time": "0:01:06", "remaining_time": "6:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 3836, "loss": 0.3812, "learning_rate": 3.125e-07, "epoch": 0.003127748998142899, "percentage": 0.31, "elapsed_time": "0:01:11", "remaining_time": "6:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13, "total_steps": 3836, "loss": 0.3907, "learning_rate": 3.3854166666666667e-07, "epoch": 0.0033883947479881405, "percentage": 0.34, "elapsed_time": "0:01:17", "remaining_time": "6:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 3836, "loss": 0.3893, "learning_rate": 3.6458333333333337e-07, "epoch": 0.0036490404978333823, "percentage": 0.36, "elapsed_time": "0:01:22", "remaining_time": "6:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 3836, "loss": 0.381, "learning_rate": 3.90625e-07, "epoch": 0.003909686247678624, "percentage": 0.39, "elapsed_time": "0:01:28", "remaining_time": "6:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 3836, "loss": 0.3852, "learning_rate": 4.1666666666666667e-07, "epoch": 0.004170331997523866, "percentage": 0.42, "elapsed_time": "0:01:33", "remaining_time": "6:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17, "total_steps": 3836, "loss": 0.3885, "learning_rate": 4.427083333333334e-07, "epoch": 0.004430977747369107, "percentage": 0.44, "elapsed_time": "0:01:39", "remaining_time": "6:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 3836, "loss": 0.3737, "learning_rate": 4.6875000000000006e-07, "epoch": 0.0046916234972143485, "percentage": 0.47, "elapsed_time": "0:01:44", "remaining_time": "6:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19, "total_steps": 3836, "loss": 0.3847, "learning_rate": 4.947916666666667e-07, "epoch": 0.00495226924705959, "percentage": 0.5, "elapsed_time": "0:01:50", "remaining_time": "6:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 3836, "loss": 0.3455, "learning_rate": 5.208333333333334e-07, "epoch": 0.005212914996904832, "percentage": 0.52, "elapsed_time": "0:01:55", "remaining_time": "6:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21, "total_steps": 3836, "loss": 0.3394, "learning_rate": 5.468750000000001e-07, "epoch": 0.005473560746750073, "percentage": 0.55, "elapsed_time": "0:02:00", "remaining_time": "6:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 3836, "loss": 0.3604, "learning_rate": 5.729166666666667e-07, "epoch": 0.005734206496595315, "percentage": 0.57, "elapsed_time": "0:02:05", "remaining_time": "6:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23, "total_steps": 3836, "loss": 0.3386, "learning_rate": 5.989583333333335e-07, "epoch": 0.0059948522464405565, "percentage": 0.6, "elapsed_time": "0:02:11", "remaining_time": "6:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 3836, "loss": 0.3491, "learning_rate": 6.25e-07, "epoch": 0.006255497996285798, "percentage": 0.63, "elapsed_time": "0:02:16", "remaining_time": "6:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 3836, "loss": 0.346, "learning_rate": 6.510416666666668e-07, "epoch": 0.00651614374613104, "percentage": 0.65, "elapsed_time": "0:02:21", "remaining_time": "6:00:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 3836, "loss": 0.3408, "learning_rate": 6.770833333333333e-07, "epoch": 0.006776789495976281, "percentage": 0.68, "elapsed_time": "0:02:27", "remaining_time": "6:00:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27, "total_steps": 3836, "loss": 0.3384, "learning_rate": 7.03125e-07, "epoch": 0.007037435245821523, "percentage": 0.7, "elapsed_time": "0:02:32", "remaining_time": "5:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 3836, "loss": 0.3117, "learning_rate": 7.291666666666667e-07, "epoch": 0.0072980809956667645, "percentage": 0.73, "elapsed_time": "0:02:38", "remaining_time": "5:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29, "total_steps": 3836, "loss": 0.3349, "learning_rate": 7.552083333333333e-07, "epoch": 0.007558726745512006, "percentage": 0.76, "elapsed_time": "0:02:43", "remaining_time": "5:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 3836, "loss": 0.3201, "learning_rate": 7.8125e-07, "epoch": 0.007819372495357248, "percentage": 0.78, "elapsed_time": "0:02:49", "remaining_time": "5:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 31, "total_steps": 3836, "loss": 0.3233, "learning_rate": 8.072916666666667e-07, "epoch": 0.00808001824520249, "percentage": 0.81, "elapsed_time": "0:02:54", "remaining_time": "5:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 3836, "loss": 0.3241, "learning_rate": 8.333333333333333e-07, "epoch": 0.008340663995047732, "percentage": 0.83, "elapsed_time": "0:03:00", "remaining_time": "5:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 33, "total_steps": 3836, "loss": 0.3163, "learning_rate": 8.59375e-07, "epoch": 0.008601309744892972, "percentage": 0.86, "elapsed_time": "0:03:06", "remaining_time": "5:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 3836, "loss": 0.3259, "learning_rate": 8.854166666666668e-07, "epoch": 0.008861955494738213, "percentage": 0.89, "elapsed_time": "0:03:11", "remaining_time": "5:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 3836, "loss": 0.3385, "learning_rate": 9.114583333333333e-07, "epoch": 0.009122601244583455, "percentage": 0.91, "elapsed_time": "0:03:17", "remaining_time": "5:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 3836, "loss": 0.3223, "learning_rate": 9.375000000000001e-07, "epoch": 0.009383246994428697, "percentage": 0.94, "elapsed_time": "0:03:23", "remaining_time": "5:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 37, "total_steps": 3836, "loss": 0.3078, "learning_rate": 9.635416666666667e-07, "epoch": 0.009643892744273939, "percentage": 0.96, "elapsed_time": "0:03:28", "remaining_time": "5:57:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 3836, "loss": 0.3, "learning_rate": 9.895833333333333e-07, "epoch": 0.00990453849411918, "percentage": 0.99, "elapsed_time": "0:03:34", "remaining_time": "5:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 39, "total_steps": 3836, "loss": 0.2862, "learning_rate": 1.0156250000000001e-06, "epoch": 0.010165184243964422, "percentage": 1.02, "elapsed_time": "0:03:40", "remaining_time": "5:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 3836, "loss": 0.3004, "learning_rate": 1.0416666666666667e-06, "epoch": 0.010425829993809664, "percentage": 1.04, "elapsed_time": "0:03:45", "remaining_time": "5:55:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 41, "total_steps": 3836, "loss": 0.2767, "learning_rate": 1.0677083333333333e-06, "epoch": 0.010686475743654906, "percentage": 1.07, "elapsed_time": "0:03:50", "remaining_time": "5:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 3836, "loss": 0.2938, "learning_rate": 1.0937500000000001e-06, "epoch": 0.010947121493500146, "percentage": 1.09, "elapsed_time": "0:03:56", "remaining_time": "5:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 43, "total_steps": 3836, "loss": 0.2998, "learning_rate": 1.1197916666666667e-06, "epoch": 0.011207767243345388, "percentage": 1.12, "elapsed_time": "0:04:02", "remaining_time": "5:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 3836, "loss": 0.2925, "learning_rate": 1.1458333333333333e-06, "epoch": 0.01146841299319063, "percentage": 1.15, "elapsed_time": "0:04:07", "remaining_time": "5:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 3836, "loss": 0.2748, "learning_rate": 1.1718750000000001e-06, "epoch": 0.011729058743035871, "percentage": 1.17, "elapsed_time": "0:04:13", "remaining_time": "5:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 3836, "loss": 0.2856, "learning_rate": 1.197916666666667e-06, "epoch": 0.011989704492881113, "percentage": 1.2, "elapsed_time": "0:04:19", "remaining_time": "5:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 47, "total_steps": 3836, "loss": 0.2885, "learning_rate": 1.2239583333333333e-06, "epoch": 0.012250350242726355, "percentage": 1.23, "elapsed_time": "0:04:24", "remaining_time": "5:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 3836, "loss": 0.2785, "learning_rate": 1.25e-06, "epoch": 0.012510995992571597, "percentage": 1.25, "elapsed_time": "0:04:30", "remaining_time": "5:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 49, "total_steps": 3836, "loss": 0.2715, "learning_rate": 1.2760416666666667e-06, "epoch": 0.012771641742416838, "percentage": 1.28, "elapsed_time": "0:04:35", "remaining_time": "5:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 3836, "loss": 0.2804, "learning_rate": 1.3020833333333335e-06, "epoch": 0.01303228749226208, "percentage": 1.3, "elapsed_time": "0:04:41", "remaining_time": "5:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 51, "total_steps": 3836, "loss": 0.2753, "learning_rate": 1.328125e-06, "epoch": 0.01329293324210732, "percentage": 1.33, "elapsed_time": "0:04:46", "remaining_time": "5:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 3836, "loss": 0.2566, "learning_rate": 1.3541666666666667e-06, "epoch": 0.013553578991952562, "percentage": 1.36, "elapsed_time": "0:04:52", "remaining_time": "5:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 53, "total_steps": 3836, "loss": 0.2695, "learning_rate": 1.3802083333333335e-06, "epoch": 0.013814224741797804, "percentage": 1.38, "elapsed_time": "0:04:57", "remaining_time": "5:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 3836, "loss": 0.2722, "learning_rate": 1.40625e-06, "epoch": 0.014074870491643045, "percentage": 1.41, "elapsed_time": "0:05:03", "remaining_time": "5:54:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 3836, "loss": 0.261, "learning_rate": 1.4322916666666667e-06, "epoch": 0.014335516241488287, "percentage": 1.43, "elapsed_time": "0:05:08", "remaining_time": "5:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 3836, "loss": 0.2626, "learning_rate": 1.4583333333333335e-06, "epoch": 0.014596161991333529, "percentage": 1.46, "elapsed_time": "0:05:13", "remaining_time": "5:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 57, "total_steps": 3836, "loss": 0.2694, "learning_rate": 1.484375e-06, "epoch": 0.01485680774117877, "percentage": 1.49, "elapsed_time": "0:05:19", "remaining_time": "5:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 3836, "loss": 0.2716, "learning_rate": 1.5104166666666667e-06, "epoch": 0.015117453491024013, "percentage": 1.51, "elapsed_time": "0:05:24", "remaining_time": "5:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 59, "total_steps": 3836, "loss": 0.2851, "learning_rate": 1.5364583333333335e-06, "epoch": 0.015378099240869254, "percentage": 1.54, "elapsed_time": "0:05:30", "remaining_time": "5:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 3836, "loss": 0.2701, "learning_rate": 1.5625e-06, "epoch": 0.015638744990714496, "percentage": 1.56, "elapsed_time": "0:05:35", "remaining_time": "5:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 61, "total_steps": 3836, "loss": 0.2711, "learning_rate": 1.5885416666666667e-06, "epoch": 0.015899390740559738, "percentage": 1.59, "elapsed_time": "0:05:42", "remaining_time": "5:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 3836, "loss": 0.2486, "learning_rate": 1.6145833333333335e-06, "epoch": 0.01616003649040498, "percentage": 1.62, "elapsed_time": "0:05:47", "remaining_time": "5:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 63, "total_steps": 3836, "loss": 0.2569, "learning_rate": 1.640625e-06, "epoch": 0.01642068224025022, "percentage": 1.64, "elapsed_time": "0:05:52", "remaining_time": "5:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 3836, "loss": 0.2282, "learning_rate": 1.6666666666666667e-06, "epoch": 0.016681327990095463, "percentage": 1.67, "elapsed_time": "0:05:58", "remaining_time": "5:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 3836, "loss": 0.2447, "learning_rate": 1.6927083333333335e-06, "epoch": 0.0169419737399407, "percentage": 1.69, "elapsed_time": "0:06:03", "remaining_time": "5:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 3836, "loss": 0.272, "learning_rate": 1.71875e-06, "epoch": 0.017202619489785943, "percentage": 1.72, "elapsed_time": "0:06:08", "remaining_time": "5:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 67, "total_steps": 3836, "loss": 0.2546, "learning_rate": 1.7447916666666667e-06, "epoch": 0.017463265239631185, "percentage": 1.75, "elapsed_time": "0:06:14", "remaining_time": "5:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 3836, "loss": 0.28, "learning_rate": 1.7708333333333337e-06, "epoch": 0.017723910989476427, "percentage": 1.77, "elapsed_time": "0:06:19", "remaining_time": "5:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 69, "total_steps": 3836, "loss": 0.2644, "learning_rate": 1.796875e-06, "epoch": 0.01798455673932167, "percentage": 1.8, "elapsed_time": "0:06:24", "remaining_time": "5:50:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 3836, "loss": 0.2581, "learning_rate": 1.8229166666666666e-06, "epoch": 0.01824520248916691, "percentage": 1.82, "elapsed_time": "0:06:30", "remaining_time": "5:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 71, "total_steps": 3836, "loss": 0.2502, "learning_rate": 1.8489583333333337e-06, "epoch": 0.018505848239012152, "percentage": 1.85, "elapsed_time": "0:06:36", "remaining_time": "5:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 3836, "loss": 0.2636, "learning_rate": 1.8750000000000003e-06, "epoch": 0.018766493988857394, "percentage": 1.88, "elapsed_time": "0:06:42", "remaining_time": "5:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 73, "total_steps": 3836, "loss": 0.2318, "learning_rate": 1.9010416666666666e-06, "epoch": 0.019027139738702636, "percentage": 1.9, "elapsed_time": "0:06:47", "remaining_time": "5:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 3836, "loss": 0.2466, "learning_rate": 1.9270833333333334e-06, "epoch": 0.019287785488547877, "percentage": 1.93, "elapsed_time": "0:06:53", "remaining_time": "5:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 3836, "loss": 0.2537, "learning_rate": 1.953125e-06, "epoch": 0.01954843123839312, "percentage": 1.96, "elapsed_time": "0:06:59", "remaining_time": "5:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 3836, "loss": 0.2588, "learning_rate": 1.9791666666666666e-06, "epoch": 0.01980907698823836, "percentage": 1.98, "elapsed_time": "0:07:04", "remaining_time": "5:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 77, "total_steps": 3836, "loss": 0.2631, "learning_rate": 2.0052083333333337e-06, "epoch": 0.020069722738083603, "percentage": 2.01, "elapsed_time": "0:07:10", "remaining_time": "5:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 3836, "loss": 0.2588, "learning_rate": 2.0312500000000002e-06, "epoch": 0.020330368487928845, "percentage": 2.03, "elapsed_time": "0:07:15", "remaining_time": "5:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 79, "total_steps": 3836, "loss": 0.236, "learning_rate": 2.057291666666667e-06, "epoch": 0.020591014237774086, "percentage": 2.06, "elapsed_time": "0:07:20", "remaining_time": "5:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 3836, "loss": 0.2384, "learning_rate": 2.0833333333333334e-06, "epoch": 0.020851659987619328, "percentage": 2.09, "elapsed_time": "0:07:26", "remaining_time": "5:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 81, "total_steps": 3836, "loss": 0.2415, "learning_rate": 2.109375e-06, "epoch": 0.02111230573746457, "percentage": 2.11, "elapsed_time": "0:07:31", "remaining_time": "5:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 3836, "loss": 0.2286, "learning_rate": 2.1354166666666666e-06, "epoch": 0.02137295148730981, "percentage": 2.14, "elapsed_time": "0:07:36", "remaining_time": "5:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 83, "total_steps": 3836, "loss": 0.2391, "learning_rate": 2.1614583333333336e-06, "epoch": 0.02163359723715505, "percentage": 2.16, "elapsed_time": "0:07:42", "remaining_time": "5:48:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 3836, "loss": 0.257, "learning_rate": 2.1875000000000002e-06, "epoch": 0.021894242987000292, "percentage": 2.19, "elapsed_time": "0:07:47", "remaining_time": "5:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 3836, "loss": 0.238, "learning_rate": 2.213541666666667e-06, "epoch": 0.022154888736845534, "percentage": 2.22, "elapsed_time": "0:07:52", "remaining_time": "5:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 3836, "loss": 0.2477, "learning_rate": 2.2395833333333334e-06, "epoch": 0.022415534486690775, "percentage": 2.24, "elapsed_time": "0:07:58", "remaining_time": "5:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 87, "total_steps": 3836, "loss": 0.2504, "learning_rate": 2.265625e-06, "epoch": 0.022676180236536017, "percentage": 2.27, "elapsed_time": "0:08:03", "remaining_time": "5:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 3836, "loss": 0.2442, "learning_rate": 2.2916666666666666e-06, "epoch": 0.02293682598638126, "percentage": 2.29, "elapsed_time": "0:08:09", "remaining_time": "5:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 89, "total_steps": 3836, "loss": 0.2435, "learning_rate": 2.3177083333333336e-06, "epoch": 0.0231974717362265, "percentage": 2.32, "elapsed_time": "0:08:15", "remaining_time": "5:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 3836, "loss": 0.2592, "learning_rate": 2.3437500000000002e-06, "epoch": 0.023458117486071742, "percentage": 2.35, "elapsed_time": "0:08:21", "remaining_time": "5:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 91, "total_steps": 3836, "loss": 0.2672, "learning_rate": 2.369791666666667e-06, "epoch": 0.023718763235916984, "percentage": 2.37, "elapsed_time": "0:08:27", "remaining_time": "5:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 3836, "loss": 0.249, "learning_rate": 2.395833333333334e-06, "epoch": 0.023979408985762226, "percentage": 2.4, "elapsed_time": "0:08:32", "remaining_time": "5:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 93, "total_steps": 3836, "loss": 0.2275, "learning_rate": 2.421875e-06, "epoch": 0.024240054735607468, "percentage": 2.42, "elapsed_time": "0:08:38", "remaining_time": "5:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 3836, "loss": 0.2338, "learning_rate": 2.4479166666666666e-06, "epoch": 0.02450070048545271, "percentage": 2.45, "elapsed_time": "0:08:43", "remaining_time": "5:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 3836, "loss": 0.2232, "learning_rate": 2.4739583333333336e-06, "epoch": 0.02476134623529795, "percentage": 2.48, "elapsed_time": "0:08:48", "remaining_time": "5:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 3836, "loss": 0.2635, "learning_rate": 2.5e-06, "epoch": 0.025021991985143193, "percentage": 2.5, "elapsed_time": "0:08:54", "remaining_time": "5:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 97, "total_steps": 3836, "loss": 0.2349, "learning_rate": 2.5260416666666672e-06, "epoch": 0.025282637734988435, "percentage": 2.53, "elapsed_time": "0:09:00", "remaining_time": "5:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 3836, "loss": 0.2417, "learning_rate": 2.5520833333333334e-06, "epoch": 0.025543283484833677, "percentage": 2.55, "elapsed_time": "0:09:05", "remaining_time": "5:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 99, "total_steps": 3836, "loss": 0.2447, "learning_rate": 2.5781250000000004e-06, "epoch": 0.02580392923467892, "percentage": 2.58, "elapsed_time": "0:09:10", "remaining_time": "5:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 3836, "loss": 0.2177, "learning_rate": 2.604166666666667e-06, "epoch": 0.02606457498452416, "percentage": 2.61, "elapsed_time": "0:09:16", "remaining_time": "5:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 101, "total_steps": 3836, "loss": 0.2375, "learning_rate": 2.630208333333333e-06, "epoch": 0.0263252207343694, "percentage": 2.63, "elapsed_time": "0:09:22", "remaining_time": "5:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 3836, "loss": 0.2596, "learning_rate": 2.65625e-06, "epoch": 0.02658586648421464, "percentage": 2.66, "elapsed_time": "0:09:28", "remaining_time": "5:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 103, "total_steps": 3836, "loss": 0.224, "learning_rate": 2.682291666666667e-06, "epoch": 0.026846512234059882, "percentage": 2.69, "elapsed_time": "0:09:33", "remaining_time": "5:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 3836, "loss": 0.2334, "learning_rate": 2.7083333333333334e-06, "epoch": 0.027107157983905124, "percentage": 2.71, "elapsed_time": "0:09:38", "remaining_time": "5:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 3836, "loss": 0.2483, "learning_rate": 2.7343750000000004e-06, "epoch": 0.027367803733750366, "percentage": 2.74, "elapsed_time": "0:09:43", "remaining_time": "5:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 3836, "loss": 0.2403, "learning_rate": 2.760416666666667e-06, "epoch": 0.027628449483595607, "percentage": 2.76, "elapsed_time": "0:09:49", "remaining_time": "5:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 107, "total_steps": 3836, "loss": 0.2426, "learning_rate": 2.7864583333333336e-06, "epoch": 0.02788909523344085, "percentage": 2.79, "elapsed_time": "0:09:55", "remaining_time": "5:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 3836, "loss": 0.2145, "learning_rate": 2.8125e-06, "epoch": 0.02814974098328609, "percentage": 2.82, "elapsed_time": "0:09:59", "remaining_time": "5:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 109, "total_steps": 3836, "loss": 0.2391, "learning_rate": 2.838541666666667e-06, "epoch": 0.028410386733131333, "percentage": 2.84, "elapsed_time": "0:10:05", "remaining_time": "5:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 3836, "loss": 0.2215, "learning_rate": 2.8645833333333334e-06, "epoch": 0.028671032482976574, "percentage": 2.87, "elapsed_time": "0:10:11", "remaining_time": "5:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 111, "total_steps": 3836, "loss": 0.2434, "learning_rate": 2.8906250000000004e-06, "epoch": 0.028931678232821816, "percentage": 2.89, "elapsed_time": "0:10:16", "remaining_time": "5:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 3836, "loss": 0.2334, "learning_rate": 2.916666666666667e-06, "epoch": 0.029192323982667058, "percentage": 2.92, "elapsed_time": "0:10:22", "remaining_time": "5:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 113, "total_steps": 3836, "loss": 0.2223, "learning_rate": 2.9427083333333336e-06, "epoch": 0.0294529697325123, "percentage": 2.95, "elapsed_time": "0:10:27", "remaining_time": "5:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 3836, "loss": 0.2394, "learning_rate": 2.96875e-06, "epoch": 0.02971361548235754, "percentage": 2.97, "elapsed_time": "0:10:33", "remaining_time": "5:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 3836, "loss": 0.2446, "learning_rate": 2.994791666666667e-06, "epoch": 0.029974261232202783, "percentage": 3.0, "elapsed_time": "0:10:39", "remaining_time": "5:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 3836, "loss": 0.2381, "learning_rate": 3.0208333333333334e-06, "epoch": 0.030234906982048025, "percentage": 3.02, "elapsed_time": "0:10:45", "remaining_time": "5:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 117, "total_steps": 3836, "loss": 0.2466, "learning_rate": 3.0468750000000004e-06, "epoch": 0.030495552731893267, "percentage": 3.05, "elapsed_time": "0:10:50", "remaining_time": "5:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 3836, "loss": 0.2436, "learning_rate": 3.072916666666667e-06, "epoch": 0.03075619848173851, "percentage": 3.08, "elapsed_time": "0:10:55", "remaining_time": "5:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 119, "total_steps": 3836, "loss": 0.2512, "learning_rate": 3.0989583333333336e-06, "epoch": 0.03101684423158375, "percentage": 3.1, "elapsed_time": "0:11:01", "remaining_time": "5:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 3836, "loss": 0.2421, "learning_rate": 3.125e-06, "epoch": 0.03127748998142899, "percentage": 3.13, "elapsed_time": "0:11:06", "remaining_time": "5:44:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 121, "total_steps": 3836, "loss": 0.2377, "learning_rate": 3.151041666666667e-06, "epoch": 0.03153813573127423, "percentage": 3.15, "elapsed_time": "0:11:11", "remaining_time": "5:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 3836, "loss": 0.2333, "learning_rate": 3.1770833333333333e-06, "epoch": 0.031798781481119476, "percentage": 3.18, "elapsed_time": "0:11:17", "remaining_time": "5:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 123, "total_steps": 3836, "loss": 0.2281, "learning_rate": 3.2031250000000004e-06, "epoch": 0.032059427230964714, "percentage": 3.21, "elapsed_time": "0:11:22", "remaining_time": "5:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 3836, "loss": 0.2531, "learning_rate": 3.229166666666667e-06, "epoch": 0.03232007298080996, "percentage": 3.23, "elapsed_time": "0:11:27", "remaining_time": "5:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 3836, "loss": 0.2496, "learning_rate": 3.2552083333333335e-06, "epoch": 0.0325807187306552, "percentage": 3.26, "elapsed_time": "0:11:33", "remaining_time": "5:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 3836, "loss": 0.2279, "learning_rate": 3.28125e-06, "epoch": 0.03284136448050044, "percentage": 3.28, "elapsed_time": "0:11:38", "remaining_time": "5:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 127, "total_steps": 3836, "loss": 0.2404, "learning_rate": 3.307291666666667e-06, "epoch": 0.03310201023034568, "percentage": 3.31, "elapsed_time": "0:11:43", "remaining_time": "5:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 3836, "loss": 0.2559, "learning_rate": 3.3333333333333333e-06, "epoch": 0.033362655980190926, "percentage": 3.34, "elapsed_time": "0:11:49", "remaining_time": "5:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 129, "total_steps": 3836, "loss": 0.2436, "learning_rate": 3.3593750000000003e-06, "epoch": 0.033623301730036165, "percentage": 3.36, "elapsed_time": "0:11:54", "remaining_time": "5:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 3836, "loss": 0.2345, "learning_rate": 3.385416666666667e-06, "epoch": 0.0338839474798814, "percentage": 3.39, "elapsed_time": "0:12:00", "remaining_time": "5:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 131, "total_steps": 3836, "loss": 0.2364, "learning_rate": 3.4114583333333335e-06, "epoch": 0.03414459322972665, "percentage": 3.42, "elapsed_time": "0:12:06", "remaining_time": "5:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 3836, "loss": 0.2362, "learning_rate": 3.4375e-06, "epoch": 0.03440523897957189, "percentage": 3.44, "elapsed_time": "0:12:11", "remaining_time": "5:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 133, "total_steps": 3836, "loss": 0.2353, "learning_rate": 3.463541666666667e-06, "epoch": 0.03466588472941713, "percentage": 3.47, "elapsed_time": "0:12:17", "remaining_time": "5:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 3836, "loss": 0.225, "learning_rate": 3.4895833333333333e-06, "epoch": 0.03492653047926237, "percentage": 3.49, "elapsed_time": "0:12:22", "remaining_time": "5:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 3836, "loss": 0.2177, "learning_rate": 3.5156250000000003e-06, "epoch": 0.035187176229107615, "percentage": 3.52, "elapsed_time": "0:12:28", "remaining_time": "5:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 3836, "loss": 0.2291, "learning_rate": 3.5416666666666673e-06, "epoch": 0.035447821978952854, "percentage": 3.55, "elapsed_time": "0:12:34", "remaining_time": "5:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 137, "total_steps": 3836, "loss": 0.2211, "learning_rate": 3.5677083333333335e-06, "epoch": 0.0357084677287981, "percentage": 3.57, "elapsed_time": "0:12:39", "remaining_time": "5:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 3836, "loss": 0.2276, "learning_rate": 3.59375e-06, "epoch": 0.03596911347864334, "percentage": 3.6, "elapsed_time": "0:12:45", "remaining_time": "5:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 139, "total_steps": 3836, "loss": 0.2256, "learning_rate": 3.619791666666667e-06, "epoch": 0.03622975922848858, "percentage": 3.62, "elapsed_time": "0:12:50", "remaining_time": "5:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 3836, "loss": 0.2322, "learning_rate": 3.6458333333333333e-06, "epoch": 0.03649040497833382, "percentage": 3.65, "elapsed_time": "0:12:56", "remaining_time": "5:41:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 141, "total_steps": 3836, "loss": 0.2533, "learning_rate": 3.6718750000000003e-06, "epoch": 0.036751050728179066, "percentage": 3.68, "elapsed_time": "0:13:01", "remaining_time": "5:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 3836, "loss": 0.2198, "learning_rate": 3.6979166666666673e-06, "epoch": 0.037011696478024304, "percentage": 3.7, "elapsed_time": "0:13:07", "remaining_time": "5:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 143, "total_steps": 3836, "loss": 0.2236, "learning_rate": 3.7239583333333335e-06, "epoch": 0.03727234222786955, "percentage": 3.73, "elapsed_time": "0:13:12", "remaining_time": "5:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 3836, "loss": 0.2217, "learning_rate": 3.7500000000000005e-06, "epoch": 0.03753298797771479, "percentage": 3.75, "elapsed_time": "0:13:17", "remaining_time": "5:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 3836, "loss": 0.2305, "learning_rate": 3.776041666666667e-06, "epoch": 0.03779363372756003, "percentage": 3.78, "elapsed_time": "0:13:22", "remaining_time": "5:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 3836, "loss": 0.223, "learning_rate": 3.8020833333333333e-06, "epoch": 0.03805427947740527, "percentage": 3.81, "elapsed_time": "0:13:28", "remaining_time": "5:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 147, "total_steps": 3836, "loss": 0.2425, "learning_rate": 3.828125000000001e-06, "epoch": 0.03831492522725051, "percentage": 3.83, "elapsed_time": "0:13:33", "remaining_time": "5:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 3836, "loss": 0.2139, "learning_rate": 3.854166666666667e-06, "epoch": 0.038575570977095755, "percentage": 3.86, "elapsed_time": "0:13:39", "remaining_time": "5:40:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 149, "total_steps": 3836, "loss": 0.2337, "learning_rate": 3.880208333333333e-06, "epoch": 0.03883621672694099, "percentage": 3.88, "elapsed_time": "0:13:44", "remaining_time": "5:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 3836, "loss": 0.227, "learning_rate": 3.90625e-06, "epoch": 0.03909686247678624, "percentage": 3.91, "elapsed_time": "0:13:49", "remaining_time": "5:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 151, "total_steps": 3836, "loss": 0.243, "learning_rate": 3.932291666666667e-06, "epoch": 0.03935750822663148, "percentage": 3.94, "elapsed_time": "0:13:54", "remaining_time": "5:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 3836, "loss": 0.2137, "learning_rate": 3.958333333333333e-06, "epoch": 0.03961815397647672, "percentage": 3.96, "elapsed_time": "0:14:00", "remaining_time": "5:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 153, "total_steps": 3836, "loss": 0.2439, "learning_rate": 3.984375e-06, "epoch": 0.03987879972632196, "percentage": 3.99, "elapsed_time": "0:14:06", "remaining_time": "5:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 3836, "loss": 0.2321, "learning_rate": 4.010416666666667e-06, "epoch": 0.040139445476167206, "percentage": 4.01, "elapsed_time": "0:14:11", "remaining_time": "5:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 3836, "loss": 0.2205, "learning_rate": 4.0364583333333335e-06, "epoch": 0.040400091226012444, "percentage": 4.04, "elapsed_time": "0:14:17", "remaining_time": "5:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 3836, "loss": 0.2445, "learning_rate": 4.0625000000000005e-06, "epoch": 0.04066073697585769, "percentage": 4.07, "elapsed_time": "0:14:22", "remaining_time": "5:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 157, "total_steps": 3836, "loss": 0.2215, "learning_rate": 4.0885416666666675e-06, "epoch": 0.04092138272570293, "percentage": 4.09, "elapsed_time": "0:14:28", "remaining_time": "5:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 3836, "loss": 0.235, "learning_rate": 4.114583333333334e-06, "epoch": 0.04118202847554817, "percentage": 4.12, "elapsed_time": "0:14:33", "remaining_time": "5:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 159, "total_steps": 3836, "loss": 0.2257, "learning_rate": 4.140625000000001e-06, "epoch": 0.04144267422539341, "percentage": 4.14, "elapsed_time": "0:14:39", "remaining_time": "5:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 3836, "loss": 0.2385, "learning_rate": 4.166666666666667e-06, "epoch": 0.041703319975238656, "percentage": 4.17, "elapsed_time": "0:14:44", "remaining_time": "5:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 161, "total_steps": 3836, "loss": 0.2378, "learning_rate": 4.192708333333334e-06, "epoch": 0.041963965725083895, "percentage": 4.2, "elapsed_time": "0:14:49", "remaining_time": "5:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 3836, "loss": 0.2097, "learning_rate": 4.21875e-06, "epoch": 0.04222461147492914, "percentage": 4.22, "elapsed_time": "0:14:55", "remaining_time": "5:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 163, "total_steps": 3836, "loss": 0.2296, "learning_rate": 4.244791666666667e-06, "epoch": 0.04248525722477438, "percentage": 4.25, "elapsed_time": "0:15:01", "remaining_time": "5:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 3836, "loss": 0.219, "learning_rate": 4.270833333333333e-06, "epoch": 0.04274590297461962, "percentage": 4.28, "elapsed_time": "0:15:06", "remaining_time": "5:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 3836, "loss": 0.2307, "learning_rate": 4.296875e-06, "epoch": 0.04300654872446486, "percentage": 4.3, "elapsed_time": "0:15:11", "remaining_time": "5:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 3836, "loss": 0.2042, "learning_rate": 4.322916666666667e-06, "epoch": 0.0432671944743101, "percentage": 4.33, "elapsed_time": "0:15:17", "remaining_time": "5:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 167, "total_steps": 3836, "loss": 0.231, "learning_rate": 4.3489583333333334e-06, "epoch": 0.043527840224155345, "percentage": 4.35, "elapsed_time": "0:15:22", "remaining_time": "5:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 3836, "loss": 0.225, "learning_rate": 4.3750000000000005e-06, "epoch": 0.043788485974000584, "percentage": 4.38, "elapsed_time": "0:15:28", "remaining_time": "5:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 169, "total_steps": 3836, "loss": 0.2211, "learning_rate": 4.4010416666666675e-06, "epoch": 0.04404913172384583, "percentage": 4.41, "elapsed_time": "0:15:33", "remaining_time": "5:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 3836, "loss": 0.2117, "learning_rate": 4.427083333333334e-06, "epoch": 0.04430977747369107, "percentage": 4.43, "elapsed_time": "0:15:38", "remaining_time": "5:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 171, "total_steps": 3836, "loss": 0.2116, "learning_rate": 4.453125000000001e-06, "epoch": 0.04457042322353631, "percentage": 4.46, "elapsed_time": "0:15:43", "remaining_time": "5:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 3836, "loss": 0.2222, "learning_rate": 4.479166666666667e-06, "epoch": 0.04483106897338155, "percentage": 4.48, "elapsed_time": "0:15:48", "remaining_time": "5:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 173, "total_steps": 3836, "loss": 0.2347, "learning_rate": 4.505208333333334e-06, "epoch": 0.045091714723226796, "percentage": 4.51, "elapsed_time": "0:15:53", "remaining_time": "5:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 3836, "loss": 0.2287, "learning_rate": 4.53125e-06, "epoch": 0.045352360473072034, "percentage": 4.54, "elapsed_time": "0:15:59", "remaining_time": "5:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 3836, "loss": 0.2216, "learning_rate": 4.557291666666667e-06, "epoch": 0.04561300622291728, "percentage": 4.56, "elapsed_time": "0:16:05", "remaining_time": "5:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 3836, "loss": 0.2607, "learning_rate": 4.583333333333333e-06, "epoch": 0.04587365197276252, "percentage": 4.59, "elapsed_time": "0:16:10", "remaining_time": "5:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 177, "total_steps": 3836, "loss": 0.2337, "learning_rate": 4.609375e-06, "epoch": 0.04613429772260776, "percentage": 4.61, "elapsed_time": "0:16:16", "remaining_time": "5:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 3836, "loss": 0.2361, "learning_rate": 4.635416666666667e-06, "epoch": 0.046394943472453, "percentage": 4.64, "elapsed_time": "0:16:22", "remaining_time": "5:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 179, "total_steps": 3836, "loss": 0.2242, "learning_rate": 4.661458333333333e-06, "epoch": 0.04665558922229825, "percentage": 4.67, "elapsed_time": "0:16:27", "remaining_time": "5:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 3836, "loss": 0.2255, "learning_rate": 4.6875000000000004e-06, "epoch": 0.046916234972143485, "percentage": 4.69, "elapsed_time": "0:16:33", "remaining_time": "5:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 181, "total_steps": 3836, "loss": 0.2092, "learning_rate": 4.7135416666666675e-06, "epoch": 0.04717688072198873, "percentage": 4.72, "elapsed_time": "0:16:39", "remaining_time": "5:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 3836, "loss": 0.2054, "learning_rate": 4.739583333333334e-06, "epoch": 0.04743752647183397, "percentage": 4.74, "elapsed_time": "0:16:44", "remaining_time": "5:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 183, "total_steps": 3836, "loss": 0.2395, "learning_rate": 4.765625000000001e-06, "epoch": 0.047698172221679214, "percentage": 4.77, "elapsed_time": "0:16:50", "remaining_time": "5:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 3836, "loss": 0.2131, "learning_rate": 4.791666666666668e-06, "epoch": 0.04795881797152445, "percentage": 4.8, "elapsed_time": "0:16:56", "remaining_time": "5:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 3836, "loss": 0.2334, "learning_rate": 4.817708333333334e-06, "epoch": 0.04821946372136969, "percentage": 4.82, "elapsed_time": "0:17:01", "remaining_time": "5:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 3836, "loss": 0.2081, "learning_rate": 4.84375e-06, "epoch": 0.048480109471214936, "percentage": 4.85, "elapsed_time": "0:17:07", "remaining_time": "5:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 187, "total_steps": 3836, "loss": 0.2379, "learning_rate": 4.869791666666667e-06, "epoch": 0.048740755221060174, "percentage": 4.87, "elapsed_time": "0:17:12", "remaining_time": "5:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 3836, "loss": 0.2323, "learning_rate": 4.895833333333333e-06, "epoch": 0.04900140097090542, "percentage": 4.9, "elapsed_time": "0:17:18", "remaining_time": "5:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 189, "total_steps": 3836, "loss": 0.1977, "learning_rate": 4.921875e-06, "epoch": 0.04926204672075066, "percentage": 4.93, "elapsed_time": "0:17:23", "remaining_time": "5:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 3836, "loss": 0.2045, "learning_rate": 4.947916666666667e-06, "epoch": 0.0495226924705959, "percentage": 4.95, "elapsed_time": "0:17:28", "remaining_time": "5:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 191, "total_steps": 3836, "loss": 0.2206, "learning_rate": 4.973958333333333e-06, "epoch": 0.04978333822044114, "percentage": 4.98, "elapsed_time": "0:17:34", "remaining_time": "5:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 3836, "loss": 0.2155, "learning_rate": 5e-06, "epoch": 0.050043983970286386, "percentage": 5.01, "elapsed_time": "0:17:39", "remaining_time": "5:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 193, "total_steps": 3836, "loss": 0.2161, "learning_rate": 4.999999070920249e-06, "epoch": 0.050304629720131624, "percentage": 5.03, "elapsed_time": "0:17:44", "remaining_time": "5:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 3836, "loss": 0.2314, "learning_rate": 4.999996283681687e-06, "epoch": 0.05056527546997687, "percentage": 5.06, "elapsed_time": "0:17:50", "remaining_time": "5:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 3836, "loss": 0.2298, "learning_rate": 4.999991638286384e-06, "epoch": 0.05082592121982211, "percentage": 5.08, "elapsed_time": "0:17:56", "remaining_time": "5:34:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 3836, "loss": 0.237, "learning_rate": 4.9999851347377946e-06, "epoch": 0.05108656696966735, "percentage": 5.11, "elapsed_time": "0:18:02", "remaining_time": "5:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 197, "total_steps": 3836, "loss": 0.219, "learning_rate": 4.9999767730407515e-06, "epoch": 0.05134721271951259, "percentage": 5.14, "elapsed_time": "0:18:07", "remaining_time": "5:34:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 3836, "loss": 0.2182, "learning_rate": 4.99996655320147e-06, "epoch": 0.05160785846935784, "percentage": 5.16, "elapsed_time": "0:18:12", "remaining_time": "5:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 199, "total_steps": 3836, "loss": 0.2408, "learning_rate": 4.999954475227547e-06, "epoch": 0.051868504219203075, "percentage": 5.19, "elapsed_time": "0:18:18", "remaining_time": "5:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 3836, "loss": 0.2222, "learning_rate": 4.999940539127958e-06, "epoch": 0.05212914996904832, "percentage": 5.21, "elapsed_time": "0:18:23", "remaining_time": "5:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 201, "total_steps": 3836, "loss": 0.2183, "learning_rate": 4.999924744913062e-06, "epoch": 0.05238979571889356, "percentage": 5.24, "elapsed_time": "0:18:29", "remaining_time": "5:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 3836, "loss": 0.2413, "learning_rate": 4.999907092594598e-06, "epoch": 0.0526504414687388, "percentage": 5.27, "elapsed_time": "0:18:35", "remaining_time": "5:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 203, "total_steps": 3836, "loss": 0.2485, "learning_rate": 4.999887582185688e-06, "epoch": 0.05291108721858404, "percentage": 5.29, "elapsed_time": "0:18:41", "remaining_time": "5:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 3836, "loss": 0.2171, "learning_rate": 4.99986621370083e-06, "epoch": 0.05317173296842928, "percentage": 5.32, "elapsed_time": "0:18:46", "remaining_time": "5:34:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 3836, "loss": 0.2281, "learning_rate": 4.999842987155909e-06, "epoch": 0.053432378718274526, "percentage": 5.34, "elapsed_time": "0:18:52", "remaining_time": "5:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 3836, "loss": 0.247, "learning_rate": 4.99981790256819e-06, "epoch": 0.053693024468119764, "percentage": 5.37, "elapsed_time": "0:18:58", "remaining_time": "5:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 207, "total_steps": 3836, "loss": 0.2179, "learning_rate": 4.999790959956312e-06, "epoch": 0.05395367021796501, "percentage": 5.4, "elapsed_time": "0:19:05", "remaining_time": "5:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 3836, "loss": 0.2291, "learning_rate": 4.999762159340305e-06, "epoch": 0.05421431596781025, "percentage": 5.42, "elapsed_time": "0:19:10", "remaining_time": "5:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 209, "total_steps": 3836, "loss": 0.2214, "learning_rate": 4.999731500741575e-06, "epoch": 0.05447496171765549, "percentage": 5.45, "elapsed_time": "0:19:16", "remaining_time": "5:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 3836, "loss": 0.2243, "learning_rate": 4.999698984182909e-06, "epoch": 0.05473560746750073, "percentage": 5.47, "elapsed_time": "0:19:22", "remaining_time": "5:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 211, "total_steps": 3836, "loss": 0.219, "learning_rate": 4.999664609688474e-06, "epoch": 0.054996253217345976, "percentage": 5.5, "elapsed_time": "0:19:28", "remaining_time": "5:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 3836, "loss": 0.2228, "learning_rate": 4.999628377283821e-06, "epoch": 0.055256898967191215, "percentage": 5.53, "elapsed_time": "0:19:33", "remaining_time": "5:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 213, "total_steps": 3836, "loss": 0.2331, "learning_rate": 4.999590286995879e-06, "epoch": 0.05551754471703646, "percentage": 5.55, "elapsed_time": "0:19:39", "remaining_time": "5:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 3836, "loss": 0.2305, "learning_rate": 4.99955033885296e-06, "epoch": 0.0557781904668817, "percentage": 5.58, "elapsed_time": "0:19:44", "remaining_time": "5:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 3836, "loss": 0.2386, "learning_rate": 4.999508532884756e-06, "epoch": 0.056038836216726944, "percentage": 5.6, "elapsed_time": "0:19:50", "remaining_time": "5:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 3836, "loss": 0.2377, "learning_rate": 4.999464869122339e-06, "epoch": 0.05629948196657218, "percentage": 5.63, "elapsed_time": "0:19:56", "remaining_time": "5:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 217, "total_steps": 3836, "loss": 0.2322, "learning_rate": 4.999419347598164e-06, "epoch": 0.05656012771641743, "percentage": 5.66, "elapsed_time": "0:20:02", "remaining_time": "5:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 3836, "loss": 0.236, "learning_rate": 4.999371968346064e-06, "epoch": 0.056820773466262665, "percentage": 5.68, "elapsed_time": "0:20:07", "remaining_time": "5:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 219, "total_steps": 3836, "loss": 0.2181, "learning_rate": 4.999322731401256e-06, "epoch": 0.05708141921610791, "percentage": 5.71, "elapsed_time": "0:20:13", "remaining_time": "5:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 3836, "loss": 0.2268, "learning_rate": 4.999271636800334e-06, "epoch": 0.05734206496595315, "percentage": 5.74, "elapsed_time": "0:20:18", "remaining_time": "5:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 221, "total_steps": 3836, "loss": 0.2269, "learning_rate": 4.999218684581277e-06, "epoch": 0.05760271071579839, "percentage": 5.76, "elapsed_time": "0:20:24", "remaining_time": "5:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 3836, "loss": 0.2356, "learning_rate": 4.999163874783441e-06, "epoch": 0.05786335646564363, "percentage": 5.79, "elapsed_time": "0:20:29", "remaining_time": "5:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 223, "total_steps": 3836, "loss": 0.2314, "learning_rate": 4.999107207447564e-06, "epoch": 0.05812400221548887, "percentage": 5.81, "elapsed_time": "0:20:35", "remaining_time": "5:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 3836, "loss": 0.2158, "learning_rate": 4.999048682615766e-06, "epoch": 0.058384647965334116, "percentage": 5.84, "elapsed_time": "0:20:41", "remaining_time": "5:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 3836, "loss": 0.2248, "learning_rate": 4.998988300331545e-06, "epoch": 0.058645293715179354, "percentage": 5.87, "elapsed_time": "0:20:46", "remaining_time": "5:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 3836, "loss": 0.2175, "learning_rate": 4.9989260606397816e-06, "epoch": 0.0589059394650246, "percentage": 5.89, "elapsed_time": "0:20:52", "remaining_time": "5:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 227, "total_steps": 3836, "loss": 0.2319, "learning_rate": 4.998861963586737e-06, "epoch": 0.05916658521486984, "percentage": 5.92, "elapsed_time": "0:20:57", "remaining_time": "5:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 3836, "loss": 0.2079, "learning_rate": 4.998796009220051e-06, "epoch": 0.05942723096471508, "percentage": 5.94, "elapsed_time": "0:21:03", "remaining_time": "5:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 229, "total_steps": 3836, "loss": 0.2034, "learning_rate": 4.998728197588746e-06, "epoch": 0.05968787671456032, "percentage": 5.97, "elapsed_time": "0:21:09", "remaining_time": "5:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 3836, "loss": 0.2166, "learning_rate": 4.9986585287432236e-06, "epoch": 0.05994852246440557, "percentage": 6.0, "elapsed_time": "0:21:15", "remaining_time": "5:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 231, "total_steps": 3836, "loss": 0.2246, "learning_rate": 4.998587002735266e-06, "epoch": 0.060209168214250805, "percentage": 6.02, "elapsed_time": "0:21:20", "remaining_time": "5:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 3836, "loss": 0.2356, "learning_rate": 4.998513619618036e-06, "epoch": 0.06046981396409605, "percentage": 6.05, "elapsed_time": "0:21:26", "remaining_time": "5:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 233, "total_steps": 3836, "loss": 0.2357, "learning_rate": 4.998438379446077e-06, "epoch": 0.06073045971394129, "percentage": 6.07, "elapsed_time": "0:21:31", "remaining_time": "5:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 3836, "loss": 0.2219, "learning_rate": 4.998361282275311e-06, "epoch": 0.060991105463786534, "percentage": 6.1, "elapsed_time": "0:21:37", "remaining_time": "5:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 3836, "loss": 0.231, "learning_rate": 4.998282328163043e-06, "epoch": 0.06125175121363177, "percentage": 6.13, "elapsed_time": "0:21:42", "remaining_time": "5:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 3836, "loss": 0.2348, "learning_rate": 4.998201517167956e-06, "epoch": 0.06151239696347702, "percentage": 6.15, "elapsed_time": "0:21:47", "remaining_time": "5:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 237, "total_steps": 3836, "loss": 0.2194, "learning_rate": 4.998118849350114e-06, "epoch": 0.061773042713322256, "percentage": 6.18, "elapsed_time": "0:21:53", "remaining_time": "5:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 3836, "loss": 0.2274, "learning_rate": 4.998034324770962e-06, "epoch": 0.0620336884631675, "percentage": 6.2, "elapsed_time": "0:21:59", "remaining_time": "5:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 239, "total_steps": 3836, "loss": 0.2152, "learning_rate": 4.997947943493322e-06, "epoch": 0.06229433421301274, "percentage": 6.23, "elapsed_time": "0:22:04", "remaining_time": "5:32:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 3836, "loss": 0.2286, "learning_rate": 4.997859705581399e-06, "epoch": 0.06255497996285798, "percentage": 6.26, "elapsed_time": "0:22:10", "remaining_time": "5:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 241, "total_steps": 3836, "loss": 0.2203, "learning_rate": 4.997769611100779e-06, "epoch": 0.06281562571270322, "percentage": 6.28, "elapsed_time": "0:22:15", "remaining_time": "5:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 3836, "loss": 0.2223, "learning_rate": 4.997677660118423e-06, "epoch": 0.06307627146254846, "percentage": 6.31, "elapsed_time": "0:22:21", "remaining_time": "5:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 243, "total_steps": 3836, "loss": 0.2093, "learning_rate": 4.997583852702675e-06, "epoch": 0.0633369172123937, "percentage": 6.33, "elapsed_time": "0:22:27", "remaining_time": "5:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 3836, "loss": 0.2198, "learning_rate": 4.997488188923262e-06, "epoch": 0.06359756296223895, "percentage": 6.36, "elapsed_time": "0:22:32", "remaining_time": "5:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 3836, "loss": 0.2409, "learning_rate": 4.997390668851284e-06, "epoch": 0.06385820871208418, "percentage": 6.39, "elapsed_time": "0:22:38", "remaining_time": "5:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 3836, "loss": 0.228, "learning_rate": 4.9972912925592245e-06, "epoch": 0.06411885446192943, "percentage": 6.41, "elapsed_time": "0:22:44", "remaining_time": "5:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 247, "total_steps": 3836, "loss": 0.2089, "learning_rate": 4.997190060120948e-06, "epoch": 0.06437950021177467, "percentage": 6.44, "elapsed_time": "0:22:49", "remaining_time": "5:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 3836, "loss": 0.2118, "learning_rate": 4.997086971611696e-06, "epoch": 0.06464014596161992, "percentage": 6.47, "elapsed_time": "0:22:55", "remaining_time": "5:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 249, "total_steps": 3836, "loss": 0.2239, "learning_rate": 4.996982027108091e-06, "epoch": 0.06490079171146515, "percentage": 6.49, "elapsed_time": "0:23:00", "remaining_time": "5:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 3836, "loss": 0.2221, "learning_rate": 4.996875226688133e-06, "epoch": 0.0651614374613104, "percentage": 6.52, "elapsed_time": "0:23:06", "remaining_time": "5:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 251, "total_steps": 3836, "loss": 0.2286, "learning_rate": 4.996766570431203e-06, "epoch": 0.06542208321115564, "percentage": 6.54, "elapsed_time": "0:23:12", "remaining_time": "5:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 3836, "loss": 0.2319, "learning_rate": 4.996656058418064e-06, "epoch": 0.06568272896100089, "percentage": 6.57, "elapsed_time": "0:23:18", "remaining_time": "5:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 253, "total_steps": 3836, "loss": 0.2212, "learning_rate": 4.996543690730852e-06, "epoch": 0.06594337471084612, "percentage": 6.6, "elapsed_time": "0:23:23", "remaining_time": "5:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 3836, "loss": 0.2091, "learning_rate": 4.996429467453088e-06, "epoch": 0.06620402046069136, "percentage": 6.62, "elapsed_time": "0:23:29", "remaining_time": "5:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 3836, "loss": 0.2087, "learning_rate": 4.99631338866967e-06, "epoch": 0.06646466621053661, "percentage": 6.65, "elapsed_time": "0:23:34", "remaining_time": "5:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 3836, "loss": 0.2176, "learning_rate": 4.996195454466873e-06, "epoch": 0.06672531196038185, "percentage": 6.67, "elapsed_time": "0:23:40", "remaining_time": "5:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 257, "total_steps": 3836, "loss": 0.2296, "learning_rate": 4.996075664932356e-06, "epoch": 0.06698595771022708, "percentage": 6.7, "elapsed_time": "0:23:46", "remaining_time": "5:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 3836, "loss": 0.2225, "learning_rate": 4.995954020155153e-06, "epoch": 0.06724660346007233, "percentage": 6.73, "elapsed_time": "0:23:51", "remaining_time": "5:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 259, "total_steps": 3836, "loss": 0.2309, "learning_rate": 4.9958305202256795e-06, "epoch": 0.06750724920991757, "percentage": 6.75, "elapsed_time": "0:23:57", "remaining_time": "5:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 3836, "loss": 0.2101, "learning_rate": 4.995705165235726e-06, "epoch": 0.0677678949597628, "percentage": 6.78, "elapsed_time": "0:24:02", "remaining_time": "5:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 261, "total_steps": 3836, "loss": 0.2319, "learning_rate": 4.995577955278465e-06, "epoch": 0.06802854070960805, "percentage": 6.8, "elapsed_time": "0:24:08", "remaining_time": "5:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 3836, "loss": 0.2095, "learning_rate": 4.995448890448449e-06, "epoch": 0.0682891864594533, "percentage": 6.83, "elapsed_time": "0:24:13", "remaining_time": "5:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 263, "total_steps": 3836, "loss": 0.2313, "learning_rate": 4.995317970841605e-06, "epoch": 0.06854983220929854, "percentage": 6.86, "elapsed_time": "0:24:19", "remaining_time": "5:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 3836, "loss": 0.2168, "learning_rate": 4.995185196555242e-06, "epoch": 0.06881047795914377, "percentage": 6.88, "elapsed_time": "0:24:24", "remaining_time": "5:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 3836, "loss": 0.2205, "learning_rate": 4.9950505676880455e-06, "epoch": 0.06907112370898902, "percentage": 6.91, "elapsed_time": "0:24:30", "remaining_time": "5:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 3836, "loss": 0.2032, "learning_rate": 4.994914084340082e-06, "epoch": 0.06933176945883426, "percentage": 6.93, "elapsed_time": "0:24:36", "remaining_time": "5:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 267, "total_steps": 3836, "loss": 0.2342, "learning_rate": 4.994775746612792e-06, "epoch": 0.06959241520867951, "percentage": 6.96, "elapsed_time": "0:24:42", "remaining_time": "5:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 3836, "loss": 0.2225, "learning_rate": 4.994635554608999e-06, "epoch": 0.06985306095852474, "percentage": 6.99, "elapsed_time": "0:24:47", "remaining_time": "5:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 269, "total_steps": 3836, "loss": 0.2272, "learning_rate": 4.9944935084329015e-06, "epoch": 0.07011370670836999, "percentage": 7.01, "elapsed_time": "0:24:53", "remaining_time": "5:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 3836, "loss": 0.2154, "learning_rate": 4.994349608190079e-06, "epoch": 0.07037435245821523, "percentage": 7.04, "elapsed_time": "0:24:58", "remaining_time": "5:29:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 271, "total_steps": 3836, "loss": 0.2374, "learning_rate": 4.994203853987485e-06, "epoch": 0.07063499820806048, "percentage": 7.06, "elapsed_time": "0:25:04", "remaining_time": "5:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 3836, "loss": 0.2299, "learning_rate": 4.994056245933454e-06, "epoch": 0.07089564395790571, "percentage": 7.09, "elapsed_time": "0:25:08", "remaining_time": "5:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 273, "total_steps": 3836, "loss": 0.2312, "learning_rate": 4.9939067841376985e-06, "epoch": 0.07115628970775095, "percentage": 7.12, "elapsed_time": "0:25:13", "remaining_time": "5:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 3836, "loss": 0.2071, "learning_rate": 4.993755468711308e-06, "epoch": 0.0714169354575962, "percentage": 7.14, "elapsed_time": "0:25:19", "remaining_time": "5:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 3836, "loss": 0.2113, "learning_rate": 4.99360229976675e-06, "epoch": 0.07167758120744143, "percentage": 7.17, "elapsed_time": "0:25:25", "remaining_time": "5:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 3836, "loss": 0.2137, "learning_rate": 4.993447277417867e-06, "epoch": 0.07193822695728667, "percentage": 7.19, "elapsed_time": "0:25:30", "remaining_time": "5:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 277, "total_steps": 3836, "loss": 0.2287, "learning_rate": 4.993290401779886e-06, "epoch": 0.07219887270713192, "percentage": 7.22, "elapsed_time": "0:25:36", "remaining_time": "5:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 3836, "loss": 0.2228, "learning_rate": 4.993131672969402e-06, "epoch": 0.07245951845697716, "percentage": 7.25, "elapsed_time": "0:25:41", "remaining_time": "5:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 279, "total_steps": 3836, "loss": 0.2157, "learning_rate": 4.992971091104396e-06, "epoch": 0.0727201642068224, "percentage": 7.27, "elapsed_time": "0:25:47", "remaining_time": "5:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 3836, "loss": 0.2291, "learning_rate": 4.992808656304221e-06, "epoch": 0.07298080995666764, "percentage": 7.3, "elapsed_time": "0:25:52", "remaining_time": "5:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 281, "total_steps": 3836, "loss": 0.2257, "learning_rate": 4.99264436868961e-06, "epoch": 0.07324145570651289, "percentage": 7.33, "elapsed_time": "0:25:58", "remaining_time": "5:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 3836, "loss": 0.2344, "learning_rate": 4.99247822838267e-06, "epoch": 0.07350210145635813, "percentage": 7.35, "elapsed_time": "0:26:04", "remaining_time": "5:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 283, "total_steps": 3836, "loss": 0.2205, "learning_rate": 4.9923102355068895e-06, "epoch": 0.07376274720620336, "percentage": 7.38, "elapsed_time": "0:26:10", "remaining_time": "5:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 3836, "loss": 0.2062, "learning_rate": 4.99214039018713e-06, "epoch": 0.07402339295604861, "percentage": 7.4, "elapsed_time": "0:26:15", "remaining_time": "5:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 3836, "loss": 0.2092, "learning_rate": 4.991968692549632e-06, "epoch": 0.07428403870589385, "percentage": 7.43, "elapsed_time": "0:26:21", "remaining_time": "5:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 3836, "loss": 0.2287, "learning_rate": 4.991795142722012e-06, "epoch": 0.0745446844557391, "percentage": 7.46, "elapsed_time": "0:26:27", "remaining_time": "5:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 287, "total_steps": 3836, "loss": 0.2253, "learning_rate": 4.991619740833263e-06, "epoch": 0.07480533020558433, "percentage": 7.48, "elapsed_time": "0:26:33", "remaining_time": "5:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 3836, "loss": 0.2505, "learning_rate": 4.9914424870137565e-06, "epoch": 0.07506597595542958, "percentage": 7.51, "elapsed_time": "0:26:39", "remaining_time": "5:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 289, "total_steps": 3836, "loss": 0.2171, "learning_rate": 4.991263381395236e-06, "epoch": 0.07532662170527482, "percentage": 7.53, "elapsed_time": "0:26:44", "remaining_time": "5:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 3836, "loss": 0.2082, "learning_rate": 4.991082424110826e-06, "epoch": 0.07558726745512007, "percentage": 7.56, "elapsed_time": "0:26:49", "remaining_time": "5:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 291, "total_steps": 3836, "loss": 0.2198, "learning_rate": 4.9908996152950266e-06, "epoch": 0.0758479132049653, "percentage": 7.59, "elapsed_time": "0:26:55", "remaining_time": "5:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 3836, "loss": 0.2206, "learning_rate": 4.990714955083709e-06, "epoch": 0.07610855895481054, "percentage": 7.61, "elapsed_time": "0:27:01", "remaining_time": "5:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 293, "total_steps": 3836, "loss": 0.2242, "learning_rate": 4.990528443614129e-06, "epoch": 0.07636920470465579, "percentage": 7.64, "elapsed_time": "0:27:07", "remaining_time": "5:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 3836, "loss": 0.2017, "learning_rate": 4.9903400810249116e-06, "epoch": 0.07662985045450102, "percentage": 7.66, "elapsed_time": "0:27:12", "remaining_time": "5:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 3836, "loss": 0.2288, "learning_rate": 4.99014986745606e-06, "epoch": 0.07689049620434626, "percentage": 7.69, "elapsed_time": "0:27:18", "remaining_time": "5:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 3836, "loss": 0.217, "learning_rate": 4.9899578030489534e-06, "epoch": 0.07715114195419151, "percentage": 7.72, "elapsed_time": "0:27:23", "remaining_time": "5:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 297, "total_steps": 3836, "loss": 0.2251, "learning_rate": 4.989763887946346e-06, "epoch": 0.07741178770403676, "percentage": 7.74, "elapsed_time": "0:27:28", "remaining_time": "5:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 3836, "loss": 0.2143, "learning_rate": 4.9895681222923685e-06, "epoch": 0.07767243345388199, "percentage": 7.77, "elapsed_time": "0:27:34", "remaining_time": "5:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 299, "total_steps": 3836, "loss": 0.2246, "learning_rate": 4.989370506232525e-06, "epoch": 0.07793307920372723, "percentage": 7.79, "elapsed_time": "0:27:40", "remaining_time": "5:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 3836, "loss": 0.2275, "learning_rate": 4.989171039913698e-06, "epoch": 0.07819372495357248, "percentage": 7.82, "elapsed_time": "0:27:46", "remaining_time": "5:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 301, "total_steps": 3836, "loss": 0.222, "learning_rate": 4.988969723484142e-06, "epoch": 0.07845437070341772, "percentage": 7.85, "elapsed_time": "0:27:51", "remaining_time": "5:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 3836, "loss": 0.2263, "learning_rate": 4.9887665570934905e-06, "epoch": 0.07871501645326295, "percentage": 7.87, "elapsed_time": "0:27:57", "remaining_time": "5:27:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 303, "total_steps": 3836, "loss": 0.2173, "learning_rate": 4.988561540892748e-06, "epoch": 0.0789756622031082, "percentage": 7.9, "elapsed_time": "0:28:03", "remaining_time": "5:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 3836, "loss": 0.2148, "learning_rate": 4.988354675034296e-06, "epoch": 0.07923630795295344, "percentage": 7.92, "elapsed_time": "0:28:08", "remaining_time": "5:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 3836, "loss": 0.2005, "learning_rate": 4.98814595967189e-06, "epoch": 0.07949695370279869, "percentage": 7.95, "elapsed_time": "0:28:14", "remaining_time": "5:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 3836, "loss": 0.2218, "learning_rate": 4.987935394960661e-06, "epoch": 0.07975759945264392, "percentage": 7.98, "elapsed_time": "0:28:19", "remaining_time": "5:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 307, "total_steps": 3836, "loss": 0.2184, "learning_rate": 4.9877229810571145e-06, "epoch": 0.08001824520248917, "percentage": 8.0, "elapsed_time": "0:28:25", "remaining_time": "5:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 3836, "loss": 0.2191, "learning_rate": 4.98750871811913e-06, "epoch": 0.08027889095233441, "percentage": 8.03, "elapsed_time": "0:28:30", "remaining_time": "5:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 309, "total_steps": 3836, "loss": 0.225, "learning_rate": 4.98729260630596e-06, "epoch": 0.08053953670217966, "percentage": 8.06, "elapsed_time": "0:28:35", "remaining_time": "5:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 3836, "loss": 0.2243, "learning_rate": 4.987074645778234e-06, "epoch": 0.08080018245202489, "percentage": 8.08, "elapsed_time": "0:28:41", "remaining_time": "5:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 311, "total_steps": 3836, "loss": 0.2062, "learning_rate": 4.986854836697953e-06, "epoch": 0.08106082820187013, "percentage": 8.11, "elapsed_time": "0:28:47", "remaining_time": "5:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 3836, "loss": 0.2189, "learning_rate": 4.986633179228495e-06, "epoch": 0.08132147395171538, "percentage": 8.13, "elapsed_time": "0:28:52", "remaining_time": "5:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 313, "total_steps": 3836, "loss": 0.2207, "learning_rate": 4.986409673534609e-06, "epoch": 0.08158211970156061, "percentage": 8.16, "elapsed_time": "0:28:58", "remaining_time": "5:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 3836, "loss": 0.2164, "learning_rate": 4.986184319782418e-06, "epoch": 0.08184276545140586, "percentage": 8.19, "elapsed_time": "0:29:04", "remaining_time": "5:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 3836, "loss": 0.2101, "learning_rate": 4.98595711813942e-06, "epoch": 0.0821034112012511, "percentage": 8.21, "elapsed_time": "0:29:09", "remaining_time": "5:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 3836, "loss": 0.2223, "learning_rate": 4.9857280687744856e-06, "epoch": 0.08236405695109635, "percentage": 8.24, "elapsed_time": "0:29:14", "remaining_time": "5:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 317, "total_steps": 3836, "loss": 0.2219, "learning_rate": 4.98549717185786e-06, "epoch": 0.08262470270094158, "percentage": 8.26, "elapsed_time": "0:29:20", "remaining_time": "5:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 3836, "loss": 0.2183, "learning_rate": 4.985264427561158e-06, "epoch": 0.08288534845078682, "percentage": 8.29, "elapsed_time": "0:29:25", "remaining_time": "5:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 319, "total_steps": 3836, "loss": 0.2303, "learning_rate": 4.985029836057372e-06, "epoch": 0.08314599420063207, "percentage": 8.32, "elapsed_time": "0:29:30", "remaining_time": "5:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 3836, "loss": 0.1969, "learning_rate": 4.984793397520865e-06, "epoch": 0.08340663995047731, "percentage": 8.34, "elapsed_time": "0:29:35", "remaining_time": "5:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 321, "total_steps": 3836, "loss": 0.2051, "learning_rate": 4.984555112127373e-06, "epoch": 0.08366728570032254, "percentage": 8.37, "elapsed_time": "0:29:41", "remaining_time": "5:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 3836, "loss": 0.2136, "learning_rate": 4.984314980054005e-06, "epoch": 0.08392793145016779, "percentage": 8.39, "elapsed_time": "0:29:46", "remaining_time": "5:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 323, "total_steps": 3836, "loss": 0.2058, "learning_rate": 4.984073001479241e-06, "epoch": 0.08418857720001303, "percentage": 8.42, "elapsed_time": "0:29:52", "remaining_time": "5:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 3836, "loss": 0.2195, "learning_rate": 4.983829176582939e-06, "epoch": 0.08444922294985828, "percentage": 8.45, "elapsed_time": "0:29:58", "remaining_time": "5:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 3836, "loss": 0.2179, "learning_rate": 4.98358350554632e-06, "epoch": 0.08470986869970351, "percentage": 8.47, "elapsed_time": "0:30:04", "remaining_time": "5:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 3836, "loss": 0.2114, "learning_rate": 4.983335988551986e-06, "epoch": 0.08497051444954876, "percentage": 8.5, "elapsed_time": "0:30:10", "remaining_time": "5:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 327, "total_steps": 3836, "loss": 0.2045, "learning_rate": 4.983086625783907e-06, "epoch": 0.085231160199394, "percentage": 8.52, "elapsed_time": "0:30:15", "remaining_time": "5:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 3836, "loss": 0.2174, "learning_rate": 4.982835417427424e-06, "epoch": 0.08549180594923925, "percentage": 8.55, "elapsed_time": "0:30:20", "remaining_time": "5:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 329, "total_steps": 3836, "loss": 0.2037, "learning_rate": 4.982582363669252e-06, "epoch": 0.08575245169908448, "percentage": 8.58, "elapsed_time": "0:30:25", "remaining_time": "5:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 3836, "loss": 0.2148, "learning_rate": 4.982327464697476e-06, "epoch": 0.08601309744892972, "percentage": 8.6, "elapsed_time": "0:30:31", "remaining_time": "5:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 331, "total_steps": 3836, "loss": 0.2247, "learning_rate": 4.982070720701554e-06, "epoch": 0.08627374319877497, "percentage": 8.63, "elapsed_time": "0:30:36", "remaining_time": "5:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 3836, "loss": 0.2153, "learning_rate": 4.981812131872315e-06, "epoch": 0.0865343889486202, "percentage": 8.65, "elapsed_time": "0:30:42", "remaining_time": "5:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 333, "total_steps": 3836, "loss": 0.2169, "learning_rate": 4.981551698401956e-06, "epoch": 0.08679503469846545, "percentage": 8.68, "elapsed_time": "0:30:47", "remaining_time": "5:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 3836, "loss": 0.2162, "learning_rate": 4.981289420484051e-06, "epoch": 0.08705568044831069, "percentage": 8.71, "elapsed_time": "0:30:53", "remaining_time": "5:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 3836, "loss": 0.2076, "learning_rate": 4.981025298313541e-06, "epoch": 0.08731632619815594, "percentage": 8.73, "elapsed_time": "0:30:58", "remaining_time": "5:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 3836, "loss": 0.2066, "learning_rate": 4.980759332086736e-06, "epoch": 0.08757697194800117, "percentage": 8.76, "elapsed_time": "0:31:04", "remaining_time": "5:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 337, "total_steps": 3836, "loss": 0.2225, "learning_rate": 4.980491522001322e-06, "epoch": 0.08783761769784641, "percentage": 8.79, "elapsed_time": "0:31:09", "remaining_time": "5:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 3836, "loss": 0.2022, "learning_rate": 4.980221868256351e-06, "epoch": 0.08809826344769166, "percentage": 8.81, "elapsed_time": "0:31:16", "remaining_time": "5:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 339, "total_steps": 3836, "loss": 0.203, "learning_rate": 4.979950371052248e-06, "epoch": 0.0883589091975369, "percentage": 8.84, "elapsed_time": "0:31:21", "remaining_time": "5:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 3836, "loss": 0.2206, "learning_rate": 4.9796770305908045e-06, "epoch": 0.08861955494738213, "percentage": 8.86, "elapsed_time": "0:31:28", "remaining_time": "5:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 341, "total_steps": 3836, "loss": 0.2174, "learning_rate": 4.979401847075188e-06, "epoch": 0.08888020069722738, "percentage": 8.89, "elapsed_time": "0:31:33", "remaining_time": "5:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 3836, "loss": 0.2032, "learning_rate": 4.979124820709931e-06, "epoch": 0.08914084644707262, "percentage": 8.92, "elapsed_time": "0:31:38", "remaining_time": "5:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 343, "total_steps": 3836, "loss": 0.1987, "learning_rate": 4.978845951700936e-06, "epoch": 0.08940149219691787, "percentage": 8.94, "elapsed_time": "0:31:44", "remaining_time": "5:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 3836, "loss": 0.2024, "learning_rate": 4.978565240255477e-06, "epoch": 0.0896621379467631, "percentage": 8.97, "elapsed_time": "0:31:50", "remaining_time": "5:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 3836, "loss": 0.2182, "learning_rate": 4.9782826865821974e-06, "epoch": 0.08992278369660835, "percentage": 8.99, "elapsed_time": "0:31:55", "remaining_time": "5:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 3836, "loss": 0.2202, "learning_rate": 4.977998290891109e-06, "epoch": 0.09018342944645359, "percentage": 9.02, "elapsed_time": "0:32:01", "remaining_time": "5:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 347, "total_steps": 3836, "loss": 0.2212, "learning_rate": 4.977712053393593e-06, "epoch": 0.09044407519629884, "percentage": 9.05, "elapsed_time": "0:32:07", "remaining_time": "5:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 3836, "loss": 0.2236, "learning_rate": 4.9774239743023975e-06, "epoch": 0.09070472094614407, "percentage": 9.07, "elapsed_time": "0:32:12", "remaining_time": "5:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 349, "total_steps": 3836, "loss": 0.2245, "learning_rate": 4.977134053831642e-06, "epoch": 0.09096536669598931, "percentage": 9.1, "elapsed_time": "0:32:18", "remaining_time": "5:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 3836, "loss": 0.216, "learning_rate": 4.976842292196817e-06, "epoch": 0.09122601244583456, "percentage": 9.12, "elapsed_time": "0:32:24", "remaining_time": "5:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 351, "total_steps": 3836, "loss": 0.2207, "learning_rate": 4.976548689614773e-06, "epoch": 0.09148665819567979, "percentage": 9.15, "elapsed_time": "0:32:29", "remaining_time": "5:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 3836, "loss": 0.2094, "learning_rate": 4.9762532463037385e-06, "epoch": 0.09174730394552504, "percentage": 9.18, "elapsed_time": "0:32:35", "remaining_time": "5:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 353, "total_steps": 3836, "loss": 0.1985, "learning_rate": 4.975955962483304e-06, "epoch": 0.09200794969537028, "percentage": 9.2, "elapsed_time": "0:32:40", "remaining_time": "5:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 3836, "loss": 0.2106, "learning_rate": 4.97565683837443e-06, "epoch": 0.09226859544521553, "percentage": 9.23, "elapsed_time": "0:32:46", "remaining_time": "5:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 355, "total_steps": 3836, "loss": 0.2146, "learning_rate": 4.9753558741994446e-06, "epoch": 0.09252924119506076, "percentage": 9.25, "elapsed_time": "0:32:51", "remaining_time": "5:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 3836, "loss": 0.2082, "learning_rate": 4.9750530701820446e-06, "epoch": 0.092789886944906, "percentage": 9.28, "elapsed_time": "0:32:56", "remaining_time": "5:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 357, "total_steps": 3836, "loss": 0.2021, "learning_rate": 4.974748426547291e-06, "epoch": 0.09305053269475125, "percentage": 9.31, "elapsed_time": "0:33:02", "remaining_time": "5:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 3836, "loss": 0.2081, "learning_rate": 4.974441943521616e-06, "epoch": 0.0933111784445965, "percentage": 9.33, "elapsed_time": "0:33:07", "remaining_time": "5:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 359, "total_steps": 3836, "loss": 0.2225, "learning_rate": 4.974133621332818e-06, "epoch": 0.09357182419444172, "percentage": 9.36, "elapsed_time": "0:33:13", "remaining_time": "5:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 3836, "loss": 0.2299, "learning_rate": 4.9738234602100605e-06, "epoch": 0.09383246994428697, "percentage": 9.38, "elapsed_time": "0:33:19", "remaining_time": "5:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 361, "total_steps": 3836, "loss": 0.2256, "learning_rate": 4.973511460383875e-06, "epoch": 0.09409311569413221, "percentage": 9.41, "elapsed_time": "0:33:24", "remaining_time": "5:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 3836, "loss": 0.2165, "learning_rate": 4.97319762208616e-06, "epoch": 0.09435376144397746, "percentage": 9.44, "elapsed_time": "0:33:29", "remaining_time": "5:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 363, "total_steps": 3836, "loss": 0.2063, "learning_rate": 4.972881945550181e-06, "epoch": 0.09461440719382269, "percentage": 9.46, "elapsed_time": "0:33:34", "remaining_time": "5:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 3836, "loss": 0.2051, "learning_rate": 4.972564431010567e-06, "epoch": 0.09487505294366794, "percentage": 9.49, "elapsed_time": "0:33:40", "remaining_time": "5:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 365, "total_steps": 3836, "loss": 0.2044, "learning_rate": 4.972245078703317e-06, "epoch": 0.09513569869351318, "percentage": 9.52, "elapsed_time": "0:33:46", "remaining_time": "5:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 3836, "loss": 0.2153, "learning_rate": 4.971923888865792e-06, "epoch": 0.09539634444335843, "percentage": 9.54, "elapsed_time": "0:33:51", "remaining_time": "5:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 367, "total_steps": 3836, "loss": 0.2199, "learning_rate": 4.971600861736723e-06, "epoch": 0.09565699019320366, "percentage": 9.57, "elapsed_time": "0:33:57", "remaining_time": "5:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 3836, "loss": 0.2199, "learning_rate": 4.971275997556203e-06, "epoch": 0.0959176359430489, "percentage": 9.59, "elapsed_time": "0:34:01", "remaining_time": "5:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 369, "total_steps": 3836, "loss": 0.2147, "learning_rate": 4.970949296565693e-06, "epoch": 0.09617828169289415, "percentage": 9.62, "elapsed_time": "0:34:07", "remaining_time": "5:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 3836, "loss": 0.2082, "learning_rate": 4.970620759008015e-06, "epoch": 0.09643892744273938, "percentage": 9.65, "elapsed_time": "0:34:12", "remaining_time": "5:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 371, "total_steps": 3836, "loss": 0.232, "learning_rate": 4.970290385127363e-06, "epoch": 0.09669957319258463, "percentage": 9.67, "elapsed_time": "0:34:18", "remaining_time": "5:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 3836, "loss": 0.2226, "learning_rate": 4.969958175169291e-06, "epoch": 0.09696021894242987, "percentage": 9.7, "elapsed_time": "0:34:24", "remaining_time": "5:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 373, "total_steps": 3836, "loss": 0.2153, "learning_rate": 4.9696241293807155e-06, "epoch": 0.09722086469227512, "percentage": 9.72, "elapsed_time": "0:34:30", "remaining_time": "5:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 3836, "loss": 0.2109, "learning_rate": 4.969288248009924e-06, "epoch": 0.09748151044212035, "percentage": 9.75, "elapsed_time": "0:34:35", "remaining_time": "5:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 375, "total_steps": 3836, "loss": 0.1975, "learning_rate": 4.968950531306564e-06, "epoch": 0.09774215619196559, "percentage": 9.78, "elapsed_time": "0:34:41", "remaining_time": "5:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 3836, "loss": 0.2259, "learning_rate": 4.968610979521647e-06, "epoch": 0.09800280194181084, "percentage": 9.8, "elapsed_time": "0:34:47", "remaining_time": "5:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 377, "total_steps": 3836, "loss": 0.2196, "learning_rate": 4.968269592907552e-06, "epoch": 0.09826344769165608, "percentage": 9.83, "elapsed_time": "0:34:52", "remaining_time": "5:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 3836, "loss": 0.2145, "learning_rate": 4.967926371718017e-06, "epoch": 0.09852409344150131, "percentage": 9.85, "elapsed_time": "0:34:58", "remaining_time": "5:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 379, "total_steps": 3836, "loss": 0.2077, "learning_rate": 4.967581316208147e-06, "epoch": 0.09878473919134656, "percentage": 9.88, "elapsed_time": "0:35:03", "remaining_time": "5:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 3836, "loss": 0.1936, "learning_rate": 4.96723442663441e-06, "epoch": 0.0990453849411918, "percentage": 9.91, "elapsed_time": "0:35:09", "remaining_time": "5:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 381, "total_steps": 3836, "loss": 0.2169, "learning_rate": 4.966885703254634e-06, "epoch": 0.09930603069103705, "percentage": 9.93, "elapsed_time": "0:35:14", "remaining_time": "5:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 3836, "loss": 0.2114, "learning_rate": 4.966535146328014e-06, "epoch": 0.09956667644088228, "percentage": 9.96, "elapsed_time": "0:35:20", "remaining_time": "5:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 383, "total_steps": 3836, "loss": 0.2174, "learning_rate": 4.966182756115107e-06, "epoch": 0.09982732219072753, "percentage": 9.98, "elapsed_time": "0:35:26", "remaining_time": "5:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 3836, "loss": 0.1984, "learning_rate": 4.965828532877831e-06, "epoch": 0.10008796794057277, "percentage": 10.01, "elapsed_time": "0:35:31", "remaining_time": "5:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 385, "total_steps": 3836, "loss": 0.1906, "learning_rate": 4.965472476879467e-06, "epoch": 0.100348613690418, "percentage": 10.04, "elapsed_time": "0:35:37", "remaining_time": "5:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 3836, "loss": 0.2148, "learning_rate": 4.96511458838466e-06, "epoch": 0.10060925944026325, "percentage": 10.06, "elapsed_time": "0:35:42", "remaining_time": "5:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 387, "total_steps": 3836, "loss": 0.209, "learning_rate": 4.964754867659413e-06, "epoch": 0.1008699051901085, "percentage": 10.09, "elapsed_time": "0:35:47", "remaining_time": "5:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 3836, "loss": 0.2062, "learning_rate": 4.964393314971096e-06, "epoch": 0.10113055093995374, "percentage": 10.11, "elapsed_time": "0:35:53", "remaining_time": "5:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 389, "total_steps": 3836, "loss": 0.2083, "learning_rate": 4.9640299305884365e-06, "epoch": 0.10139119668979897, "percentage": 10.14, "elapsed_time": "0:35:59", "remaining_time": "5:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 3836, "loss": 0.213, "learning_rate": 4.963664714781525e-06, "epoch": 0.10165184243964422, "percentage": 10.17, "elapsed_time": "0:36:05", "remaining_time": "5:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 391, "total_steps": 3836, "loss": 0.216, "learning_rate": 4.963297667821814e-06, "epoch": 0.10191248818948946, "percentage": 10.19, "elapsed_time": "0:36:10", "remaining_time": "5:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 3836, "loss": 0.1879, "learning_rate": 4.962928789982117e-06, "epoch": 0.1021731339393347, "percentage": 10.22, "elapsed_time": "0:36:15", "remaining_time": "5:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 393, "total_steps": 3836, "loss": 0.1978, "learning_rate": 4.962558081536604e-06, "epoch": 0.10243377968917994, "percentage": 10.25, "elapsed_time": "0:36:20", "remaining_time": "5:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 3836, "loss": 0.23, "learning_rate": 4.9621855427608134e-06, "epoch": 0.10269442543902518, "percentage": 10.27, "elapsed_time": "0:36:26", "remaining_time": "5:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 395, "total_steps": 3836, "loss": 0.2152, "learning_rate": 4.9618111739316366e-06, "epoch": 0.10295507118887043, "percentage": 10.3, "elapsed_time": "0:36:32", "remaining_time": "5:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 3836, "loss": 0.2207, "learning_rate": 4.961434975327331e-06, "epoch": 0.10321571693871567, "percentage": 10.32, "elapsed_time": "0:36:37", "remaining_time": "5:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 397, "total_steps": 3836, "loss": 0.2021, "learning_rate": 4.961056947227509e-06, "epoch": 0.1034763626885609, "percentage": 10.35, "elapsed_time": "0:36:42", "remaining_time": "5:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 3836, "loss": 0.2032, "learning_rate": 4.960677089913146e-06, "epoch": 0.10373700843840615, "percentage": 10.38, "elapsed_time": "0:36:48", "remaining_time": "5:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 399, "total_steps": 3836, "loss": 0.2179, "learning_rate": 4.960295403666578e-06, "epoch": 0.1039976541882514, "percentage": 10.4, "elapsed_time": "0:36:54", "remaining_time": "5:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 3836, "loss": 0.1914, "learning_rate": 4.959911888771496e-06, "epoch": 0.10425829993809664, "percentage": 10.43, "elapsed_time": "0:36:59", "remaining_time": "5:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 401, "total_steps": 3836, "loss": 0.1998, "learning_rate": 4.9595265455129544e-06, "epoch": 0.10451894568794187, "percentage": 10.45, "elapsed_time": "0:37:05", "remaining_time": "5:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 3836, "loss": 0.204, "learning_rate": 4.959139374177364e-06, "epoch": 0.10477959143778712, "percentage": 10.48, "elapsed_time": "0:37:11", "remaining_time": "5:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 403, "total_steps": 3836, "loss": 0.201, "learning_rate": 4.958750375052496e-06, "epoch": 0.10504023718763236, "percentage": 10.51, "elapsed_time": "0:37:16", "remaining_time": "5:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 3836, "loss": 0.2235, "learning_rate": 4.958359548427478e-06, "epoch": 0.1053008829374776, "percentage": 10.53, "elapsed_time": "0:37:22", "remaining_time": "5:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 405, "total_steps": 3836, "loss": 0.2249, "learning_rate": 4.957966894592799e-06, "epoch": 0.10556152868732284, "percentage": 10.56, "elapsed_time": "0:37:27", "remaining_time": "5:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 3836, "loss": 0.1905, "learning_rate": 4.957572413840303e-06, "epoch": 0.10582217443716808, "percentage": 10.58, "elapsed_time": "0:37:33", "remaining_time": "5:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 407, "total_steps": 3836, "loss": 0.2248, "learning_rate": 4.957176106463194e-06, "epoch": 0.10608282018701333, "percentage": 10.61, "elapsed_time": "0:37:38", "remaining_time": "5:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 3836, "loss": 0.219, "learning_rate": 4.956777972756033e-06, "epoch": 0.10634346593685856, "percentage": 10.64, "elapsed_time": "0:37:43", "remaining_time": "5:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 409, "total_steps": 3836, "loss": 0.1997, "learning_rate": 4.956378013014738e-06, "epoch": 0.1066041116867038, "percentage": 10.66, "elapsed_time": "0:37:49", "remaining_time": "5:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 3836, "loss": 0.2071, "learning_rate": 4.955976227536584e-06, "epoch": 0.10686475743654905, "percentage": 10.69, "elapsed_time": "0:37:55", "remaining_time": "5:16:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 411, "total_steps": 3836, "loss": 0.2163, "learning_rate": 4.955572616620205e-06, "epoch": 0.1071254031863943, "percentage": 10.71, "elapsed_time": "0:38:00", "remaining_time": "5:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 412, "total_steps": 3836, "loss": 0.2084, "learning_rate": 4.95516718056559e-06, "epoch": 0.10738604893623953, "percentage": 10.74, "elapsed_time": "0:38:06", "remaining_time": "5:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 413, "total_steps": 3836, "loss": 0.2051, "learning_rate": 4.9547599196740844e-06, "epoch": 0.10764669468608477, "percentage": 10.77, "elapsed_time": "0:38:11", "remaining_time": "5:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 414, "total_steps": 3836, "loss": 0.1955, "learning_rate": 4.95435083424839e-06, "epoch": 0.10790734043593002, "percentage": 10.79, "elapsed_time": "0:38:16", "remaining_time": "5:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 415, "total_steps": 3836, "loss": 0.2011, "learning_rate": 4.953939924592567e-06, "epoch": 0.10816798618577526, "percentage": 10.82, "elapsed_time": "0:38:22", "remaining_time": "5:16:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 416, "total_steps": 3836, "loss": 0.2064, "learning_rate": 4.953527191012029e-06, "epoch": 0.1084286319356205, "percentage": 10.84, "elapsed_time": "0:38:27", "remaining_time": "5:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 417, "total_steps": 3836, "loss": 0.1937, "learning_rate": 4.953112633813544e-06, "epoch": 0.10868927768546574, "percentage": 10.87, "elapsed_time": "0:38:33", "remaining_time": "5:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 418, "total_steps": 3836, "loss": 0.2068, "learning_rate": 4.95269625330524e-06, "epoch": 0.10894992343531099, "percentage": 10.9, "elapsed_time": "0:38:38", "remaining_time": "5:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 419, "total_steps": 3836, "loss": 0.2372, "learning_rate": 4.952278049796596e-06, "epoch": 0.10921056918515623, "percentage": 10.92, "elapsed_time": "0:38:44", "remaining_time": "5:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 3836, "loss": 0.2166, "learning_rate": 4.951858023598448e-06, "epoch": 0.10947121493500146, "percentage": 10.95, "elapsed_time": "0:38:50", "remaining_time": "5:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 421, "total_steps": 3836, "loss": 0.2091, "learning_rate": 4.951436175022987e-06, "epoch": 0.10973186068484671, "percentage": 10.97, "elapsed_time": "0:38:55", "remaining_time": "5:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 422, "total_steps": 3836, "loss": 0.2125, "learning_rate": 4.951012504383756e-06, "epoch": 0.10999250643469195, "percentage": 11.0, "elapsed_time": "0:39:01", "remaining_time": "5:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 423, "total_steps": 3836, "loss": 0.2214, "learning_rate": 4.950587011995656e-06, "epoch": 0.11025315218453718, "percentage": 11.03, "elapsed_time": "0:39:07", "remaining_time": "5:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 424, "total_steps": 3836, "loss": 0.2092, "learning_rate": 4.9501596981749375e-06, "epoch": 0.11051379793438243, "percentage": 11.05, "elapsed_time": "0:39:12", "remaining_time": "5:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 425, "total_steps": 3836, "loss": 0.2028, "learning_rate": 4.949730563239211e-06, "epoch": 0.11077444368422767, "percentage": 11.08, "elapsed_time": "0:39:17", "remaining_time": "5:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 426, "total_steps": 3836, "loss": 0.2068, "learning_rate": 4.949299607507434e-06, "epoch": 0.11103508943407292, "percentage": 11.11, "elapsed_time": "0:39:23", "remaining_time": "5:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 427, "total_steps": 3836, "loss": 0.2166, "learning_rate": 4.9488668312999215e-06, "epoch": 0.11129573518391815, "percentage": 11.13, "elapsed_time": "0:39:29", "remaining_time": "5:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 428, "total_steps": 3836, "loss": 0.2242, "learning_rate": 4.94843223493834e-06, "epoch": 0.1115563809337634, "percentage": 11.16, "elapsed_time": "0:39:34", "remaining_time": "5:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 429, "total_steps": 3836, "loss": 0.2052, "learning_rate": 4.94799581874571e-06, "epoch": 0.11181702668360864, "percentage": 11.18, "elapsed_time": "0:39:39", "remaining_time": "5:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 3836, "loss": 0.2172, "learning_rate": 4.947557583046403e-06, "epoch": 0.11207767243345389, "percentage": 11.21, "elapsed_time": "0:39:45", "remaining_time": "5:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 431, "total_steps": 3836, "loss": 0.2052, "learning_rate": 4.947117528166144e-06, "epoch": 0.11233831818329912, "percentage": 11.24, "elapsed_time": "0:39:50", "remaining_time": "5:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 432, "total_steps": 3836, "loss": 0.2156, "learning_rate": 4.94667565443201e-06, "epoch": 0.11259896393314436, "percentage": 11.26, "elapsed_time": "0:39:55", "remaining_time": "5:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 433, "total_steps": 3836, "loss": 0.2228, "learning_rate": 4.9462319621724295e-06, "epoch": 0.11285960968298961, "percentage": 11.29, "elapsed_time": "0:40:01", "remaining_time": "5:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 434, "total_steps": 3836, "loss": 0.2133, "learning_rate": 4.945786451717183e-06, "epoch": 0.11312025543283485, "percentage": 11.31, "elapsed_time": "0:40:06", "remaining_time": "5:14:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 435, "total_steps": 3836, "loss": 0.1969, "learning_rate": 4.945339123397402e-06, "epoch": 0.11338090118268009, "percentage": 11.34, "elapsed_time": "0:40:11", "remaining_time": "5:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 436, "total_steps": 3836, "loss": 0.2252, "learning_rate": 4.944889977545571e-06, "epoch": 0.11364154693252533, "percentage": 11.37, "elapsed_time": "0:40:17", "remaining_time": "5:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 437, "total_steps": 3836, "loss": 0.2089, "learning_rate": 4.944439014495521e-06, "epoch": 0.11390219268237058, "percentage": 11.39, "elapsed_time": "0:40:23", "remaining_time": "5:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 438, "total_steps": 3836, "loss": 0.2128, "learning_rate": 4.94398623458244e-06, "epoch": 0.11416283843221582, "percentage": 11.42, "elapsed_time": "0:40:28", "remaining_time": "5:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 439, "total_steps": 3836, "loss": 0.2162, "learning_rate": 4.94353163814286e-06, "epoch": 0.11442348418206105, "percentage": 11.44, "elapsed_time": "0:40:34", "remaining_time": "5:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 3836, "loss": 0.2138, "learning_rate": 4.943075225514667e-06, "epoch": 0.1146841299319063, "percentage": 11.47, "elapsed_time": "0:40:40", "remaining_time": "5:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 441, "total_steps": 3836, "loss": 0.2167, "learning_rate": 4.942616997037096e-06, "epoch": 0.11494477568175154, "percentage": 11.5, "elapsed_time": "0:40:45", "remaining_time": "5:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 442, "total_steps": 3836, "loss": 0.1971, "learning_rate": 4.942156953050733e-06, "epoch": 0.11520542143159677, "percentage": 11.52, "elapsed_time": "0:40:51", "remaining_time": "5:13:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 443, "total_steps": 3836, "loss": 0.2178, "learning_rate": 4.94169509389751e-06, "epoch": 0.11546606718144202, "percentage": 11.55, "elapsed_time": "0:40:57", "remaining_time": "5:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 444, "total_steps": 3836, "loss": 0.1947, "learning_rate": 4.94123141992071e-06, "epoch": 0.11572671293128726, "percentage": 11.57, "elapsed_time": "0:41:02", "remaining_time": "5:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 445, "total_steps": 3836, "loss": 0.214, "learning_rate": 4.940765931464967e-06, "epoch": 0.11598735868113251, "percentage": 11.6, "elapsed_time": "0:41:08", "remaining_time": "5:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 446, "total_steps": 3836, "loss": 0.2057, "learning_rate": 4.940298628876261e-06, "epoch": 0.11624800443097774, "percentage": 11.63, "elapsed_time": "0:41:13", "remaining_time": "5:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 447, "total_steps": 3836, "loss": 0.2237, "learning_rate": 4.939829512501921e-06, "epoch": 0.11650865018082299, "percentage": 11.65, "elapsed_time": "0:41:19", "remaining_time": "5:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 448, "total_steps": 3836, "loss": 0.213, "learning_rate": 4.9393585826906245e-06, "epoch": 0.11676929593066823, "percentage": 11.68, "elapsed_time": "0:41:25", "remaining_time": "5:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 449, "total_steps": 3836, "loss": 0.1913, "learning_rate": 4.938885839792395e-06, "epoch": 0.11702994168051348, "percentage": 11.7, "elapsed_time": "0:41:30", "remaining_time": "5:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 3836, "loss": 0.2036, "learning_rate": 4.938411284158608e-06, "epoch": 0.11729058743035871, "percentage": 11.73, "elapsed_time": "0:41:36", "remaining_time": "5:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 451, "total_steps": 3836, "loss": 0.2285, "learning_rate": 4.9379349161419795e-06, "epoch": 0.11755123318020395, "percentage": 11.76, "elapsed_time": "0:41:41", "remaining_time": "5:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 452, "total_steps": 3836, "loss": 0.2237, "learning_rate": 4.937456736096581e-06, "epoch": 0.1178118789300492, "percentage": 11.78, "elapsed_time": "0:41:46", "remaining_time": "5:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 453, "total_steps": 3836, "loss": 0.2169, "learning_rate": 4.936976744377824e-06, "epoch": 0.11807252467989444, "percentage": 11.81, "elapsed_time": "0:41:52", "remaining_time": "5:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 454, "total_steps": 3836, "loss": 0.2134, "learning_rate": 4.936494941342469e-06, "epoch": 0.11833317042973968, "percentage": 11.84, "elapsed_time": "0:41:57", "remaining_time": "5:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 455, "total_steps": 3836, "loss": 0.2211, "learning_rate": 4.9360113273486235e-06, "epoch": 0.11859381617958492, "percentage": 11.86, "elapsed_time": "0:42:02", "remaining_time": "5:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 456, "total_steps": 3836, "loss": 0.2095, "learning_rate": 4.93552590275574e-06, "epoch": 0.11885446192943017, "percentage": 11.89, "elapsed_time": "0:42:07", "remaining_time": "5:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 457, "total_steps": 3836, "loss": 0.2076, "learning_rate": 4.935038667924617e-06, "epoch": 0.11911510767927541, "percentage": 11.91, "elapsed_time": "0:42:13", "remaining_time": "5:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 458, "total_steps": 3836, "loss": 0.2288, "learning_rate": 4.934549623217399e-06, "epoch": 0.11937575342912064, "percentage": 11.94, "elapsed_time": "0:42:18", "remaining_time": "5:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 459, "total_steps": 3836, "loss": 0.2058, "learning_rate": 4.934058768997573e-06, "epoch": 0.11963639917896589, "percentage": 11.97, "elapsed_time": "0:42:24", "remaining_time": "5:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 3836, "loss": 0.2091, "learning_rate": 4.9335661056299755e-06, "epoch": 0.11989704492881113, "percentage": 11.99, "elapsed_time": "0:42:29", "remaining_time": "5:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 461, "total_steps": 3836, "loss": 0.2021, "learning_rate": 4.933071633480785e-06, "epoch": 0.12015769067865636, "percentage": 12.02, "elapsed_time": "0:42:35", "remaining_time": "5:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 462, "total_steps": 3836, "loss": 0.1868, "learning_rate": 4.932575352917524e-06, "epoch": 0.12041833642850161, "percentage": 12.04, "elapsed_time": "0:42:40", "remaining_time": "5:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 463, "total_steps": 3836, "loss": 0.2069, "learning_rate": 4.932077264309062e-06, "epoch": 0.12067898217834686, "percentage": 12.07, "elapsed_time": "0:42:46", "remaining_time": "5:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 464, "total_steps": 3836, "loss": 0.2101, "learning_rate": 4.931577368025607e-06, "epoch": 0.1209396279281921, "percentage": 12.1, "elapsed_time": "0:42:51", "remaining_time": "5:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 465, "total_steps": 3836, "loss": 0.2041, "learning_rate": 4.9310756644387155e-06, "epoch": 0.12120027367803733, "percentage": 12.12, "elapsed_time": "0:42:57", "remaining_time": "5:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 466, "total_steps": 3836, "loss": 0.1973, "learning_rate": 4.930572153921287e-06, "epoch": 0.12146091942788258, "percentage": 12.15, "elapsed_time": "0:43:02", "remaining_time": "5:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 467, "total_steps": 3836, "loss": 0.1925, "learning_rate": 4.93006683684756e-06, "epoch": 0.12172156517772782, "percentage": 12.17, "elapsed_time": "0:43:09", "remaining_time": "5:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 468, "total_steps": 3836, "loss": 0.2032, "learning_rate": 4.92955971359312e-06, "epoch": 0.12198221092757307, "percentage": 12.2, "elapsed_time": "0:43:14", "remaining_time": "5:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 469, "total_steps": 3836, "loss": 0.198, "learning_rate": 4.929050784534892e-06, "epoch": 0.1222428566774183, "percentage": 12.23, "elapsed_time": "0:43:19", "remaining_time": "5:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 3836, "loss": 0.1881, "learning_rate": 4.928540050051146e-06, "epoch": 0.12250350242726354, "percentage": 12.25, "elapsed_time": "0:43:24", "remaining_time": "5:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 471, "total_steps": 3836, "loss": 0.1874, "learning_rate": 4.928027510521491e-06, "epoch": 0.12276414817710879, "percentage": 12.28, "elapsed_time": "0:43:31", "remaining_time": "5:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 472, "total_steps": 3836, "loss": 0.2023, "learning_rate": 4.927513166326881e-06, "epoch": 0.12302479392695403, "percentage": 12.3, "elapsed_time": "0:43:36", "remaining_time": "5:10:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 473, "total_steps": 3836, "loss": 0.2146, "learning_rate": 4.926997017849609e-06, "epoch": 0.12328543967679927, "percentage": 12.33, "elapsed_time": "0:43:42", "remaining_time": "5:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 474, "total_steps": 3836, "loss": 0.1958, "learning_rate": 4.9264790654733076e-06, "epoch": 0.12354608542664451, "percentage": 12.36, "elapsed_time": "0:43:48", "remaining_time": "5:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 475, "total_steps": 3836, "loss": 0.2018, "learning_rate": 4.925959309582954e-06, "epoch": 0.12380673117648976, "percentage": 12.38, "elapsed_time": "0:43:53", "remaining_time": "5:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 476, "total_steps": 3836, "loss": 0.1938, "learning_rate": 4.925437750564863e-06, "epoch": 0.124067376926335, "percentage": 12.41, "elapsed_time": "0:43:59", "remaining_time": "5:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 477, "total_steps": 3836, "loss": 0.2092, "learning_rate": 4.924914388806691e-06, "epoch": 0.12432802267618023, "percentage": 12.43, "elapsed_time": "0:44:05", "remaining_time": "5:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 478, "total_steps": 3836, "loss": 0.2134, "learning_rate": 4.924389224697433e-06, "epoch": 0.12458866842602548, "percentage": 12.46, "elapsed_time": "0:44:10", "remaining_time": "5:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 479, "total_steps": 3836, "loss": 0.1949, "learning_rate": 4.923862258627426e-06, "epoch": 0.12484931417587072, "percentage": 12.49, "elapsed_time": "0:44:15", "remaining_time": "5:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 3836, "loss": 0.2174, "learning_rate": 4.923333490988343e-06, "epoch": 0.12510995992571597, "percentage": 12.51, "elapsed_time": "0:44:21", "remaining_time": "5:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 481, "total_steps": 3836, "loss": 0.2121, "learning_rate": 4.9228029221731995e-06, "epoch": 0.12537060567556121, "percentage": 12.54, "elapsed_time": "0:44:27", "remaining_time": "5:10:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 482, "total_steps": 3836, "loss": 0.1985, "learning_rate": 4.922270552576347e-06, "epoch": 0.12563125142540643, "percentage": 12.57, "elapsed_time": "0:44:33", "remaining_time": "5:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 483, "total_steps": 3836, "loss": 0.2162, "learning_rate": 4.921736382593477e-06, "epoch": 0.12589189717525168, "percentage": 12.59, "elapsed_time": "0:44:38", "remaining_time": "5:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 484, "total_steps": 3836, "loss": 0.1971, "learning_rate": 4.921200412621619e-06, "epoch": 0.12615254292509692, "percentage": 12.62, "elapsed_time": "0:44:43", "remaining_time": "5:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 485, "total_steps": 3836, "loss": 0.2041, "learning_rate": 4.920662643059139e-06, "epoch": 0.12641318867494217, "percentage": 12.64, "elapsed_time": "0:44:49", "remaining_time": "5:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 486, "total_steps": 3836, "loss": 0.2055, "learning_rate": 4.920123074305743e-06, "epoch": 0.1266738344247874, "percentage": 12.67, "elapsed_time": "0:44:55", "remaining_time": "5:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 487, "total_steps": 3836, "loss": 0.2, "learning_rate": 4.919581706762472e-06, "epoch": 0.12693448017463266, "percentage": 12.7, "elapsed_time": "0:45:00", "remaining_time": "5:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 488, "total_steps": 3836, "loss": 0.2011, "learning_rate": 4.919038540831705e-06, "epoch": 0.1271951259244779, "percentage": 12.72, "elapsed_time": "0:45:05", "remaining_time": "5:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 489, "total_steps": 3836, "loss": 0.1977, "learning_rate": 4.918493576917158e-06, "epoch": 0.12745577167432315, "percentage": 12.75, "elapsed_time": "0:45:11", "remaining_time": "5:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 3836, "loss": 0.2195, "learning_rate": 4.917946815423883e-06, "epoch": 0.12771641742416837, "percentage": 12.77, "elapsed_time": "0:45:17", "remaining_time": "5:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 491, "total_steps": 3836, "loss": 0.2123, "learning_rate": 4.9173982567582674e-06, "epoch": 0.1279770631740136, "percentage": 12.8, "elapsed_time": "0:45:22", "remaining_time": "5:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 492, "total_steps": 3836, "loss": 0.2134, "learning_rate": 4.916847901328035e-06, "epoch": 0.12823770892385886, "percentage": 12.83, "elapsed_time": "0:45:28", "remaining_time": "5:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 493, "total_steps": 3836, "loss": 0.2171, "learning_rate": 4.9162957495422455e-06, "epoch": 0.1284983546737041, "percentage": 12.85, "elapsed_time": "0:45:34", "remaining_time": "5:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 494, "total_steps": 3836, "loss": 0.2119, "learning_rate": 4.915741801811294e-06, "epoch": 0.12875900042354935, "percentage": 12.88, "elapsed_time": "0:45:40", "remaining_time": "5:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 495, "total_steps": 3836, "loss": 0.1982, "learning_rate": 4.915186058546908e-06, "epoch": 0.1290196461733946, "percentage": 12.9, "elapsed_time": "0:45:45", "remaining_time": "5:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 496, "total_steps": 3836, "loss": 0.2113, "learning_rate": 4.914628520162154e-06, "epoch": 0.12928029192323984, "percentage": 12.93, "elapsed_time": "0:45:51", "remaining_time": "5:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 497, "total_steps": 3836, "loss": 0.218, "learning_rate": 4.914069187071426e-06, "epoch": 0.12954093767308505, "percentage": 12.96, "elapsed_time": "0:45:57", "remaining_time": "5:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 498, "total_steps": 3836, "loss": 0.2021, "learning_rate": 4.913508059690461e-06, "epoch": 0.1298015834229303, "percentage": 12.98, "elapsed_time": "0:46:02", "remaining_time": "5:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 499, "total_steps": 3836, "loss": 0.2161, "learning_rate": 4.91294513843632e-06, "epoch": 0.13006222917277555, "percentage": 13.01, "elapsed_time": "0:46:08", "remaining_time": "5:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 3836, "loss": 0.1845, "learning_rate": 4.912380423727405e-06, "epoch": 0.1303228749226208, "percentage": 13.03, "elapsed_time": "0:46:13", "remaining_time": "5:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 3836, "eval_loss": 0.20621350407600403, "epoch": 0.1303228749226208, "percentage": 13.03, "elapsed_time": "0:47:09", "remaining_time": "5:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 501, "total_steps": 3836, "loss": 0.2171, "learning_rate": 4.9118139159834475e-06, "epoch": 0.13058352067246604, "percentage": 13.06, "elapsed_time": "0:47:15", "remaining_time": "5:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 502, "total_steps": 3836, "loss": 0.2145, "learning_rate": 4.911245615625512e-06, "epoch": 0.13084416642231128, "percentage": 13.09, "elapsed_time": "0:47:20", "remaining_time": "5:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 503, "total_steps": 3836, "loss": 0.2036, "learning_rate": 4.9106755230759955e-06, "epoch": 0.13110481217215653, "percentage": 13.11, "elapsed_time": "0:47:26", "remaining_time": "5:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 504, "total_steps": 3836, "loss": 0.2083, "learning_rate": 4.910103638758627e-06, "epoch": 0.13136545792200177, "percentage": 13.14, "elapsed_time": "0:47:32", "remaining_time": "5:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 505, "total_steps": 3836, "loss": 0.2124, "learning_rate": 4.909529963098467e-06, "epoch": 0.131626103671847, "percentage": 13.16, "elapsed_time": "0:47:37", "remaining_time": "5:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 506, "total_steps": 3836, "loss": 0.1985, "learning_rate": 4.9089544965219095e-06, "epoch": 0.13188674942169223, "percentage": 13.19, "elapsed_time": "0:47:43", "remaining_time": "5:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 507, "total_steps": 3836, "loss": 0.2146, "learning_rate": 4.908377239456676e-06, "epoch": 0.13214739517153748, "percentage": 13.22, "elapsed_time": "0:47:49", "remaining_time": "5:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 508, "total_steps": 3836, "loss": 0.196, "learning_rate": 4.907798192331821e-06, "epoch": 0.13240804092138272, "percentage": 13.24, "elapsed_time": "0:47:54", "remaining_time": "5:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 509, "total_steps": 3836, "loss": 0.2053, "learning_rate": 4.9072173555777304e-06, "epoch": 0.13266868667122797, "percentage": 13.27, "elapsed_time": "0:48:00", "remaining_time": "5:13:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 3836, "loss": 0.2041, "learning_rate": 4.90663472962612e-06, "epoch": 0.13292933242107322, "percentage": 13.3, "elapsed_time": "0:48:05", "remaining_time": "5:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 511, "total_steps": 3836, "loss": 0.1976, "learning_rate": 4.906050314910031e-06, "epoch": 0.13318997817091846, "percentage": 13.32, "elapsed_time": "0:48:11", "remaining_time": "5:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 512, "total_steps": 3836, "loss": 0.1969, "learning_rate": 4.905464111863841e-06, "epoch": 0.1334506239207637, "percentage": 13.35, "elapsed_time": "0:48:17", "remaining_time": "5:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 513, "total_steps": 3836, "loss": 0.199, "learning_rate": 4.904876120923253e-06, "epoch": 0.13371126967060892, "percentage": 13.37, "elapsed_time": "0:48:23", "remaining_time": "5:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 514, "total_steps": 3836, "loss": 0.1982, "learning_rate": 4.904286342525298e-06, "epoch": 0.13397191542045417, "percentage": 13.4, "elapsed_time": "0:48:28", "remaining_time": "5:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 515, "total_steps": 3836, "loss": 0.1997, "learning_rate": 4.903694777108337e-06, "epoch": 0.1342325611702994, "percentage": 13.43, "elapsed_time": "0:48:34", "remaining_time": "5:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 516, "total_steps": 3836, "loss": 0.2011, "learning_rate": 4.903101425112062e-06, "epoch": 0.13449320692014466, "percentage": 13.45, "elapsed_time": "0:48:39", "remaining_time": "5:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 517, "total_steps": 3836, "loss": 0.2085, "learning_rate": 4.902506286977486e-06, "epoch": 0.1347538526699899, "percentage": 13.48, "elapsed_time": "0:48:45", "remaining_time": "5:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 518, "total_steps": 3836, "loss": 0.199, "learning_rate": 4.9019093631469575e-06, "epoch": 0.13501449841983515, "percentage": 13.5, "elapsed_time": "0:48:50", "remaining_time": "5:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 519, "total_steps": 3836, "loss": 0.2023, "learning_rate": 4.901310654064145e-06, "epoch": 0.1352751441696804, "percentage": 13.53, "elapsed_time": "0:48:55", "remaining_time": "5:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 3836, "loss": 0.2129, "learning_rate": 4.900710160174048e-06, "epoch": 0.1355357899195256, "percentage": 13.56, "elapsed_time": "0:49:01", "remaining_time": "5:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 521, "total_steps": 3836, "loss": 0.2017, "learning_rate": 4.900107881922994e-06, "epoch": 0.13579643566937086, "percentage": 13.58, "elapsed_time": "0:49:06", "remaining_time": "5:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 522, "total_steps": 3836, "loss": 0.2004, "learning_rate": 4.899503819758633e-06, "epoch": 0.1360570814192161, "percentage": 13.61, "elapsed_time": "0:49:12", "remaining_time": "5:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 523, "total_steps": 3836, "loss": 0.2057, "learning_rate": 4.898897974129943e-06, "epoch": 0.13631772716906135, "percentage": 13.63, "elapsed_time": "0:49:18", "remaining_time": "5:12:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 524, "total_steps": 3836, "loss": 0.1989, "learning_rate": 4.898290345487226e-06, "epoch": 0.1365783729189066, "percentage": 13.66, "elapsed_time": "0:49:23", "remaining_time": "5:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 525, "total_steps": 3836, "loss": 0.2024, "learning_rate": 4.897680934282113e-06, "epoch": 0.13683901866875184, "percentage": 13.69, "elapsed_time": "0:49:28", "remaining_time": "5:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 526, "total_steps": 3836, "loss": 0.1963, "learning_rate": 4.897069740967554e-06, "epoch": 0.13709966441859708, "percentage": 13.71, "elapsed_time": "0:49:34", "remaining_time": "5:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 527, "total_steps": 3836, "loss": 0.1912, "learning_rate": 4.896456765997829e-06, "epoch": 0.13736031016844233, "percentage": 13.74, "elapsed_time": "0:49:40", "remaining_time": "5:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 528, "total_steps": 3836, "loss": 0.1969, "learning_rate": 4.89584200982854e-06, "epoch": 0.13762095591828755, "percentage": 13.76, "elapsed_time": "0:49:45", "remaining_time": "5:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 529, "total_steps": 3836, "loss": 0.188, "learning_rate": 4.895225472916612e-06, "epoch": 0.1378816016681328, "percentage": 13.79, "elapsed_time": "0:49:51", "remaining_time": "5:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 3836, "loss": 0.2207, "learning_rate": 4.894607155720294e-06, "epoch": 0.13814224741797804, "percentage": 13.82, "elapsed_time": "0:49:56", "remaining_time": "5:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 531, "total_steps": 3836, "loss": 0.1956, "learning_rate": 4.893987058699162e-06, "epoch": 0.13840289316782328, "percentage": 13.84, "elapsed_time": "0:50:01", "remaining_time": "5:11:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 532, "total_steps": 3836, "loss": 0.2023, "learning_rate": 4.893365182314108e-06, "epoch": 0.13866353891766853, "percentage": 13.87, "elapsed_time": "0:50:07", "remaining_time": "5:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 533, "total_steps": 3836, "loss": 0.2117, "learning_rate": 4.8927415270273525e-06, "epoch": 0.13892418466751377, "percentage": 13.89, "elapsed_time": "0:50:13", "remaining_time": "5:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 534, "total_steps": 3836, "loss": 0.2112, "learning_rate": 4.892116093302436e-06, "epoch": 0.13918483041735902, "percentage": 13.92, "elapsed_time": "0:50:19", "remaining_time": "5:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 535, "total_steps": 3836, "loss": 0.2121, "learning_rate": 4.8914888816042186e-06, "epoch": 0.13944547616720424, "percentage": 13.95, "elapsed_time": "0:50:24", "remaining_time": "5:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 536, "total_steps": 3836, "loss": 0.2054, "learning_rate": 4.890859892398886e-06, "epoch": 0.13970612191704948, "percentage": 13.97, "elapsed_time": "0:50:30", "remaining_time": "5:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 537, "total_steps": 3836, "loss": 0.1934, "learning_rate": 4.890229126153942e-06, "epoch": 0.13996676766689473, "percentage": 14.0, "elapsed_time": "0:50:35", "remaining_time": "5:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 538, "total_steps": 3836, "loss": 0.1976, "learning_rate": 4.889596583338213e-06, "epoch": 0.14022741341673997, "percentage": 14.03, "elapsed_time": "0:50:41", "remaining_time": "5:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 539, "total_steps": 3836, "loss": 0.2, "learning_rate": 4.888962264421845e-06, "epoch": 0.14048805916658522, "percentage": 14.05, "elapsed_time": "0:50:46", "remaining_time": "5:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 3836, "loss": 0.2004, "learning_rate": 4.8883261698763045e-06, "epoch": 0.14074870491643046, "percentage": 14.08, "elapsed_time": "0:50:51", "remaining_time": "5:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 541, "total_steps": 3836, "loss": 0.1994, "learning_rate": 4.887688300174377e-06, "epoch": 0.1410093506662757, "percentage": 14.1, "elapsed_time": "0:50:57", "remaining_time": "5:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 542, "total_steps": 3836, "loss": 0.2079, "learning_rate": 4.887048655790169e-06, "epoch": 0.14126999641612095, "percentage": 14.13, "elapsed_time": "0:51:03", "remaining_time": "5:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 543, "total_steps": 3836, "loss": 0.1977, "learning_rate": 4.886407237199103e-06, "epoch": 0.14153064216596617, "percentage": 14.16, "elapsed_time": "0:51:09", "remaining_time": "5:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 544, "total_steps": 3836, "loss": 0.1972, "learning_rate": 4.8857640448779246e-06, "epoch": 0.14179128791581141, "percentage": 14.18, "elapsed_time": "0:51:14", "remaining_time": "5:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 545, "total_steps": 3836, "loss": 0.1939, "learning_rate": 4.885119079304694e-06, "epoch": 0.14205193366565666, "percentage": 14.21, "elapsed_time": "0:51:20", "remaining_time": "5:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 546, "total_steps": 3836, "loss": 0.2151, "learning_rate": 4.884472340958791e-06, "epoch": 0.1423125794155019, "percentage": 14.23, "elapsed_time": "0:51:25", "remaining_time": "5:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 547, "total_steps": 3836, "loss": 0.2168, "learning_rate": 4.883823830320913e-06, "epoch": 0.14257322516534715, "percentage": 14.26, "elapsed_time": "0:51:30", "remaining_time": "5:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 548, "total_steps": 3836, "loss": 0.1884, "learning_rate": 4.883173547873073e-06, "epoch": 0.1428338709151924, "percentage": 14.29, "elapsed_time": "0:51:36", "remaining_time": "5:09:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 549, "total_steps": 3836, "loss": 0.2061, "learning_rate": 4.882521494098605e-06, "epoch": 0.14309451666503764, "percentage": 14.31, "elapsed_time": "0:51:42", "remaining_time": "5:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 3836, "loss": 0.2098, "learning_rate": 4.881867669482157e-06, "epoch": 0.14335516241488286, "percentage": 14.34, "elapsed_time": "0:51:47", "remaining_time": "5:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 551, "total_steps": 3836, "loss": 0.2073, "learning_rate": 4.8812120745096906e-06, "epoch": 0.1436158081647281, "percentage": 14.36, "elapsed_time": "0:51:53", "remaining_time": "5:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 552, "total_steps": 3836, "loss": 0.2063, "learning_rate": 4.880554709668486e-06, "epoch": 0.14387645391457335, "percentage": 14.39, "elapsed_time": "0:51:58", "remaining_time": "5:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 553, "total_steps": 3836, "loss": 0.2184, "learning_rate": 4.879895575447141e-06, "epoch": 0.1441370996644186, "percentage": 14.42, "elapsed_time": "0:52:04", "remaining_time": "5:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 554, "total_steps": 3836, "loss": 0.1945, "learning_rate": 4.879234672335564e-06, "epoch": 0.14439774541426384, "percentage": 14.44, "elapsed_time": "0:52:10", "remaining_time": "5:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 555, "total_steps": 3836, "loss": 0.1979, "learning_rate": 4.878572000824982e-06, "epoch": 0.14465839116410908, "percentage": 14.47, "elapsed_time": "0:52:15", "remaining_time": "5:08:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 556, "total_steps": 3836, "loss": 0.2033, "learning_rate": 4.8779075614079354e-06, "epoch": 0.14491903691395433, "percentage": 14.49, "elapsed_time": "0:52:20", "remaining_time": "5:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 557, "total_steps": 3836, "loss": 0.196, "learning_rate": 4.877241354578275e-06, "epoch": 0.14517968266379958, "percentage": 14.52, "elapsed_time": "0:52:27", "remaining_time": "5:08:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 558, "total_steps": 3836, "loss": 0.2125, "learning_rate": 4.87657338083117e-06, "epoch": 0.1454403284136448, "percentage": 14.55, "elapsed_time": "0:52:32", "remaining_time": "5:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 559, "total_steps": 3836, "loss": 0.2008, "learning_rate": 4.875903640663101e-06, "epoch": 0.14570097416349004, "percentage": 14.57, "elapsed_time": "0:52:39", "remaining_time": "5:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 3836, "loss": 0.199, "learning_rate": 4.875232134571863e-06, "epoch": 0.14596161991333528, "percentage": 14.6, "elapsed_time": "0:52:44", "remaining_time": "5:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 561, "total_steps": 3836, "loss": 0.1984, "learning_rate": 4.874558863056559e-06, "epoch": 0.14622226566318053, "percentage": 14.62, "elapsed_time": "0:52:50", "remaining_time": "5:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 562, "total_steps": 3836, "loss": 0.1825, "learning_rate": 4.8738838266176094e-06, "epoch": 0.14648291141302577, "percentage": 14.65, "elapsed_time": "0:52:55", "remaining_time": "5:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 563, "total_steps": 3836, "loss": 0.2112, "learning_rate": 4.873207025756744e-06, "epoch": 0.14674355716287102, "percentage": 14.68, "elapsed_time": "0:53:00", "remaining_time": "5:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 564, "total_steps": 3836, "loss": 0.2014, "learning_rate": 4.872528460977005e-06, "epoch": 0.14700420291271626, "percentage": 14.7, "elapsed_time": "0:53:06", "remaining_time": "5:08:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 565, "total_steps": 3836, "loss": 0.1847, "learning_rate": 4.871848132782744e-06, "epoch": 0.1472648486625615, "percentage": 14.73, "elapsed_time": "0:53:11", "remaining_time": "5:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 566, "total_steps": 3836, "loss": 0.1991, "learning_rate": 4.871166041679626e-06, "epoch": 0.14752549441240673, "percentage": 14.75, "elapsed_time": "0:53:16", "remaining_time": "5:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 567, "total_steps": 3836, "loss": 0.1999, "learning_rate": 4.870482188174622e-06, "epoch": 0.14778614016225197, "percentage": 14.78, "elapsed_time": "0:53:22", "remaining_time": "5:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 568, "total_steps": 3836, "loss": 0.1952, "learning_rate": 4.869796572776018e-06, "epoch": 0.14804678591209722, "percentage": 14.81, "elapsed_time": "0:53:27", "remaining_time": "5:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 569, "total_steps": 3836, "loss": 0.1982, "learning_rate": 4.8691091959934054e-06, "epoch": 0.14830743166194246, "percentage": 14.83, "elapsed_time": "0:53:33", "remaining_time": "5:07:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 3836, "loss": 0.2092, "learning_rate": 4.868420058337687e-06, "epoch": 0.1485680774117877, "percentage": 14.86, "elapsed_time": "0:53:38", "remaining_time": "5:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 571, "total_steps": 3836, "loss": 0.2003, "learning_rate": 4.8677291603210745e-06, "epoch": 0.14882872316163295, "percentage": 14.89, "elapsed_time": "0:53:44", "remaining_time": "5:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 572, "total_steps": 3836, "loss": 0.2145, "learning_rate": 4.867036502457087e-06, "epoch": 0.1490893689114782, "percentage": 14.91, "elapsed_time": "0:53:50", "remaining_time": "5:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 573, "total_steps": 3836, "loss": 0.2109, "learning_rate": 4.866342085260551e-06, "epoch": 0.14935001466132342, "percentage": 14.94, "elapsed_time": "0:53:55", "remaining_time": "5:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 574, "total_steps": 3836, "loss": 0.2048, "learning_rate": 4.865645909247604e-06, "epoch": 0.14961066041116866, "percentage": 14.96, "elapsed_time": "0:54:01", "remaining_time": "5:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 575, "total_steps": 3836, "loss": 0.2075, "learning_rate": 4.864947974935686e-06, "epoch": 0.1498713061610139, "percentage": 14.99, "elapsed_time": "0:54:07", "remaining_time": "5:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 576, "total_steps": 3836, "loss": 0.2055, "learning_rate": 4.864248282843548e-06, "epoch": 0.15013195191085915, "percentage": 15.02, "elapsed_time": "0:54:12", "remaining_time": "5:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 577, "total_steps": 3836, "loss": 0.2109, "learning_rate": 4.863546833491245e-06, "epoch": 0.1503925976607044, "percentage": 15.04, "elapsed_time": "0:54:18", "remaining_time": "5:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 578, "total_steps": 3836, "loss": 0.1901, "learning_rate": 4.862843627400139e-06, "epoch": 0.15065324341054964, "percentage": 15.07, "elapsed_time": "0:54:23", "remaining_time": "5:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 579, "total_steps": 3836, "loss": 0.2069, "learning_rate": 4.862138665092898e-06, "epoch": 0.1509138891603949, "percentage": 15.09, "elapsed_time": "0:54:28", "remaining_time": "5:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 3836, "loss": 0.1924, "learning_rate": 4.861431947093494e-06, "epoch": 0.15117453491024013, "percentage": 15.12, "elapsed_time": "0:54:34", "remaining_time": "5:06:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 581, "total_steps": 3836, "loss": 0.2028, "learning_rate": 4.860723473927206e-06, "epoch": 0.15143518066008535, "percentage": 15.15, "elapsed_time": "0:54:39", "remaining_time": "5:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 582, "total_steps": 3836, "loss": 0.2047, "learning_rate": 4.860013246120616e-06, "epoch": 0.1516958264099306, "percentage": 15.17, "elapsed_time": "0:54:45", "remaining_time": "5:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 583, "total_steps": 3836, "loss": 0.2118, "learning_rate": 4.8593012642016105e-06, "epoch": 0.15195647215977584, "percentage": 15.2, "elapsed_time": "0:54:50", "remaining_time": "5:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 584, "total_steps": 3836, "loss": 0.2081, "learning_rate": 4.85858752869938e-06, "epoch": 0.15221711790962109, "percentage": 15.22, "elapsed_time": "0:54:56", "remaining_time": "5:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 585, "total_steps": 3836, "loss": 0.1927, "learning_rate": 4.857872040144418e-06, "epoch": 0.15247776365946633, "percentage": 15.25, "elapsed_time": "0:55:01", "remaining_time": "5:05:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 586, "total_steps": 3836, "loss": 0.2069, "learning_rate": 4.857154799068522e-06, "epoch": 0.15273840940931158, "percentage": 15.28, "elapsed_time": "0:55:07", "remaining_time": "5:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 587, "total_steps": 3836, "loss": 0.1952, "learning_rate": 4.856435806004791e-06, "epoch": 0.15299905515915682, "percentage": 15.3, "elapsed_time": "0:55:13", "remaining_time": "5:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 588, "total_steps": 3836, "loss": 0.206, "learning_rate": 4.855715061487626e-06, "epoch": 0.15325970090900204, "percentage": 15.33, "elapsed_time": "0:55:18", "remaining_time": "5:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 589, "total_steps": 3836, "loss": 0.1949, "learning_rate": 4.854992566052731e-06, "epoch": 0.15352034665884728, "percentage": 15.35, "elapsed_time": "0:55:25", "remaining_time": "5:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 3836, "loss": 0.1994, "learning_rate": 4.8542683202371105e-06, "epoch": 0.15378099240869253, "percentage": 15.38, "elapsed_time": "0:55:30", "remaining_time": "5:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 591, "total_steps": 3836, "loss": 0.1983, "learning_rate": 4.85354232457907e-06, "epoch": 0.15404163815853777, "percentage": 15.41, "elapsed_time": "0:55:36", "remaining_time": "5:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 592, "total_steps": 3836, "loss": 0.1956, "learning_rate": 4.8528145796182155e-06, "epoch": 0.15430228390838302, "percentage": 15.43, "elapsed_time": "0:55:41", "remaining_time": "5:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 593, "total_steps": 3836, "loss": 0.2133, "learning_rate": 4.852085085895454e-06, "epoch": 0.15456292965822827, "percentage": 15.46, "elapsed_time": "0:55:46", "remaining_time": "5:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 594, "total_steps": 3836, "loss": 0.1981, "learning_rate": 4.851353843952992e-06, "epoch": 0.1548235754080735, "percentage": 15.48, "elapsed_time": "0:55:51", "remaining_time": "5:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 595, "total_steps": 3836, "loss": 0.1892, "learning_rate": 4.850620854334334e-06, "epoch": 0.15508422115791876, "percentage": 15.51, "elapsed_time": "0:55:57", "remaining_time": "5:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 596, "total_steps": 3836, "loss": 0.2087, "learning_rate": 4.849886117584286e-06, "epoch": 0.15534486690776397, "percentage": 15.54, "elapsed_time": "0:56:03", "remaining_time": "5:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 597, "total_steps": 3836, "loss": 0.2008, "learning_rate": 4.849149634248951e-06, "epoch": 0.15560551265760922, "percentage": 15.56, "elapsed_time": "0:56:08", "remaining_time": "5:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 598, "total_steps": 3836, "loss": 0.2021, "learning_rate": 4.84841140487573e-06, "epoch": 0.15586615840745446, "percentage": 15.59, "elapsed_time": "0:56:14", "remaining_time": "5:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 599, "total_steps": 3836, "loss": 0.1873, "learning_rate": 4.847671430013322e-06, "epoch": 0.1561268041572997, "percentage": 15.62, "elapsed_time": "0:56:20", "remaining_time": "5:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 3836, "loss": 0.2094, "learning_rate": 4.846929710211724e-06, "epoch": 0.15638744990714495, "percentage": 15.64, "elapsed_time": "0:56:26", "remaining_time": "5:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 601, "total_steps": 3836, "loss": 0.1973, "learning_rate": 4.846186246022228e-06, "epoch": 0.1566480956569902, "percentage": 15.67, "elapsed_time": "0:56:31", "remaining_time": "5:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 602, "total_steps": 3836, "loss": 0.2007, "learning_rate": 4.845441037997428e-06, "epoch": 0.15690874140683544, "percentage": 15.69, "elapsed_time": "0:56:37", "remaining_time": "5:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 603, "total_steps": 3836, "loss": 0.1849, "learning_rate": 4.8446940866912055e-06, "epoch": 0.1571693871566807, "percentage": 15.72, "elapsed_time": "0:56:42", "remaining_time": "5:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 604, "total_steps": 3836, "loss": 0.2019, "learning_rate": 4.843945392658744e-06, "epoch": 0.1574300329065259, "percentage": 15.75, "elapsed_time": "0:56:48", "remaining_time": "5:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 605, "total_steps": 3836, "loss": 0.2105, "learning_rate": 4.843194956456522e-06, "epoch": 0.15769067865637115, "percentage": 15.77, "elapsed_time": "0:56:54", "remaining_time": "5:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 606, "total_steps": 3836, "loss": 0.1888, "learning_rate": 4.84244277864231e-06, "epoch": 0.1579513244062164, "percentage": 15.8, "elapsed_time": "0:56:59", "remaining_time": "5:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 607, "total_steps": 3836, "loss": 0.2056, "learning_rate": 4.841688859775176e-06, "epoch": 0.15821197015606164, "percentage": 15.82, "elapsed_time": "0:57:05", "remaining_time": "5:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 608, "total_steps": 3836, "loss": 0.1996, "learning_rate": 4.840933200415479e-06, "epoch": 0.1584726159059069, "percentage": 15.85, "elapsed_time": "0:57:10", "remaining_time": "5:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 609, "total_steps": 3836, "loss": 0.2004, "learning_rate": 4.8401758011248735e-06, "epoch": 0.15873326165575213, "percentage": 15.88, "elapsed_time": "0:57:16", "remaining_time": "5:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 3836, "loss": 0.2157, "learning_rate": 4.839416662466307e-06, "epoch": 0.15899390740559738, "percentage": 15.9, "elapsed_time": "0:57:22", "remaining_time": "5:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 611, "total_steps": 3836, "loss": 0.2046, "learning_rate": 4.838655785004022e-06, "epoch": 0.1592545531554426, "percentage": 15.93, "elapsed_time": "0:57:28", "remaining_time": "5:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 612, "total_steps": 3836, "loss": 0.1948, "learning_rate": 4.837893169303548e-06, "epoch": 0.15951519890528784, "percentage": 15.95, "elapsed_time": "0:57:33", "remaining_time": "5:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 613, "total_steps": 3836, "loss": 0.2035, "learning_rate": 4.837128815931712e-06, "epoch": 0.1597758446551331, "percentage": 15.98, "elapsed_time": "0:57:39", "remaining_time": "5:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 614, "total_steps": 3836, "loss": 0.212, "learning_rate": 4.836362725456628e-06, "epoch": 0.16003649040497833, "percentage": 16.01, "elapsed_time": "0:57:45", "remaining_time": "5:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 615, "total_steps": 3836, "loss": 0.1998, "learning_rate": 4.835594898447705e-06, "epoch": 0.16029713615482358, "percentage": 16.03, "elapsed_time": "0:57:51", "remaining_time": "5:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 616, "total_steps": 3836, "loss": 0.2039, "learning_rate": 4.834825335475641e-06, "epoch": 0.16055778190466882, "percentage": 16.06, "elapsed_time": "0:57:57", "remaining_time": "5:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 617, "total_steps": 3836, "loss": 0.1888, "learning_rate": 4.834054037112423e-06, "epoch": 0.16081842765451407, "percentage": 16.08, "elapsed_time": "0:58:02", "remaining_time": "5:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 618, "total_steps": 3836, "loss": 0.2136, "learning_rate": 4.833281003931331e-06, "epoch": 0.1610790734043593, "percentage": 16.11, "elapsed_time": "0:58:08", "remaining_time": "5:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 619, "total_steps": 3836, "loss": 0.1948, "learning_rate": 4.832506236506931e-06, "epoch": 0.16133971915420453, "percentage": 16.14, "elapsed_time": "0:58:13", "remaining_time": "5:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 3836, "loss": 0.2045, "learning_rate": 4.831729735415081e-06, "epoch": 0.16160036490404978, "percentage": 16.16, "elapsed_time": "0:58:19", "remaining_time": "5:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 621, "total_steps": 3836, "loss": 0.1935, "learning_rate": 4.830951501232924e-06, "epoch": 0.16186101065389502, "percentage": 16.19, "elapsed_time": "0:58:25", "remaining_time": "5:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 622, "total_steps": 3836, "loss": 0.1901, "learning_rate": 4.830171534538895e-06, "epoch": 0.16212165640374027, "percentage": 16.21, "elapsed_time": "0:58:31", "remaining_time": "5:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 623, "total_steps": 3836, "loss": 0.1957, "learning_rate": 4.829389835912715e-06, "epoch": 0.1623823021535855, "percentage": 16.24, "elapsed_time": "0:58:36", "remaining_time": "5:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 624, "total_steps": 3836, "loss": 0.194, "learning_rate": 4.828606405935391e-06, "epoch": 0.16264294790343076, "percentage": 16.27, "elapsed_time": "0:58:42", "remaining_time": "5:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 625, "total_steps": 3836, "loss": 0.2038, "learning_rate": 4.82782124518922e-06, "epoch": 0.162903593653276, "percentage": 16.29, "elapsed_time": "0:58:48", "remaining_time": "5:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 626, "total_steps": 3836, "loss": 0.2175, "learning_rate": 4.827034354257782e-06, "epoch": 0.16316423940312122, "percentage": 16.32, "elapsed_time": "0:58:54", "remaining_time": "5:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 627, "total_steps": 3836, "loss": 0.2045, "learning_rate": 4.8262457337259465e-06, "epoch": 0.16342488515296646, "percentage": 16.35, "elapsed_time": "0:59:00", "remaining_time": "5:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 628, "total_steps": 3836, "loss": 0.1896, "learning_rate": 4.825455384179864e-06, "epoch": 0.1636855309028117, "percentage": 16.37, "elapsed_time": "0:59:06", "remaining_time": "5:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 629, "total_steps": 3836, "loss": 0.1928, "learning_rate": 4.8246633062069744e-06, "epoch": 0.16394617665265696, "percentage": 16.4, "elapsed_time": "0:59:11", "remaining_time": "5:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 3836, "loss": 0.1944, "learning_rate": 4.823869500395999e-06, "epoch": 0.1642068224025022, "percentage": 16.42, "elapsed_time": "0:59:16", "remaining_time": "5:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 631, "total_steps": 3836, "loss": 0.1889, "learning_rate": 4.823073967336948e-06, "epoch": 0.16446746815234745, "percentage": 16.45, "elapsed_time": "0:59:22", "remaining_time": "5:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 632, "total_steps": 3836, "loss": 0.2086, "learning_rate": 4.822276707621109e-06, "epoch": 0.1647281139021927, "percentage": 16.48, "elapsed_time": "0:59:28", "remaining_time": "5:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 633, "total_steps": 3836, "loss": 0.1814, "learning_rate": 4.821477721841058e-06, "epoch": 0.16498875965203794, "percentage": 16.5, "elapsed_time": "0:59:34", "remaining_time": "5:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 634, "total_steps": 3836, "loss": 0.1912, "learning_rate": 4.820677010590652e-06, "epoch": 0.16524940540188315, "percentage": 16.53, "elapsed_time": "0:59:40", "remaining_time": "5:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 635, "total_steps": 3836, "loss": 0.1949, "learning_rate": 4.819874574465031e-06, "epoch": 0.1655100511517284, "percentage": 16.55, "elapsed_time": "0:59:45", "remaining_time": "5:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 636, "total_steps": 3836, "loss": 0.2109, "learning_rate": 4.819070414060616e-06, "epoch": 0.16577069690157364, "percentage": 16.58, "elapsed_time": "0:59:51", "remaining_time": "5:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 637, "total_steps": 3836, "loss": 0.2138, "learning_rate": 4.81826452997511e-06, "epoch": 0.1660313426514189, "percentage": 16.61, "elapsed_time": "0:59:57", "remaining_time": "5:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 638, "total_steps": 3836, "loss": 0.1931, "learning_rate": 4.817456922807499e-06, "epoch": 0.16629198840126413, "percentage": 16.63, "elapsed_time": "1:00:02", "remaining_time": "5:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 639, "total_steps": 3836, "loss": 0.2032, "learning_rate": 4.816647593158047e-06, "epoch": 0.16655263415110938, "percentage": 16.66, "elapsed_time": "1:00:09", "remaining_time": "5:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 3836, "loss": 0.1964, "learning_rate": 4.815836541628299e-06, "epoch": 0.16681327990095463, "percentage": 16.68, "elapsed_time": "1:00:15", "remaining_time": "5:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 641, "total_steps": 3836, "loss": 0.1992, "learning_rate": 4.815023768821082e-06, "epoch": 0.16707392565079987, "percentage": 16.71, "elapsed_time": "1:00:20", "remaining_time": "5:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 642, "total_steps": 3836, "loss": 0.1978, "learning_rate": 4.814209275340498e-06, "epoch": 0.1673345714006451, "percentage": 16.74, "elapsed_time": "1:00:26", "remaining_time": "5:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 643, "total_steps": 3836, "loss": 0.1922, "learning_rate": 4.813393061791933e-06, "epoch": 0.16759521715049033, "percentage": 16.76, "elapsed_time": "1:00:31", "remaining_time": "5:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 644, "total_steps": 3836, "loss": 0.204, "learning_rate": 4.8125751287820484e-06, "epoch": 0.16785586290033558, "percentage": 16.79, "elapsed_time": "1:00:37", "remaining_time": "5:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 645, "total_steps": 3836, "loss": 0.2011, "learning_rate": 4.8117554769187835e-06, "epoch": 0.16811650865018082, "percentage": 16.81, "elapsed_time": "1:00:43", "remaining_time": "5:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 646, "total_steps": 3836, "loss": 0.1886, "learning_rate": 4.8109341068113566e-06, "epoch": 0.16837715440002607, "percentage": 16.84, "elapsed_time": "1:00:48", "remaining_time": "5:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 647, "total_steps": 3836, "loss": 0.1954, "learning_rate": 4.8101110190702616e-06, "epoch": 0.16863780014987131, "percentage": 16.87, "elapsed_time": "1:00:54", "remaining_time": "5:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 648, "total_steps": 3836, "loss": 0.2093, "learning_rate": 4.8092862143072705e-06, "epoch": 0.16889844589971656, "percentage": 16.89, "elapsed_time": "1:01:00", "remaining_time": "5:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 649, "total_steps": 3836, "loss": 0.1946, "learning_rate": 4.8084596931354296e-06, "epoch": 0.16915909164956178, "percentage": 16.92, "elapsed_time": "1:01:05", "remaining_time": "5:00:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 3836, "loss": 0.2056, "learning_rate": 4.807631456169064e-06, "epoch": 0.16941973739940702, "percentage": 16.94, "elapsed_time": "1:01:11", "remaining_time": "4:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 651, "total_steps": 3836, "loss": 0.22, "learning_rate": 4.806801504023771e-06, "epoch": 0.16968038314925227, "percentage": 16.97, "elapsed_time": "1:01:17", "remaining_time": "4:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 652, "total_steps": 3836, "loss": 0.2022, "learning_rate": 4.805969837316424e-06, "epoch": 0.1699410288990975, "percentage": 17.0, "elapsed_time": "1:01:22", "remaining_time": "4:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 653, "total_steps": 3836, "loss": 0.2011, "learning_rate": 4.805136456665172e-06, "epoch": 0.17020167464894276, "percentage": 17.02, "elapsed_time": "1:01:28", "remaining_time": "4:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 654, "total_steps": 3836, "loss": 0.2085, "learning_rate": 4.804301362689435e-06, "epoch": 0.170462320398788, "percentage": 17.05, "elapsed_time": "1:01:33", "remaining_time": "4:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 655, "total_steps": 3836, "loss": 0.2016, "learning_rate": 4.803464556009909e-06, "epoch": 0.17072296614863325, "percentage": 17.08, "elapsed_time": "1:01:39", "remaining_time": "4:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 656, "total_steps": 3836, "loss": 0.1828, "learning_rate": 4.8026260372485625e-06, "epoch": 0.1709836118984785, "percentage": 17.1, "elapsed_time": "1:01:45", "remaining_time": "4:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 657, "total_steps": 3836, "loss": 0.2062, "learning_rate": 4.801785807028635e-06, "epoch": 0.1712442576483237, "percentage": 17.13, "elapsed_time": "1:01:50", "remaining_time": "4:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 658, "total_steps": 3836, "loss": 0.2145, "learning_rate": 4.8009438659746396e-06, "epoch": 0.17150490339816896, "percentage": 17.15, "elapsed_time": "1:01:56", "remaining_time": "4:59:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 659, "total_steps": 3836, "loss": 0.1994, "learning_rate": 4.800100214712361e-06, "epoch": 0.1717655491480142, "percentage": 17.18, "elapsed_time": "1:02:02", "remaining_time": "4:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 3836, "loss": 0.1994, "learning_rate": 4.7992548538688554e-06, "epoch": 0.17202619489785945, "percentage": 17.21, "elapsed_time": "1:02:07", "remaining_time": "4:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 661, "total_steps": 3836, "loss": 0.1934, "learning_rate": 4.7984077840724475e-06, "epoch": 0.1722868406477047, "percentage": 17.23, "elapsed_time": "1:02:13", "remaining_time": "4:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 662, "total_steps": 3836, "loss": 0.2082, "learning_rate": 4.797559005952733e-06, "epoch": 0.17254748639754994, "percentage": 17.26, "elapsed_time": "1:02:18", "remaining_time": "4:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 663, "total_steps": 3836, "loss": 0.2112, "learning_rate": 4.796708520140581e-06, "epoch": 0.17280813214739518, "percentage": 17.28, "elapsed_time": "1:02:24", "remaining_time": "4:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 664, "total_steps": 3836, "loss": 0.2012, "learning_rate": 4.795856327268124e-06, "epoch": 0.1730687778972404, "percentage": 17.31, "elapsed_time": "1:02:30", "remaining_time": "4:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 665, "total_steps": 3836, "loss": 0.1923, "learning_rate": 4.795002427968767e-06, "epoch": 0.17332942364708565, "percentage": 17.34, "elapsed_time": "1:02:35", "remaining_time": "4:58:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 666, "total_steps": 3836, "loss": 0.1821, "learning_rate": 4.794146822877182e-06, "epoch": 0.1735900693969309, "percentage": 17.36, "elapsed_time": "1:02:40", "remaining_time": "4:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 667, "total_steps": 3836, "loss": 0.2159, "learning_rate": 4.79328951262931e-06, "epoch": 0.17385071514677614, "percentage": 17.39, "elapsed_time": "1:02:46", "remaining_time": "4:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 668, "total_steps": 3836, "loss": 0.2008, "learning_rate": 4.792430497862358e-06, "epoch": 0.17411136089662138, "percentage": 17.41, "elapsed_time": "1:02:51", "remaining_time": "4:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 669, "total_steps": 3836, "loss": 0.2022, "learning_rate": 4.791569779214802e-06, "epoch": 0.17437200664646663, "percentage": 17.44, "elapsed_time": "1:02:57", "remaining_time": "4:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 3836, "loss": 0.2015, "learning_rate": 4.790707357326381e-06, "epoch": 0.17463265239631187, "percentage": 17.47, "elapsed_time": "1:03:03", "remaining_time": "4:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 671, "total_steps": 3836, "loss": 0.1877, "learning_rate": 4.789843232838104e-06, "epoch": 0.17489329814615712, "percentage": 17.49, "elapsed_time": "1:03:08", "remaining_time": "4:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 672, "total_steps": 3836, "loss": 0.1907, "learning_rate": 4.788977406392242e-06, "epoch": 0.17515394389600233, "percentage": 17.52, "elapsed_time": "1:03:14", "remaining_time": "4:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 673, "total_steps": 3836, "loss": 0.2072, "learning_rate": 4.7881098786323325e-06, "epoch": 0.17541458964584758, "percentage": 17.54, "elapsed_time": "1:03:19", "remaining_time": "4:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 674, "total_steps": 3836, "loss": 0.189, "learning_rate": 4.787240650203178e-06, "epoch": 0.17567523539569282, "percentage": 17.57, "elapsed_time": "1:03:25", "remaining_time": "4:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 675, "total_steps": 3836, "loss": 0.1997, "learning_rate": 4.786369721750844e-06, "epoch": 0.17593588114553807, "percentage": 17.6, "elapsed_time": "1:03:30", "remaining_time": "4:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 676, "total_steps": 3836, "loss": 0.1984, "learning_rate": 4.785497093922662e-06, "epoch": 0.17619652689538332, "percentage": 17.62, "elapsed_time": "1:03:36", "remaining_time": "4:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 677, "total_steps": 3836, "loss": 0.1942, "learning_rate": 4.784622767367222e-06, "epoch": 0.17645717264522856, "percentage": 17.65, "elapsed_time": "1:03:41", "remaining_time": "4:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 678, "total_steps": 3836, "loss": 0.2092, "learning_rate": 4.78374674273438e-06, "epoch": 0.1767178183950738, "percentage": 17.67, "elapsed_time": "1:03:47", "remaining_time": "4:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 679, "total_steps": 3836, "loss": 0.2027, "learning_rate": 4.782869020675255e-06, "epoch": 0.17697846414491902, "percentage": 17.7, "elapsed_time": "1:03:53", "remaining_time": "4:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 3836, "loss": 0.1839, "learning_rate": 4.781989601842224e-06, "epoch": 0.17723910989476427, "percentage": 17.73, "elapsed_time": "1:03:58", "remaining_time": "4:56:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 681, "total_steps": 3836, "loss": 0.1918, "learning_rate": 4.7811084868889275e-06, "epoch": 0.1774997556446095, "percentage": 17.75, "elapsed_time": "1:04:04", "remaining_time": "4:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 682, "total_steps": 3836, "loss": 0.1747, "learning_rate": 4.780225676470268e-06, "epoch": 0.17776040139445476, "percentage": 17.78, "elapsed_time": "1:04:09", "remaining_time": "4:56:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 683, "total_steps": 3836, "loss": 0.2075, "learning_rate": 4.779341171242405e-06, "epoch": 0.1780210471443, "percentage": 17.81, "elapsed_time": "1:04:15", "remaining_time": "4:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 684, "total_steps": 3836, "loss": 0.1945, "learning_rate": 4.77845497186276e-06, "epoch": 0.17828169289414525, "percentage": 17.83, "elapsed_time": "1:04:20", "remaining_time": "4:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 685, "total_steps": 3836, "loss": 0.2087, "learning_rate": 4.777567078990012e-06, "epoch": 0.1785423386439905, "percentage": 17.86, "elapsed_time": "1:04:26", "remaining_time": "4:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 686, "total_steps": 3836, "loss": 0.2078, "learning_rate": 4.776677493284101e-06, "epoch": 0.17880298439383574, "percentage": 17.88, "elapsed_time": "1:04:31", "remaining_time": "4:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 687, "total_steps": 3836, "loss": 0.1916, "learning_rate": 4.775786215406223e-06, "epoch": 0.17906363014368096, "percentage": 17.91, "elapsed_time": "1:04:37", "remaining_time": "4:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 688, "total_steps": 3836, "loss": 0.1955, "learning_rate": 4.774893246018831e-06, "epoch": 0.1793242758935262, "percentage": 17.94, "elapsed_time": "1:04:43", "remaining_time": "4:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 689, "total_steps": 3836, "loss": 0.2095, "learning_rate": 4.773998585785641e-06, "epoch": 0.17958492164337145, "percentage": 17.96, "elapsed_time": "1:04:49", "remaining_time": "4:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 3836, "loss": 0.1841, "learning_rate": 4.773102235371617e-06, "epoch": 0.1798455673932167, "percentage": 17.99, "elapsed_time": "1:04:54", "remaining_time": "4:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 691, "total_steps": 3836, "loss": 0.1938, "learning_rate": 4.772204195442986e-06, "epoch": 0.18010621314306194, "percentage": 18.01, "elapsed_time": "1:05:00", "remaining_time": "4:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 692, "total_steps": 3836, "loss": 0.2016, "learning_rate": 4.771304466667229e-06, "epoch": 0.18036685889290718, "percentage": 18.04, "elapsed_time": "1:05:05", "remaining_time": "4:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 693, "total_steps": 3836, "loss": 0.1991, "learning_rate": 4.770403049713082e-06, "epoch": 0.18062750464275243, "percentage": 18.07, "elapsed_time": "1:05:10", "remaining_time": "4:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 694, "total_steps": 3836, "loss": 0.2082, "learning_rate": 4.769499945250533e-06, "epoch": 0.18088815039259767, "percentage": 18.09, "elapsed_time": "1:05:16", "remaining_time": "4:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 695, "total_steps": 3836, "loss": 0.2015, "learning_rate": 4.768595153950829e-06, "epoch": 0.1811487961424429, "percentage": 18.12, "elapsed_time": "1:05:21", "remaining_time": "4:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 696, "total_steps": 3836, "loss": 0.1988, "learning_rate": 4.76768867648647e-06, "epoch": 0.18140944189228814, "percentage": 18.14, "elapsed_time": "1:05:27", "remaining_time": "4:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 697, "total_steps": 3836, "loss": 0.2071, "learning_rate": 4.766780513531205e-06, "epoch": 0.18167008764213338, "percentage": 18.17, "elapsed_time": "1:05:32", "remaining_time": "4:55:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 698, "total_steps": 3836, "loss": 0.1923, "learning_rate": 4.7658706657600395e-06, "epoch": 0.18193073339197863, "percentage": 18.2, "elapsed_time": "1:05:38", "remaining_time": "4:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 699, "total_steps": 3836, "loss": 0.198, "learning_rate": 4.764959133849231e-06, "epoch": 0.18219137914182387, "percentage": 18.22, "elapsed_time": "1:05:44", "remaining_time": "4:55:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 3836, "loss": 0.1866, "learning_rate": 4.764045918476288e-06, "epoch": 0.18245202489166912, "percentage": 18.25, "elapsed_time": "1:05:49", "remaining_time": "4:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 701, "total_steps": 3836, "loss": 0.1982, "learning_rate": 4.7631310203199706e-06, "epoch": 0.18271267064151436, "percentage": 18.27, "elapsed_time": "1:05:54", "remaining_time": "4:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 702, "total_steps": 3836, "loss": 0.1959, "learning_rate": 4.762214440060289e-06, "epoch": 0.18297331639135958, "percentage": 18.3, "elapsed_time": "1:06:00", "remaining_time": "4:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 703, "total_steps": 3836, "loss": 0.1769, "learning_rate": 4.761296178378504e-06, "epoch": 0.18323396214120483, "percentage": 18.33, "elapsed_time": "1:06:05", "remaining_time": "4:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 704, "total_steps": 3836, "loss": 0.2002, "learning_rate": 4.760376235957127e-06, "epoch": 0.18349460789105007, "percentage": 18.35, "elapsed_time": "1:06:11", "remaining_time": "4:54:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 705, "total_steps": 3836, "loss": 0.1969, "learning_rate": 4.759454613479918e-06, "epoch": 0.18375525364089532, "percentage": 18.38, "elapsed_time": "1:06:16", "remaining_time": "4:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 706, "total_steps": 3836, "loss": 0.1884, "learning_rate": 4.758531311631884e-06, "epoch": 0.18401589939074056, "percentage": 18.4, "elapsed_time": "1:06:22", "remaining_time": "4:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 707, "total_steps": 3836, "loss": 0.1979, "learning_rate": 4.7576063310992835e-06, "epoch": 0.1842765451405858, "percentage": 18.43, "elapsed_time": "1:06:27", "remaining_time": "4:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 708, "total_steps": 3836, "loss": 0.196, "learning_rate": 4.756679672569621e-06, "epoch": 0.18453719089043105, "percentage": 18.46, "elapsed_time": "1:06:32", "remaining_time": "4:54:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 709, "total_steps": 3836, "loss": 0.1823, "learning_rate": 4.7557513367316475e-06, "epoch": 0.1847978366402763, "percentage": 18.48, "elapsed_time": "1:06:38", "remaining_time": "4:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 3836, "loss": 0.211, "learning_rate": 4.7548213242753616e-06, "epoch": 0.18505848239012151, "percentage": 18.51, "elapsed_time": "1:06:44", "remaining_time": "4:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 711, "total_steps": 3836, "loss": 0.1855, "learning_rate": 4.753889635892008e-06, "epoch": 0.18531912813996676, "percentage": 18.53, "elapsed_time": "1:06:49", "remaining_time": "4:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 712, "total_steps": 3836, "loss": 0.1998, "learning_rate": 4.752956272274078e-06, "epoch": 0.185579773889812, "percentage": 18.56, "elapsed_time": "1:06:55", "remaining_time": "4:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 713, "total_steps": 3836, "loss": 0.2003, "learning_rate": 4.752021234115304e-06, "epoch": 0.18584041963965725, "percentage": 18.59, "elapsed_time": "1:07:00", "remaining_time": "4:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 714, "total_steps": 3836, "loss": 0.1918, "learning_rate": 4.751084522110669e-06, "epoch": 0.1861010653895025, "percentage": 18.61, "elapsed_time": "1:07:06", "remaining_time": "4:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 715, "total_steps": 3836, "loss": 0.1898, "learning_rate": 4.750146136956396e-06, "epoch": 0.18636171113934774, "percentage": 18.64, "elapsed_time": "1:07:12", "remaining_time": "4:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 716, "total_steps": 3836, "loss": 0.1929, "learning_rate": 4.749206079349952e-06, "epoch": 0.186622356889193, "percentage": 18.67, "elapsed_time": "1:07:17", "remaining_time": "4:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 717, "total_steps": 3836, "loss": 0.1708, "learning_rate": 4.74826434999005e-06, "epoch": 0.1868830026390382, "percentage": 18.69, "elapsed_time": "1:07:23", "remaining_time": "4:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 718, "total_steps": 3836, "loss": 0.2003, "learning_rate": 4.747320949576641e-06, "epoch": 0.18714364838888345, "percentage": 18.72, "elapsed_time": "1:07:28", "remaining_time": "4:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 719, "total_steps": 3836, "loss": 0.2023, "learning_rate": 4.746375878810921e-06, "epoch": 0.1874042941387287, "percentage": 18.74, "elapsed_time": "1:07:34", "remaining_time": "4:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 3836, "loss": 0.1977, "learning_rate": 4.745429138395329e-06, "epoch": 0.18766493988857394, "percentage": 18.77, "elapsed_time": "1:07:39", "remaining_time": "4:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 721, "total_steps": 3836, "loss": 0.2136, "learning_rate": 4.744480729033539e-06, "epoch": 0.18792558563841918, "percentage": 18.8, "elapsed_time": "1:07:45", "remaining_time": "4:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 722, "total_steps": 3836, "loss": 0.2055, "learning_rate": 4.743530651430472e-06, "epoch": 0.18818623138826443, "percentage": 18.82, "elapsed_time": "1:07:50", "remaining_time": "4:52:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 723, "total_steps": 3836, "loss": 0.2036, "learning_rate": 4.742578906292286e-06, "epoch": 0.18844687713810968, "percentage": 18.85, "elapsed_time": "1:07:55", "remaining_time": "4:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 724, "total_steps": 3836, "loss": 0.2071, "learning_rate": 4.741625494326379e-06, "epoch": 0.18870752288795492, "percentage": 18.87, "elapsed_time": "1:08:01", "remaining_time": "4:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 725, "total_steps": 3836, "loss": 0.1906, "learning_rate": 4.740670416241386e-06, "epoch": 0.18896816863780014, "percentage": 18.9, "elapsed_time": "1:08:07", "remaining_time": "4:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 726, "total_steps": 3836, "loss": 0.2055, "learning_rate": 4.739713672747183e-06, "epoch": 0.18922881438764538, "percentage": 18.93, "elapsed_time": "1:08:12", "remaining_time": "4:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 727, "total_steps": 3836, "loss": 0.1926, "learning_rate": 4.7387552645548834e-06, "epoch": 0.18948946013749063, "percentage": 18.95, "elapsed_time": "1:08:18", "remaining_time": "4:52:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 728, "total_steps": 3836, "loss": 0.2044, "learning_rate": 4.737795192376836e-06, "epoch": 0.18975010588733587, "percentage": 18.98, "elapsed_time": "1:08:23", "remaining_time": "4:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 729, "total_steps": 3836, "loss": 0.201, "learning_rate": 4.73683345692663e-06, "epoch": 0.19001075163718112, "percentage": 19.0, "elapsed_time": "1:08:29", "remaining_time": "4:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 3836, "loss": 0.1961, "learning_rate": 4.735870058919084e-06, "epoch": 0.19027139738702636, "percentage": 19.03, "elapsed_time": "1:08:34", "remaining_time": "4:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 731, "total_steps": 3836, "loss": 0.204, "learning_rate": 4.7349049990702624e-06, "epoch": 0.1905320431368716, "percentage": 19.06, "elapsed_time": "1:08:40", "remaining_time": "4:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 732, "total_steps": 3836, "loss": 0.1883, "learning_rate": 4.733938278097456e-06, "epoch": 0.19079268888671685, "percentage": 19.08, "elapsed_time": "1:08:46", "remaining_time": "4:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 733, "total_steps": 3836, "loss": 0.2011, "learning_rate": 4.732969896719194e-06, "epoch": 0.19105333463656207, "percentage": 19.11, "elapsed_time": "1:08:52", "remaining_time": "4:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 734, "total_steps": 3836, "loss": 0.1844, "learning_rate": 4.731999855655239e-06, "epoch": 0.19131398038640732, "percentage": 19.13, "elapsed_time": "1:08:57", "remaining_time": "4:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 735, "total_steps": 3836, "loss": 0.1845, "learning_rate": 4.731028155626588e-06, "epoch": 0.19157462613625256, "percentage": 19.16, "elapsed_time": "1:09:02", "remaining_time": "4:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 736, "total_steps": 3836, "loss": 0.1976, "learning_rate": 4.730054797355471e-06, "epoch": 0.1918352718860978, "percentage": 19.19, "elapsed_time": "1:09:08", "remaining_time": "4:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 737, "total_steps": 3836, "loss": 0.1927, "learning_rate": 4.729079781565349e-06, "epoch": 0.19209591763594305, "percentage": 19.21, "elapsed_time": "1:09:15", "remaining_time": "4:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 738, "total_steps": 3836, "loss": 0.204, "learning_rate": 4.728103108980915e-06, "epoch": 0.1923565633857883, "percentage": 19.24, "elapsed_time": "1:09:21", "remaining_time": "4:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 739, "total_steps": 3836, "loss": 0.1737, "learning_rate": 4.727124780328097e-06, "epoch": 0.19261720913563354, "percentage": 19.26, "elapsed_time": "1:09:27", "remaining_time": "4:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 3836, "loss": 0.2055, "learning_rate": 4.726144796334049e-06, "epoch": 0.19287785488547876, "percentage": 19.29, "elapsed_time": "1:09:33", "remaining_time": "4:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 741, "total_steps": 3836, "loss": 0.1884, "learning_rate": 4.7251631577271585e-06, "epoch": 0.193138500635324, "percentage": 19.32, "elapsed_time": "1:09:39", "remaining_time": "4:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 742, "total_steps": 3836, "loss": 0.1782, "learning_rate": 4.724179865237042e-06, "epoch": 0.19339914638516925, "percentage": 19.34, "elapsed_time": "1:09:44", "remaining_time": "4:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 743, "total_steps": 3836, "loss": 0.1993, "learning_rate": 4.723194919594545e-06, "epoch": 0.1936597921350145, "percentage": 19.37, "elapsed_time": "1:09:50", "remaining_time": "4:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 744, "total_steps": 3836, "loss": 0.2008, "learning_rate": 4.722208321531743e-06, "epoch": 0.19392043788485974, "percentage": 19.4, "elapsed_time": "1:09:55", "remaining_time": "4:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 745, "total_steps": 3836, "loss": 0.1918, "learning_rate": 4.721220071781936e-06, "epoch": 0.194181083634705, "percentage": 19.42, "elapsed_time": "1:10:01", "remaining_time": "4:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 746, "total_steps": 3836, "loss": 0.2104, "learning_rate": 4.720230171079657e-06, "epoch": 0.19444172938455023, "percentage": 19.45, "elapsed_time": "1:10:06", "remaining_time": "4:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 747, "total_steps": 3836, "loss": 0.1904, "learning_rate": 4.719238620160662e-06, "epoch": 0.19470237513439548, "percentage": 19.47, "elapsed_time": "1:10:11", "remaining_time": "4:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 748, "total_steps": 3836, "loss": 0.203, "learning_rate": 4.7182454197619355e-06, "epoch": 0.1949630208842407, "percentage": 19.5, "elapsed_time": "1:10:17", "remaining_time": "4:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 749, "total_steps": 3836, "loss": 0.1891, "learning_rate": 4.717250570621686e-06, "epoch": 0.19522366663408594, "percentage": 19.53, "elapsed_time": "1:10:22", "remaining_time": "4:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 3836, "loss": 0.196, "learning_rate": 4.716254073479352e-06, "epoch": 0.19548431238393119, "percentage": 19.55, "elapsed_time": "1:10:28", "remaining_time": "4:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 751, "total_steps": 3836, "loss": 0.1821, "learning_rate": 4.71525592907559e-06, "epoch": 0.19574495813377643, "percentage": 19.58, "elapsed_time": "1:10:34", "remaining_time": "4:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 752, "total_steps": 3836, "loss": 0.1913, "learning_rate": 4.714256138152287e-06, "epoch": 0.19600560388362168, "percentage": 19.6, "elapsed_time": "1:10:39", "remaining_time": "4:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 753, "total_steps": 3836, "loss": 0.1873, "learning_rate": 4.71325470145255e-06, "epoch": 0.19626624963346692, "percentage": 19.63, "elapsed_time": "1:10:45", "remaining_time": "4:49:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 754, "total_steps": 3836, "loss": 0.2, "learning_rate": 4.712251619720712e-06, "epoch": 0.19652689538331217, "percentage": 19.66, "elapsed_time": "1:10:50", "remaining_time": "4:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 755, "total_steps": 3836, "loss": 0.1751, "learning_rate": 4.711246893702327e-06, "epoch": 0.19678754113315738, "percentage": 19.68, "elapsed_time": "1:10:55", "remaining_time": "4:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 756, "total_steps": 3836, "loss": 0.2008, "learning_rate": 4.71024052414417e-06, "epoch": 0.19704818688300263, "percentage": 19.71, "elapsed_time": "1:11:01", "remaining_time": "4:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 757, "total_steps": 3836, "loss": 0.183, "learning_rate": 4.709232511794242e-06, "epoch": 0.19730883263284787, "percentage": 19.73, "elapsed_time": "1:11:07", "remaining_time": "4:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 758, "total_steps": 3836, "loss": 0.1863, "learning_rate": 4.70822285740176e-06, "epoch": 0.19756947838269312, "percentage": 19.76, "elapsed_time": "1:11:13", "remaining_time": "4:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 759, "total_steps": 3836, "loss": 0.2063, "learning_rate": 4.707211561717162e-06, "epoch": 0.19783012413253837, "percentage": 19.79, "elapsed_time": "1:11:18", "remaining_time": "4:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 3836, "loss": 0.1937, "learning_rate": 4.706198625492111e-06, "epoch": 0.1980907698823836, "percentage": 19.81, "elapsed_time": "1:11:24", "remaining_time": "4:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 761, "total_steps": 3836, "loss": 0.1742, "learning_rate": 4.7051840494794845e-06, "epoch": 0.19835141563222886, "percentage": 19.84, "elapsed_time": "1:11:29", "remaining_time": "4:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 762, "total_steps": 3836, "loss": 0.1992, "learning_rate": 4.704167834433378e-06, "epoch": 0.1986120613820741, "percentage": 19.86, "elapsed_time": "1:11:35", "remaining_time": "4:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 763, "total_steps": 3836, "loss": 0.2193, "learning_rate": 4.70314998110911e-06, "epoch": 0.19887270713191932, "percentage": 19.89, "elapsed_time": "1:11:41", "remaining_time": "4:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 764, "total_steps": 3836, "loss": 0.2181, "learning_rate": 4.702130490263215e-06, "epoch": 0.19913335288176456, "percentage": 19.92, "elapsed_time": "1:11:46", "remaining_time": "4:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 765, "total_steps": 3836, "loss": 0.1862, "learning_rate": 4.70110936265344e-06, "epoch": 0.1993939986316098, "percentage": 19.94, "elapsed_time": "1:11:51", "remaining_time": "4:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 766, "total_steps": 3836, "loss": 0.2, "learning_rate": 4.700086599038755e-06, "epoch": 0.19965464438145505, "percentage": 19.97, "elapsed_time": "1:11:57", "remaining_time": "4:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 767, "total_steps": 3836, "loss": 0.195, "learning_rate": 4.69906220017934e-06, "epoch": 0.1999152901313003, "percentage": 19.99, "elapsed_time": "1:12:03", "remaining_time": "4:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 768, "total_steps": 3836, "loss": 0.1978, "learning_rate": 4.698036166836598e-06, "epoch": 0.20017593588114554, "percentage": 20.02, "elapsed_time": "1:12:08", "remaining_time": "4:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 769, "total_steps": 3836, "loss": 0.2052, "learning_rate": 4.69700849977314e-06, "epoch": 0.2004365816309908, "percentage": 20.05, "elapsed_time": "1:12:14", "remaining_time": "4:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 3836, "loss": 0.1922, "learning_rate": 4.695979199752794e-06, "epoch": 0.200697227380836, "percentage": 20.07, "elapsed_time": "1:12:19", "remaining_time": "4:48:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 771, "total_steps": 3836, "loss": 0.1943, "learning_rate": 4.694948267540601e-06, "epoch": 0.20095787313068125, "percentage": 20.1, "elapsed_time": "1:12:25", "remaining_time": "4:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 772, "total_steps": 3836, "loss": 0.1945, "learning_rate": 4.693915703902816e-06, "epoch": 0.2012185188805265, "percentage": 20.13, "elapsed_time": "1:12:30", "remaining_time": "4:47:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 773, "total_steps": 3836, "loss": 0.1837, "learning_rate": 4.692881509606906e-06, "epoch": 0.20147916463037174, "percentage": 20.15, "elapsed_time": "1:12:35", "remaining_time": "4:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 774, "total_steps": 3836, "loss": 0.2192, "learning_rate": 4.691845685421551e-06, "epoch": 0.201739810380217, "percentage": 20.18, "elapsed_time": "1:12:41", "remaining_time": "4:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 775, "total_steps": 3836, "loss": 0.1852, "learning_rate": 4.69080823211664e-06, "epoch": 0.20200045613006223, "percentage": 20.2, "elapsed_time": "1:12:47", "remaining_time": "4:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 776, "total_steps": 3836, "loss": 0.1831, "learning_rate": 4.689769150463277e-06, "epoch": 0.20226110187990748, "percentage": 20.23, "elapsed_time": "1:12:52", "remaining_time": "4:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 777, "total_steps": 3836, "loss": 0.1886, "learning_rate": 4.688728441233771e-06, "epoch": 0.20252174762975272, "percentage": 20.26, "elapsed_time": "1:12:58", "remaining_time": "4:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 778, "total_steps": 3836, "loss": 0.1933, "learning_rate": 4.687686105201645e-06, "epoch": 0.20278239337959794, "percentage": 20.28, "elapsed_time": "1:13:03", "remaining_time": "4:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 779, "total_steps": 3836, "loss": 0.1834, "learning_rate": 4.686642143141629e-06, "epoch": 0.2030430391294432, "percentage": 20.31, "elapsed_time": "1:13:09", "remaining_time": "4:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 3836, "loss": 0.1994, "learning_rate": 4.685596555829664e-06, "epoch": 0.20330368487928843, "percentage": 20.33, "elapsed_time": "1:13:15", "remaining_time": "4:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 781, "total_steps": 3836, "loss": 0.1904, "learning_rate": 4.684549344042894e-06, "epoch": 0.20356433062913368, "percentage": 20.36, "elapsed_time": "1:13:20", "remaining_time": "4:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 782, "total_steps": 3836, "loss": 0.1783, "learning_rate": 4.683500508559676e-06, "epoch": 0.20382497637897892, "percentage": 20.39, "elapsed_time": "1:13:26", "remaining_time": "4:46:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 783, "total_steps": 3836, "loss": 0.2061, "learning_rate": 4.682450050159571e-06, "epoch": 0.20408562212882417, "percentage": 20.41, "elapsed_time": "1:13:31", "remaining_time": "4:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 784, "total_steps": 3836, "loss": 0.1924, "learning_rate": 4.681397969623347e-06, "epoch": 0.2043462678786694, "percentage": 20.44, "elapsed_time": "1:13:37", "remaining_time": "4:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 785, "total_steps": 3836, "loss": 0.2101, "learning_rate": 4.680344267732977e-06, "epoch": 0.20460691362851466, "percentage": 20.46, "elapsed_time": "1:13:42", "remaining_time": "4:46:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 786, "total_steps": 3836, "loss": 0.1984, "learning_rate": 4.679288945271639e-06, "epoch": 0.20486755937835988, "percentage": 20.49, "elapsed_time": "1:13:48", "remaining_time": "4:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 787, "total_steps": 3836, "loss": 0.1792, "learning_rate": 4.678232003023716e-06, "epoch": 0.20512820512820512, "percentage": 20.52, "elapsed_time": "1:13:54", "remaining_time": "4:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 788, "total_steps": 3836, "loss": 0.2004, "learning_rate": 4.677173441774796e-06, "epoch": 0.20538885087805037, "percentage": 20.54, "elapsed_time": "1:14:00", "remaining_time": "4:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 789, "total_steps": 3836, "loss": 0.1877, "learning_rate": 4.676113262311668e-06, "epoch": 0.2056494966278956, "percentage": 20.57, "elapsed_time": "1:14:05", "remaining_time": "4:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 3836, "loss": 0.2001, "learning_rate": 4.675051465422326e-06, "epoch": 0.20591014237774086, "percentage": 20.59, "elapsed_time": "1:14:11", "remaining_time": "4:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 791, "total_steps": 3836, "loss": 0.1902, "learning_rate": 4.673988051895965e-06, "epoch": 0.2061707881275861, "percentage": 20.62, "elapsed_time": "1:14:17", "remaining_time": "4:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 792, "total_steps": 3836, "loss": 0.195, "learning_rate": 4.6729230225229815e-06, "epoch": 0.20643143387743135, "percentage": 20.65, "elapsed_time": "1:14:22", "remaining_time": "4:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 793, "total_steps": 3836, "loss": 0.1948, "learning_rate": 4.671856378094974e-06, "epoch": 0.20669207962727656, "percentage": 20.67, "elapsed_time": "1:14:28", "remaining_time": "4:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 794, "total_steps": 3836, "loss": 0.1826, "learning_rate": 4.670788119404739e-06, "epoch": 0.2069527253771218, "percentage": 20.7, "elapsed_time": "1:14:33", "remaining_time": "4:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 795, "total_steps": 3836, "loss": 0.1866, "learning_rate": 4.669718247246275e-06, "epoch": 0.20721337112696706, "percentage": 20.72, "elapsed_time": "1:14:38", "remaining_time": "4:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 796, "total_steps": 3836, "loss": 0.1901, "learning_rate": 4.66864676241478e-06, "epoch": 0.2074740168768123, "percentage": 20.75, "elapsed_time": "1:14:44", "remaining_time": "4:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 797, "total_steps": 3836, "loss": 0.19, "learning_rate": 4.6675736657066504e-06, "epoch": 0.20773466262665755, "percentage": 20.78, "elapsed_time": "1:14:49", "remaining_time": "4:45:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 798, "total_steps": 3836, "loss": 0.1898, "learning_rate": 4.666498957919479e-06, "epoch": 0.2079953083765028, "percentage": 20.8, "elapsed_time": "1:14:54", "remaining_time": "4:45:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 799, "total_steps": 3836, "loss": 0.1804, "learning_rate": 4.6654226398520574e-06, "epoch": 0.20825595412634804, "percentage": 20.83, "elapsed_time": "1:15:00", "remaining_time": "4:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 3836, "loss": 0.1859, "learning_rate": 4.664344712304375e-06, "epoch": 0.20851659987619328, "percentage": 20.86, "elapsed_time": "1:15:05", "remaining_time": "4:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 801, "total_steps": 3836, "loss": 0.1837, "learning_rate": 4.663265176077615e-06, "epoch": 0.2087772456260385, "percentage": 20.88, "elapsed_time": "1:15:11", "remaining_time": "4:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 802, "total_steps": 3836, "loss": 0.1926, "learning_rate": 4.6621840319741576e-06, "epoch": 0.20903789137588374, "percentage": 20.91, "elapsed_time": "1:15:16", "remaining_time": "4:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 803, "total_steps": 3836, "loss": 0.2002, "learning_rate": 4.661101280797579e-06, "epoch": 0.209298537125729, "percentage": 20.93, "elapsed_time": "1:15:21", "remaining_time": "4:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 804, "total_steps": 3836, "loss": 0.2066, "learning_rate": 4.660016923352648e-06, "epoch": 0.20955918287557423, "percentage": 20.96, "elapsed_time": "1:15:27", "remaining_time": "4:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 805, "total_steps": 3836, "loss": 0.1931, "learning_rate": 4.6589309604453285e-06, "epoch": 0.20981982862541948, "percentage": 20.99, "elapsed_time": "1:15:33", "remaining_time": "4:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 806, "total_steps": 3836, "loss": 0.1886, "learning_rate": 4.657843392882778e-06, "epoch": 0.21008047437526473, "percentage": 21.01, "elapsed_time": "1:15:38", "remaining_time": "4:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 807, "total_steps": 3836, "loss": 0.1892, "learning_rate": 4.656754221473346e-06, "epoch": 0.21034112012510997, "percentage": 21.04, "elapsed_time": "1:15:44", "remaining_time": "4:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 808, "total_steps": 3836, "loss": 0.1901, "learning_rate": 4.6556634470265725e-06, "epoch": 0.2106017658749552, "percentage": 21.06, "elapsed_time": "1:15:50", "remaining_time": "4:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 809, "total_steps": 3836, "loss": 0.1838, "learning_rate": 4.654571070353193e-06, "epoch": 0.21086241162480043, "percentage": 21.09, "elapsed_time": "1:15:55", "remaining_time": "4:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 3836, "loss": 0.1885, "learning_rate": 4.6534770922651305e-06, "epoch": 0.21112305737464568, "percentage": 21.12, "elapsed_time": "1:16:00", "remaining_time": "4:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 811, "total_steps": 3836, "loss": 0.1887, "learning_rate": 4.6523815135754995e-06, "epoch": 0.21138370312449092, "percentage": 21.14, "elapsed_time": "1:16:06", "remaining_time": "4:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 812, "total_steps": 3836, "loss": 0.1925, "learning_rate": 4.651284335098603e-06, "epoch": 0.21164434887433617, "percentage": 21.17, "elapsed_time": "1:16:12", "remaining_time": "4:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 813, "total_steps": 3836, "loss": 0.186, "learning_rate": 4.650185557649936e-06, "epoch": 0.21190499462418141, "percentage": 21.19, "elapsed_time": "1:16:18", "remaining_time": "4:43:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 814, "total_steps": 3836, "loss": 0.2012, "learning_rate": 4.6490851820461785e-06, "epoch": 0.21216564037402666, "percentage": 21.22, "elapsed_time": "1:16:23", "remaining_time": "4:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 815, "total_steps": 3836, "loss": 0.1946, "learning_rate": 4.6479832091052e-06, "epoch": 0.2124262861238719, "percentage": 21.25, "elapsed_time": "1:16:29", "remaining_time": "4:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 816, "total_steps": 3836, "loss": 0.1745, "learning_rate": 4.646879639646058e-06, "epoch": 0.21268693187371712, "percentage": 21.27, "elapsed_time": "1:16:34", "remaining_time": "4:43:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 817, "total_steps": 3836, "loss": 0.2086, "learning_rate": 4.645774474488995e-06, "epoch": 0.21294757762356237, "percentage": 21.3, "elapsed_time": "1:16:40", "remaining_time": "4:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 818, "total_steps": 3836, "loss": 0.1892, "learning_rate": 4.64466771445544e-06, "epoch": 0.2132082233734076, "percentage": 21.32, "elapsed_time": "1:16:45", "remaining_time": "4:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 819, "total_steps": 3836, "loss": 0.1951, "learning_rate": 4.643559360368008e-06, "epoch": 0.21346886912325286, "percentage": 21.35, "elapsed_time": "1:16:51", "remaining_time": "4:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 3836, "loss": 0.1937, "learning_rate": 4.642449413050499e-06, "epoch": 0.2137295148730981, "percentage": 21.38, "elapsed_time": "1:16:57", "remaining_time": "4:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 821, "total_steps": 3836, "loss": 0.2136, "learning_rate": 4.6413378733278945e-06, "epoch": 0.21399016062294335, "percentage": 21.4, "elapsed_time": "1:17:02", "remaining_time": "4:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 822, "total_steps": 3836, "loss": 0.1869, "learning_rate": 4.640224742026365e-06, "epoch": 0.2142508063727886, "percentage": 21.43, "elapsed_time": "1:17:08", "remaining_time": "4:42:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 823, "total_steps": 3836, "loss": 0.1966, "learning_rate": 4.639110019973258e-06, "epoch": 0.21451145212263384, "percentage": 21.45, "elapsed_time": "1:17:14", "remaining_time": "4:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 824, "total_steps": 3836, "loss": 0.1864, "learning_rate": 4.637993707997107e-06, "epoch": 0.21477209787247906, "percentage": 21.48, "elapsed_time": "1:17:19", "remaining_time": "4:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 825, "total_steps": 3836, "loss": 0.1942, "learning_rate": 4.6368758069276274e-06, "epoch": 0.2150327436223243, "percentage": 21.51, "elapsed_time": "1:17:25", "remaining_time": "4:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 826, "total_steps": 3836, "loss": 0.2042, "learning_rate": 4.635756317595714e-06, "epoch": 0.21529338937216955, "percentage": 21.53, "elapsed_time": "1:17:30", "remaining_time": "4:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 827, "total_steps": 3836, "loss": 0.1918, "learning_rate": 4.634635240833442e-06, "epoch": 0.2155540351220148, "percentage": 21.56, "elapsed_time": "1:17:35", "remaining_time": "4:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 828, "total_steps": 3836, "loss": 0.1649, "learning_rate": 4.6335125774740665e-06, "epoch": 0.21581468087186004, "percentage": 21.58, "elapsed_time": "1:17:41", "remaining_time": "4:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 829, "total_steps": 3836, "loss": 0.1914, "learning_rate": 4.632388328352023e-06, "epoch": 0.21607532662170528, "percentage": 21.61, "elapsed_time": "1:17:47", "remaining_time": "4:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 3836, "loss": 0.1804, "learning_rate": 4.6312624943029275e-06, "epoch": 0.21633597237155053, "percentage": 21.64, "elapsed_time": "1:17:52", "remaining_time": "4:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 831, "total_steps": 3836, "loss": 0.1845, "learning_rate": 4.630135076163569e-06, "epoch": 0.21659661812139575, "percentage": 21.66, "elapsed_time": "1:17:58", "remaining_time": "4:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 832, "total_steps": 3836, "loss": 0.1723, "learning_rate": 4.629006074771918e-06, "epoch": 0.216857263871241, "percentage": 21.69, "elapsed_time": "1:18:03", "remaining_time": "4:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 833, "total_steps": 3836, "loss": 0.2102, "learning_rate": 4.627875490967119e-06, "epoch": 0.21711790962108624, "percentage": 21.72, "elapsed_time": "1:18:09", "remaining_time": "4:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 834, "total_steps": 3836, "loss": 0.1895, "learning_rate": 4.626743325589496e-06, "epoch": 0.21737855537093148, "percentage": 21.74, "elapsed_time": "1:18:15", "remaining_time": "4:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 835, "total_steps": 3836, "loss": 0.1871, "learning_rate": 4.625609579480544e-06, "epoch": 0.21763920112077673, "percentage": 21.77, "elapsed_time": "1:18:20", "remaining_time": "4:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 836, "total_steps": 3836, "loss": 0.1889, "learning_rate": 4.624474253482938e-06, "epoch": 0.21789984687062197, "percentage": 21.79, "elapsed_time": "1:18:26", "remaining_time": "4:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 837, "total_steps": 3836, "loss": 0.1933, "learning_rate": 4.623337348440524e-06, "epoch": 0.21816049262046722, "percentage": 21.82, "elapsed_time": "1:18:31", "remaining_time": "4:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 838, "total_steps": 3836, "loss": 0.1933, "learning_rate": 4.622198865198321e-06, "epoch": 0.21842113837031246, "percentage": 21.85, "elapsed_time": "1:18:37", "remaining_time": "4:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 839, "total_steps": 3836, "loss": 0.1816, "learning_rate": 4.621058804602523e-06, "epoch": 0.21868178412015768, "percentage": 21.87, "elapsed_time": "1:18:42", "remaining_time": "4:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 3836, "loss": 0.2002, "learning_rate": 4.619917167500496e-06, "epoch": 0.21894242987000292, "percentage": 21.9, "elapsed_time": "1:18:47", "remaining_time": "4:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 841, "total_steps": 3836, "loss": 0.201, "learning_rate": 4.6187739547407785e-06, "epoch": 0.21920307561984817, "percentage": 21.92, "elapsed_time": "1:18:54", "remaining_time": "4:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 842, "total_steps": 3836, "loss": 0.1819, "learning_rate": 4.617629167173078e-06, "epoch": 0.21946372136969342, "percentage": 21.95, "elapsed_time": "1:18:59", "remaining_time": "4:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 843, "total_steps": 3836, "loss": 0.1928, "learning_rate": 4.616482805648273e-06, "epoch": 0.21972436711953866, "percentage": 21.98, "elapsed_time": "1:19:05", "remaining_time": "4:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 844, "total_steps": 3836, "loss": 0.1715, "learning_rate": 4.615334871018415e-06, "epoch": 0.2199850128693839, "percentage": 22.0, "elapsed_time": "1:19:10", "remaining_time": "4:40:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 845, "total_steps": 3836, "loss": 0.1733, "learning_rate": 4.614185364136719e-06, "epoch": 0.22024565861922915, "percentage": 22.03, "elapsed_time": "1:19:15", "remaining_time": "4:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 846, "total_steps": 3836, "loss": 0.1872, "learning_rate": 4.613034285857575e-06, "epoch": 0.22050630436907437, "percentage": 22.05, "elapsed_time": "1:19:21", "remaining_time": "4:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 847, "total_steps": 3836, "loss": 0.1919, "learning_rate": 4.611881637036536e-06, "epoch": 0.2207669501189196, "percentage": 22.08, "elapsed_time": "1:19:26", "remaining_time": "4:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 848, "total_steps": 3836, "loss": 0.1872, "learning_rate": 4.610727418530324e-06, "epoch": 0.22102759586876486, "percentage": 22.11, "elapsed_time": "1:19:31", "remaining_time": "4:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 849, "total_steps": 3836, "loss": 0.1741, "learning_rate": 4.609571631196829e-06, "epoch": 0.2212882416186101, "percentage": 22.13, "elapsed_time": "1:19:37", "remaining_time": "4:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 3836, "loss": 0.1851, "learning_rate": 4.6084142758951055e-06, "epoch": 0.22154888736845535, "percentage": 22.16, "elapsed_time": "1:19:42", "remaining_time": "4:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 851, "total_steps": 3836, "loss": 0.198, "learning_rate": 4.607255353485373e-06, "epoch": 0.2218095331183006, "percentage": 22.18, "elapsed_time": "1:19:47", "remaining_time": "4:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 852, "total_steps": 3836, "loss": 0.1725, "learning_rate": 4.606094864829016e-06, "epoch": 0.22207017886814584, "percentage": 22.21, "elapsed_time": "1:19:53", "remaining_time": "4:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 853, "total_steps": 3836, "loss": 0.1947, "learning_rate": 4.604932810788587e-06, "epoch": 0.22233082461799109, "percentage": 22.24, "elapsed_time": "1:19:58", "remaining_time": "4:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 854, "total_steps": 3836, "loss": 0.1813, "learning_rate": 4.603769192227795e-06, "epoch": 0.2225914703678363, "percentage": 22.26, "elapsed_time": "1:20:03", "remaining_time": "4:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 855, "total_steps": 3836, "loss": 0.1892, "learning_rate": 4.602604010011518e-06, "epoch": 0.22285211611768155, "percentage": 22.29, "elapsed_time": "1:20:09", "remaining_time": "4:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 856, "total_steps": 3836, "loss": 0.205, "learning_rate": 4.601437265005792e-06, "epoch": 0.2231127618675268, "percentage": 22.31, "elapsed_time": "1:20:14", "remaining_time": "4:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 857, "total_steps": 3836, "loss": 0.1854, "learning_rate": 4.600268958077818e-06, "epoch": 0.22337340761737204, "percentage": 22.34, "elapsed_time": "1:20:20", "remaining_time": "4:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 858, "total_steps": 3836, "loss": 0.1822, "learning_rate": 4.599099090095955e-06, "epoch": 0.22363405336721728, "percentage": 22.37, "elapsed_time": "1:20:25", "remaining_time": "4:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 859, "total_steps": 3836, "loss": 0.1925, "learning_rate": 4.5979276619297245e-06, "epoch": 0.22389469911706253, "percentage": 22.39, "elapsed_time": "1:20:32", "remaining_time": "4:39:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 3836, "loss": 0.1758, "learning_rate": 4.5967546744498044e-06, "epoch": 0.22415534486690777, "percentage": 22.42, "elapsed_time": "1:20:38", "remaining_time": "4:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 861, "total_steps": 3836, "loss": 0.2019, "learning_rate": 4.595580128528037e-06, "epoch": 0.22441599061675302, "percentage": 22.45, "elapsed_time": "1:20:43", "remaining_time": "4:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 862, "total_steps": 3836, "loss": 0.2019, "learning_rate": 4.594404025037418e-06, "epoch": 0.22467663636659824, "percentage": 22.47, "elapsed_time": "1:20:49", "remaining_time": "4:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 863, "total_steps": 3836, "loss": 0.186, "learning_rate": 4.593226364852102e-06, "epoch": 0.22493728211644348, "percentage": 22.5, "elapsed_time": "1:20:55", "remaining_time": "4:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 864, "total_steps": 3836, "loss": 0.2144, "learning_rate": 4.592047148847404e-06, "epoch": 0.22519792786628873, "percentage": 22.52, "elapsed_time": "1:21:00", "remaining_time": "4:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 865, "total_steps": 3836, "loss": 0.1998, "learning_rate": 4.590866377899789e-06, "epoch": 0.22545857361613397, "percentage": 22.55, "elapsed_time": "1:21:05", "remaining_time": "4:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 866, "total_steps": 3836, "loss": 0.1906, "learning_rate": 4.589684052886884e-06, "epoch": 0.22571921936597922, "percentage": 22.58, "elapsed_time": "1:21:10", "remaining_time": "4:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 867, "total_steps": 3836, "loss": 0.193, "learning_rate": 4.5885001746874665e-06, "epoch": 0.22597986511582446, "percentage": 22.6, "elapsed_time": "1:21:15", "remaining_time": "4:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 868, "total_steps": 3836, "loss": 0.1939, "learning_rate": 4.587314744181471e-06, "epoch": 0.2262405108656697, "percentage": 22.63, "elapsed_time": "1:21:21", "remaining_time": "4:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 869, "total_steps": 3836, "loss": 0.1916, "learning_rate": 4.586127762249985e-06, "epoch": 0.22650115661551493, "percentage": 22.65, "elapsed_time": "1:21:27", "remaining_time": "4:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 3836, "loss": 0.1975, "learning_rate": 4.58493922977525e-06, "epoch": 0.22676180236536017, "percentage": 22.68, "elapsed_time": "1:21:32", "remaining_time": "4:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 871, "total_steps": 3836, "loss": 0.1826, "learning_rate": 4.583749147640658e-06, "epoch": 0.22702244811520542, "percentage": 22.71, "elapsed_time": "1:21:37", "remaining_time": "4:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 872, "total_steps": 3836, "loss": 0.1832, "learning_rate": 4.582557516730755e-06, "epoch": 0.22728309386505066, "percentage": 22.73, "elapsed_time": "1:21:43", "remaining_time": "4:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 873, "total_steps": 3836, "loss": 0.1839, "learning_rate": 4.581364337931237e-06, "epoch": 0.2275437396148959, "percentage": 22.76, "elapsed_time": "1:21:48", "remaining_time": "4:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 874, "total_steps": 3836, "loss": 0.2027, "learning_rate": 4.58016961212895e-06, "epoch": 0.22780438536474115, "percentage": 22.78, "elapsed_time": "1:21:54", "remaining_time": "4:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 875, "total_steps": 3836, "loss": 0.1785, "learning_rate": 4.5789733402118895e-06, "epoch": 0.2280650311145864, "percentage": 22.81, "elapsed_time": "1:22:00", "remaining_time": "4:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 876, "total_steps": 3836, "loss": 0.1903, "learning_rate": 4.577775523069204e-06, "epoch": 0.22832567686443164, "percentage": 22.84, "elapsed_time": "1:22:06", "remaining_time": "4:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 877, "total_steps": 3836, "loss": 0.1791, "learning_rate": 4.5765761615911856e-06, "epoch": 0.22858632261427686, "percentage": 22.86, "elapsed_time": "1:22:12", "remaining_time": "4:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 878, "total_steps": 3836, "loss": 0.1897, "learning_rate": 4.575375256669276e-06, "epoch": 0.2288469683641221, "percentage": 22.89, "elapsed_time": "1:22:17", "remaining_time": "4:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 879, "total_steps": 3836, "loss": 0.1792, "learning_rate": 4.5741728091960645e-06, "epoch": 0.22910761411396735, "percentage": 22.91, "elapsed_time": "1:22:23", "remaining_time": "4:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 3836, "loss": 0.1991, "learning_rate": 4.572968820065288e-06, "epoch": 0.2293682598638126, "percentage": 22.94, "elapsed_time": "1:22:29", "remaining_time": "4:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 881, "total_steps": 3836, "loss": 0.1961, "learning_rate": 4.571763290171827e-06, "epoch": 0.22962890561365784, "percentage": 22.97, "elapsed_time": "1:22:34", "remaining_time": "4:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 882, "total_steps": 3836, "loss": 0.2018, "learning_rate": 4.570556220411708e-06, "epoch": 0.2298895513635031, "percentage": 22.99, "elapsed_time": "1:22:39", "remaining_time": "4:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 883, "total_steps": 3836, "loss": 0.1871, "learning_rate": 4.569347611682104e-06, "epoch": 0.23015019711334833, "percentage": 23.02, "elapsed_time": "1:22:45", "remaining_time": "4:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 884, "total_steps": 3836, "loss": 0.1947, "learning_rate": 4.568137464881328e-06, "epoch": 0.23041084286319355, "percentage": 23.04, "elapsed_time": "1:22:50", "remaining_time": "4:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 885, "total_steps": 3836, "loss": 0.1963, "learning_rate": 4.5669257809088394e-06, "epoch": 0.2306714886130388, "percentage": 23.07, "elapsed_time": "1:22:56", "remaining_time": "4:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 886, "total_steps": 3836, "loss": 0.187, "learning_rate": 4.5657125606652385e-06, "epoch": 0.23093213436288404, "percentage": 23.1, "elapsed_time": "1:23:01", "remaining_time": "4:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 887, "total_steps": 3836, "loss": 0.1841, "learning_rate": 4.564497805052269e-06, "epoch": 0.23119278011272928, "percentage": 23.12, "elapsed_time": "1:23:07", "remaining_time": "4:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 888, "total_steps": 3836, "loss": 0.1938, "learning_rate": 4.563281514972814e-06, "epoch": 0.23145342586257453, "percentage": 23.15, "elapsed_time": "1:23:12", "remaining_time": "4:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 889, "total_steps": 3836, "loss": 0.2047, "learning_rate": 4.562063691330897e-06, "epoch": 0.23171407161241978, "percentage": 23.18, "elapsed_time": "1:23:17", "remaining_time": "4:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 3836, "loss": 0.1868, "learning_rate": 4.560844335031684e-06, "epoch": 0.23197471736226502, "percentage": 23.2, "elapsed_time": "1:23:23", "remaining_time": "4:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 891, "total_steps": 3836, "loss": 0.199, "learning_rate": 4.5596234469814775e-06, "epoch": 0.23223536311211027, "percentage": 23.23, "elapsed_time": "1:23:28", "remaining_time": "4:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 892, "total_steps": 3836, "loss": 0.1947, "learning_rate": 4.55840102808772e-06, "epoch": 0.23249600886195548, "percentage": 23.25, "elapsed_time": "1:23:34", "remaining_time": "4:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 893, "total_steps": 3836, "loss": 0.1941, "learning_rate": 4.557177079258989e-06, "epoch": 0.23275665461180073, "percentage": 23.28, "elapsed_time": "1:23:40", "remaining_time": "4:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 894, "total_steps": 3836, "loss": 0.1912, "learning_rate": 4.555951601405005e-06, "epoch": 0.23301730036164597, "percentage": 23.31, "elapsed_time": "1:23:45", "remaining_time": "4:35:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 895, "total_steps": 3836, "loss": 0.2008, "learning_rate": 4.5547245954366185e-06, "epoch": 0.23327794611149122, "percentage": 23.33, "elapsed_time": "1:23:51", "remaining_time": "4:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 896, "total_steps": 3836, "loss": 0.1915, "learning_rate": 4.55349606226582e-06, "epoch": 0.23353859186133646, "percentage": 23.36, "elapsed_time": "1:23:56", "remaining_time": "4:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 897, "total_steps": 3836, "loss": 0.1891, "learning_rate": 4.552266002805732e-06, "epoch": 0.2337992376111817, "percentage": 23.38, "elapsed_time": "1:24:02", "remaining_time": "4:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 898, "total_steps": 3836, "loss": 0.1964, "learning_rate": 4.551034417970616e-06, "epoch": 0.23405988336102695, "percentage": 23.41, "elapsed_time": "1:24:08", "remaining_time": "4:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 899, "total_steps": 3836, "loss": 0.1796, "learning_rate": 4.549801308675862e-06, "epoch": 0.23432052911087217, "percentage": 23.44, "elapsed_time": "1:24:13", "remaining_time": "4:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 3836, "loss": 0.1938, "learning_rate": 4.548566675837996e-06, "epoch": 0.23458117486071742, "percentage": 23.46, "elapsed_time": "1:24:19", "remaining_time": "4:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 901, "total_steps": 3836, "loss": 0.1798, "learning_rate": 4.547330520374677e-06, "epoch": 0.23484182061056266, "percentage": 23.49, "elapsed_time": "1:24:24", "remaining_time": "4:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 902, "total_steps": 3836, "loss": 0.1758, "learning_rate": 4.546092843204694e-06, "epoch": 0.2351024663604079, "percentage": 23.51, "elapsed_time": "1:24:30", "remaining_time": "4:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 903, "total_steps": 3836, "loss": 0.1895, "learning_rate": 4.544853645247966e-06, "epoch": 0.23536311211025315, "percentage": 23.54, "elapsed_time": "1:24:35", "remaining_time": "4:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 904, "total_steps": 3836, "loss": 0.1804, "learning_rate": 4.543612927425547e-06, "epoch": 0.2356237578600984, "percentage": 23.57, "elapsed_time": "1:24:41", "remaining_time": "4:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 905, "total_steps": 3836, "loss": 0.1938, "learning_rate": 4.542370690659615e-06, "epoch": 0.23588440360994364, "percentage": 23.59, "elapsed_time": "1:24:47", "remaining_time": "4:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 906, "total_steps": 3836, "loss": 0.1717, "learning_rate": 4.541126935873481e-06, "epoch": 0.2361450493597889, "percentage": 23.62, "elapsed_time": "1:24:53", "remaining_time": "4:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 907, "total_steps": 3836, "loss": 0.1817, "learning_rate": 4.539881663991583e-06, "epoch": 0.2364056951096341, "percentage": 23.64, "elapsed_time": "1:24:58", "remaining_time": "4:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 908, "total_steps": 3836, "loss": 0.1842, "learning_rate": 4.538634875939486e-06, "epoch": 0.23666634085947935, "percentage": 23.67, "elapsed_time": "1:25:04", "remaining_time": "4:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 909, "total_steps": 3836, "loss": 0.1742, "learning_rate": 4.537386572643882e-06, "epoch": 0.2369269866093246, "percentage": 23.7, "elapsed_time": "1:25:10", "remaining_time": "4:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 3836, "loss": 0.1848, "learning_rate": 4.536136755032592e-06, "epoch": 0.23718763235916984, "percentage": 23.72, "elapsed_time": "1:25:15", "remaining_time": "4:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 911, "total_steps": 3836, "loss": 0.2025, "learning_rate": 4.534885424034557e-06, "epoch": 0.2374482781090151, "percentage": 23.75, "elapsed_time": "1:25:20", "remaining_time": "4:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 912, "total_steps": 3836, "loss": 0.1834, "learning_rate": 4.5336325805798475e-06, "epoch": 0.23770892385886033, "percentage": 23.77, "elapsed_time": "1:25:26", "remaining_time": "4:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 913, "total_steps": 3836, "loss": 0.1953, "learning_rate": 4.532378225599657e-06, "epoch": 0.23796956960870558, "percentage": 23.8, "elapsed_time": "1:25:31", "remaining_time": "4:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 914, "total_steps": 3836, "loss": 0.1843, "learning_rate": 4.5311223600263016e-06, "epoch": 0.23823021535855082, "percentage": 23.83, "elapsed_time": "1:25:37", "remaining_time": "4:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 915, "total_steps": 3836, "loss": 0.1801, "learning_rate": 4.529864984793221e-06, "epoch": 0.23849086110839604, "percentage": 23.85, "elapsed_time": "1:25:42", "remaining_time": "4:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 916, "total_steps": 3836, "loss": 0.1772, "learning_rate": 4.528606100834976e-06, "epoch": 0.23875150685824129, "percentage": 23.88, "elapsed_time": "1:25:48", "remaining_time": "4:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 917, "total_steps": 3836, "loss": 0.1814, "learning_rate": 4.527345709087251e-06, "epoch": 0.23901215260808653, "percentage": 23.91, "elapsed_time": "1:25:55", "remaining_time": "4:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 918, "total_steps": 3836, "loss": 0.1679, "learning_rate": 4.526083810486848e-06, "epoch": 0.23927279835793178, "percentage": 23.93, "elapsed_time": "1:26:01", "remaining_time": "4:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 919, "total_steps": 3836, "loss": 0.1945, "learning_rate": 4.524820405971691e-06, "epoch": 0.23953344410777702, "percentage": 23.96, "elapsed_time": "1:26:06", "remaining_time": "4:33:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 3836, "loss": 0.1873, "learning_rate": 4.523555496480824e-06, "epoch": 0.23979408985762227, "percentage": 23.98, "elapsed_time": "1:26:12", "remaining_time": "4:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 921, "total_steps": 3836, "loss": 0.1954, "learning_rate": 4.522289082954406e-06, "epoch": 0.2400547356074675, "percentage": 24.01, "elapsed_time": "1:26:18", "remaining_time": "4:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 922, "total_steps": 3836, "loss": 0.1856, "learning_rate": 4.5210211663337195e-06, "epoch": 0.24031538135731273, "percentage": 24.04, "elapsed_time": "1:26:23", "remaining_time": "4:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 923, "total_steps": 3836, "loss": 0.1945, "learning_rate": 4.519751747561158e-06, "epoch": 0.24057602710715797, "percentage": 24.06, "elapsed_time": "1:26:28", "remaining_time": "4:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 924, "total_steps": 3836, "loss": 0.1989, "learning_rate": 4.518480827580237e-06, "epoch": 0.24083667285700322, "percentage": 24.09, "elapsed_time": "1:26:34", "remaining_time": "4:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 925, "total_steps": 3836, "loss": 0.1688, "learning_rate": 4.517208407335584e-06, "epoch": 0.24109731860684847, "percentage": 24.11, "elapsed_time": "1:26:40", "remaining_time": "4:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 926, "total_steps": 3836, "loss": 0.2017, "learning_rate": 4.515934487772942e-06, "epoch": 0.2413579643566937, "percentage": 24.14, "elapsed_time": "1:26:46", "remaining_time": "4:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 927, "total_steps": 3836, "loss": 0.2061, "learning_rate": 4.5146590698391714e-06, "epoch": 0.24161861010653896, "percentage": 24.17, "elapsed_time": "1:26:51", "remaining_time": "4:32:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 928, "total_steps": 3836, "loss": 0.1866, "learning_rate": 4.513382154482242e-06, "epoch": 0.2418792558563842, "percentage": 24.19, "elapsed_time": "1:26:56", "remaining_time": "4:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 929, "total_steps": 3836, "loss": 0.1826, "learning_rate": 4.512103742651241e-06, "epoch": 0.24213990160622945, "percentage": 24.22, "elapsed_time": "1:27:02", "remaining_time": "4:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 3836, "loss": 0.1873, "learning_rate": 4.510823835296364e-06, "epoch": 0.24240054735607466, "percentage": 24.24, "elapsed_time": "1:27:07", "remaining_time": "4:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 931, "total_steps": 3836, "loss": 0.1675, "learning_rate": 4.509542433368921e-06, "epoch": 0.2426611931059199, "percentage": 24.27, "elapsed_time": "1:27:13", "remaining_time": "4:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 932, "total_steps": 3836, "loss": 0.1921, "learning_rate": 4.50825953782133e-06, "epoch": 0.24292183885576515, "percentage": 24.3, "elapsed_time": "1:27:19", "remaining_time": "4:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 933, "total_steps": 3836, "loss": 0.1926, "learning_rate": 4.5069751496071225e-06, "epoch": 0.2431824846056104, "percentage": 24.32, "elapsed_time": "1:27:24", "remaining_time": "4:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 934, "total_steps": 3836, "loss": 0.1937, "learning_rate": 4.505689269680937e-06, "epoch": 0.24344313035545564, "percentage": 24.35, "elapsed_time": "1:27:29", "remaining_time": "4:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 935, "total_steps": 3836, "loss": 0.2022, "learning_rate": 4.504401898998522e-06, "epoch": 0.2437037761053009, "percentage": 24.37, "elapsed_time": "1:27:35", "remaining_time": "4:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 936, "total_steps": 3836, "loss": 0.1966, "learning_rate": 4.503113038516732e-06, "epoch": 0.24396442185514614, "percentage": 24.4, "elapsed_time": "1:27:41", "remaining_time": "4:31:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 937, "total_steps": 3836, "loss": 0.1808, "learning_rate": 4.501822689193532e-06, "epoch": 0.24422506760499135, "percentage": 24.43, "elapsed_time": "1:27:47", "remaining_time": "4:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 938, "total_steps": 3836, "loss": 0.1942, "learning_rate": 4.500530851987992e-06, "epoch": 0.2444857133548366, "percentage": 24.45, "elapsed_time": "1:27:53", "remaining_time": "4:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 939, "total_steps": 3836, "loss": 0.1828, "learning_rate": 4.499237527860287e-06, "epoch": 0.24474635910468184, "percentage": 24.48, "elapsed_time": "1:27:58", "remaining_time": "4:31:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 3836, "loss": 0.1939, "learning_rate": 4.4979427177716974e-06, "epoch": 0.2450070048545271, "percentage": 24.5, "elapsed_time": "1:28:04", "remaining_time": "4:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 941, "total_steps": 3836, "loss": 0.167, "learning_rate": 4.4966464226846105e-06, "epoch": 0.24526765060437233, "percentage": 24.53, "elapsed_time": "1:28:09", "remaining_time": "4:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 942, "total_steps": 3836, "loss": 0.1855, "learning_rate": 4.495348643562514e-06, "epoch": 0.24552829635421758, "percentage": 24.56, "elapsed_time": "1:28:15", "remaining_time": "4:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 943, "total_steps": 3836, "loss": 0.1745, "learning_rate": 4.494049381370002e-06, "epoch": 0.24578894210406282, "percentage": 24.58, "elapsed_time": "1:28:20", "remaining_time": "4:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 944, "total_steps": 3836, "loss": 0.1715, "learning_rate": 4.4927486370727656e-06, "epoch": 0.24604958785390807, "percentage": 24.61, "elapsed_time": "1:28:26", "remaining_time": "4:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 945, "total_steps": 3836, "loss": 0.1972, "learning_rate": 4.491446411637605e-06, "epoch": 0.2463102336037533, "percentage": 24.64, "elapsed_time": "1:28:31", "remaining_time": "4:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 946, "total_steps": 3836, "loss": 0.1817, "learning_rate": 4.4901427060324135e-06, "epoch": 0.24657087935359853, "percentage": 24.66, "elapsed_time": "1:28:37", "remaining_time": "4:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 947, "total_steps": 3836, "loss": 0.1899, "learning_rate": 4.488837521226192e-06, "epoch": 0.24683152510344378, "percentage": 24.69, "elapsed_time": "1:28:42", "remaining_time": "4:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 948, "total_steps": 3836, "loss": 0.187, "learning_rate": 4.487530858189033e-06, "epoch": 0.24709217085328902, "percentage": 24.71, "elapsed_time": "1:28:49", "remaining_time": "4:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 949, "total_steps": 3836, "loss": 0.1931, "learning_rate": 4.486222717892135e-06, "epoch": 0.24735281660313427, "percentage": 24.74, "elapsed_time": "1:28:54", "remaining_time": "4:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 3836, "loss": 0.1742, "learning_rate": 4.4849131013077915e-06, "epoch": 0.2476134623529795, "percentage": 24.77, "elapsed_time": "1:29:00", "remaining_time": "4:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 951, "total_steps": 3836, "loss": 0.1787, "learning_rate": 4.483602009409391e-06, "epoch": 0.24787410810282476, "percentage": 24.79, "elapsed_time": "1:29:05", "remaining_time": "4:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 952, "total_steps": 3836, "loss": 0.1914, "learning_rate": 4.482289443171421e-06, "epoch": 0.24813475385267, "percentage": 24.82, "elapsed_time": "1:29:12", "remaining_time": "4:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 953, "total_steps": 3836, "loss": 0.1897, "learning_rate": 4.480975403569466e-06, "epoch": 0.24839539960251522, "percentage": 24.84, "elapsed_time": "1:29:17", "remaining_time": "4:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 954, "total_steps": 3836, "loss": 0.1913, "learning_rate": 4.479659891580203e-06, "epoch": 0.24865604535236047, "percentage": 24.87, "elapsed_time": "1:29:23", "remaining_time": "4:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 955, "total_steps": 3836, "loss": 0.1754, "learning_rate": 4.478342908181404e-06, "epoch": 0.2489166911022057, "percentage": 24.9, "elapsed_time": "1:29:29", "remaining_time": "4:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 956, "total_steps": 3836, "loss": 0.1799, "learning_rate": 4.477024454351937e-06, "epoch": 0.24917733685205096, "percentage": 24.92, "elapsed_time": "1:29:35", "remaining_time": "4:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 957, "total_steps": 3836, "loss": 0.1886, "learning_rate": 4.475704531071759e-06, "epoch": 0.2494379826018962, "percentage": 24.95, "elapsed_time": "1:29:40", "remaining_time": "4:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 958, "total_steps": 3836, "loss": 0.1853, "learning_rate": 4.4743831393219215e-06, "epoch": 0.24969862835174145, "percentage": 24.97, "elapsed_time": "1:29:45", "remaining_time": "4:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 959, "total_steps": 3836, "loss": 0.1985, "learning_rate": 4.473060280084568e-06, "epoch": 0.2499592741015867, "percentage": 25.0, "elapsed_time": "1:29:51", "remaining_time": "4:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 3836, "loss": 0.1996, "learning_rate": 4.471735954342932e-06, "epoch": 0.25021991985143194, "percentage": 25.03, "elapsed_time": "1:29:56", "remaining_time": "4:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 961, "total_steps": 3836, "loss": 0.1845, "learning_rate": 4.470410163081336e-06, "epoch": 0.2504805656012772, "percentage": 25.05, "elapsed_time": "1:30:02", "remaining_time": "4:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 962, "total_steps": 3836, "loss": 0.189, "learning_rate": 4.469082907285192e-06, "epoch": 0.25074121135112243, "percentage": 25.08, "elapsed_time": "1:30:07", "remaining_time": "4:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 963, "total_steps": 3836, "loss": 0.1777, "learning_rate": 4.4677541879410025e-06, "epoch": 0.2510018571009677, "percentage": 25.1, "elapsed_time": "1:30:13", "remaining_time": "4:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 964, "total_steps": 3836, "loss": 0.1882, "learning_rate": 4.4664240060363565e-06, "epoch": 0.25126250285081286, "percentage": 25.13, "elapsed_time": "1:30:19", "remaining_time": "4:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 965, "total_steps": 3836, "loss": 0.1969, "learning_rate": 4.465092362559929e-06, "epoch": 0.2515231486006581, "percentage": 25.16, "elapsed_time": "1:30:24", "remaining_time": "4:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 966, "total_steps": 3836, "loss": 0.1729, "learning_rate": 4.463759258501485e-06, "epoch": 0.25178379435050335, "percentage": 25.18, "elapsed_time": "1:30:30", "remaining_time": "4:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 967, "total_steps": 3836, "loss": 0.1969, "learning_rate": 4.4624246948518685e-06, "epoch": 0.2520444401003486, "percentage": 25.21, "elapsed_time": "1:30:35", "remaining_time": "4:28:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 968, "total_steps": 3836, "loss": 0.1766, "learning_rate": 4.461088672603015e-06, "epoch": 0.25230508585019384, "percentage": 25.23, "elapsed_time": "1:30:41", "remaining_time": "4:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 969, "total_steps": 3836, "loss": 0.1886, "learning_rate": 4.459751192747941e-06, "epoch": 0.2525657316000391, "percentage": 25.26, "elapsed_time": "1:30:47", "remaining_time": "4:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 3836, "loss": 0.1851, "learning_rate": 4.458412256280747e-06, "epoch": 0.25282637734988433, "percentage": 25.29, "elapsed_time": "1:30:53", "remaining_time": "4:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 971, "total_steps": 3836, "loss": 0.1951, "learning_rate": 4.457071864196616e-06, "epoch": 0.2530870230997296, "percentage": 25.31, "elapsed_time": "1:30:59", "remaining_time": "4:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 972, "total_steps": 3836, "loss": 0.1917, "learning_rate": 4.455730017491812e-06, "epoch": 0.2533476688495748, "percentage": 25.34, "elapsed_time": "1:31:04", "remaining_time": "4:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 973, "total_steps": 3836, "loss": 0.1927, "learning_rate": 4.454386717163682e-06, "epoch": 0.25360831459942007, "percentage": 25.36, "elapsed_time": "1:31:10", "remaining_time": "4:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 974, "total_steps": 3836, "loss": 0.1936, "learning_rate": 4.453041964210653e-06, "epoch": 0.2538689603492653, "percentage": 25.39, "elapsed_time": "1:31:15", "remaining_time": "4:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 975, "total_steps": 3836, "loss": 0.1883, "learning_rate": 4.451695759632229e-06, "epoch": 0.25412960609911056, "percentage": 25.42, "elapsed_time": "1:31:21", "remaining_time": "4:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 976, "total_steps": 3836, "loss": 0.2, "learning_rate": 4.450348104428998e-06, "epoch": 0.2543902518489558, "percentage": 25.44, "elapsed_time": "1:31:26", "remaining_time": "4:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 977, "total_steps": 3836, "loss": 0.1839, "learning_rate": 4.448998999602621e-06, "epoch": 0.25465089759880105, "percentage": 25.47, "elapsed_time": "1:31:32", "remaining_time": "4:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 978, "total_steps": 3836, "loss": 0.1873, "learning_rate": 4.447648446155841e-06, "epoch": 0.2549115433486463, "percentage": 25.5, "elapsed_time": "1:31:38", "remaining_time": "4:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 979, "total_steps": 3836, "loss": 0.1791, "learning_rate": 4.446296445092473e-06, "epoch": 0.2551721890984915, "percentage": 25.52, "elapsed_time": "1:31:43", "remaining_time": "4:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 3836, "loss": 0.1885, "learning_rate": 4.4449429974174115e-06, "epoch": 0.25543283484833673, "percentage": 25.55, "elapsed_time": "1:31:49", "remaining_time": "4:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 981, "total_steps": 3836, "loss": 0.1895, "learning_rate": 4.443588104136626e-06, "epoch": 0.255693480598182, "percentage": 25.57, "elapsed_time": "1:31:53", "remaining_time": "4:27:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 982, "total_steps": 3836, "loss": 0.1707, "learning_rate": 4.442231766257159e-06, "epoch": 0.2559541263480272, "percentage": 25.6, "elapsed_time": "1:31:59", "remaining_time": "4:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 983, "total_steps": 3836, "loss": 0.1876, "learning_rate": 4.440873984787127e-06, "epoch": 0.25621477209787247, "percentage": 25.63, "elapsed_time": "1:32:05", "remaining_time": "4:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 984, "total_steps": 3836, "loss": 0.1934, "learning_rate": 4.43951476073572e-06, "epoch": 0.2564754178477177, "percentage": 25.65, "elapsed_time": "1:32:10", "remaining_time": "4:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 985, "total_steps": 3836, "loss": 0.1857, "learning_rate": 4.4381540951132e-06, "epoch": 0.25673606359756296, "percentage": 25.68, "elapsed_time": "1:32:16", "remaining_time": "4:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 986, "total_steps": 3836, "loss": 0.1681, "learning_rate": 4.436791988930901e-06, "epoch": 0.2569967093474082, "percentage": 25.7, "elapsed_time": "1:32:21", "remaining_time": "4:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 987, "total_steps": 3836, "loss": 0.1648, "learning_rate": 4.435428443201226e-06, "epoch": 0.25725735509725345, "percentage": 25.73, "elapsed_time": "1:32:27", "remaining_time": "4:26:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 988, "total_steps": 3836, "loss": 0.1788, "learning_rate": 4.434063458937652e-06, "epoch": 0.2575180008470987, "percentage": 25.76, "elapsed_time": "1:32:32", "remaining_time": "4:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 989, "total_steps": 3836, "loss": 0.1861, "learning_rate": 4.432697037154718e-06, "epoch": 0.25777864659694394, "percentage": 25.78, "elapsed_time": "1:32:38", "remaining_time": "4:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 3836, "loss": 0.1841, "learning_rate": 4.43132917886804e-06, "epoch": 0.2580392923467892, "percentage": 25.81, "elapsed_time": "1:32:44", "remaining_time": "4:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 991, "total_steps": 3836, "loss": 0.1999, "learning_rate": 4.429959885094295e-06, "epoch": 0.25829993809663443, "percentage": 25.83, "elapsed_time": "1:32:49", "remaining_time": "4:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 992, "total_steps": 3836, "loss": 0.1956, "learning_rate": 4.428589156851231e-06, "epoch": 0.2585605838464797, "percentage": 25.86, "elapsed_time": "1:32:54", "remaining_time": "4:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 993, "total_steps": 3836, "loss": 0.1797, "learning_rate": 4.42721699515766e-06, "epoch": 0.2588212295963249, "percentage": 25.89, "elapsed_time": "1:32:59", "remaining_time": "4:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 994, "total_steps": 3836, "loss": 0.199, "learning_rate": 4.42584340103346e-06, "epoch": 0.2590818753461701, "percentage": 25.91, "elapsed_time": "1:33:06", "remaining_time": "4:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 995, "total_steps": 3836, "loss": 0.185, "learning_rate": 4.424468375499573e-06, "epoch": 0.25934252109601535, "percentage": 25.94, "elapsed_time": "1:33:12", "remaining_time": "4:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 996, "total_steps": 3836, "loss": 0.1826, "learning_rate": 4.423091919578008e-06, "epoch": 0.2596031668458606, "percentage": 25.96, "elapsed_time": "1:33:18", "remaining_time": "4:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 997, "total_steps": 3836, "loss": 0.1762, "learning_rate": 4.421714034291833e-06, "epoch": 0.25986381259570585, "percentage": 25.99, "elapsed_time": "1:33:23", "remaining_time": "4:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 998, "total_steps": 3836, "loss": 0.1741, "learning_rate": 4.4203347206651805e-06, "epoch": 0.2601244583455511, "percentage": 26.02, "elapsed_time": "1:33:29", "remaining_time": "4:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 999, "total_steps": 3836, "loss": 0.1985, "learning_rate": 4.418953979723244e-06, "epoch": 0.26038510409539634, "percentage": 26.04, "elapsed_time": "1:33:35", "remaining_time": "4:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 3836, "loss": 0.1762, "learning_rate": 4.417571812492279e-06, "epoch": 0.2606457498452416, "percentage": 26.07, "elapsed_time": "1:33:41", "remaining_time": "4:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 3836, "eval_loss": 0.18625357747077942, "epoch": 0.2606457498452416, "percentage": 26.07, "elapsed_time": "1:34:36", "remaining_time": "4:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1001, "total_steps": 3836, "loss": 0.1833, "learning_rate": 4.416188219999601e-06, "epoch": 0.2609063955950868, "percentage": 26.09, "elapsed_time": "1:34:41", "remaining_time": "4:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1002, "total_steps": 3836, "loss": 0.1926, "learning_rate": 4.4148032032735835e-06, "epoch": 0.26116704134493207, "percentage": 26.12, "elapsed_time": "1:34:46", "remaining_time": "4:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1003, "total_steps": 3836, "loss": 0.1858, "learning_rate": 4.41341676334366e-06, "epoch": 0.2614276870947773, "percentage": 26.15, "elapsed_time": "1:34:52", "remaining_time": "4:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1004, "total_steps": 3836, "loss": 0.183, "learning_rate": 4.4120289012403185e-06, "epoch": 0.26168833284462256, "percentage": 26.17, "elapsed_time": "1:34:57", "remaining_time": "4:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1005, "total_steps": 3836, "loss": 0.175, "learning_rate": 4.410639617995109e-06, "epoch": 0.2619489785944678, "percentage": 26.2, "elapsed_time": "1:35:03", "remaining_time": "4:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1006, "total_steps": 3836, "loss": 0.1828, "learning_rate": 4.409248914640636e-06, "epoch": 0.26220962434431305, "percentage": 26.23, "elapsed_time": "1:35:08", "remaining_time": "4:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1007, "total_steps": 3836, "loss": 0.1988, "learning_rate": 4.407856792210558e-06, "epoch": 0.2624702700941583, "percentage": 26.25, "elapsed_time": "1:35:13", "remaining_time": "4:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1008, "total_steps": 3836, "loss": 0.1741, "learning_rate": 4.4064632517395875e-06, "epoch": 0.26273091584400354, "percentage": 26.28, "elapsed_time": "1:35:18", "remaining_time": "4:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1009, "total_steps": 3836, "loss": 0.1816, "learning_rate": 4.405068294263496e-06, "epoch": 0.26299156159384873, "percentage": 26.3, "elapsed_time": "1:35:24", "remaining_time": "4:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 3836, "loss": 0.1785, "learning_rate": 4.4036719208191025e-06, "epoch": 0.263252207343694, "percentage": 26.33, "elapsed_time": "1:35:30", "remaining_time": "4:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1011, "total_steps": 3836, "loss": 0.1748, "learning_rate": 4.402274132444282e-06, "epoch": 0.2635128530935392, "percentage": 26.36, "elapsed_time": "1:35:36", "remaining_time": "4:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1012, "total_steps": 3836, "loss": 0.1839, "learning_rate": 4.400874930177959e-06, "epoch": 0.26377349884338447, "percentage": 26.38, "elapsed_time": "1:35:41", "remaining_time": "4:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1013, "total_steps": 3836, "loss": 0.1726, "learning_rate": 4.399474315060111e-06, "epoch": 0.2640341445932297, "percentage": 26.41, "elapsed_time": "1:35:47", "remaining_time": "4:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1014, "total_steps": 3836, "loss": 0.1794, "learning_rate": 4.398072288131763e-06, "epoch": 0.26429479034307496, "percentage": 26.43, "elapsed_time": "1:35:52", "remaining_time": "4:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1015, "total_steps": 3836, "loss": 0.1902, "learning_rate": 4.396668850434993e-06, "epoch": 0.2645554360929202, "percentage": 26.46, "elapsed_time": "1:35:58", "remaining_time": "4:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1016, "total_steps": 3836, "loss": 0.1857, "learning_rate": 4.395264003012924e-06, "epoch": 0.26481608184276545, "percentage": 26.49, "elapsed_time": "1:36:04", "remaining_time": "4:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1017, "total_steps": 3836, "loss": 0.1832, "learning_rate": 4.393857746909728e-06, "epoch": 0.2650767275926107, "percentage": 26.51, "elapsed_time": "1:36:09", "remaining_time": "4:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1018, "total_steps": 3836, "loss": 0.1692, "learning_rate": 4.392450083170625e-06, "epoch": 0.26533737334245594, "percentage": 26.54, "elapsed_time": "1:36:14", "remaining_time": "4:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1019, "total_steps": 3836, "loss": 0.2013, "learning_rate": 4.3910410128418805e-06, "epoch": 0.2655980190923012, "percentage": 26.56, "elapsed_time": "1:36:20", "remaining_time": "4:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 3836, "loss": 0.1824, "learning_rate": 4.389630536970806e-06, "epoch": 0.26585866484214643, "percentage": 26.59, "elapsed_time": "1:36:26", "remaining_time": "4:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1021, "total_steps": 3836, "loss": 0.1911, "learning_rate": 4.388218656605755e-06, "epoch": 0.2661193105919917, "percentage": 26.62, "elapsed_time": "1:36:31", "remaining_time": "4:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1022, "total_steps": 3836, "loss": 0.1993, "learning_rate": 4.386805372796129e-06, "epoch": 0.2663799563418369, "percentage": 26.64, "elapsed_time": "1:36:37", "remaining_time": "4:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1023, "total_steps": 3836, "loss": 0.1782, "learning_rate": 4.38539068659237e-06, "epoch": 0.26664060209168217, "percentage": 26.67, "elapsed_time": "1:36:43", "remaining_time": "4:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1024, "total_steps": 3836, "loss": 0.1876, "learning_rate": 4.383974599045963e-06, "epoch": 0.2669012478415274, "percentage": 26.69, "elapsed_time": "1:36:49", "remaining_time": "4:25:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1025, "total_steps": 3836, "loss": 0.2014, "learning_rate": 4.382557111209436e-06, "epoch": 0.2671618935913726, "percentage": 26.72, "elapsed_time": "1:36:55", "remaining_time": "4:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1026, "total_steps": 3836, "loss": 0.1879, "learning_rate": 4.3811382241363545e-06, "epoch": 0.26742253934121785, "percentage": 26.75, "elapsed_time": "1:37:01", "remaining_time": "4:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1027, "total_steps": 3836, "loss": 0.1875, "learning_rate": 4.379717938881326e-06, "epoch": 0.2676831850910631, "percentage": 26.77, "elapsed_time": "1:37:07", "remaining_time": "4:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1028, "total_steps": 3836, "loss": 0.1713, "learning_rate": 4.378296256499998e-06, "epoch": 0.26794383084090834, "percentage": 26.8, "elapsed_time": "1:37:12", "remaining_time": "4:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1029, "total_steps": 3836, "loss": 0.1901, "learning_rate": 4.376873178049056e-06, "epoch": 0.2682044765907536, "percentage": 26.82, "elapsed_time": "1:37:18", "remaining_time": "4:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 3836, "loss": 0.1912, "learning_rate": 4.375448704586221e-06, "epoch": 0.2684651223405988, "percentage": 26.85, "elapsed_time": "1:37:23", "remaining_time": "4:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1031, "total_steps": 3836, "loss": 0.1911, "learning_rate": 4.374022837170254e-06, "epoch": 0.2687257680904441, "percentage": 26.88, "elapsed_time": "1:37:29", "remaining_time": "4:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1032, "total_steps": 3836, "loss": 0.2033, "learning_rate": 4.37259557686095e-06, "epoch": 0.2689864138402893, "percentage": 26.9, "elapsed_time": "1:37:35", "remaining_time": "4:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1033, "total_steps": 3836, "loss": 0.1725, "learning_rate": 4.37116692471914e-06, "epoch": 0.26924705959013456, "percentage": 26.93, "elapsed_time": "1:37:39", "remaining_time": "4:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1034, "total_steps": 3836, "loss": 0.1925, "learning_rate": 4.369736881806691e-06, "epoch": 0.2695077053399798, "percentage": 26.96, "elapsed_time": "1:37:44", "remaining_time": "4:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1035, "total_steps": 3836, "loss": 0.1754, "learning_rate": 4.368305449186499e-06, "epoch": 0.26976835108982505, "percentage": 26.98, "elapsed_time": "1:37:50", "remaining_time": "4:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1036, "total_steps": 3836, "loss": 0.184, "learning_rate": 4.366872627922498e-06, "epoch": 0.2700289968396703, "percentage": 27.01, "elapsed_time": "1:37:55", "remaining_time": "4:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1037, "total_steps": 3836, "loss": 0.1803, "learning_rate": 4.365438419079652e-06, "epoch": 0.27028964258951554, "percentage": 27.03, "elapsed_time": "1:38:00", "remaining_time": "4:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1038, "total_steps": 3836, "loss": 0.1915, "learning_rate": 4.364002823723956e-06, "epoch": 0.2705502883393608, "percentage": 27.06, "elapsed_time": "1:38:06", "remaining_time": "4:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1039, "total_steps": 3836, "loss": 0.1908, "learning_rate": 4.3625658429224374e-06, "epoch": 0.27081093408920603, "percentage": 27.09, "elapsed_time": "1:38:11", "remaining_time": "4:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 3836, "loss": 0.1831, "learning_rate": 4.36112747774315e-06, "epoch": 0.2710715798390512, "percentage": 27.11, "elapsed_time": "1:38:16", "remaining_time": "4:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1041, "total_steps": 3836, "loss": 0.1749, "learning_rate": 4.359687729255181e-06, "epoch": 0.27133222558889647, "percentage": 27.14, "elapsed_time": "1:38:21", "remaining_time": "4:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1042, "total_steps": 3836, "loss": 0.1884, "learning_rate": 4.358246598528641e-06, "epoch": 0.2715928713387417, "percentage": 27.16, "elapsed_time": "1:38:27", "remaining_time": "4:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1043, "total_steps": 3836, "loss": 0.1812, "learning_rate": 4.356804086634671e-06, "epoch": 0.27185351708858696, "percentage": 27.19, "elapsed_time": "1:38:32", "remaining_time": "4:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1044, "total_steps": 3836, "loss": 0.1825, "learning_rate": 4.355360194645439e-06, "epoch": 0.2721141628384322, "percentage": 27.22, "elapsed_time": "1:38:38", "remaining_time": "4:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1045, "total_steps": 3836, "loss": 0.1905, "learning_rate": 4.353914923634136e-06, "epoch": 0.27237480858827745, "percentage": 27.24, "elapsed_time": "1:38:44", "remaining_time": "4:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1046, "total_steps": 3836, "loss": 0.1707, "learning_rate": 4.35246827467498e-06, "epoch": 0.2726354543381227, "percentage": 27.27, "elapsed_time": "1:38:50", "remaining_time": "4:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1047, "total_steps": 3836, "loss": 0.1754, "learning_rate": 4.3510202488432155e-06, "epoch": 0.27289610008796794, "percentage": 27.29, "elapsed_time": "1:38:56", "remaining_time": "4:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1048, "total_steps": 3836, "loss": 0.1926, "learning_rate": 4.349570847215104e-06, "epoch": 0.2731567458378132, "percentage": 27.32, "elapsed_time": "1:39:02", "remaining_time": "4:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1049, "total_steps": 3836, "loss": 0.1776, "learning_rate": 4.348120070867934e-06, "epoch": 0.27341739158765843, "percentage": 27.35, "elapsed_time": "1:39:07", "remaining_time": "4:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 3836, "loss": 0.186, "learning_rate": 4.346667920880016e-06, "epoch": 0.2736780373375037, "percentage": 27.37, "elapsed_time": "1:39:13", "remaining_time": "4:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1051, "total_steps": 3836, "loss": 0.1825, "learning_rate": 4.34521439833068e-06, "epoch": 0.2739386830873489, "percentage": 27.4, "elapsed_time": "1:39:18", "remaining_time": "4:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1052, "total_steps": 3836, "loss": 0.1896, "learning_rate": 4.343759504300278e-06, "epoch": 0.27419932883719417, "percentage": 27.42, "elapsed_time": "1:39:24", "remaining_time": "4:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1053, "total_steps": 3836, "loss": 0.174, "learning_rate": 4.3423032398701785e-06, "epoch": 0.2744599745870394, "percentage": 27.45, "elapsed_time": "1:39:30", "remaining_time": "4:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1054, "total_steps": 3836, "loss": 0.1655, "learning_rate": 4.34084560612277e-06, "epoch": 0.27472062033688466, "percentage": 27.48, "elapsed_time": "1:39:36", "remaining_time": "4:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1055, "total_steps": 3836, "loss": 0.1879, "learning_rate": 4.33938660414146e-06, "epoch": 0.27498126608672985, "percentage": 27.5, "elapsed_time": "1:39:41", "remaining_time": "4:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1056, "total_steps": 3836, "loss": 0.1694, "learning_rate": 4.337926235010672e-06, "epoch": 0.2752419118365751, "percentage": 27.53, "elapsed_time": "1:39:47", "remaining_time": "4:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1057, "total_steps": 3836, "loss": 0.1764, "learning_rate": 4.336464499815844e-06, "epoch": 0.27550255758642034, "percentage": 27.55, "elapsed_time": "1:39:52", "remaining_time": "4:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1058, "total_steps": 3836, "loss": 0.1883, "learning_rate": 4.335001399643433e-06, "epoch": 0.2757632033362656, "percentage": 27.58, "elapsed_time": "1:39:58", "remaining_time": "4:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1059, "total_steps": 3836, "loss": 0.1737, "learning_rate": 4.333536935580905e-06, "epoch": 0.27602384908611083, "percentage": 27.61, "elapsed_time": "1:40:03", "remaining_time": "4:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 3836, "loss": 0.1819, "learning_rate": 4.332071108716747e-06, "epoch": 0.2762844948359561, "percentage": 27.63, "elapsed_time": "1:40:08", "remaining_time": "4:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1061, "total_steps": 3836, "loss": 0.1731, "learning_rate": 4.330603920140453e-06, "epoch": 0.2765451405858013, "percentage": 27.66, "elapsed_time": "1:40:13", "remaining_time": "4:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1062, "total_steps": 3836, "loss": 0.1692, "learning_rate": 4.329135370942531e-06, "epoch": 0.27680578633564656, "percentage": 27.69, "elapsed_time": "1:40:19", "remaining_time": "4:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1063, "total_steps": 3836, "loss": 0.1824, "learning_rate": 4.327665462214501e-06, "epoch": 0.2770664320854918, "percentage": 27.71, "elapsed_time": "1:40:24", "remaining_time": "4:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1064, "total_steps": 3836, "loss": 0.1831, "learning_rate": 4.326194195048894e-06, "epoch": 0.27732707783533705, "percentage": 27.74, "elapsed_time": "1:40:30", "remaining_time": "4:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1065, "total_steps": 3836, "loss": 0.1692, "learning_rate": 4.324721570539247e-06, "epoch": 0.2775877235851823, "percentage": 27.76, "elapsed_time": "1:40:36", "remaining_time": "4:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1066, "total_steps": 3836, "loss": 0.1753, "learning_rate": 4.323247589780111e-06, "epoch": 0.27784836933502755, "percentage": 27.79, "elapsed_time": "1:40:41", "remaining_time": "4:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1067, "total_steps": 3836, "loss": 0.1898, "learning_rate": 4.321772253867041e-06, "epoch": 0.2781090150848728, "percentage": 27.82, "elapsed_time": "1:40:46", "remaining_time": "4:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1068, "total_steps": 3836, "loss": 0.1723, "learning_rate": 4.320295563896601e-06, "epoch": 0.27836966083471804, "percentage": 27.84, "elapsed_time": "1:40:51", "remaining_time": "4:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1069, "total_steps": 3836, "loss": 0.1851, "learning_rate": 4.318817520966362e-06, "epoch": 0.2786303065845633, "percentage": 27.87, "elapsed_time": "1:40:56", "remaining_time": "4:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 3836, "loss": 0.1849, "learning_rate": 4.317338126174899e-06, "epoch": 0.27889095233440847, "percentage": 27.89, "elapsed_time": "1:41:02", "remaining_time": "4:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1071, "total_steps": 3836, "loss": 0.1862, "learning_rate": 4.315857380621794e-06, "epoch": 0.2791515980842537, "percentage": 27.92, "elapsed_time": "1:41:08", "remaining_time": "4:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1072, "total_steps": 3836, "loss": 0.1785, "learning_rate": 4.314375285407629e-06, "epoch": 0.27941224383409896, "percentage": 27.95, "elapsed_time": "1:41:13", "remaining_time": "4:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1073, "total_steps": 3836, "loss": 0.1718, "learning_rate": 4.312891841633995e-06, "epoch": 0.2796728895839442, "percentage": 27.97, "elapsed_time": "1:41:18", "remaining_time": "4:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1074, "total_steps": 3836, "loss": 0.1783, "learning_rate": 4.311407050403479e-06, "epoch": 0.27993353533378945, "percentage": 28.0, "elapsed_time": "1:41:23", "remaining_time": "4:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1075, "total_steps": 3836, "loss": 0.1823, "learning_rate": 4.309920912819674e-06, "epoch": 0.2801941810836347, "percentage": 28.02, "elapsed_time": "1:41:29", "remaining_time": "4:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1076, "total_steps": 3836, "loss": 0.1767, "learning_rate": 4.308433429987172e-06, "epoch": 0.28045482683347994, "percentage": 28.05, "elapsed_time": "1:41:35", "remaining_time": "4:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1077, "total_steps": 3836, "loss": 0.1892, "learning_rate": 4.306944603011565e-06, "epoch": 0.2807154725833252, "percentage": 28.08, "elapsed_time": "1:41:40", "remaining_time": "4:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1078, "total_steps": 3836, "loss": 0.1783, "learning_rate": 4.305454432999445e-06, "epoch": 0.28097611833317043, "percentage": 28.1, "elapsed_time": "1:41:46", "remaining_time": "4:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1079, "total_steps": 3836, "loss": 0.1748, "learning_rate": 4.303962921058401e-06, "epoch": 0.2812367640830157, "percentage": 28.13, "elapsed_time": "1:41:52", "remaining_time": "4:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 3836, "loss": 0.1886, "learning_rate": 4.302470068297019e-06, "epoch": 0.2814974098328609, "percentage": 28.15, "elapsed_time": "1:41:59", "remaining_time": "4:20:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1081, "total_steps": 3836, "loss": 0.1748, "learning_rate": 4.300975875824884e-06, "epoch": 0.28175805558270617, "percentage": 28.18, "elapsed_time": "1:42:04", "remaining_time": "4:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1082, "total_steps": 3836, "loss": 0.1803, "learning_rate": 4.2994803447525735e-06, "epoch": 0.2820187013325514, "percentage": 28.21, "elapsed_time": "1:42:10", "remaining_time": "4:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1083, "total_steps": 3836, "loss": 0.1902, "learning_rate": 4.297983476191663e-06, "epoch": 0.28227934708239666, "percentage": 28.23, "elapsed_time": "1:42:15", "remaining_time": "4:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1084, "total_steps": 3836, "loss": 0.1866, "learning_rate": 4.29648527125472e-06, "epoch": 0.2825399928322419, "percentage": 28.26, "elapsed_time": "1:42:21", "remaining_time": "4:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1085, "total_steps": 3836, "loss": 0.1935, "learning_rate": 4.294985731055306e-06, "epoch": 0.2828006385820871, "percentage": 28.28, "elapsed_time": "1:42:27", "remaining_time": "4:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1086, "total_steps": 3836, "loss": 0.1807, "learning_rate": 4.2934848567079745e-06, "epoch": 0.28306128433193234, "percentage": 28.31, "elapsed_time": "1:42:31", "remaining_time": "4:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1087, "total_steps": 3836, "loss": 0.179, "learning_rate": 4.2919826493282725e-06, "epoch": 0.2833219300817776, "percentage": 28.34, "elapsed_time": "1:42:37", "remaining_time": "4:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1088, "total_steps": 3836, "loss": 0.1887, "learning_rate": 4.290479110032735e-06, "epoch": 0.28358257583162283, "percentage": 28.36, "elapsed_time": "1:42:42", "remaining_time": "4:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1089, "total_steps": 3836, "loss": 0.1721, "learning_rate": 4.28897423993889e-06, "epoch": 0.2838432215814681, "percentage": 28.39, "elapsed_time": "1:42:47", "remaining_time": "4:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 3836, "loss": 0.1703, "learning_rate": 4.28746804016525e-06, "epoch": 0.2841038673313133, "percentage": 28.42, "elapsed_time": "1:42:53", "remaining_time": "4:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1091, "total_steps": 3836, "loss": 0.1719, "learning_rate": 4.285960511831322e-06, "epoch": 0.28436451308115857, "percentage": 28.44, "elapsed_time": "1:42:58", "remaining_time": "4:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1092, "total_steps": 3836, "loss": 0.191, "learning_rate": 4.284451656057595e-06, "epoch": 0.2846251588310038, "percentage": 28.47, "elapsed_time": "1:43:04", "remaining_time": "4:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1093, "total_steps": 3836, "loss": 0.1888, "learning_rate": 4.282941473965548e-06, "epoch": 0.28488580458084906, "percentage": 28.49, "elapsed_time": "1:43:10", "remaining_time": "4:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1094, "total_steps": 3836, "loss": 0.1772, "learning_rate": 4.281429966677644e-06, "epoch": 0.2851464503306943, "percentage": 28.52, "elapsed_time": "1:43:15", "remaining_time": "4:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1095, "total_steps": 3836, "loss": 0.1809, "learning_rate": 4.279917135317333e-06, "epoch": 0.28540709608053955, "percentage": 28.55, "elapsed_time": "1:43:20", "remaining_time": "4:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1096, "total_steps": 3836, "loss": 0.1795, "learning_rate": 4.2784029810090456e-06, "epoch": 0.2856677418303848, "percentage": 28.57, "elapsed_time": "1:43:26", "remaining_time": "4:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1097, "total_steps": 3836, "loss": 0.19, "learning_rate": 4.2768875048782e-06, "epoch": 0.28592838758023004, "percentage": 28.6, "elapsed_time": "1:43:32", "remaining_time": "4:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1098, "total_steps": 3836, "loss": 0.1823, "learning_rate": 4.275370708051194e-06, "epoch": 0.2861890333300753, "percentage": 28.62, "elapsed_time": "1:43:38", "remaining_time": "4:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1099, "total_steps": 3836, "loss": 0.193, "learning_rate": 4.2738525916554065e-06, "epoch": 0.2864496790799205, "percentage": 28.65, "elapsed_time": "1:43:42", "remaining_time": "4:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 3836, "loss": 0.1738, "learning_rate": 4.2723331568192004e-06, "epoch": 0.2867103248297657, "percentage": 28.68, "elapsed_time": "1:43:48", "remaining_time": "4:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1101, "total_steps": 3836, "loss": 0.1813, "learning_rate": 4.270812404671916e-06, "epoch": 0.28697097057961096, "percentage": 28.7, "elapsed_time": "1:43:53", "remaining_time": "4:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1102, "total_steps": 3836, "loss": 0.1979, "learning_rate": 4.269290336343873e-06, "epoch": 0.2872316163294562, "percentage": 28.73, "elapsed_time": "1:43:59", "remaining_time": "4:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1103, "total_steps": 3836, "loss": 0.2033, "learning_rate": 4.267766952966369e-06, "epoch": 0.28749226207930145, "percentage": 28.75, "elapsed_time": "1:44:04", "remaining_time": "4:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1104, "total_steps": 3836, "loss": 0.184, "learning_rate": 4.266242255671681e-06, "epoch": 0.2877529078291467, "percentage": 28.78, "elapsed_time": "1:44:10", "remaining_time": "4:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1105, "total_steps": 3836, "loss": 0.1778, "learning_rate": 4.2647162455930615e-06, "epoch": 0.28801355357899194, "percentage": 28.81, "elapsed_time": "1:44:15", "remaining_time": "4:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1106, "total_steps": 3836, "loss": 0.1829, "learning_rate": 4.2631889238647375e-06, "epoch": 0.2882741993288372, "percentage": 28.83, "elapsed_time": "1:44:21", "remaining_time": "4:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1107, "total_steps": 3836, "loss": 0.1978, "learning_rate": 4.261660291621912e-06, "epoch": 0.28853484507868243, "percentage": 28.86, "elapsed_time": "1:44:26", "remaining_time": "4:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1108, "total_steps": 3836, "loss": 0.1899, "learning_rate": 4.260130350000763e-06, "epoch": 0.2887954908285277, "percentage": 28.88, "elapsed_time": "1:44:32", "remaining_time": "4:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1109, "total_steps": 3836, "loss": 0.1783, "learning_rate": 4.258599100138439e-06, "epoch": 0.2890561365783729, "percentage": 28.91, "elapsed_time": "1:44:37", "remaining_time": "4:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 3836, "loss": 0.17, "learning_rate": 4.257066543173064e-06, "epoch": 0.28931678232821817, "percentage": 28.94, "elapsed_time": "1:44:42", "remaining_time": "4:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1111, "total_steps": 3836, "loss": 0.1914, "learning_rate": 4.255532680243732e-06, "epoch": 0.2895774280780634, "percentage": 28.96, "elapsed_time": "1:44:48", "remaining_time": "4:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1112, "total_steps": 3836, "loss": 0.1859, "learning_rate": 4.253997512490507e-06, "epoch": 0.28983807382790866, "percentage": 28.99, "elapsed_time": "1:44:53", "remaining_time": "4:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1113, "total_steps": 3836, "loss": 0.1881, "learning_rate": 4.252461041054426e-06, "epoch": 0.2900987195777539, "percentage": 29.01, "elapsed_time": "1:44:59", "remaining_time": "4:16:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1114, "total_steps": 3836, "loss": 0.1798, "learning_rate": 4.250923267077489e-06, "epoch": 0.29035936532759915, "percentage": 29.04, "elapsed_time": "1:45:04", "remaining_time": "4:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1115, "total_steps": 3836, "loss": 0.1871, "learning_rate": 4.249384191702671e-06, "epoch": 0.2906200110774444, "percentage": 29.07, "elapsed_time": "1:45:10", "remaining_time": "4:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1116, "total_steps": 3836, "loss": 0.1787, "learning_rate": 4.247843816073909e-06, "epoch": 0.2908806568272896, "percentage": 29.09, "elapsed_time": "1:45:15", "remaining_time": "4:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1117, "total_steps": 3836, "loss": 0.1856, "learning_rate": 4.246302141336108e-06, "epoch": 0.29114130257713483, "percentage": 29.12, "elapsed_time": "1:45:21", "remaining_time": "4:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1118, "total_steps": 3836, "loss": 0.1816, "learning_rate": 4.2447591686351406e-06, "epoch": 0.2914019483269801, "percentage": 29.14, "elapsed_time": "1:45:26", "remaining_time": "4:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1119, "total_steps": 3836, "loss": 0.189, "learning_rate": 4.243214899117842e-06, "epoch": 0.2916625940768253, "percentage": 29.17, "elapsed_time": "1:45:32", "remaining_time": "4:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 3836, "loss": 0.1855, "learning_rate": 4.2416693339320115e-06, "epoch": 0.29192323982667057, "percentage": 29.2, "elapsed_time": "1:45:37", "remaining_time": "4:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1121, "total_steps": 3836, "loss": 0.2116, "learning_rate": 4.240122474226413e-06, "epoch": 0.2921838855765158, "percentage": 29.22, "elapsed_time": "1:45:43", "remaining_time": "4:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1122, "total_steps": 3836, "loss": 0.1779, "learning_rate": 4.238574321150769e-06, "epoch": 0.29244453132636106, "percentage": 29.25, "elapsed_time": "1:45:48", "remaining_time": "4:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1123, "total_steps": 3836, "loss": 0.1829, "learning_rate": 4.237024875855768e-06, "epoch": 0.2927051770762063, "percentage": 29.28, "elapsed_time": "1:45:54", "remaining_time": "4:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1124, "total_steps": 3836, "loss": 0.1635, "learning_rate": 4.235474139493055e-06, "epoch": 0.29296582282605155, "percentage": 29.3, "elapsed_time": "1:45:59", "remaining_time": "4:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1125, "total_steps": 3836, "loss": 0.1811, "learning_rate": 4.233922113215237e-06, "epoch": 0.2932264685758968, "percentage": 29.33, "elapsed_time": "1:46:05", "remaining_time": "4:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1126, "total_steps": 3836, "loss": 0.1817, "learning_rate": 4.23236879817588e-06, "epoch": 0.29348711432574204, "percentage": 29.35, "elapsed_time": "1:46:10", "remaining_time": "4:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1127, "total_steps": 3836, "loss": 0.1952, "learning_rate": 4.230814195529504e-06, "epoch": 0.2937477600755873, "percentage": 29.38, "elapsed_time": "1:46:16", "remaining_time": "4:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1128, "total_steps": 3836, "loss": 0.1892, "learning_rate": 4.229258306431592e-06, "epoch": 0.29400840582543253, "percentage": 29.41, "elapsed_time": "1:46:21", "remaining_time": "4:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1129, "total_steps": 3836, "loss": 0.1821, "learning_rate": 4.227701132038576e-06, "epoch": 0.2942690515752778, "percentage": 29.43, "elapsed_time": "1:46:27", "remaining_time": "4:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 3836, "loss": 0.1765, "learning_rate": 4.226142673507852e-06, "epoch": 0.294529697325123, "percentage": 29.46, "elapsed_time": "1:46:32", "remaining_time": "4:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1131, "total_steps": 3836, "loss": 0.1898, "learning_rate": 4.2245829319977635e-06, "epoch": 0.2947903430749682, "percentage": 29.48, "elapsed_time": "1:46:38", "remaining_time": "4:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1132, "total_steps": 3836, "loss": 0.1927, "learning_rate": 4.22302190866761e-06, "epoch": 0.29505098882481345, "percentage": 29.51, "elapsed_time": "1:46:43", "remaining_time": "4:14:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1133, "total_steps": 3836, "loss": 0.1862, "learning_rate": 4.221459604677643e-06, "epoch": 0.2953116345746587, "percentage": 29.54, "elapsed_time": "1:46:49", "remaining_time": "4:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1134, "total_steps": 3836, "loss": 0.1877, "learning_rate": 4.219896021189067e-06, "epoch": 0.29557228032450394, "percentage": 29.56, "elapsed_time": "1:46:55", "remaining_time": "4:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1135, "total_steps": 3836, "loss": 0.1802, "learning_rate": 4.218331159364039e-06, "epoch": 0.2958329260743492, "percentage": 29.59, "elapsed_time": "1:47:00", "remaining_time": "4:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1136, "total_steps": 3836, "loss": 0.1846, "learning_rate": 4.2167650203656605e-06, "epoch": 0.29609357182419443, "percentage": 29.61, "elapsed_time": "1:47:06", "remaining_time": "4:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1137, "total_steps": 3836, "loss": 0.1978, "learning_rate": 4.215197605357989e-06, "epoch": 0.2963542175740397, "percentage": 29.64, "elapsed_time": "1:47:11", "remaining_time": "4:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1138, "total_steps": 3836, "loss": 0.1691, "learning_rate": 4.213628915506025e-06, "epoch": 0.2966148633238849, "percentage": 29.67, "elapsed_time": "1:47:17", "remaining_time": "4:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1139, "total_steps": 3836, "loss": 0.165, "learning_rate": 4.212058951975721e-06, "epoch": 0.29687550907373017, "percentage": 29.69, "elapsed_time": "1:47:23", "remaining_time": "4:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 3836, "loss": 0.1952, "learning_rate": 4.210487715933973e-06, "epoch": 0.2971361548235754, "percentage": 29.72, "elapsed_time": "1:47:28", "remaining_time": "4:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1141, "total_steps": 3836, "loss": 0.1668, "learning_rate": 4.208915208548624e-06, "epoch": 0.29739680057342066, "percentage": 29.74, "elapsed_time": "1:47:33", "remaining_time": "4:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1142, "total_steps": 3836, "loss": 0.1751, "learning_rate": 4.207341430988461e-06, "epoch": 0.2976574463232659, "percentage": 29.77, "elapsed_time": "1:47:39", "remaining_time": "4:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1143, "total_steps": 3836, "loss": 0.1873, "learning_rate": 4.205766384423218e-06, "epoch": 0.29791809207311115, "percentage": 29.8, "elapsed_time": "1:47:45", "remaining_time": "4:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1144, "total_steps": 3836, "loss": 0.177, "learning_rate": 4.204190070023567e-06, "epoch": 0.2981787378229564, "percentage": 29.82, "elapsed_time": "1:47:51", "remaining_time": "4:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1145, "total_steps": 3836, "loss": 0.1739, "learning_rate": 4.202612488961129e-06, "epoch": 0.29843938357280164, "percentage": 29.85, "elapsed_time": "1:47:56", "remaining_time": "4:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1146, "total_steps": 3836, "loss": 0.179, "learning_rate": 4.2010336424084596e-06, "epoch": 0.29870002932264683, "percentage": 29.87, "elapsed_time": "1:48:02", "remaining_time": "4:13:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1147, "total_steps": 3836, "loss": 0.1872, "learning_rate": 4.1994535315390605e-06, "epoch": 0.2989606750724921, "percentage": 29.9, "elapsed_time": "1:48:07", "remaining_time": "4:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1148, "total_steps": 3836, "loss": 0.1826, "learning_rate": 4.19787215752737e-06, "epoch": 0.2992213208223373, "percentage": 29.93, "elapsed_time": "1:48:12", "remaining_time": "4:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1149, "total_steps": 3836, "loss": 0.1807, "learning_rate": 4.196289521548767e-06, "epoch": 0.29948196657218257, "percentage": 29.95, "elapsed_time": "1:48:18", "remaining_time": "4:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 3836, "loss": 0.1777, "learning_rate": 4.194705624779566e-06, "epoch": 0.2997426123220278, "percentage": 29.98, "elapsed_time": "1:48:24", "remaining_time": "4:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1151, "total_steps": 3836, "loss": 0.1949, "learning_rate": 4.193120468397021e-06, "epoch": 0.30000325807187306, "percentage": 30.01, "elapsed_time": "1:48:29", "remaining_time": "4:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1152, "total_steps": 3836, "loss": 0.1764, "learning_rate": 4.191534053579322e-06, "epoch": 0.3002639038217183, "percentage": 30.03, "elapsed_time": "1:48:34", "remaining_time": "4:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1153, "total_steps": 3836, "loss": 0.1707, "learning_rate": 4.189946381505593e-06, "epoch": 0.30052454957156355, "percentage": 30.06, "elapsed_time": "1:48:40", "remaining_time": "4:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1154, "total_steps": 3836, "loss": 0.1885, "learning_rate": 4.188357453355893e-06, "epoch": 0.3007851953214088, "percentage": 30.08, "elapsed_time": "1:48:45", "remaining_time": "4:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1155, "total_steps": 3836, "loss": 0.1677, "learning_rate": 4.186767270311215e-06, "epoch": 0.30104584107125404, "percentage": 30.11, "elapsed_time": "1:48:51", "remaining_time": "4:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1156, "total_steps": 3836, "loss": 0.1922, "learning_rate": 4.1851758335534844e-06, "epoch": 0.3013064868210993, "percentage": 30.14, "elapsed_time": "1:48:57", "remaining_time": "4:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1157, "total_steps": 3836, "loss": 0.17, "learning_rate": 4.183583144265559e-06, "epoch": 0.30156713257094453, "percentage": 30.16, "elapsed_time": "1:49:02", "remaining_time": "4:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1158, "total_steps": 3836, "loss": 0.1867, "learning_rate": 4.181989203631227e-06, "epoch": 0.3018277783207898, "percentage": 30.19, "elapsed_time": "1:49:07", "remaining_time": "4:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1159, "total_steps": 3836, "loss": 0.1778, "learning_rate": 4.1803940128352055e-06, "epoch": 0.302088424070635, "percentage": 30.21, "elapsed_time": "1:49:13", "remaining_time": "4:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 3836, "loss": 0.18, "learning_rate": 4.178797573063144e-06, "epoch": 0.30234906982048027, "percentage": 30.24, "elapsed_time": "1:49:19", "remaining_time": "4:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1161, "total_steps": 3836, "loss": 0.1888, "learning_rate": 4.177199885501617e-06, "epoch": 0.30260971557032545, "percentage": 30.27, "elapsed_time": "1:49:25", "remaining_time": "4:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1162, "total_steps": 3836, "loss": 0.171, "learning_rate": 4.175600951338129e-06, "epoch": 0.3028703613201707, "percentage": 30.29, "elapsed_time": "1:49:30", "remaining_time": "4:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1163, "total_steps": 3836, "loss": 0.177, "learning_rate": 4.174000771761109e-06, "epoch": 0.30313100707001595, "percentage": 30.32, "elapsed_time": "1:49:35", "remaining_time": "4:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1164, "total_steps": 3836, "loss": 0.1741, "learning_rate": 4.172399347959912e-06, "epoch": 0.3033916528198612, "percentage": 30.34, "elapsed_time": "1:49:41", "remaining_time": "4:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1165, "total_steps": 3836, "loss": 0.1784, "learning_rate": 4.1707966811248206e-06, "epoch": 0.30365229856970644, "percentage": 30.37, "elapsed_time": "1:49:46", "remaining_time": "4:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1166, "total_steps": 3836, "loss": 0.1924, "learning_rate": 4.169192772447036e-06, "epoch": 0.3039129443195517, "percentage": 30.4, "elapsed_time": "1:49:52", "remaining_time": "4:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1167, "total_steps": 3836, "loss": 0.1768, "learning_rate": 4.167587623118687e-06, "epoch": 0.3041735900693969, "percentage": 30.42, "elapsed_time": "1:49:57", "remaining_time": "4:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1168, "total_steps": 3836, "loss": 0.1809, "learning_rate": 4.1659812343328246e-06, "epoch": 0.30443423581924217, "percentage": 30.45, "elapsed_time": "1:50:03", "remaining_time": "4:11:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1169, "total_steps": 3836, "loss": 0.1827, "learning_rate": 4.164373607283416e-06, "epoch": 0.3046948815690874, "percentage": 30.47, "elapsed_time": "1:50:09", "remaining_time": "4:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 3836, "loss": 0.1784, "learning_rate": 4.162764743165355e-06, "epoch": 0.30495552731893266, "percentage": 30.5, "elapsed_time": "1:50:14", "remaining_time": "4:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1171, "total_steps": 3836, "loss": 0.195, "learning_rate": 4.161154643174451e-06, "epoch": 0.3052161730687779, "percentage": 30.53, "elapsed_time": "1:50:19", "remaining_time": "4:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1172, "total_steps": 3836, "loss": 0.1864, "learning_rate": 4.1595433085074334e-06, "epoch": 0.30547681881862315, "percentage": 30.55, "elapsed_time": "1:50:25", "remaining_time": "4:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1173, "total_steps": 3836, "loss": 0.1817, "learning_rate": 4.157930740361949e-06, "epoch": 0.3057374645684684, "percentage": 30.58, "elapsed_time": "1:50:30", "remaining_time": "4:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1174, "total_steps": 3836, "loss": 0.1898, "learning_rate": 4.156316939936559e-06, "epoch": 0.30599811031831364, "percentage": 30.6, "elapsed_time": "1:50:35", "remaining_time": "4:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1175, "total_steps": 3836, "loss": 0.1572, "learning_rate": 4.154701908430747e-06, "epoch": 0.3062587560681589, "percentage": 30.63, "elapsed_time": "1:50:41", "remaining_time": "4:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1176, "total_steps": 3836, "loss": 0.1866, "learning_rate": 4.153085647044904e-06, "epoch": 0.3065194018180041, "percentage": 30.66, "elapsed_time": "1:50:47", "remaining_time": "4:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1177, "total_steps": 3836, "loss": 0.1814, "learning_rate": 4.15146815698034e-06, "epoch": 0.3067800475678493, "percentage": 30.68, "elapsed_time": "1:50:52", "remaining_time": "4:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1178, "total_steps": 3836, "loss": 0.1787, "learning_rate": 4.149849439439277e-06, "epoch": 0.30704069331769457, "percentage": 30.71, "elapsed_time": "1:50:57", "remaining_time": "4:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1179, "total_steps": 3836, "loss": 0.188, "learning_rate": 4.148229495624849e-06, "epoch": 0.3073013390675398, "percentage": 30.74, "elapsed_time": "1:51:03", "remaining_time": "4:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 3836, "loss": 0.1646, "learning_rate": 4.146608326741101e-06, "epoch": 0.30756198481738506, "percentage": 30.76, "elapsed_time": "1:51:08", "remaining_time": "4:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1181, "total_steps": 3836, "loss": 0.1826, "learning_rate": 4.144985933992989e-06, "epoch": 0.3078226305672303, "percentage": 30.79, "elapsed_time": "1:51:13", "remaining_time": "4:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1182, "total_steps": 3836, "loss": 0.1859, "learning_rate": 4.1433623185863805e-06, "epoch": 0.30808327631707555, "percentage": 30.81, "elapsed_time": "1:51:19", "remaining_time": "4:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1183, "total_steps": 3836, "loss": 0.1849, "learning_rate": 4.141737481728049e-06, "epoch": 0.3083439220669208, "percentage": 30.84, "elapsed_time": "1:51:24", "remaining_time": "4:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1184, "total_steps": 3836, "loss": 0.1818, "learning_rate": 4.140111424625676e-06, "epoch": 0.30860456781676604, "percentage": 30.87, "elapsed_time": "1:51:30", "remaining_time": "4:09:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1185, "total_steps": 3836, "loss": 0.1716, "learning_rate": 4.138484148487853e-06, "epoch": 0.3088652135666113, "percentage": 30.89, "elapsed_time": "1:51:36", "remaining_time": "4:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1186, "total_steps": 3836, "loss": 0.1821, "learning_rate": 4.1368556545240724e-06, "epoch": 0.30912585931645653, "percentage": 30.92, "elapsed_time": "1:51:41", "remaining_time": "4:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1187, "total_steps": 3836, "loss": 0.1746, "learning_rate": 4.135225943944737e-06, "epoch": 0.3093865050663018, "percentage": 30.94, "elapsed_time": "1:51:47", "remaining_time": "4:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1188, "total_steps": 3836, "loss": 0.1824, "learning_rate": 4.133595017961152e-06, "epoch": 0.309647150816147, "percentage": 30.97, "elapsed_time": "1:51:52", "remaining_time": "4:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1189, "total_steps": 3836, "loss": 0.1951, "learning_rate": 4.131962877785525e-06, "epoch": 0.30990779656599227, "percentage": 31.0, "elapsed_time": "1:51:58", "remaining_time": "4:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 3836, "loss": 0.1666, "learning_rate": 4.130329524630966e-06, "epoch": 0.3101684423158375, "percentage": 31.02, "elapsed_time": "1:52:04", "remaining_time": "4:09:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1191, "total_steps": 3836, "loss": 0.1624, "learning_rate": 4.128694959711488e-06, "epoch": 0.31042908806568276, "percentage": 31.05, "elapsed_time": "1:52:09", "remaining_time": "4:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1192, "total_steps": 3836, "loss": 0.1699, "learning_rate": 4.127059184242004e-06, "epoch": 0.31068973381552795, "percentage": 31.07, "elapsed_time": "1:52:15", "remaining_time": "4:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1193, "total_steps": 3836, "loss": 0.1729, "learning_rate": 4.125422199438326e-06, "epoch": 0.3109503795653732, "percentage": 31.1, "elapsed_time": "1:52:20", "remaining_time": "4:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1194, "total_steps": 3836, "loss": 0.1852, "learning_rate": 4.123784006517166e-06, "epoch": 0.31121102531521844, "percentage": 31.13, "elapsed_time": "1:52:25", "remaining_time": "4:08:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1195, "total_steps": 3836, "loss": 0.1849, "learning_rate": 4.122144606696135e-06, "epoch": 0.3114716710650637, "percentage": 31.15, "elapsed_time": "1:52:31", "remaining_time": "4:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1196, "total_steps": 3836, "loss": 0.1929, "learning_rate": 4.120504001193737e-06, "epoch": 0.3117323168149089, "percentage": 31.18, "elapsed_time": "1:52:37", "remaining_time": "4:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1197, "total_steps": 3836, "loss": 0.1802, "learning_rate": 4.118862191229376e-06, "epoch": 0.3119929625647542, "percentage": 31.2, "elapsed_time": "1:52:42", "remaining_time": "4:08:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1198, "total_steps": 3836, "loss": 0.1748, "learning_rate": 4.117219178023349e-06, "epoch": 0.3122536083145994, "percentage": 31.23, "elapsed_time": "1:52:48", "remaining_time": "4:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1199, "total_steps": 3836, "loss": 0.1892, "learning_rate": 4.11557496279685e-06, "epoch": 0.31251425406444466, "percentage": 31.26, "elapsed_time": "1:52:53", "remaining_time": "4:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 3836, "loss": 0.1642, "learning_rate": 4.113929546771963e-06, "epoch": 0.3127748998142899, "percentage": 31.28, "elapsed_time": "1:52:58", "remaining_time": "4:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1201, "total_steps": 3836, "loss": 0.1851, "learning_rate": 4.112282931171668e-06, "epoch": 0.31303554556413515, "percentage": 31.31, "elapsed_time": "1:53:04", "remaining_time": "4:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1202, "total_steps": 3836, "loss": 0.1795, "learning_rate": 4.1106351172198325e-06, "epoch": 0.3132961913139804, "percentage": 31.33, "elapsed_time": "1:53:10", "remaining_time": "4:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1203, "total_steps": 3836, "loss": 0.169, "learning_rate": 4.1089861061412175e-06, "epoch": 0.31355683706382564, "percentage": 31.36, "elapsed_time": "1:53:15", "remaining_time": "4:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1204, "total_steps": 3836, "loss": 0.1866, "learning_rate": 4.1073358991614745e-06, "epoch": 0.3138174828136709, "percentage": 31.39, "elapsed_time": "1:53:21", "remaining_time": "4:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1205, "total_steps": 3836, "loss": 0.1871, "learning_rate": 4.105684497507141e-06, "epoch": 0.31407812856351613, "percentage": 31.41, "elapsed_time": "1:53:27", "remaining_time": "4:07:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1206, "total_steps": 3836, "loss": 0.1834, "learning_rate": 4.1040319024056465e-06, "epoch": 0.3143387743133614, "percentage": 31.44, "elapsed_time": "1:53:33", "remaining_time": "4:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1207, "total_steps": 3836, "loss": 0.1722, "learning_rate": 4.102378115085302e-06, "epoch": 0.31459942006320657, "percentage": 31.47, "elapsed_time": "1:53:39", "remaining_time": "4:07:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1208, "total_steps": 3836, "loss": 0.1835, "learning_rate": 4.10072313677531e-06, "epoch": 0.3148600658130518, "percentage": 31.49, "elapsed_time": "1:53:44", "remaining_time": "4:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1209, "total_steps": 3836, "loss": 0.1707, "learning_rate": 4.0990669687057545e-06, "epoch": 0.31512071156289706, "percentage": 31.52, "elapsed_time": "1:53:50", "remaining_time": "4:07:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 3836, "loss": 0.1874, "learning_rate": 4.0974096121076076e-06, "epoch": 0.3153813573127423, "percentage": 31.54, "elapsed_time": "1:53:56", "remaining_time": "4:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1211, "total_steps": 3836, "loss": 0.1843, "learning_rate": 4.09575106821272e-06, "epoch": 0.31564200306258755, "percentage": 31.57, "elapsed_time": "1:54:02", "remaining_time": "4:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1212, "total_steps": 3836, "loss": 0.1736, "learning_rate": 4.094091338253829e-06, "epoch": 0.3159026488124328, "percentage": 31.6, "elapsed_time": "1:54:07", "remaining_time": "4:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1213, "total_steps": 3836, "loss": 0.1811, "learning_rate": 4.092430423464549e-06, "epoch": 0.31616329456227804, "percentage": 31.62, "elapsed_time": "1:54:13", "remaining_time": "4:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1214, "total_steps": 3836, "loss": 0.1831, "learning_rate": 4.0907683250793814e-06, "epoch": 0.3164239403121233, "percentage": 31.65, "elapsed_time": "1:54:20", "remaining_time": "4:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1215, "total_steps": 3836, "loss": 0.1947, "learning_rate": 4.089105044333702e-06, "epoch": 0.31668458606196853, "percentage": 31.67, "elapsed_time": "1:54:25", "remaining_time": "4:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1216, "total_steps": 3836, "loss": 0.1702, "learning_rate": 4.0874405824637676e-06, "epoch": 0.3169452318118138, "percentage": 31.7, "elapsed_time": "1:54:31", "remaining_time": "4:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1217, "total_steps": 3836, "loss": 0.1843, "learning_rate": 4.085774940706712e-06, "epoch": 0.317205877561659, "percentage": 31.73, "elapsed_time": "1:54:36", "remaining_time": "4:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1218, "total_steps": 3836, "loss": 0.1844, "learning_rate": 4.084108120300546e-06, "epoch": 0.31746652331150427, "percentage": 31.75, "elapsed_time": "1:54:42", "remaining_time": "4:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1219, "total_steps": 3836, "loss": 0.1784, "learning_rate": 4.082440122484159e-06, "epoch": 0.3177271690613495, "percentage": 31.78, "elapsed_time": "1:54:48", "remaining_time": "4:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 3836, "loss": 0.1764, "learning_rate": 4.080770948497311e-06, "epoch": 0.31798781481119476, "percentage": 31.8, "elapsed_time": "1:54:52", "remaining_time": "4:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1221, "total_steps": 3836, "loss": 0.1764, "learning_rate": 4.07910059958064e-06, "epoch": 0.31824846056104, "percentage": 31.83, "elapsed_time": "1:54:58", "remaining_time": "4:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1222, "total_steps": 3836, "loss": 0.1722, "learning_rate": 4.077429076975655e-06, "epoch": 0.3185091063108852, "percentage": 31.86, "elapsed_time": "1:55:04", "remaining_time": "4:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1223, "total_steps": 3836, "loss": 0.1698, "learning_rate": 4.075756381924739e-06, "epoch": 0.31876975206073044, "percentage": 31.88, "elapsed_time": "1:55:09", "remaining_time": "4:06:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1224, "total_steps": 3836, "loss": 0.1819, "learning_rate": 4.074082515671145e-06, "epoch": 0.3190303978105757, "percentage": 31.91, "elapsed_time": "1:55:14", "remaining_time": "4:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1225, "total_steps": 3836, "loss": 0.1789, "learning_rate": 4.072407479458998e-06, "epoch": 0.31929104356042093, "percentage": 31.93, "elapsed_time": "1:55:19", "remaining_time": "4:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1226, "total_steps": 3836, "loss": 0.1731, "learning_rate": 4.070731274533291e-06, "epoch": 0.3195516893102662, "percentage": 31.96, "elapsed_time": "1:55:26", "remaining_time": "4:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1227, "total_steps": 3836, "loss": 0.1778, "learning_rate": 4.069053902139887e-06, "epoch": 0.3198123350601114, "percentage": 31.99, "elapsed_time": "1:55:31", "remaining_time": "4:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1228, "total_steps": 3836, "loss": 0.1786, "learning_rate": 4.067375363525516e-06, "epoch": 0.32007298080995666, "percentage": 32.01, "elapsed_time": "1:55:37", "remaining_time": "4:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1229, "total_steps": 3836, "loss": 0.1887, "learning_rate": 4.065695659937775e-06, "epoch": 0.3203336265598019, "percentage": 32.04, "elapsed_time": "1:55:43", "remaining_time": "4:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 3836, "loss": 0.1754, "learning_rate": 4.064014792625126e-06, "epoch": 0.32059427230964715, "percentage": 32.06, "elapsed_time": "1:55:49", "remaining_time": "4:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1231, "total_steps": 3836, "loss": 0.1644, "learning_rate": 4.062332762836899e-06, "epoch": 0.3208549180594924, "percentage": 32.09, "elapsed_time": "1:55:54", "remaining_time": "4:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1232, "total_steps": 3836, "loss": 0.1681, "learning_rate": 4.060649571823284e-06, "epoch": 0.32111556380933765, "percentage": 32.12, "elapsed_time": "1:55:59", "remaining_time": "4:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1233, "total_steps": 3836, "loss": 0.179, "learning_rate": 4.0589652208353355e-06, "epoch": 0.3213762095591829, "percentage": 32.14, "elapsed_time": "1:56:05", "remaining_time": "4:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1234, "total_steps": 3836, "loss": 0.1805, "learning_rate": 4.057279711124973e-06, "epoch": 0.32163685530902814, "percentage": 32.17, "elapsed_time": "1:56:11", "remaining_time": "4:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1235, "total_steps": 3836, "loss": 0.1994, "learning_rate": 4.055593043944973e-06, "epoch": 0.3218975010588734, "percentage": 32.19, "elapsed_time": "1:56:17", "remaining_time": "4:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1236, "total_steps": 3836, "loss": 0.1805, "learning_rate": 4.053905220548974e-06, "epoch": 0.3221581468087186, "percentage": 32.22, "elapsed_time": "1:56:23", "remaining_time": "4:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1237, "total_steps": 3836, "loss": 0.1814, "learning_rate": 4.052216242191475e-06, "epoch": 0.3224187925585638, "percentage": 32.25, "elapsed_time": "1:56:29", "remaining_time": "4:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1238, "total_steps": 3836, "loss": 0.1813, "learning_rate": 4.050526110127832e-06, "epoch": 0.32267943830840906, "percentage": 32.27, "elapsed_time": "1:56:35", "remaining_time": "4:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1239, "total_steps": 3836, "loss": 0.1839, "learning_rate": 4.0488348256142595e-06, "epoch": 0.3229400840582543, "percentage": 32.3, "elapsed_time": "1:56:41", "remaining_time": "4:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 3836, "loss": 0.1713, "learning_rate": 4.047142389907827e-06, "epoch": 0.32320072980809955, "percentage": 32.33, "elapsed_time": "1:56:47", "remaining_time": "4:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1241, "total_steps": 3836, "loss": 0.167, "learning_rate": 4.045448804266462e-06, "epoch": 0.3234613755579448, "percentage": 32.35, "elapsed_time": "1:56:52", "remaining_time": "4:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1242, "total_steps": 3836, "loss": 0.1743, "learning_rate": 4.043754069948944e-06, "epoch": 0.32372202130779004, "percentage": 32.38, "elapsed_time": "1:56:58", "remaining_time": "4:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1243, "total_steps": 3836, "loss": 0.179, "learning_rate": 4.042058188214909e-06, "epoch": 0.3239826670576353, "percentage": 32.4, "elapsed_time": "1:57:04", "remaining_time": "4:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1244, "total_steps": 3836, "loss": 0.1803, "learning_rate": 4.040361160324844e-06, "epoch": 0.32424331280748053, "percentage": 32.43, "elapsed_time": "1:57:09", "remaining_time": "4:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1245, "total_steps": 3836, "loss": 0.1886, "learning_rate": 4.038662987540088e-06, "epoch": 0.3245039585573258, "percentage": 32.46, "elapsed_time": "1:57:15", "remaining_time": "4:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1246, "total_steps": 3836, "loss": 0.1913, "learning_rate": 4.036963671122831e-06, "epoch": 0.324764604307171, "percentage": 32.48, "elapsed_time": "1:57:20", "remaining_time": "4:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1247, "total_steps": 3836, "loss": 0.1753, "learning_rate": 4.0352632123361155e-06, "epoch": 0.32502525005701627, "percentage": 32.51, "elapsed_time": "1:57:26", "remaining_time": "4:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1248, "total_steps": 3836, "loss": 0.1716, "learning_rate": 4.033561612443829e-06, "epoch": 0.3252858958068615, "percentage": 32.53, "elapsed_time": "1:57:32", "remaining_time": "4:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1249, "total_steps": 3836, "loss": 0.1765, "learning_rate": 4.031858872710709e-06, "epoch": 0.32554654155670676, "percentage": 32.56, "elapsed_time": "1:57:37", "remaining_time": "4:03:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 3836, "loss": 0.1937, "learning_rate": 4.030154994402341e-06, "epoch": 0.325807187306552, "percentage": 32.59, "elapsed_time": "1:57:43", "remaining_time": "4:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1251, "total_steps": 3836, "loss": 0.171, "learning_rate": 4.028449978785156e-06, "epoch": 0.32606783305639725, "percentage": 32.61, "elapsed_time": "1:57:48", "remaining_time": "4:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1252, "total_steps": 3836, "loss": 0.1795, "learning_rate": 4.0267438271264304e-06, "epoch": 0.32632847880624244, "percentage": 32.64, "elapsed_time": "1:57:53", "remaining_time": "4:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1253, "total_steps": 3836, "loss": 0.1803, "learning_rate": 4.025036540694285e-06, "epoch": 0.3265891245560877, "percentage": 32.66, "elapsed_time": "1:57:59", "remaining_time": "4:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1254, "total_steps": 3836, "loss": 0.1699, "learning_rate": 4.023328120757685e-06, "epoch": 0.32684977030593293, "percentage": 32.69, "elapsed_time": "1:58:05", "remaining_time": "4:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1255, "total_steps": 3836, "loss": 0.1641, "learning_rate": 4.021618568586434e-06, "epoch": 0.3271104160557782, "percentage": 32.72, "elapsed_time": "1:58:10", "remaining_time": "4:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1256, "total_steps": 3836, "loss": 0.1845, "learning_rate": 4.019907885451184e-06, "epoch": 0.3273710618056234, "percentage": 32.74, "elapsed_time": "1:58:16", "remaining_time": "4:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1257, "total_steps": 3836, "loss": 0.1749, "learning_rate": 4.018196072623421e-06, "epoch": 0.32763170755546867, "percentage": 32.77, "elapsed_time": "1:58:20", "remaining_time": "4:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1258, "total_steps": 3836, "loss": 0.191, "learning_rate": 4.016483131375476e-06, "epoch": 0.3278923533053139, "percentage": 32.79, "elapsed_time": "1:58:26", "remaining_time": "4:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1259, "total_steps": 3836, "loss": 0.1692, "learning_rate": 4.014769062980513e-06, "epoch": 0.32815299905515916, "percentage": 32.82, "elapsed_time": "1:58:32", "remaining_time": "4:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 3836, "loss": 0.1742, "learning_rate": 4.01305386871254e-06, "epoch": 0.3284136448050044, "percentage": 32.85, "elapsed_time": "1:58:38", "remaining_time": "4:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1261, "total_steps": 3836, "loss": 0.1922, "learning_rate": 4.011337549846398e-06, "epoch": 0.32867429055484965, "percentage": 32.87, "elapsed_time": "1:58:43", "remaining_time": "4:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1262, "total_steps": 3836, "loss": 0.178, "learning_rate": 4.009620107657763e-06, "epoch": 0.3289349363046949, "percentage": 32.9, "elapsed_time": "1:58:49", "remaining_time": "4:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1263, "total_steps": 3836, "loss": 0.1787, "learning_rate": 4.00790154342315e-06, "epoch": 0.32919558205454014, "percentage": 32.92, "elapsed_time": "1:58:55", "remaining_time": "4:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1264, "total_steps": 3836, "loss": 0.1725, "learning_rate": 4.006181858419905e-06, "epoch": 0.3294562278043854, "percentage": 32.95, "elapsed_time": "1:59:00", "remaining_time": "4:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1265, "total_steps": 3836, "loss": 0.1689, "learning_rate": 4.004461053926206e-06, "epoch": 0.3297168735542306, "percentage": 32.98, "elapsed_time": "1:59:05", "remaining_time": "4:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1266, "total_steps": 3836, "loss": 0.16, "learning_rate": 4.002739131221066e-06, "epoch": 0.3299775193040759, "percentage": 33.0, "elapsed_time": "1:59:11", "remaining_time": "4:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1267, "total_steps": 3836, "loss": 0.1767, "learning_rate": 4.0010160915843286e-06, "epoch": 0.33023816505392106, "percentage": 33.03, "elapsed_time": "1:59:17", "remaining_time": "4:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1268, "total_steps": 3836, "loss": 0.1881, "learning_rate": 3.999291936296664e-06, "epoch": 0.3304988108037663, "percentage": 33.06, "elapsed_time": "1:59:22", "remaining_time": "4:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1269, "total_steps": 3836, "loss": 0.1823, "learning_rate": 3.997566666639578e-06, "epoch": 0.33075945655361155, "percentage": 33.08, "elapsed_time": "1:59:28", "remaining_time": "4:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 3836, "loss": 0.1728, "learning_rate": 3.995840283895399e-06, "epoch": 0.3310201023034568, "percentage": 33.11, "elapsed_time": "1:59:33", "remaining_time": "4:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1271, "total_steps": 3836, "loss": 0.1791, "learning_rate": 3.9941127893472845e-06, "epoch": 0.33128074805330204, "percentage": 33.13, "elapsed_time": "1:59:39", "remaining_time": "4:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1272, "total_steps": 3836, "loss": 0.1658, "learning_rate": 3.99238418427922e-06, "epoch": 0.3315413938031473, "percentage": 33.16, "elapsed_time": "1:59:44", "remaining_time": "4:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1273, "total_steps": 3836, "loss": 0.1849, "learning_rate": 3.9906544699760145e-06, "epoch": 0.33180203955299253, "percentage": 33.19, "elapsed_time": "1:59:50", "remaining_time": "4:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1274, "total_steps": 3836, "loss": 0.1748, "learning_rate": 3.988923647723301e-06, "epoch": 0.3320626853028378, "percentage": 33.21, "elapsed_time": "1:59:56", "remaining_time": "4:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1275, "total_steps": 3836, "loss": 0.1736, "learning_rate": 3.987191718807538e-06, "epoch": 0.332323331052683, "percentage": 33.24, "elapsed_time": "2:00:01", "remaining_time": "4:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1276, "total_steps": 3836, "loss": 0.1797, "learning_rate": 3.9854586845160055e-06, "epoch": 0.33258397680252827, "percentage": 33.26, "elapsed_time": "2:00:06", "remaining_time": "4:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1277, "total_steps": 3836, "loss": 0.157, "learning_rate": 3.9837245461368055e-06, "epoch": 0.3328446225523735, "percentage": 33.29, "elapsed_time": "2:00:11", "remaining_time": "4:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1278, "total_steps": 3836, "loss": 0.1705, "learning_rate": 3.981989304958861e-06, "epoch": 0.33310526830221876, "percentage": 33.32, "elapsed_time": "2:00:16", "remaining_time": "4:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1279, "total_steps": 3836, "loss": 0.171, "learning_rate": 3.980252962271911e-06, "epoch": 0.333365914052064, "percentage": 33.34, "elapsed_time": "2:00:21", "remaining_time": "4:00:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 3836, "loss": 0.1881, "learning_rate": 3.978515519366519e-06, "epoch": 0.33362655980190925, "percentage": 33.37, "elapsed_time": "2:00:26", "remaining_time": "4:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1281, "total_steps": 3836, "loss": 0.1802, "learning_rate": 3.976776977534062e-06, "epoch": 0.3338872055517545, "percentage": 33.39, "elapsed_time": "2:00:32", "remaining_time": "4:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1282, "total_steps": 3836, "loss": 0.1815, "learning_rate": 3.975037338066736e-06, "epoch": 0.33414785130159974, "percentage": 33.42, "elapsed_time": "2:00:38", "remaining_time": "4:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1283, "total_steps": 3836, "loss": 0.1655, "learning_rate": 3.973296602257553e-06, "epoch": 0.33440849705144493, "percentage": 33.45, "elapsed_time": "2:00:43", "remaining_time": "4:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1284, "total_steps": 3836, "loss": 0.1855, "learning_rate": 3.9715547714003355e-06, "epoch": 0.3346691428012902, "percentage": 33.47, "elapsed_time": "2:00:49", "remaining_time": "4:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1285, "total_steps": 3836, "loss": 0.1702, "learning_rate": 3.969811846789727e-06, "epoch": 0.3349297885511354, "percentage": 33.5, "elapsed_time": "2:00:55", "remaining_time": "4:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1286, "total_steps": 3836, "loss": 0.1766, "learning_rate": 3.968067829721178e-06, "epoch": 0.33519043430098067, "percentage": 33.52, "elapsed_time": "2:01:00", "remaining_time": "3:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1287, "total_steps": 3836, "loss": 0.1673, "learning_rate": 3.966322721490954e-06, "epoch": 0.3354510800508259, "percentage": 33.55, "elapsed_time": "2:01:06", "remaining_time": "3:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1288, "total_steps": 3836, "loss": 0.1792, "learning_rate": 3.96457652339613e-06, "epoch": 0.33571172580067116, "percentage": 33.58, "elapsed_time": "2:01:12", "remaining_time": "3:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1289, "total_steps": 3836, "loss": 0.1617, "learning_rate": 3.9628292367345946e-06, "epoch": 0.3359723715505164, "percentage": 33.6, "elapsed_time": "2:01:18", "remaining_time": "3:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 3836, "loss": 0.175, "learning_rate": 3.961080862805039e-06, "epoch": 0.33623301730036165, "percentage": 33.63, "elapsed_time": "2:01:23", "remaining_time": "3:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1291, "total_steps": 3836, "loss": 0.1799, "learning_rate": 3.959331402906969e-06, "epoch": 0.3364936630502069, "percentage": 33.65, "elapsed_time": "2:01:28", "remaining_time": "3:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1292, "total_steps": 3836, "loss": 0.1902, "learning_rate": 3.9575808583406926e-06, "epoch": 0.33675430880005214, "percentage": 33.68, "elapsed_time": "2:01:34", "remaining_time": "3:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1293, "total_steps": 3836, "loss": 0.1894, "learning_rate": 3.955829230407328e-06, "epoch": 0.3370149545498974, "percentage": 33.71, "elapsed_time": "2:01:39", "remaining_time": "3:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1294, "total_steps": 3836, "loss": 0.171, "learning_rate": 3.954076520408796e-06, "epoch": 0.33727560029974263, "percentage": 33.73, "elapsed_time": "2:01:44", "remaining_time": "3:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1295, "total_steps": 3836, "loss": 0.1831, "learning_rate": 3.952322729647823e-06, "epoch": 0.3375362460495879, "percentage": 33.76, "elapsed_time": "2:01:50", "remaining_time": "3:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1296, "total_steps": 3836, "loss": 0.1971, "learning_rate": 3.950567859427938e-06, "epoch": 0.3377968917994331, "percentage": 33.79, "elapsed_time": "2:01:56", "remaining_time": "3:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1297, "total_steps": 3836, "loss": 0.1851, "learning_rate": 3.948811911053473e-06, "epoch": 0.33805753754927836, "percentage": 33.81, "elapsed_time": "2:02:01", "remaining_time": "3:58:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1298, "total_steps": 3836, "loss": 0.1644, "learning_rate": 3.947054885829559e-06, "epoch": 0.33831818329912355, "percentage": 33.84, "elapsed_time": "2:02:07", "remaining_time": "3:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1299, "total_steps": 3836, "loss": 0.2045, "learning_rate": 3.945296785062131e-06, "epoch": 0.3385788290489688, "percentage": 33.86, "elapsed_time": "2:02:13", "remaining_time": "3:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 3836, "loss": 0.1788, "learning_rate": 3.943537610057921e-06, "epoch": 0.33883947479881404, "percentage": 33.89, "elapsed_time": "2:02:18", "remaining_time": "3:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1301, "total_steps": 3836, "loss": 0.1767, "learning_rate": 3.941777362124461e-06, "epoch": 0.3391001205486593, "percentage": 33.92, "elapsed_time": "2:02:24", "remaining_time": "3:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1302, "total_steps": 3836, "loss": 0.1727, "learning_rate": 3.940016042570079e-06, "epoch": 0.33936076629850453, "percentage": 33.94, "elapsed_time": "2:02:29", "remaining_time": "3:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1303, "total_steps": 3836, "loss": 0.1686, "learning_rate": 3.9382536527039e-06, "epoch": 0.3396214120483498, "percentage": 33.97, "elapsed_time": "2:02:35", "remaining_time": "3:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1304, "total_steps": 3836, "loss": 0.1623, "learning_rate": 3.936490193835843e-06, "epoch": 0.339882057798195, "percentage": 33.99, "elapsed_time": "2:02:41", "remaining_time": "3:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1305, "total_steps": 3836, "loss": 0.1528, "learning_rate": 3.9347256672766255e-06, "epoch": 0.34014270354804027, "percentage": 34.02, "elapsed_time": "2:02:46", "remaining_time": "3:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1306, "total_steps": 3836, "loss": 0.1827, "learning_rate": 3.932960074337755e-06, "epoch": 0.3404033492978855, "percentage": 34.05, "elapsed_time": "2:02:51", "remaining_time": "3:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1307, "total_steps": 3836, "loss": 0.1791, "learning_rate": 3.931193416331534e-06, "epoch": 0.34066399504773076, "percentage": 34.07, "elapsed_time": "2:02:57", "remaining_time": "3:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1308, "total_steps": 3836, "loss": 0.1675, "learning_rate": 3.929425694571055e-06, "epoch": 0.340924640797576, "percentage": 34.1, "elapsed_time": "2:03:03", "remaining_time": "3:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1309, "total_steps": 3836, "loss": 0.1662, "learning_rate": 3.9276569103702e-06, "epoch": 0.34118528654742125, "percentage": 34.12, "elapsed_time": "2:03:08", "remaining_time": "3:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 3836, "loss": 0.1844, "learning_rate": 3.925887065043643e-06, "epoch": 0.3414459322972665, "percentage": 34.15, "elapsed_time": "2:03:14", "remaining_time": "3:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1311, "total_steps": 3836, "loss": 0.1723, "learning_rate": 3.924116159906848e-06, "epoch": 0.34170657804711174, "percentage": 34.18, "elapsed_time": "2:03:19", "remaining_time": "3:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1312, "total_steps": 3836, "loss": 0.1715, "learning_rate": 3.922344196276063e-06, "epoch": 0.341967223796957, "percentage": 34.2, "elapsed_time": "2:03:25", "remaining_time": "3:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1313, "total_steps": 3836, "loss": 0.1602, "learning_rate": 3.920571175468324e-06, "epoch": 0.3422278695468022, "percentage": 34.23, "elapsed_time": "2:03:31", "remaining_time": "3:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1314, "total_steps": 3836, "loss": 0.1747, "learning_rate": 3.918797098801453e-06, "epoch": 0.3424885152966474, "percentage": 34.25, "elapsed_time": "2:03:36", "remaining_time": "3:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1315, "total_steps": 3836, "loss": 0.1735, "learning_rate": 3.9170219675940595e-06, "epoch": 0.34274916104649267, "percentage": 34.28, "elapsed_time": "2:03:41", "remaining_time": "3:57:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1316, "total_steps": 3836, "loss": 0.1861, "learning_rate": 3.915245783165531e-06, "epoch": 0.3430098067963379, "percentage": 34.31, "elapsed_time": "2:03:47", "remaining_time": "3:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1317, "total_steps": 3836, "loss": 0.1809, "learning_rate": 3.9134685468360435e-06, "epoch": 0.34327045254618316, "percentage": 34.33, "elapsed_time": "2:03:53", "remaining_time": "3:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1318, "total_steps": 3836, "loss": 0.1762, "learning_rate": 3.911690259926551e-06, "epoch": 0.3435310982960284, "percentage": 34.36, "elapsed_time": "2:03:58", "remaining_time": "3:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1319, "total_steps": 3836, "loss": 0.1852, "learning_rate": 3.90991092375879e-06, "epoch": 0.34379174404587365, "percentage": 34.38, "elapsed_time": "2:04:04", "remaining_time": "3:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 3836, "loss": 0.1786, "learning_rate": 3.908130539655278e-06, "epoch": 0.3440523897957189, "percentage": 34.41, "elapsed_time": "2:04:10", "remaining_time": "3:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1321, "total_steps": 3836, "loss": 0.1672, "learning_rate": 3.906349108939308e-06, "epoch": 0.34431303554556414, "percentage": 34.44, "elapsed_time": "2:04:15", "remaining_time": "3:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1322, "total_steps": 3836, "loss": 0.1775, "learning_rate": 3.904566632934955e-06, "epoch": 0.3445736812954094, "percentage": 34.46, "elapsed_time": "2:04:21", "remaining_time": "3:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1323, "total_steps": 3836, "loss": 0.1716, "learning_rate": 3.902783112967067e-06, "epoch": 0.34483432704525463, "percentage": 34.49, "elapsed_time": "2:04:27", "remaining_time": "3:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1324, "total_steps": 3836, "loss": 0.1823, "learning_rate": 3.900998550361271e-06, "epoch": 0.3450949727950999, "percentage": 34.52, "elapsed_time": "2:04:33", "remaining_time": "3:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1325, "total_steps": 3836, "loss": 0.1717, "learning_rate": 3.899212946443967e-06, "epoch": 0.3453556185449451, "percentage": 34.54, "elapsed_time": "2:04:39", "remaining_time": "3:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1326, "total_steps": 3836, "loss": 0.1615, "learning_rate": 3.897426302542331e-06, "epoch": 0.34561626429479037, "percentage": 34.57, "elapsed_time": "2:04:44", "remaining_time": "3:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1327, "total_steps": 3836, "loss": 0.1883, "learning_rate": 3.89563861998431e-06, "epoch": 0.3458769100446356, "percentage": 34.59, "elapsed_time": "2:04:49", "remaining_time": "3:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1328, "total_steps": 3836, "loss": 0.1715, "learning_rate": 3.893849900098623e-06, "epoch": 0.3461375557944808, "percentage": 34.62, "elapsed_time": "2:04:55", "remaining_time": "3:55:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1329, "total_steps": 3836, "loss": 0.1761, "learning_rate": 3.8920601442147625e-06, "epoch": 0.34639820154432605, "percentage": 34.65, "elapsed_time": "2:05:00", "remaining_time": "3:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 3836, "loss": 0.1771, "learning_rate": 3.890269353662987e-06, "epoch": 0.3466588472941713, "percentage": 34.67, "elapsed_time": "2:05:05", "remaining_time": "3:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1331, "total_steps": 3836, "loss": 0.1643, "learning_rate": 3.888477529774328e-06, "epoch": 0.34691949304401654, "percentage": 34.7, "elapsed_time": "2:05:10", "remaining_time": "3:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1332, "total_steps": 3836, "loss": 0.1686, "learning_rate": 3.886684673880583e-06, "epoch": 0.3471801387938618, "percentage": 34.72, "elapsed_time": "2:05:16", "remaining_time": "3:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1333, "total_steps": 3836, "loss": 0.1577, "learning_rate": 3.884890787314316e-06, "epoch": 0.347440784543707, "percentage": 34.75, "elapsed_time": "2:05:22", "remaining_time": "3:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1334, "total_steps": 3836, "loss": 0.1719, "learning_rate": 3.8830958714088595e-06, "epoch": 0.34770143029355227, "percentage": 34.78, "elapsed_time": "2:05:28", "remaining_time": "3:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1335, "total_steps": 3836, "loss": 0.1828, "learning_rate": 3.8812999274983085e-06, "epoch": 0.3479620760433975, "percentage": 34.8, "elapsed_time": "2:05:34", "remaining_time": "3:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1336, "total_steps": 3836, "loss": 0.1722, "learning_rate": 3.879502956917524e-06, "epoch": 0.34822272179324276, "percentage": 34.83, "elapsed_time": "2:05:39", "remaining_time": "3:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1337, "total_steps": 3836, "loss": 0.1799, "learning_rate": 3.877704961002127e-06, "epoch": 0.348483367543088, "percentage": 34.85, "elapsed_time": "2:05:45", "remaining_time": "3:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1338, "total_steps": 3836, "loss": 0.1776, "learning_rate": 3.875905941088505e-06, "epoch": 0.34874401329293325, "percentage": 34.88, "elapsed_time": "2:05:51", "remaining_time": "3:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1339, "total_steps": 3836, "loss": 0.18, "learning_rate": 3.874105898513803e-06, "epoch": 0.3490046590427785, "percentage": 34.91, "elapsed_time": "2:05:56", "remaining_time": "3:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 3836, "loss": 0.1567, "learning_rate": 3.872304834615929e-06, "epoch": 0.34926530479262374, "percentage": 34.93, "elapsed_time": "2:06:02", "remaining_time": "3:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1341, "total_steps": 3836, "loss": 0.1679, "learning_rate": 3.870502750733547e-06, "epoch": 0.349525950542469, "percentage": 34.96, "elapsed_time": "2:06:09", "remaining_time": "3:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1342, "total_steps": 3836, "loss": 0.1645, "learning_rate": 3.868699648206081e-06, "epoch": 0.34978659629231423, "percentage": 34.98, "elapsed_time": "2:06:14", "remaining_time": "3:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1343, "total_steps": 3836, "loss": 0.1863, "learning_rate": 3.866895528373713e-06, "epoch": 0.3500472420421594, "percentage": 35.01, "elapsed_time": "2:06:20", "remaining_time": "3:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1344, "total_steps": 3836, "loss": 0.1717, "learning_rate": 3.8650903925773795e-06, "epoch": 0.35030788779200467, "percentage": 35.04, "elapsed_time": "2:06:25", "remaining_time": "3:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1345, "total_steps": 3836, "loss": 0.1798, "learning_rate": 3.863284242158772e-06, "epoch": 0.3505685335418499, "percentage": 35.06, "elapsed_time": "2:06:31", "remaining_time": "3:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1346, "total_steps": 3836, "loss": 0.1717, "learning_rate": 3.861477078460337e-06, "epoch": 0.35082917929169516, "percentage": 35.09, "elapsed_time": "2:06:37", "remaining_time": "3:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1347, "total_steps": 3836, "loss": 0.1871, "learning_rate": 3.859668902825274e-06, "epoch": 0.3510898250415404, "percentage": 35.11, "elapsed_time": "2:06:42", "remaining_time": "3:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1348, "total_steps": 3836, "loss": 0.1813, "learning_rate": 3.857859716597534e-06, "epoch": 0.35135047079138565, "percentage": 35.14, "elapsed_time": "2:06:48", "remaining_time": "3:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1349, "total_steps": 3836, "loss": 0.1616, "learning_rate": 3.8560495211218215e-06, "epoch": 0.3516111165412309, "percentage": 35.17, "elapsed_time": "2:06:53", "remaining_time": "3:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 3836, "loss": 0.163, "learning_rate": 3.854238317743586e-06, "epoch": 0.35187176229107614, "percentage": 35.19, "elapsed_time": "2:06:59", "remaining_time": "3:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1351, "total_steps": 3836, "loss": 0.1838, "learning_rate": 3.852426107809032e-06, "epoch": 0.3521324080409214, "percentage": 35.22, "elapsed_time": "2:07:05", "remaining_time": "3:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1352, "total_steps": 3836, "loss": 0.1802, "learning_rate": 3.8506128926651095e-06, "epoch": 0.35239305379076663, "percentage": 35.25, "elapsed_time": "2:07:11", "remaining_time": "3:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1353, "total_steps": 3836, "loss": 0.1706, "learning_rate": 3.8487986736595135e-06, "epoch": 0.3526536995406119, "percentage": 35.27, "elapsed_time": "2:07:17", "remaining_time": "3:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1354, "total_steps": 3836, "loss": 0.1711, "learning_rate": 3.846983452140689e-06, "epoch": 0.3529143452904571, "percentage": 35.3, "elapsed_time": "2:07:22", "remaining_time": "3:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1355, "total_steps": 3836, "loss": 0.1822, "learning_rate": 3.845167229457824e-06, "epoch": 0.35317499104030237, "percentage": 35.32, "elapsed_time": "2:07:27", "remaining_time": "3:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1356, "total_steps": 3836, "loss": 0.1806, "learning_rate": 3.843350006960852e-06, "epoch": 0.3534356367901476, "percentage": 35.35, "elapsed_time": "2:07:33", "remaining_time": "3:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1357, "total_steps": 3836, "loss": 0.1795, "learning_rate": 3.841531786000448e-06, "epoch": 0.35369628253999286, "percentage": 35.38, "elapsed_time": "2:07:38", "remaining_time": "3:53:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1358, "total_steps": 3836, "loss": 0.1758, "learning_rate": 3.83971256792803e-06, "epoch": 0.35395692828983805, "percentage": 35.4, "elapsed_time": "2:07:44", "remaining_time": "3:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1359, "total_steps": 3836, "loss": 0.1591, "learning_rate": 3.8378923540957555e-06, "epoch": 0.3542175740396833, "percentage": 35.43, "elapsed_time": "2:07:49", "remaining_time": "3:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 3836, "loss": 0.1788, "learning_rate": 3.836071145856526e-06, "epoch": 0.35447821978952854, "percentage": 35.45, "elapsed_time": "2:07:55", "remaining_time": "3:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1361, "total_steps": 3836, "loss": 0.1825, "learning_rate": 3.8342489445639776e-06, "epoch": 0.3547388655393738, "percentage": 35.48, "elapsed_time": "2:08:01", "remaining_time": "3:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1362, "total_steps": 3836, "loss": 0.1747, "learning_rate": 3.832425751572488e-06, "epoch": 0.354999511289219, "percentage": 35.51, "elapsed_time": "2:08:06", "remaining_time": "3:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1363, "total_steps": 3836, "loss": 0.1685, "learning_rate": 3.83060156823717e-06, "epoch": 0.3552601570390643, "percentage": 35.53, "elapsed_time": "2:08:12", "remaining_time": "3:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1364, "total_steps": 3836, "loss": 0.1557, "learning_rate": 3.828776395913872e-06, "epoch": 0.3555208027889095, "percentage": 35.56, "elapsed_time": "2:08:17", "remaining_time": "3:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1365, "total_steps": 3836, "loss": 0.1703, "learning_rate": 3.82695023595918e-06, "epoch": 0.35578144853875476, "percentage": 35.58, "elapsed_time": "2:08:22", "remaining_time": "3:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1366, "total_steps": 3836, "loss": 0.1792, "learning_rate": 3.825123089730413e-06, "epoch": 0.3560420942886, "percentage": 35.61, "elapsed_time": "2:08:28", "remaining_time": "3:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1367, "total_steps": 3836, "loss": 0.1561, "learning_rate": 3.823294958585621e-06, "epoch": 0.35630274003844525, "percentage": 35.64, "elapsed_time": "2:08:33", "remaining_time": "3:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1368, "total_steps": 3836, "loss": 0.1709, "learning_rate": 3.821465843883588e-06, "epoch": 0.3565633857882905, "percentage": 35.66, "elapsed_time": "2:08:38", "remaining_time": "3:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1369, "total_steps": 3836, "loss": 0.1756, "learning_rate": 3.819635746983829e-06, "epoch": 0.35682403153813574, "percentage": 35.69, "elapsed_time": "2:08:43", "remaining_time": "3:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 3836, "loss": 0.155, "learning_rate": 3.81780466924659e-06, "epoch": 0.357084677287981, "percentage": 35.71, "elapsed_time": "2:08:48", "remaining_time": "3:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1371, "total_steps": 3836, "loss": 0.1706, "learning_rate": 3.8159726120328434e-06, "epoch": 0.35734532303782623, "percentage": 35.74, "elapsed_time": "2:08:54", "remaining_time": "3:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1372, "total_steps": 3836, "loss": 0.173, "learning_rate": 3.814139576704291e-06, "epoch": 0.3576059687876715, "percentage": 35.77, "elapsed_time": "2:09:00", "remaining_time": "3:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1373, "total_steps": 3836, "loss": 0.1752, "learning_rate": 3.8123055646233626e-06, "epoch": 0.3578666145375167, "percentage": 35.79, "elapsed_time": "2:09:05", "remaining_time": "3:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1374, "total_steps": 3836, "loss": 0.1711, "learning_rate": 3.810470577153212e-06, "epoch": 0.3581272602873619, "percentage": 35.82, "elapsed_time": "2:09:10", "remaining_time": "3:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1375, "total_steps": 3836, "loss": 0.1682, "learning_rate": 3.808634615657719e-06, "epoch": 0.35838790603720716, "percentage": 35.84, "elapsed_time": "2:09:16", "remaining_time": "3:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1376, "total_steps": 3836, "loss": 0.1719, "learning_rate": 3.8067976815014885e-06, "epoch": 0.3586485517870524, "percentage": 35.87, "elapsed_time": "2:09:21", "remaining_time": "3:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1377, "total_steps": 3836, "loss": 0.1602, "learning_rate": 3.804959776049846e-06, "epoch": 0.35890919753689765, "percentage": 35.9, "elapsed_time": "2:09:26", "remaining_time": "3:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1378, "total_steps": 3836, "loss": 0.1739, "learning_rate": 3.8031209006688397e-06, "epoch": 0.3591698432867429, "percentage": 35.92, "elapsed_time": "2:09:32", "remaining_time": "3:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1379, "total_steps": 3836, "loss": 0.1801, "learning_rate": 3.8012810567252404e-06, "epoch": 0.35943048903658814, "percentage": 35.95, "elapsed_time": "2:09:38", "remaining_time": "3:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 3836, "loss": 0.1758, "learning_rate": 3.7994402455865375e-06, "epoch": 0.3596911347864334, "percentage": 35.97, "elapsed_time": "2:09:44", "remaining_time": "3:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1381, "total_steps": 3836, "loss": 0.1743, "learning_rate": 3.7975984686209376e-06, "epoch": 0.35995178053627863, "percentage": 36.0, "elapsed_time": "2:09:49", "remaining_time": "3:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1382, "total_steps": 3836, "loss": 0.1722, "learning_rate": 3.795755727197368e-06, "epoch": 0.3602124262861239, "percentage": 36.03, "elapsed_time": "2:09:55", "remaining_time": "3:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1383, "total_steps": 3836, "loss": 0.1732, "learning_rate": 3.7939120226854724e-06, "epoch": 0.3604730720359691, "percentage": 36.05, "elapsed_time": "2:10:00", "remaining_time": "3:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1384, "total_steps": 3836, "loss": 0.1732, "learning_rate": 3.7920673564556083e-06, "epoch": 0.36073371778581437, "percentage": 36.08, "elapsed_time": "2:10:05", "remaining_time": "3:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1385, "total_steps": 3836, "loss": 0.1881, "learning_rate": 3.79022172987885e-06, "epoch": 0.3609943635356596, "percentage": 36.11, "elapsed_time": "2:10:10", "remaining_time": "3:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1386, "total_steps": 3836, "loss": 0.1687, "learning_rate": 3.788375144326985e-06, "epoch": 0.36125500928550486, "percentage": 36.13, "elapsed_time": "2:10:16", "remaining_time": "3:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1387, "total_steps": 3836, "loss": 0.1743, "learning_rate": 3.786527601172513e-06, "epoch": 0.3615156550353501, "percentage": 36.16, "elapsed_time": "2:10:22", "remaining_time": "3:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1388, "total_steps": 3836, "loss": 0.163, "learning_rate": 3.784679101788647e-06, "epoch": 0.36177630078519535, "percentage": 36.18, "elapsed_time": "2:10:27", "remaining_time": "3:50:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1389, "total_steps": 3836, "loss": 0.1676, "learning_rate": 3.782829647549308e-06, "epoch": 0.36203694653504054, "percentage": 36.21, "elapsed_time": "2:10:32", "remaining_time": "3:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 3836, "loss": 0.1951, "learning_rate": 3.78097923982913e-06, "epoch": 0.3622975922848858, "percentage": 36.24, "elapsed_time": "2:10:39", "remaining_time": "3:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1391, "total_steps": 3836, "loss": 0.1738, "learning_rate": 3.7791278800034532e-06, "epoch": 0.36255823803473103, "percentage": 36.26, "elapsed_time": "2:10:44", "remaining_time": "3:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1392, "total_steps": 3836, "loss": 0.1797, "learning_rate": 3.7772755694483265e-06, "epoch": 0.3628188837845763, "percentage": 36.29, "elapsed_time": "2:10:49", "remaining_time": "3:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1393, "total_steps": 3836, "loss": 0.1702, "learning_rate": 3.775422309540505e-06, "epoch": 0.3630795295344215, "percentage": 36.31, "elapsed_time": "2:10:55", "remaining_time": "3:49:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1394, "total_steps": 3836, "loss": 0.1798, "learning_rate": 3.7735681016574504e-06, "epoch": 0.36334017528426676, "percentage": 36.34, "elapsed_time": "2:11:00", "remaining_time": "3:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1395, "total_steps": 3836, "loss": 0.1909, "learning_rate": 3.7717129471773283e-06, "epoch": 0.363600821034112, "percentage": 36.37, "elapsed_time": "2:11:06", "remaining_time": "3:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1396, "total_steps": 3836, "loss": 0.1768, "learning_rate": 3.7698568474790064e-06, "epoch": 0.36386146678395725, "percentage": 36.39, "elapsed_time": "2:11:12", "remaining_time": "3:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1397, "total_steps": 3836, "loss": 0.1802, "learning_rate": 3.7679998039420586e-06, "epoch": 0.3641221125338025, "percentage": 36.42, "elapsed_time": "2:11:17", "remaining_time": "3:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1398, "total_steps": 3836, "loss": 0.1671, "learning_rate": 3.766141817946757e-06, "epoch": 0.36438275828364775, "percentage": 36.44, "elapsed_time": "2:11:23", "remaining_time": "3:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1399, "total_steps": 3836, "loss": 0.1726, "learning_rate": 3.7642828908740746e-06, "epoch": 0.364643404033493, "percentage": 36.47, "elapsed_time": "2:11:29", "remaining_time": "3:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 3836, "loss": 0.1726, "learning_rate": 3.7624230241056854e-06, "epoch": 0.36490404978333824, "percentage": 36.5, "elapsed_time": "2:11:34", "remaining_time": "3:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1401, "total_steps": 3836, "loss": 0.1758, "learning_rate": 3.760562219023962e-06, "epoch": 0.3651646955331835, "percentage": 36.52, "elapsed_time": "2:11:40", "remaining_time": "3:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1402, "total_steps": 3836, "loss": 0.1643, "learning_rate": 3.7587004770119716e-06, "epoch": 0.3654253412830287, "percentage": 36.55, "elapsed_time": "2:11:45", "remaining_time": "3:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1403, "total_steps": 3836, "loss": 0.1567, "learning_rate": 3.756837799453481e-06, "epoch": 0.36568598703287397, "percentage": 36.57, "elapsed_time": "2:11:51", "remaining_time": "3:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1404, "total_steps": 3836, "loss": 0.1608, "learning_rate": 3.7549741877329504e-06, "epoch": 0.36594663278271916, "percentage": 36.6, "elapsed_time": "2:11:57", "remaining_time": "3:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1405, "total_steps": 3836, "loss": 0.1724, "learning_rate": 3.7531096432355345e-06, "epoch": 0.3662072785325644, "percentage": 36.63, "elapsed_time": "2:12:03", "remaining_time": "3:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1406, "total_steps": 3836, "loss": 0.1632, "learning_rate": 3.7512441673470836e-06, "epoch": 0.36646792428240965, "percentage": 36.65, "elapsed_time": "2:12:08", "remaining_time": "3:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1407, "total_steps": 3836, "loss": 0.1751, "learning_rate": 3.749377761454136e-06, "epoch": 0.3667285700322549, "percentage": 36.68, "elapsed_time": "2:12:14", "remaining_time": "3:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1408, "total_steps": 3836, "loss": 0.1832, "learning_rate": 3.747510426943925e-06, "epoch": 0.36698921578210014, "percentage": 36.7, "elapsed_time": "2:12:20", "remaining_time": "3:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1409, "total_steps": 3836, "loss": 0.1657, "learning_rate": 3.7456421652043727e-06, "epoch": 0.3672498615319454, "percentage": 36.73, "elapsed_time": "2:12:25", "remaining_time": "3:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 3836, "loss": 0.1655, "learning_rate": 3.7437729776240894e-06, "epoch": 0.36751050728179063, "percentage": 36.76, "elapsed_time": "2:12:30", "remaining_time": "3:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1411, "total_steps": 3836, "loss": 0.1985, "learning_rate": 3.741902865592376e-06, "epoch": 0.3677711530316359, "percentage": 36.78, "elapsed_time": "2:12:36", "remaining_time": "3:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1412, "total_steps": 3836, "loss": 0.1598, "learning_rate": 3.740031830499219e-06, "epoch": 0.3680317987814811, "percentage": 36.81, "elapsed_time": "2:12:42", "remaining_time": "3:47:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1413, "total_steps": 3836, "loss": 0.1795, "learning_rate": 3.738159873735289e-06, "epoch": 0.36829244453132637, "percentage": 36.84, "elapsed_time": "2:12:47", "remaining_time": "3:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1414, "total_steps": 3836, "loss": 0.1644, "learning_rate": 3.7362869966919467e-06, "epoch": 0.3685530902811716, "percentage": 36.86, "elapsed_time": "2:12:52", "remaining_time": "3:47:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1415, "total_steps": 3836, "loss": 0.1841, "learning_rate": 3.7344132007612317e-06, "epoch": 0.36881373603101686, "percentage": 36.89, "elapsed_time": "2:12:58", "remaining_time": "3:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1416, "total_steps": 3836, "loss": 0.1766, "learning_rate": 3.7325384873358695e-06, "epoch": 0.3690743817808621, "percentage": 36.91, "elapsed_time": "2:13:03", "remaining_time": "3:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1417, "total_steps": 3836, "loss": 0.1791, "learning_rate": 3.730662857809266e-06, "epoch": 0.36933502753070735, "percentage": 36.94, "elapsed_time": "2:13:09", "remaining_time": "3:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1418, "total_steps": 3836, "loss": 0.1672, "learning_rate": 3.7287863135755098e-06, "epoch": 0.3695956732805526, "percentage": 36.97, "elapsed_time": "2:13:15", "remaining_time": "3:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1419, "total_steps": 3836, "loss": 0.174, "learning_rate": 3.7269088560293677e-06, "epoch": 0.3698563190303978, "percentage": 36.99, "elapsed_time": "2:13:21", "remaining_time": "3:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 3836, "loss": 0.1677, "learning_rate": 3.7250304865662857e-06, "epoch": 0.37011696478024303, "percentage": 37.02, "elapsed_time": "2:13:26", "remaining_time": "3:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1421, "total_steps": 3836, "loss": 0.1732, "learning_rate": 3.723151206582388e-06, "epoch": 0.3703776105300883, "percentage": 37.04, "elapsed_time": "2:13:32", "remaining_time": "3:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1422, "total_steps": 3836, "loss": 0.176, "learning_rate": 3.7212710174744753e-06, "epoch": 0.3706382562799335, "percentage": 37.07, "elapsed_time": "2:13:37", "remaining_time": "3:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1423, "total_steps": 3836, "loss": 0.1826, "learning_rate": 3.719389920640025e-06, "epoch": 0.37089890202977877, "percentage": 37.1, "elapsed_time": "2:13:42", "remaining_time": "3:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1424, "total_steps": 3836, "loss": 0.1611, "learning_rate": 3.7175079174771872e-06, "epoch": 0.371159547779624, "percentage": 37.12, "elapsed_time": "2:13:48", "remaining_time": "3:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1425, "total_steps": 3836, "loss": 0.1692, "learning_rate": 3.7156250093847868e-06, "epoch": 0.37142019352946926, "percentage": 37.15, "elapsed_time": "2:13:54", "remaining_time": "3:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1426, "total_steps": 3836, "loss": 0.1602, "learning_rate": 3.713741197762323e-06, "epoch": 0.3716808392793145, "percentage": 37.17, "elapsed_time": "2:13:59", "remaining_time": "3:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1427, "total_steps": 3836, "loss": 0.1709, "learning_rate": 3.711856484009961e-06, "epoch": 0.37194148502915975, "percentage": 37.2, "elapsed_time": "2:14:06", "remaining_time": "3:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1428, "total_steps": 3836, "loss": 0.1657, "learning_rate": 3.7099708695285436e-06, "epoch": 0.372202130779005, "percentage": 37.23, "elapsed_time": "2:14:11", "remaining_time": "3:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1429, "total_steps": 3836, "loss": 0.1702, "learning_rate": 3.70808435571958e-06, "epoch": 0.37246277652885024, "percentage": 37.25, "elapsed_time": "2:14:17", "remaining_time": "3:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 3836, "loss": 0.1853, "learning_rate": 3.706196943985245e-06, "epoch": 0.3727234222786955, "percentage": 37.28, "elapsed_time": "2:14:23", "remaining_time": "3:46:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1431, "total_steps": 3836, "loss": 0.1667, "learning_rate": 3.704308635728385e-06, "epoch": 0.3729840680285407, "percentage": 37.3, "elapsed_time": "2:14:28", "remaining_time": "3:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1432, "total_steps": 3836, "loss": 0.172, "learning_rate": 3.7024194323525115e-06, "epoch": 0.373244713778386, "percentage": 37.33, "elapsed_time": "2:14:34", "remaining_time": "3:45:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1433, "total_steps": 3836, "loss": 0.1691, "learning_rate": 3.7005293352618e-06, "epoch": 0.3735053595282312, "percentage": 37.36, "elapsed_time": "2:14:40", "remaining_time": "3:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1434, "total_steps": 3836, "loss": 0.1872, "learning_rate": 3.6986383458610925e-06, "epoch": 0.3737660052780764, "percentage": 37.38, "elapsed_time": "2:14:46", "remaining_time": "3:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1435, "total_steps": 3836, "loss": 0.1599, "learning_rate": 3.6967464655558916e-06, "epoch": 0.37402665102792165, "percentage": 37.41, "elapsed_time": "2:14:51", "remaining_time": "3:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1436, "total_steps": 3836, "loss": 0.1614, "learning_rate": 3.694853695752364e-06, "epoch": 0.3742872967777669, "percentage": 37.43, "elapsed_time": "2:14:56", "remaining_time": "3:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1437, "total_steps": 3836, "loss": 0.1717, "learning_rate": 3.6929600378573373e-06, "epoch": 0.37454794252761214, "percentage": 37.46, "elapsed_time": "2:15:01", "remaining_time": "3:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1438, "total_steps": 3836, "loss": 0.1544, "learning_rate": 3.6910654932782984e-06, "epoch": 0.3748085882774574, "percentage": 37.49, "elapsed_time": "2:15:07", "remaining_time": "3:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1439, "total_steps": 3836, "loss": 0.1757, "learning_rate": 3.689170063423394e-06, "epoch": 0.37506923402730263, "percentage": 37.51, "elapsed_time": "2:15:12", "remaining_time": "3:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 3836, "loss": 0.1699, "learning_rate": 3.6872737497014286e-06, "epoch": 0.3753298797771479, "percentage": 37.54, "elapsed_time": "2:15:18", "remaining_time": "3:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1441, "total_steps": 3836, "loss": 0.1719, "learning_rate": 3.6853765535218632e-06, "epoch": 0.3755905255269931, "percentage": 37.57, "elapsed_time": "2:15:24", "remaining_time": "3:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1442, "total_steps": 3836, "loss": 0.1694, "learning_rate": 3.6834784762948156e-06, "epoch": 0.37585117127683837, "percentage": 37.59, "elapsed_time": "2:15:29", "remaining_time": "3:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1443, "total_steps": 3836, "loss": 0.1832, "learning_rate": 3.6815795194310567e-06, "epoch": 0.3761118170266836, "percentage": 37.62, "elapsed_time": "2:15:34", "remaining_time": "3:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1444, "total_steps": 3836, "loss": 0.1828, "learning_rate": 3.6796796843420134e-06, "epoch": 0.37637246277652886, "percentage": 37.64, "elapsed_time": "2:15:40", "remaining_time": "3:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1445, "total_steps": 3836, "loss": 0.168, "learning_rate": 3.677778972439765e-06, "epoch": 0.3766331085263741, "percentage": 37.67, "elapsed_time": "2:15:45", "remaining_time": "3:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1446, "total_steps": 3836, "loss": 0.1802, "learning_rate": 3.67587738513704e-06, "epoch": 0.37689375427621935, "percentage": 37.7, "elapsed_time": "2:15:51", "remaining_time": "3:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1447, "total_steps": 3836, "loss": 0.1785, "learning_rate": 3.6739749238472207e-06, "epoch": 0.3771544000260646, "percentage": 37.72, "elapsed_time": "2:15:56", "remaining_time": "3:44:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1448, "total_steps": 3836, "loss": 0.1804, "learning_rate": 3.672071589984337e-06, "epoch": 0.37741504577590984, "percentage": 37.75, "elapsed_time": "2:16:02", "remaining_time": "3:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1449, "total_steps": 3836, "loss": 0.1629, "learning_rate": 3.670167384963069e-06, "epoch": 0.37767569152575503, "percentage": 37.77, "elapsed_time": "2:16:07", "remaining_time": "3:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 3836, "loss": 0.1666, "learning_rate": 3.6682623101987423e-06, "epoch": 0.3779363372756003, "percentage": 37.8, "elapsed_time": "2:16:13", "remaining_time": "3:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1451, "total_steps": 3836, "loss": 0.1658, "learning_rate": 3.6663563671073317e-06, "epoch": 0.3781969830254455, "percentage": 37.83, "elapsed_time": "2:16:18", "remaining_time": "3:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1452, "total_steps": 3836, "loss": 0.1812, "learning_rate": 3.664449557105454e-06, "epoch": 0.37845762877529077, "percentage": 37.85, "elapsed_time": "2:16:24", "remaining_time": "3:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1453, "total_steps": 3836, "loss": 0.157, "learning_rate": 3.662541881610372e-06, "epoch": 0.378718274525136, "percentage": 37.88, "elapsed_time": "2:16:30", "remaining_time": "3:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1454, "total_steps": 3836, "loss": 0.1782, "learning_rate": 3.6606333420399933e-06, "epoch": 0.37897892027498126, "percentage": 37.9, "elapsed_time": "2:16:36", "remaining_time": "3:43:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1455, "total_steps": 3836, "loss": 0.1623, "learning_rate": 3.6587239398128644e-06, "epoch": 0.3792395660248265, "percentage": 37.93, "elapsed_time": "2:16:41", "remaining_time": "3:43:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1456, "total_steps": 3836, "loss": 0.1601, "learning_rate": 3.6568136763481766e-06, "epoch": 0.37950021177467175, "percentage": 37.96, "elapsed_time": "2:16:47", "remaining_time": "3:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1457, "total_steps": 3836, "loss": 0.1687, "learning_rate": 3.6549025530657588e-06, "epoch": 0.379760857524517, "percentage": 37.98, "elapsed_time": "2:16:52", "remaining_time": "3:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1458, "total_steps": 3836, "loss": 0.1908, "learning_rate": 3.652990571386079e-06, "epoch": 0.38002150327436224, "percentage": 38.01, "elapsed_time": "2:16:58", "remaining_time": "3:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1459, "total_steps": 3836, "loss": 0.1615, "learning_rate": 3.6510777327302455e-06, "epoch": 0.3802821490242075, "percentage": 38.03, "elapsed_time": "2:17:03", "remaining_time": "3:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 3836, "loss": 0.1833, "learning_rate": 3.649164038520001e-06, "epoch": 0.38054279477405273, "percentage": 38.06, "elapsed_time": "2:17:09", "remaining_time": "3:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1461, "total_steps": 3836, "loss": 0.173, "learning_rate": 3.6472494901777255e-06, "epoch": 0.380803440523898, "percentage": 38.09, "elapsed_time": "2:17:14", "remaining_time": "3:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1462, "total_steps": 3836, "loss": 0.1735, "learning_rate": 3.6453340891264344e-06, "epoch": 0.3810640862737432, "percentage": 38.11, "elapsed_time": "2:17:19", "remaining_time": "3:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1463, "total_steps": 3836, "loss": 0.1764, "learning_rate": 3.643417836789774e-06, "epoch": 0.38132473202358846, "percentage": 38.14, "elapsed_time": "2:17:24", "remaining_time": "3:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1464, "total_steps": 3836, "loss": 0.1733, "learning_rate": 3.641500734592026e-06, "epoch": 0.3815853777734337, "percentage": 38.16, "elapsed_time": "2:17:30", "remaining_time": "3:42:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1465, "total_steps": 3836, "loss": 0.1753, "learning_rate": 3.6395827839581046e-06, "epoch": 0.3818460235232789, "percentage": 38.19, "elapsed_time": "2:17:35", "remaining_time": "3:42:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1466, "total_steps": 3836, "loss": 0.1812, "learning_rate": 3.63766398631355e-06, "epoch": 0.38210666927312414, "percentage": 38.22, "elapsed_time": "2:17:41", "remaining_time": "3:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1467, "total_steps": 3836, "loss": 0.1697, "learning_rate": 3.6357443430845383e-06, "epoch": 0.3823673150229694, "percentage": 38.24, "elapsed_time": "2:17:46", "remaining_time": "3:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1468, "total_steps": 3836, "loss": 0.1708, "learning_rate": 3.633823855697869e-06, "epoch": 0.38262796077281463, "percentage": 38.27, "elapsed_time": "2:17:52", "remaining_time": "3:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1469, "total_steps": 3836, "loss": 0.1734, "learning_rate": 3.631902525580971e-06, "epoch": 0.3828886065226599, "percentage": 38.3, "elapsed_time": "2:17:57", "remaining_time": "3:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 3836, "loss": 0.1751, "learning_rate": 3.6299803541619e-06, "epoch": 0.3831492522725051, "percentage": 38.32, "elapsed_time": "2:18:03", "remaining_time": "3:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1471, "total_steps": 3836, "loss": 0.1802, "learning_rate": 3.6280573428693354e-06, "epoch": 0.38340989802235037, "percentage": 38.35, "elapsed_time": "2:18:09", "remaining_time": "3:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1472, "total_steps": 3836, "loss": 0.1697, "learning_rate": 3.6261334931325833e-06, "epoch": 0.3836705437721956, "percentage": 38.37, "elapsed_time": "2:18:14", "remaining_time": "3:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1473, "total_steps": 3836, "loss": 0.1777, "learning_rate": 3.6242088063815705e-06, "epoch": 0.38393118952204086, "percentage": 38.4, "elapsed_time": "2:18:19", "remaining_time": "3:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1474, "total_steps": 3836, "loss": 0.1608, "learning_rate": 3.622283284046847e-06, "epoch": 0.3841918352718861, "percentage": 38.43, "elapsed_time": "2:18:24", "remaining_time": "3:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1475, "total_steps": 3836, "loss": 0.1767, "learning_rate": 3.620356927559585e-06, "epoch": 0.38445248102173135, "percentage": 38.45, "elapsed_time": "2:18:30", "remaining_time": "3:41:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1476, "total_steps": 3836, "loss": 0.1772, "learning_rate": 3.618429738351574e-06, "epoch": 0.3847131267715766, "percentage": 38.48, "elapsed_time": "2:18:35", "remaining_time": "3:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1477, "total_steps": 3836, "loss": 0.1711, "learning_rate": 3.6165017178552252e-06, "epoch": 0.38497377252142184, "percentage": 38.5, "elapsed_time": "2:18:41", "remaining_time": "3:41:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1478, "total_steps": 3836, "loss": 0.1775, "learning_rate": 3.6145728675035658e-06, "epoch": 0.3852344182712671, "percentage": 38.53, "elapsed_time": "2:18:46", "remaining_time": "3:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1479, "total_steps": 3836, "loss": 0.1799, "learning_rate": 3.6126431887302397e-06, "epoch": 0.38549506402111233, "percentage": 38.56, "elapsed_time": "2:18:52", "remaining_time": "3:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 3836, "loss": 0.1704, "learning_rate": 3.6107126829695093e-06, "epoch": 0.3857557097709575, "percentage": 38.58, "elapsed_time": "2:18:57", "remaining_time": "3:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1481, "total_steps": 3836, "loss": 0.1628, "learning_rate": 3.608781351656249e-06, "epoch": 0.38601635552080277, "percentage": 38.61, "elapsed_time": "2:19:02", "remaining_time": "3:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1482, "total_steps": 3836, "loss": 0.1718, "learning_rate": 3.6068491962259457e-06, "epoch": 0.386277001270648, "percentage": 38.63, "elapsed_time": "2:19:08", "remaining_time": "3:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1483, "total_steps": 3836, "loss": 0.1673, "learning_rate": 3.604916218114702e-06, "epoch": 0.38653764702049326, "percentage": 38.66, "elapsed_time": "2:19:13", "remaining_time": "3:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1484, "total_steps": 3836, "loss": 0.1698, "learning_rate": 3.6029824187592304e-06, "epoch": 0.3867982927703385, "percentage": 38.69, "elapsed_time": "2:19:19", "remaining_time": "3:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1485, "total_steps": 3836, "loss": 0.1757, "learning_rate": 3.6010477995968548e-06, "epoch": 0.38705893852018375, "percentage": 38.71, "elapsed_time": "2:19:24", "remaining_time": "3:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1486, "total_steps": 3836, "loss": 0.171, "learning_rate": 3.599112362065506e-06, "epoch": 0.387319584270029, "percentage": 38.74, "elapsed_time": "2:19:30", "remaining_time": "3:40:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1487, "total_steps": 3836, "loss": 0.1775, "learning_rate": 3.5971761076037256e-06, "epoch": 0.38758023001987424, "percentage": 38.76, "elapsed_time": "2:19:35", "remaining_time": "3:40:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1488, "total_steps": 3836, "loss": 0.1659, "learning_rate": 3.5952390376506614e-06, "epoch": 0.3878408757697195, "percentage": 38.79, "elapsed_time": "2:19:41", "remaining_time": "3:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1489, "total_steps": 3836, "loss": 0.1762, "learning_rate": 3.593301153646067e-06, "epoch": 0.38810152151956473, "percentage": 38.82, "elapsed_time": "2:19:47", "remaining_time": "3:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 3836, "loss": 0.189, "learning_rate": 3.591362457030302e-06, "epoch": 0.38836216726941, "percentage": 38.84, "elapsed_time": "2:19:53", "remaining_time": "3:40:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1491, "total_steps": 3836, "loss": 0.1651, "learning_rate": 3.5894229492443284e-06, "epoch": 0.3886228130192552, "percentage": 38.87, "elapsed_time": "2:19:59", "remaining_time": "3:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1492, "total_steps": 3836, "loss": 0.1846, "learning_rate": 3.5874826317297135e-06, "epoch": 0.38888345876910047, "percentage": 38.89, "elapsed_time": "2:20:05", "remaining_time": "3:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1493, "total_steps": 3836, "loss": 0.1738, "learning_rate": 3.585541505928624e-06, "epoch": 0.3891441045189457, "percentage": 38.92, "elapsed_time": "2:20:11", "remaining_time": "3:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1494, "total_steps": 3836, "loss": 0.1846, "learning_rate": 3.5835995732838292e-06, "epoch": 0.38940475026879096, "percentage": 38.95, "elapsed_time": "2:20:16", "remaining_time": "3:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1495, "total_steps": 3836, "loss": 0.1695, "learning_rate": 3.581656835238697e-06, "epoch": 0.38966539601863615, "percentage": 38.97, "elapsed_time": "2:20:22", "remaining_time": "3:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1496, "total_steps": 3836, "loss": 0.1613, "learning_rate": 3.579713293237194e-06, "epoch": 0.3899260417684814, "percentage": 39.0, "elapsed_time": "2:20:28", "remaining_time": "3:39:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1497, "total_steps": 3836, "loss": 0.1513, "learning_rate": 3.577768948723885e-06, "epoch": 0.39018668751832664, "percentage": 39.03, "elapsed_time": "2:20:33", "remaining_time": "3:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1498, "total_steps": 3836, "loss": 0.1804, "learning_rate": 3.5758238031439306e-06, "epoch": 0.3904473332681719, "percentage": 39.05, "elapsed_time": "2:20:39", "remaining_time": "3:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1499, "total_steps": 3836, "loss": 0.1683, "learning_rate": 3.5738778579430867e-06, "epoch": 0.3907079790180171, "percentage": 39.08, "elapsed_time": "2:20:44", "remaining_time": "3:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 3836, "loss": 0.1704, "learning_rate": 3.5719311145677057e-06, "epoch": 0.39096862476786237, "percentage": 39.1, "elapsed_time": "2:20:50", "remaining_time": "3:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 3836, "eval_loss": 0.17104974389076233, "epoch": 0.39096862476786237, "percentage": 39.1, "elapsed_time": "2:21:45", "remaining_time": "3:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1501, "total_steps": 3836, "loss": 0.1827, "learning_rate": 3.5699835744647293e-06, "epoch": 0.3912292705177076, "percentage": 39.13, "elapsed_time": "2:21:50", "remaining_time": "3:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1502, "total_steps": 3836, "loss": 0.1736, "learning_rate": 3.5680352390816942e-06, "epoch": 0.39148991626755286, "percentage": 39.16, "elapsed_time": "2:21:56", "remaining_time": "3:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1503, "total_steps": 3836, "loss": 0.1622, "learning_rate": 3.566086109866729e-06, "epoch": 0.3917505620173981, "percentage": 39.18, "elapsed_time": "2:22:02", "remaining_time": "3:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1504, "total_steps": 3836, "loss": 0.168, "learning_rate": 3.5641361882685487e-06, "epoch": 0.39201120776724335, "percentage": 39.21, "elapsed_time": "2:22:07", "remaining_time": "3:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1505, "total_steps": 3836, "loss": 0.1764, "learning_rate": 3.562185475736461e-06, "epoch": 0.3922718535170886, "percentage": 39.23, "elapsed_time": "2:22:13", "remaining_time": "3:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1506, "total_steps": 3836, "loss": 0.1622, "learning_rate": 3.5602339737203593e-06, "epoch": 0.39253249926693384, "percentage": 39.26, "elapsed_time": "2:22:19", "remaining_time": "3:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1507, "total_steps": 3836, "loss": 0.1702, "learning_rate": 3.5582816836707248e-06, "epoch": 0.3927931450167791, "percentage": 39.29, "elapsed_time": "2:22:24", "remaining_time": "3:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1508, "total_steps": 3836, "loss": 0.1825, "learning_rate": 3.5563286070386237e-06, "epoch": 0.39305379076662433, "percentage": 39.31, "elapsed_time": "2:22:29", "remaining_time": "3:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1509, "total_steps": 3836, "loss": 0.1854, "learning_rate": 3.5543747452757067e-06, "epoch": 0.3933144365164696, "percentage": 39.34, "elapsed_time": "2:22:35", "remaining_time": "3:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 3836, "loss": 0.1804, "learning_rate": 3.5524200998342095e-06, "epoch": 0.39357508226631477, "percentage": 39.36, "elapsed_time": "2:22:40", "remaining_time": "3:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1511, "total_steps": 3836, "loss": 0.1651, "learning_rate": 3.5504646721669484e-06, "epoch": 0.39383572801616, "percentage": 39.39, "elapsed_time": "2:22:46", "remaining_time": "3:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1512, "total_steps": 3836, "loss": 0.1834, "learning_rate": 3.5485084637273225e-06, "epoch": 0.39409637376600526, "percentage": 39.42, "elapsed_time": "2:22:51", "remaining_time": "3:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1513, "total_steps": 3836, "loss": 0.1704, "learning_rate": 3.546551475969311e-06, "epoch": 0.3943570195158505, "percentage": 39.44, "elapsed_time": "2:22:56", "remaining_time": "3:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1514, "total_steps": 3836, "loss": 0.1618, "learning_rate": 3.5445937103474713e-06, "epoch": 0.39461766526569575, "percentage": 39.47, "elapsed_time": "2:23:02", "remaining_time": "3:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1515, "total_steps": 3836, "loss": 0.1657, "learning_rate": 3.5426351683169397e-06, "epoch": 0.394878311015541, "percentage": 39.49, "elapsed_time": "2:23:07", "remaining_time": "3:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1516, "total_steps": 3836, "loss": 0.1735, "learning_rate": 3.5406758513334316e-06, "epoch": 0.39513895676538624, "percentage": 39.52, "elapsed_time": "2:23:12", "remaining_time": "3:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1517, "total_steps": 3836, "loss": 0.1672, "learning_rate": 3.538715760853233e-06, "epoch": 0.3953996025152315, "percentage": 39.55, "elapsed_time": "2:23:17", "remaining_time": "3:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1518, "total_steps": 3836, "loss": 0.1655, "learning_rate": 3.536754898333211e-06, "epoch": 0.39566024826507673, "percentage": 39.57, "elapsed_time": "2:23:22", "remaining_time": "3:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1519, "total_steps": 3836, "loss": 0.1531, "learning_rate": 3.5347932652308025e-06, "epoch": 0.395920894014922, "percentage": 39.6, "elapsed_time": "2:23:28", "remaining_time": "3:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 3836, "loss": 0.1522, "learning_rate": 3.532830863004018e-06, "epoch": 0.3961815397647672, "percentage": 39.62, "elapsed_time": "2:23:33", "remaining_time": "3:38:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1521, "total_steps": 3836, "loss": 0.1618, "learning_rate": 3.5308676931114415e-06, "epoch": 0.39644218551461247, "percentage": 39.65, "elapsed_time": "2:23:40", "remaining_time": "3:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1522, "total_steps": 3836, "loss": 0.1707, "learning_rate": 3.5289037570122246e-06, "epoch": 0.3967028312644577, "percentage": 39.68, "elapsed_time": "2:23:45", "remaining_time": "3:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1523, "total_steps": 3836, "loss": 0.1489, "learning_rate": 3.526939056166091e-06, "epoch": 0.39696347701430296, "percentage": 39.7, "elapsed_time": "2:23:50", "remaining_time": "3:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1524, "total_steps": 3836, "loss": 0.166, "learning_rate": 3.5249735920333312e-06, "epoch": 0.3972241227641482, "percentage": 39.73, "elapsed_time": "2:23:55", "remaining_time": "3:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1525, "total_steps": 3836, "loss": 0.1602, "learning_rate": 3.523007366074804e-06, "epoch": 0.3974847685139934, "percentage": 39.75, "elapsed_time": "2:24:01", "remaining_time": "3:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1526, "total_steps": 3836, "loss": 0.16, "learning_rate": 3.521040379751933e-06, "epoch": 0.39774541426383864, "percentage": 39.78, "elapsed_time": "2:24:06", "remaining_time": "3:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1527, "total_steps": 3836, "loss": 0.167, "learning_rate": 3.519072634526709e-06, "epoch": 0.3980060600136839, "percentage": 39.81, "elapsed_time": "2:24:11", "remaining_time": "3:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1528, "total_steps": 3836, "loss": 0.1709, "learning_rate": 3.517104131861685e-06, "epoch": 0.3982667057635291, "percentage": 39.83, "elapsed_time": "2:24:17", "remaining_time": "3:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1529, "total_steps": 3836, "loss": 0.1814, "learning_rate": 3.5151348732199776e-06, "epoch": 0.3985273515133744, "percentage": 39.86, "elapsed_time": "2:24:23", "remaining_time": "3:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 3836, "loss": 0.1707, "learning_rate": 3.513164860065267e-06, "epoch": 0.3987879972632196, "percentage": 39.89, "elapsed_time": "2:24:28", "remaining_time": "3:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1531, "total_steps": 3836, "loss": 0.1658, "learning_rate": 3.5111940938617904e-06, "epoch": 0.39904864301306486, "percentage": 39.91, "elapsed_time": "2:24:34", "remaining_time": "3:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1532, "total_steps": 3836, "loss": 0.1785, "learning_rate": 3.509222576074349e-06, "epoch": 0.3993092887629101, "percentage": 39.94, "elapsed_time": "2:24:39", "remaining_time": "3:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1533, "total_steps": 3836, "loss": 0.1762, "learning_rate": 3.5072503081682995e-06, "epoch": 0.39956993451275535, "percentage": 39.96, "elapsed_time": "2:24:44", "remaining_time": "3:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1534, "total_steps": 3836, "loss": 0.16, "learning_rate": 3.5052772916095584e-06, "epoch": 0.3998305802626006, "percentage": 39.99, "elapsed_time": "2:24:49", "remaining_time": "3:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1535, "total_steps": 3836, "loss": 0.162, "learning_rate": 3.5033035278645955e-06, "epoch": 0.40009122601244584, "percentage": 40.02, "elapsed_time": "2:24:55", "remaining_time": "3:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1536, "total_steps": 3836, "loss": 0.1657, "learning_rate": 3.50132901840044e-06, "epoch": 0.4003518717622911, "percentage": 40.04, "elapsed_time": "2:25:01", "remaining_time": "3:37:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1537, "total_steps": 3836, "loss": 0.1584, "learning_rate": 3.499353764684672e-06, "epoch": 0.40061251751213633, "percentage": 40.07, "elapsed_time": "2:25:06", "remaining_time": "3:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1538, "total_steps": 3836, "loss": 0.1615, "learning_rate": 3.4973777681854265e-06, "epoch": 0.4008731632619816, "percentage": 40.09, "elapsed_time": "2:25:12", "remaining_time": "3:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1539, "total_steps": 3836, "loss": 0.1895, "learning_rate": 3.4954010303713902e-06, "epoch": 0.4011338090118268, "percentage": 40.12, "elapsed_time": "2:25:17", "remaining_time": "3:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 3836, "loss": 0.1668, "learning_rate": 3.4934235527118e-06, "epoch": 0.401394454761672, "percentage": 40.15, "elapsed_time": "2:25:23", "remaining_time": "3:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1541, "total_steps": 3836, "loss": 0.1746, "learning_rate": 3.4914453366764455e-06, "epoch": 0.40165510051151726, "percentage": 40.17, "elapsed_time": "2:25:29", "remaining_time": "3:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1542, "total_steps": 3836, "loss": 0.165, "learning_rate": 3.4894663837356607e-06, "epoch": 0.4019157462613625, "percentage": 40.2, "elapsed_time": "2:25:35", "remaining_time": "3:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1543, "total_steps": 3836, "loss": 0.1692, "learning_rate": 3.487486695360331e-06, "epoch": 0.40217639201120775, "percentage": 40.22, "elapsed_time": "2:25:41", "remaining_time": "3:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1544, "total_steps": 3836, "loss": 0.1628, "learning_rate": 3.485506273021887e-06, "epoch": 0.402437037761053, "percentage": 40.25, "elapsed_time": "2:25:46", "remaining_time": "3:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1545, "total_steps": 3836, "loss": 0.1462, "learning_rate": 3.483525118192304e-06, "epoch": 0.40269768351089824, "percentage": 40.28, "elapsed_time": "2:25:52", "remaining_time": "3:36:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1546, "total_steps": 3836, "loss": 0.1841, "learning_rate": 3.4815432323441043e-06, "epoch": 0.4029583292607435, "percentage": 40.3, "elapsed_time": "2:25:57", "remaining_time": "3:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1547, "total_steps": 3836, "loss": 0.1802, "learning_rate": 3.4795606169503506e-06, "epoch": 0.40321897501058873, "percentage": 40.33, "elapsed_time": "2:26:02", "remaining_time": "3:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1548, "total_steps": 3836, "loss": 0.1819, "learning_rate": 3.47757727348465e-06, "epoch": 0.403479620760434, "percentage": 40.35, "elapsed_time": "2:26:08", "remaining_time": "3:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1549, "total_steps": 3836, "loss": 0.1706, "learning_rate": 3.4755932034211493e-06, "epoch": 0.4037402665102792, "percentage": 40.38, "elapsed_time": "2:26:13", "remaining_time": "3:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 3836, "loss": 0.161, "learning_rate": 3.4736084082345355e-06, "epoch": 0.40400091226012447, "percentage": 40.41, "elapsed_time": "2:26:19", "remaining_time": "3:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1551, "total_steps": 3836, "loss": 0.1765, "learning_rate": 3.4716228894000366e-06, "epoch": 0.4042615580099697, "percentage": 40.43, "elapsed_time": "2:26:25", "remaining_time": "3:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1552, "total_steps": 3836, "loss": 0.1689, "learning_rate": 3.4696366483934156e-06, "epoch": 0.40452220375981496, "percentage": 40.46, "elapsed_time": "2:26:31", "remaining_time": "3:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1553, "total_steps": 3836, "loss": 0.1891, "learning_rate": 3.4676496866909736e-06, "epoch": 0.4047828495096602, "percentage": 40.48, "elapsed_time": "2:26:36", "remaining_time": "3:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1554, "total_steps": 3836, "loss": 0.1812, "learning_rate": 3.465662005769548e-06, "epoch": 0.40504349525950545, "percentage": 40.51, "elapsed_time": "2:26:42", "remaining_time": "3:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1555, "total_steps": 3836, "loss": 0.1821, "learning_rate": 3.463673607106509e-06, "epoch": 0.4053041410093507, "percentage": 40.54, "elapsed_time": "2:26:48", "remaining_time": "3:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1556, "total_steps": 3836, "loss": 0.185, "learning_rate": 3.461684492179763e-06, "epoch": 0.4055647867591959, "percentage": 40.56, "elapsed_time": "2:26:54", "remaining_time": "3:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1557, "total_steps": 3836, "loss": 0.177, "learning_rate": 3.459694662467745e-06, "epoch": 0.40582543250904113, "percentage": 40.59, "elapsed_time": "2:26:59", "remaining_time": "3:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1558, "total_steps": 3836, "loss": 0.1535, "learning_rate": 3.4577041194494253e-06, "epoch": 0.4060860782588864, "percentage": 40.62, "elapsed_time": "2:27:05", "remaining_time": "3:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1559, "total_steps": 3836, "loss": 0.1612, "learning_rate": 3.455712864604302e-06, "epoch": 0.4063467240087316, "percentage": 40.64, "elapsed_time": "2:27:10", "remaining_time": "3:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 3836, "loss": 0.1531, "learning_rate": 3.4537208994124015e-06, "epoch": 0.40660736975857686, "percentage": 40.67, "elapsed_time": "2:27:16", "remaining_time": "3:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1561, "total_steps": 3836, "loss": 0.1656, "learning_rate": 3.4517282253542806e-06, "epoch": 0.4068680155084221, "percentage": 40.69, "elapsed_time": "2:27:22", "remaining_time": "3:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1562, "total_steps": 3836, "loss": 0.157, "learning_rate": 3.449734843911022e-06, "epoch": 0.40712866125826735, "percentage": 40.72, "elapsed_time": "2:27:28", "remaining_time": "3:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1563, "total_steps": 3836, "loss": 0.1705, "learning_rate": 3.4477407565642333e-06, "epoch": 0.4073893070081126, "percentage": 40.75, "elapsed_time": "2:27:33", "remaining_time": "3:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1564, "total_steps": 3836, "loss": 0.1472, "learning_rate": 3.4457459647960477e-06, "epoch": 0.40764995275795785, "percentage": 40.77, "elapsed_time": "2:27:38", "remaining_time": "3:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1565, "total_steps": 3836, "loss": 0.1835, "learning_rate": 3.4437504700891215e-06, "epoch": 0.4079105985078031, "percentage": 40.8, "elapsed_time": "2:27:44", "remaining_time": "3:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1566, "total_steps": 3836, "loss": 0.1701, "learning_rate": 3.441754273926634e-06, "epoch": 0.40817124425764834, "percentage": 40.82, "elapsed_time": "2:27:50", "remaining_time": "3:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1567, "total_steps": 3836, "loss": 0.1738, "learning_rate": 3.4397573777922853e-06, "epoch": 0.4084318900074936, "percentage": 40.85, "elapsed_time": "2:27:55", "remaining_time": "3:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1568, "total_steps": 3836, "loss": 0.162, "learning_rate": 3.4377597831702962e-06, "epoch": 0.4086925357573388, "percentage": 40.88, "elapsed_time": "2:28:00", "remaining_time": "3:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1569, "total_steps": 3836, "loss": 0.1626, "learning_rate": 3.435761491545407e-06, "epoch": 0.40895318150718407, "percentage": 40.9, "elapsed_time": "2:28:06", "remaining_time": "3:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 3836, "loss": 0.1712, "learning_rate": 3.433762504402874e-06, "epoch": 0.4092138272570293, "percentage": 40.93, "elapsed_time": "2:28:12", "remaining_time": "3:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1571, "total_steps": 3836, "loss": 0.1556, "learning_rate": 3.4317628232284734e-06, "epoch": 0.4094744730068745, "percentage": 40.95, "elapsed_time": "2:28:17", "remaining_time": "3:33:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1572, "total_steps": 3836, "loss": 0.1777, "learning_rate": 3.429762449508495e-06, "epoch": 0.40973511875671975, "percentage": 40.98, "elapsed_time": "2:28:23", "remaining_time": "3:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1573, "total_steps": 3836, "loss": 0.1744, "learning_rate": 3.427761384729744e-06, "epoch": 0.409995764506565, "percentage": 41.01, "elapsed_time": "2:28:28", "remaining_time": "3:33:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1574, "total_steps": 3836, "loss": 0.1626, "learning_rate": 3.425759630379541e-06, "epoch": 0.41025641025641024, "percentage": 41.03, "elapsed_time": "2:28:34", "remaining_time": "3:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1575, "total_steps": 3836, "loss": 0.1686, "learning_rate": 3.423757187945716e-06, "epoch": 0.4105170560062555, "percentage": 41.06, "elapsed_time": "2:28:40", "remaining_time": "3:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1576, "total_steps": 3836, "loss": 0.1482, "learning_rate": 3.421754058916612e-06, "epoch": 0.41077770175610073, "percentage": 41.08, "elapsed_time": "2:28:45", "remaining_time": "3:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1577, "total_steps": 3836, "loss": 0.171, "learning_rate": 3.4197502447810836e-06, "epoch": 0.411038347505946, "percentage": 41.11, "elapsed_time": "2:28:51", "remaining_time": "3:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1578, "total_steps": 3836, "loss": 0.1564, "learning_rate": 3.4177457470284916e-06, "epoch": 0.4112989932557912, "percentage": 41.14, "elapsed_time": "2:28:56", "remaining_time": "3:33:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1579, "total_steps": 3836, "loss": 0.1811, "learning_rate": 3.4157405671487077e-06, "epoch": 0.41155963900563647, "percentage": 41.16, "elapsed_time": "2:29:02", "remaining_time": "3:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 3836, "loss": 0.1622, "learning_rate": 3.4137347066321097e-06, "epoch": 0.4118202847554817, "percentage": 41.19, "elapsed_time": "2:29:07", "remaining_time": "3:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1581, "total_steps": 3836, "loss": 0.1548, "learning_rate": 3.41172816696958e-06, "epoch": 0.41208093050532696, "percentage": 41.21, "elapsed_time": "2:29:13", "remaining_time": "3:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1582, "total_steps": 3836, "loss": 0.1714, "learning_rate": 3.4097209496525087e-06, "epoch": 0.4123415762551722, "percentage": 41.24, "elapsed_time": "2:29:17", "remaining_time": "3:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1583, "total_steps": 3836, "loss": 0.1659, "learning_rate": 3.4077130561727858e-06, "epoch": 0.41260222200501745, "percentage": 41.27, "elapsed_time": "2:29:23", "remaining_time": "3:32:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1584, "total_steps": 3836, "loss": 0.1584, "learning_rate": 3.4057044880228064e-06, "epoch": 0.4128628677548627, "percentage": 41.29, "elapsed_time": "2:29:29", "remaining_time": "3:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1585, "total_steps": 3836, "loss": 0.1773, "learning_rate": 3.4036952466954674e-06, "epoch": 0.41312351350470794, "percentage": 41.32, "elapsed_time": "2:29:35", "remaining_time": "3:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1586, "total_steps": 3836, "loss": 0.1741, "learning_rate": 3.4016853336841638e-06, "epoch": 0.41338415925455313, "percentage": 41.35, "elapsed_time": "2:29:41", "remaining_time": "3:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1587, "total_steps": 3836, "loss": 0.1777, "learning_rate": 3.3996747504827926e-06, "epoch": 0.4136448050043984, "percentage": 41.37, "elapsed_time": "2:29:46", "remaining_time": "3:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1588, "total_steps": 3836, "loss": 0.1654, "learning_rate": 3.397663498585747e-06, "epoch": 0.4139054507542436, "percentage": 41.4, "elapsed_time": "2:29:51", "remaining_time": "3:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1589, "total_steps": 3836, "loss": 0.1546, "learning_rate": 3.3956515794879166e-06, "epoch": 0.41416609650408887, "percentage": 41.42, "elapsed_time": "2:29:57", "remaining_time": "3:32:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 3836, "loss": 0.1684, "learning_rate": 3.39363899468469e-06, "epoch": 0.4144267422539341, "percentage": 41.45, "elapsed_time": "2:30:03", "remaining_time": "3:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1591, "total_steps": 3836, "loss": 0.1775, "learning_rate": 3.391625745671947e-06, "epoch": 0.41468738800377936, "percentage": 41.48, "elapsed_time": "2:30:08", "remaining_time": "3:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1592, "total_steps": 3836, "loss": 0.1573, "learning_rate": 3.3896118339460635e-06, "epoch": 0.4149480337536246, "percentage": 41.5, "elapsed_time": "2:30:14", "remaining_time": "3:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1593, "total_steps": 3836, "loss": 0.156, "learning_rate": 3.3875972610039075e-06, "epoch": 0.41520867950346985, "percentage": 41.53, "elapsed_time": "2:30:20", "remaining_time": "3:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1594, "total_steps": 3836, "loss": 0.1714, "learning_rate": 3.385582028342837e-06, "epoch": 0.4154693252533151, "percentage": 41.55, "elapsed_time": "2:30:25", "remaining_time": "3:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1595, "total_steps": 3836, "loss": 0.1696, "learning_rate": 3.383566137460702e-06, "epoch": 0.41572997100316034, "percentage": 41.58, "elapsed_time": "2:30:30", "remaining_time": "3:31:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1596, "total_steps": 3836, "loss": 0.1609, "learning_rate": 3.3815495898558424e-06, "epoch": 0.4159906167530056, "percentage": 41.61, "elapsed_time": "2:30:36", "remaining_time": "3:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1597, "total_steps": 3836, "loss": 0.1601, "learning_rate": 3.3795323870270837e-06, "epoch": 0.4162512625028508, "percentage": 41.63, "elapsed_time": "2:30:42", "remaining_time": "3:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1598, "total_steps": 3836, "loss": 0.1585, "learning_rate": 3.377514530473739e-06, "epoch": 0.4165119082526961, "percentage": 41.66, "elapsed_time": "2:30:48", "remaining_time": "3:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1599, "total_steps": 3836, "loss": 0.1521, "learning_rate": 3.37549602169561e-06, "epoch": 0.4167725540025413, "percentage": 41.68, "elapsed_time": "2:30:53", "remaining_time": "3:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 3836, "loss": 0.1612, "learning_rate": 3.3734768621929805e-06, "epoch": 0.41703319975238656, "percentage": 41.71, "elapsed_time": "2:30:59", "remaining_time": "3:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1601, "total_steps": 3836, "loss": 0.1631, "learning_rate": 3.3714570534666175e-06, "epoch": 0.41729384550223175, "percentage": 41.74, "elapsed_time": "2:31:05", "remaining_time": "3:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1602, "total_steps": 3836, "loss": 0.1563, "learning_rate": 3.369436597017774e-06, "epoch": 0.417554491252077, "percentage": 41.76, "elapsed_time": "2:31:10", "remaining_time": "3:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1603, "total_steps": 3836, "loss": 0.1692, "learning_rate": 3.3674154943481795e-06, "epoch": 0.41781513700192224, "percentage": 41.79, "elapsed_time": "2:31:16", "remaining_time": "3:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1604, "total_steps": 3836, "loss": 0.1638, "learning_rate": 3.3653937469600483e-06, "epoch": 0.4180757827517675, "percentage": 41.81, "elapsed_time": "2:31:22", "remaining_time": "3:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1605, "total_steps": 3836, "loss": 0.1665, "learning_rate": 3.363371356356072e-06, "epoch": 0.41833642850161273, "percentage": 41.84, "elapsed_time": "2:31:28", "remaining_time": "3:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1606, "total_steps": 3836, "loss": 0.1512, "learning_rate": 3.361348324039419e-06, "epoch": 0.418597074251458, "percentage": 41.87, "elapsed_time": "2:31:33", "remaining_time": "3:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1607, "total_steps": 3836, "loss": 0.1721, "learning_rate": 3.3593246515137373e-06, "epoch": 0.4188577200013032, "percentage": 41.89, "elapsed_time": "2:31:39", "remaining_time": "3:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1608, "total_steps": 3836, "loss": 0.1625, "learning_rate": 3.3573003402831487e-06, "epoch": 0.41911836575114847, "percentage": 41.92, "elapsed_time": "2:31:44", "remaining_time": "3:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1609, "total_steps": 3836, "loss": 0.1736, "learning_rate": 3.3552753918522507e-06, "epoch": 0.4193790115009937, "percentage": 41.94, "elapsed_time": "2:31:50", "remaining_time": "3:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 3836, "loss": 0.16, "learning_rate": 3.353249807726115e-06, "epoch": 0.41963965725083896, "percentage": 41.97, "elapsed_time": "2:31:56", "remaining_time": "3:30:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1611, "total_steps": 3836, "loss": 0.1624, "learning_rate": 3.351223589410283e-06, "epoch": 0.4199003030006842, "percentage": 42.0, "elapsed_time": "2:32:02", "remaining_time": "3:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1612, "total_steps": 3836, "loss": 0.1733, "learning_rate": 3.349196738410771e-06, "epoch": 0.42016094875052945, "percentage": 42.02, "elapsed_time": "2:32:08", "remaining_time": "3:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1613, "total_steps": 3836, "loss": 0.1661, "learning_rate": 3.347169256234064e-06, "epoch": 0.4204215945003747, "percentage": 42.05, "elapsed_time": "2:32:13", "remaining_time": "3:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1614, "total_steps": 3836, "loss": 0.1512, "learning_rate": 3.3451411443871145e-06, "epoch": 0.42068224025021994, "percentage": 42.08, "elapsed_time": "2:32:19", "remaining_time": "3:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1615, "total_steps": 3836, "loss": 0.1721, "learning_rate": 3.343112404377347e-06, "epoch": 0.4209428860000652, "percentage": 42.1, "elapsed_time": "2:32:24", "remaining_time": "3:29:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1616, "total_steps": 3836, "loss": 0.1796, "learning_rate": 3.341083037712649e-06, "epoch": 0.4212035317499104, "percentage": 42.13, "elapsed_time": "2:32:30", "remaining_time": "3:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1617, "total_steps": 3836, "loss": 0.1722, "learning_rate": 3.339053045901375e-06, "epoch": 0.4214641774997556, "percentage": 42.15, "elapsed_time": "2:32:35", "remaining_time": "3:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1618, "total_steps": 3836, "loss": 0.1569, "learning_rate": 3.337022430452346e-06, "epoch": 0.42172482324960087, "percentage": 42.18, "elapsed_time": "2:32:41", "remaining_time": "3:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1619, "total_steps": 3836, "loss": 0.1785, "learning_rate": 3.3349911928748424e-06, "epoch": 0.4219854689994461, "percentage": 42.21, "elapsed_time": "2:32:46", "remaining_time": "3:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1620, "total_steps": 3836, "loss": 0.1658, "learning_rate": 3.3329593346786125e-06, "epoch": 0.42224611474929136, "percentage": 42.23, "elapsed_time": "2:32:52", "remaining_time": "3:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1621, "total_steps": 3836, "loss": 0.1661, "learning_rate": 3.3309268573738605e-06, "epoch": 0.4225067604991366, "percentage": 42.26, "elapsed_time": "2:32:57", "remaining_time": "3:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1622, "total_steps": 3836, "loss": 0.1886, "learning_rate": 3.328893762471255e-06, "epoch": 0.42276740624898185, "percentage": 42.28, "elapsed_time": "2:33:03", "remaining_time": "3:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1623, "total_steps": 3836, "loss": 0.1686, "learning_rate": 3.3268600514819214e-06, "epoch": 0.4230280519988271, "percentage": 42.31, "elapsed_time": "2:33:08", "remaining_time": "3:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1624, "total_steps": 3836, "loss": 0.1686, "learning_rate": 3.324825725917442e-06, "epoch": 0.42328869774867234, "percentage": 42.34, "elapsed_time": "2:33:14", "remaining_time": "3:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1625, "total_steps": 3836, "loss": 0.1768, "learning_rate": 3.32279078728986e-06, "epoch": 0.4235493434985176, "percentage": 42.36, "elapsed_time": "2:33:20", "remaining_time": "3:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1626, "total_steps": 3836, "loss": 0.1579, "learning_rate": 3.320755237111669e-06, "epoch": 0.42380998924836283, "percentage": 42.39, "elapsed_time": "2:33:25", "remaining_time": "3:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1627, "total_steps": 3836, "loss": 0.1656, "learning_rate": 3.318719076895821e-06, "epoch": 0.4240706349982081, "percentage": 42.41, "elapsed_time": "2:33:30", "remaining_time": "3:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1628, "total_steps": 3836, "loss": 0.1598, "learning_rate": 3.316682308155721e-06, "epoch": 0.4243312807480533, "percentage": 42.44, "elapsed_time": "2:33:35", "remaining_time": "3:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1629, "total_steps": 3836, "loss": 0.173, "learning_rate": 3.314644932405224e-06, "epoch": 0.42459192649789856, "percentage": 42.47, "elapsed_time": "2:33:41", "remaining_time": "3:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1630, "total_steps": 3836, "loss": 0.1702, "learning_rate": 3.312606951158638e-06, "epoch": 0.4248525722477438, "percentage": 42.49, "elapsed_time": "2:33:47", "remaining_time": "3:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1631, "total_steps": 3836, "loss": 0.1592, "learning_rate": 3.3105683659307207e-06, "epoch": 0.425113217997589, "percentage": 42.52, "elapsed_time": "2:33:52", "remaining_time": "3:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1632, "total_steps": 3836, "loss": 0.1555, "learning_rate": 3.308529178236679e-06, "epoch": 0.42537386374743424, "percentage": 42.54, "elapsed_time": "2:33:57", "remaining_time": "3:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1633, "total_steps": 3836, "loss": 0.1721, "learning_rate": 3.306489389592168e-06, "epoch": 0.4256345094972795, "percentage": 42.57, "elapsed_time": "2:34:02", "remaining_time": "3:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1634, "total_steps": 3836, "loss": 0.1583, "learning_rate": 3.304449001513287e-06, "epoch": 0.42589515524712473, "percentage": 42.6, "elapsed_time": "2:34:08", "remaining_time": "3:27:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1635, "total_steps": 3836, "loss": 0.1486, "learning_rate": 3.3024080155165837e-06, "epoch": 0.42615580099697, "percentage": 42.62, "elapsed_time": "2:34:14", "remaining_time": "3:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1636, "total_steps": 3836, "loss": 0.1663, "learning_rate": 3.3003664331190487e-06, "epoch": 0.4264164467468152, "percentage": 42.65, "elapsed_time": "2:34:20", "remaining_time": "3:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1637, "total_steps": 3836, "loss": 0.176, "learning_rate": 3.2983242558381178e-06, "epoch": 0.42667709249666047, "percentage": 42.67, "elapsed_time": "2:34:25", "remaining_time": "3:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1638, "total_steps": 3836, "loss": 0.1579, "learning_rate": 3.296281485191665e-06, "epoch": 0.4269377382465057, "percentage": 42.7, "elapsed_time": "2:34:31", "remaining_time": "3:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1639, "total_steps": 3836, "loss": 0.1643, "learning_rate": 3.294238122698009e-06, "epoch": 0.42719838399635096, "percentage": 42.73, "elapsed_time": "2:34:36", "remaining_time": "3:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1640, "total_steps": 3836, "loss": 0.1745, "learning_rate": 3.292194169875908e-06, "epoch": 0.4274590297461962, "percentage": 42.75, "elapsed_time": "2:34:40", "remaining_time": "3:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1641, "total_steps": 3836, "loss": 0.155, "learning_rate": 3.2901496282445567e-06, "epoch": 0.42771967549604145, "percentage": 42.78, "elapsed_time": "2:34:47", "remaining_time": "3:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1642, "total_steps": 3836, "loss": 0.1716, "learning_rate": 3.2881044993235893e-06, "epoch": 0.4279803212458867, "percentage": 42.81, "elapsed_time": "2:34:52", "remaining_time": "3:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1643, "total_steps": 3836, "loss": 0.165, "learning_rate": 3.2860587846330773e-06, "epoch": 0.42824096699573194, "percentage": 42.83, "elapsed_time": "2:34:58", "remaining_time": "3:26:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1644, "total_steps": 3836, "loss": 0.1813, "learning_rate": 3.284012485693524e-06, "epoch": 0.4285016127455772, "percentage": 42.86, "elapsed_time": "2:35:03", "remaining_time": "3:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1645, "total_steps": 3836, "loss": 0.1748, "learning_rate": 3.281965604025871e-06, "epoch": 0.42876225849542243, "percentage": 42.88, "elapsed_time": "2:35:09", "remaining_time": "3:26:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1646, "total_steps": 3836, "loss": 0.1927, "learning_rate": 3.279918141151492e-06, "epoch": 0.4290229042452677, "percentage": 42.91, "elapsed_time": "2:35:14", "remaining_time": "3:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1647, "total_steps": 3836, "loss": 0.1707, "learning_rate": 3.2778700985921897e-06, "epoch": 0.42928354999511287, "percentage": 42.94, "elapsed_time": "2:35:20", "remaining_time": "3:26:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1648, "total_steps": 3836, "loss": 0.1531, "learning_rate": 3.2758214778702026e-06, "epoch": 0.4295441957449581, "percentage": 42.96, "elapsed_time": "2:35:25", "remaining_time": "3:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1649, "total_steps": 3836, "loss": 0.156, "learning_rate": 3.273772280508194e-06, "epoch": 0.42980484149480336, "percentage": 42.99, "elapsed_time": "2:35:30", "remaining_time": "3:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 3836, "loss": 0.1628, "learning_rate": 3.2717225080292598e-06, "epoch": 0.4300654872446486, "percentage": 43.01, "elapsed_time": "2:35:36", "remaining_time": "3:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1651, "total_steps": 3836, "loss": 0.1789, "learning_rate": 3.2696721619569214e-06, "epoch": 0.43032613299449385, "percentage": 43.04, "elapsed_time": "2:35:41", "remaining_time": "3:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1652, "total_steps": 3836, "loss": 0.1513, "learning_rate": 3.2676212438151256e-06, "epoch": 0.4305867787443391, "percentage": 43.07, "elapsed_time": "2:35:47", "remaining_time": "3:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1653, "total_steps": 3836, "loss": 0.1626, "learning_rate": 3.2655697551282473e-06, "epoch": 0.43084742449418434, "percentage": 43.09, "elapsed_time": "2:35:52", "remaining_time": "3:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1654, "total_steps": 3836, "loss": 0.1547, "learning_rate": 3.2635176974210824e-06, "epoch": 0.4311080702440296, "percentage": 43.12, "elapsed_time": "2:35:57", "remaining_time": "3:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1655, "total_steps": 3836, "loss": 0.1718, "learning_rate": 3.2614650722188517e-06, "epoch": 0.43136871599387483, "percentage": 43.14, "elapsed_time": "2:36:02", "remaining_time": "3:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1656, "total_steps": 3836, "loss": 0.1522, "learning_rate": 3.2594118810471982e-06, "epoch": 0.4316293617437201, "percentage": 43.17, "elapsed_time": "2:36:08", "remaining_time": "3:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1657, "total_steps": 3836, "loss": 0.1567, "learning_rate": 3.2573581254321824e-06, "epoch": 0.4318900074935653, "percentage": 43.2, "elapsed_time": "2:36:13", "remaining_time": "3:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1658, "total_steps": 3836, "loss": 0.1549, "learning_rate": 3.2553038069002885e-06, "epoch": 0.43215065324341057, "percentage": 43.22, "elapsed_time": "2:36:19", "remaining_time": "3:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1659, "total_steps": 3836, "loss": 0.1559, "learning_rate": 3.253248926978416e-06, "epoch": 0.4324112989932558, "percentage": 43.25, "elapsed_time": "2:36:24", "remaining_time": "3:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1660, "total_steps": 3836, "loss": 0.1818, "learning_rate": 3.2511934871938825e-06, "epoch": 0.43267194474310106, "percentage": 43.27, "elapsed_time": "2:36:29", "remaining_time": "3:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1661, "total_steps": 3836, "loss": 0.1649, "learning_rate": 3.249137489074423e-06, "epoch": 0.4329325904929463, "percentage": 43.3, "elapsed_time": "2:36:35", "remaining_time": "3:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1662, "total_steps": 3836, "loss": 0.1569, "learning_rate": 3.247080934148186e-06, "epoch": 0.4331932362427915, "percentage": 43.33, "elapsed_time": "2:36:41", "remaining_time": "3:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1663, "total_steps": 3836, "loss": 0.1592, "learning_rate": 3.2450238239437344e-06, "epoch": 0.43345388199263674, "percentage": 43.35, "elapsed_time": "2:36:48", "remaining_time": "3:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1664, "total_steps": 3836, "loss": 0.1523, "learning_rate": 3.242966159990044e-06, "epoch": 0.433714527742482, "percentage": 43.38, "elapsed_time": "2:36:53", "remaining_time": "3:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1665, "total_steps": 3836, "loss": 0.1856, "learning_rate": 3.2409079438165015e-06, "epoch": 0.4339751734923272, "percentage": 43.4, "elapsed_time": "2:36:59", "remaining_time": "3:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1666, "total_steps": 3836, "loss": 0.1638, "learning_rate": 3.238849176952904e-06, "epoch": 0.43423581924217247, "percentage": 43.43, "elapsed_time": "2:37:05", "remaining_time": "3:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1667, "total_steps": 3836, "loss": 0.1681, "learning_rate": 3.23678986092946e-06, "epoch": 0.4344964649920177, "percentage": 43.46, "elapsed_time": "2:37:11", "remaining_time": "3:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1668, "total_steps": 3836, "loss": 0.1539, "learning_rate": 3.2347299972767824e-06, "epoch": 0.43475711074186296, "percentage": 43.48, "elapsed_time": "2:37:16", "remaining_time": "3:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1669, "total_steps": 3836, "loss": 0.1689, "learning_rate": 3.232669587525895e-06, "epoch": 0.4350177564917082, "percentage": 43.51, "elapsed_time": "2:37:21", "remaining_time": "3:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1670, "total_steps": 3836, "loss": 0.1606, "learning_rate": 3.230608633208225e-06, "epoch": 0.43527840224155345, "percentage": 43.53, "elapsed_time": "2:37:27", "remaining_time": "3:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1671, "total_steps": 3836, "loss": 0.1792, "learning_rate": 3.2285471358556063e-06, "epoch": 0.4355390479913987, "percentage": 43.56, "elapsed_time": "2:37:33", "remaining_time": "3:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1672, "total_steps": 3836, "loss": 0.1854, "learning_rate": 3.226485097000273e-06, "epoch": 0.43579969374124394, "percentage": 43.59, "elapsed_time": "2:37:39", "remaining_time": "3:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1673, "total_steps": 3836, "loss": 0.1647, "learning_rate": 3.2244225181748654e-06, "epoch": 0.4360603394910892, "percentage": 43.61, "elapsed_time": "2:37:44", "remaining_time": "3:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1674, "total_steps": 3836, "loss": 0.1763, "learning_rate": 3.2223594009124247e-06, "epoch": 0.43632098524093443, "percentage": 43.64, "elapsed_time": "2:37:50", "remaining_time": "3:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1675, "total_steps": 3836, "loss": 0.1618, "learning_rate": 3.2202957467463893e-06, "epoch": 0.4365816309907797, "percentage": 43.67, "elapsed_time": "2:37:56", "remaining_time": "3:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1676, "total_steps": 3836, "loss": 0.1686, "learning_rate": 3.2182315572105995e-06, "epoch": 0.4368422767406249, "percentage": 43.69, "elapsed_time": "2:38:01", "remaining_time": "3:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1677, "total_steps": 3836, "loss": 0.1739, "learning_rate": 3.2161668338392924e-06, "epoch": 0.4371029224904701, "percentage": 43.72, "elapsed_time": "2:38:07", "remaining_time": "3:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1678, "total_steps": 3836, "loss": 0.1674, "learning_rate": 3.2141015781671025e-06, "epoch": 0.43736356824031536, "percentage": 43.74, "elapsed_time": "2:38:13", "remaining_time": "3:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1679, "total_steps": 3836, "loss": 0.1631, "learning_rate": 3.2120357917290597e-06, "epoch": 0.4376242139901606, "percentage": 43.77, "elapsed_time": "2:38:18", "remaining_time": "3:23:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 3836, "loss": 0.1605, "learning_rate": 3.209969476060587e-06, "epoch": 0.43788485974000585, "percentage": 43.8, "elapsed_time": "2:38:24", "remaining_time": "3:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1681, "total_steps": 3836, "loss": 0.1594, "learning_rate": 3.2079026326975037e-06, "epoch": 0.4381455054898511, "percentage": 43.82, "elapsed_time": "2:38:29", "remaining_time": "3:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1682, "total_steps": 3836, "loss": 0.1634, "learning_rate": 3.2058352631760198e-06, "epoch": 0.43840615123969634, "percentage": 43.85, "elapsed_time": "2:38:34", "remaining_time": "3:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1683, "total_steps": 3836, "loss": 0.1623, "learning_rate": 3.2037673690327343e-06, "epoch": 0.4386667969895416, "percentage": 43.87, "elapsed_time": "2:38:40", "remaining_time": "3:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1684, "total_steps": 3836, "loss": 0.1588, "learning_rate": 3.2016989518046397e-06, "epoch": 0.43892744273938683, "percentage": 43.9, "elapsed_time": "2:38:46", "remaining_time": "3:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1685, "total_steps": 3836, "loss": 0.1633, "learning_rate": 3.199630013029115e-06, "epoch": 0.4391880884892321, "percentage": 43.93, "elapsed_time": "2:38:51", "remaining_time": "3:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1686, "total_steps": 3836, "loss": 0.1624, "learning_rate": 3.1975605542439276e-06, "epoch": 0.4394487342390773, "percentage": 43.95, "elapsed_time": "2:38:57", "remaining_time": "3:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1687, "total_steps": 3836, "loss": 0.1556, "learning_rate": 3.195490576987231e-06, "epoch": 0.43970937998892257, "percentage": 43.98, "elapsed_time": "2:39:02", "remaining_time": "3:22:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1688, "total_steps": 3836, "loss": 0.1752, "learning_rate": 3.1934200827975654e-06, "epoch": 0.4399700257387678, "percentage": 44.0, "elapsed_time": "2:39:07", "remaining_time": "3:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1689, "total_steps": 3836, "loss": 0.1592, "learning_rate": 3.1913490732138537e-06, "epoch": 0.44023067148861306, "percentage": 44.03, "elapsed_time": "2:39:13", "remaining_time": "3:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1690, "total_steps": 3836, "loss": 0.1672, "learning_rate": 3.1892775497754014e-06, "epoch": 0.4404913172384583, "percentage": 44.06, "elapsed_time": "2:39:19", "remaining_time": "3:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1691, "total_steps": 3836, "loss": 0.1768, "learning_rate": 3.187205514021897e-06, "epoch": 0.44075196298830355, "percentage": 44.08, "elapsed_time": "2:39:25", "remaining_time": "3:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1692, "total_steps": 3836, "loss": 0.1841, "learning_rate": 3.1851329674934116e-06, "epoch": 0.44101260873814874, "percentage": 44.11, "elapsed_time": "2:39:31", "remaining_time": "3:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1693, "total_steps": 3836, "loss": 0.1544, "learning_rate": 3.183059911730392e-06, "epoch": 0.441273254487994, "percentage": 44.13, "elapsed_time": "2:39:36", "remaining_time": "3:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1694, "total_steps": 3836, "loss": 0.1626, "learning_rate": 3.1809863482736663e-06, "epoch": 0.4415339002378392, "percentage": 44.16, "elapsed_time": "2:39:41", "remaining_time": "3:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1695, "total_steps": 3836, "loss": 0.1546, "learning_rate": 3.1789122786644394e-06, "epoch": 0.4417945459876845, "percentage": 44.19, "elapsed_time": "2:39:47", "remaining_time": "3:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1696, "total_steps": 3836, "loss": 0.1778, "learning_rate": 3.176837704444291e-06, "epoch": 0.4420551917375297, "percentage": 44.21, "elapsed_time": "2:39:53", "remaining_time": "3:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1697, "total_steps": 3836, "loss": 0.1693, "learning_rate": 3.174762627155179e-06, "epoch": 0.44231583748737496, "percentage": 44.24, "elapsed_time": "2:39:58", "remaining_time": "3:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1698, "total_steps": 3836, "loss": 0.1531, "learning_rate": 3.1726870483394312e-06, "epoch": 0.4425764832372202, "percentage": 44.26, "elapsed_time": "2:40:04", "remaining_time": "3:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1699, "total_steps": 3836, "loss": 0.1715, "learning_rate": 3.1706109695397515e-06, "epoch": 0.44283712898706545, "percentage": 44.29, "elapsed_time": "2:40:10", "remaining_time": "3:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 3836, "loss": 0.1675, "learning_rate": 3.168534392299214e-06, "epoch": 0.4430977747369107, "percentage": 44.32, "elapsed_time": "2:40:15", "remaining_time": "3:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1701, "total_steps": 3836, "loss": 0.1793, "learning_rate": 3.1664573181612616e-06, "epoch": 0.44335842048675594, "percentage": 44.34, "elapsed_time": "2:40:21", "remaining_time": "3:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1702, "total_steps": 3836, "loss": 0.1759, "learning_rate": 3.1643797486697116e-06, "epoch": 0.4436190662366012, "percentage": 44.37, "elapsed_time": "2:40:27", "remaining_time": "3:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1703, "total_steps": 3836, "loss": 0.1823, "learning_rate": 3.1623016853687434e-06, "epoch": 0.44387971198644643, "percentage": 44.4, "elapsed_time": "2:40:32", "remaining_time": "3:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1704, "total_steps": 3836, "loss": 0.1733, "learning_rate": 3.1602231298029074e-06, "epoch": 0.4441403577362917, "percentage": 44.42, "elapsed_time": "2:40:38", "remaining_time": "3:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1705, "total_steps": 3836, "loss": 0.1781, "learning_rate": 3.1581440835171185e-06, "epoch": 0.4444010034861369, "percentage": 44.45, "elapsed_time": "2:40:43", "remaining_time": "3:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1706, "total_steps": 3836, "loss": 0.162, "learning_rate": 3.1560645480566566e-06, "epoch": 0.44466164923598217, "percentage": 44.47, "elapsed_time": "2:40:49", "remaining_time": "3:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1707, "total_steps": 3836, "loss": 0.1516, "learning_rate": 3.153984524967165e-06, "epoch": 0.44492229498582736, "percentage": 44.5, "elapsed_time": "2:40:54", "remaining_time": "3:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1708, "total_steps": 3836, "loss": 0.1662, "learning_rate": 3.15190401579465e-06, "epoch": 0.4451829407356726, "percentage": 44.53, "elapsed_time": "2:41:00", "remaining_time": "3:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1709, "total_steps": 3836, "loss": 0.1691, "learning_rate": 3.149823022085478e-06, "epoch": 0.44544358648551785, "percentage": 44.55, "elapsed_time": "2:41:05", "remaining_time": "3:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1710, "total_steps": 3836, "loss": 0.1604, "learning_rate": 3.1477415453863772e-06, "epoch": 0.4457042322353631, "percentage": 44.58, "elapsed_time": "2:41:11", "remaining_time": "3:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1711, "total_steps": 3836, "loss": 0.1573, "learning_rate": 3.1456595872444332e-06, "epoch": 0.44596487798520834, "percentage": 44.6, "elapsed_time": "2:41:16", "remaining_time": "3:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1712, "total_steps": 3836, "loss": 0.1593, "learning_rate": 3.143577149207091e-06, "epoch": 0.4462255237350536, "percentage": 44.63, "elapsed_time": "2:41:22", "remaining_time": "3:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1713, "total_steps": 3836, "loss": 0.1535, "learning_rate": 3.1414942328221494e-06, "epoch": 0.44648616948489883, "percentage": 44.66, "elapsed_time": "2:41:28", "remaining_time": "3:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1714, "total_steps": 3836, "loss": 0.178, "learning_rate": 3.139410839637767e-06, "epoch": 0.4467468152347441, "percentage": 44.68, "elapsed_time": "2:41:33", "remaining_time": "3:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1715, "total_steps": 3836, "loss": 0.1614, "learning_rate": 3.1373269712024533e-06, "epoch": 0.4470074609845893, "percentage": 44.71, "elapsed_time": "2:41:39", "remaining_time": "3:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1716, "total_steps": 3836, "loss": 0.1635, "learning_rate": 3.135242629065073e-06, "epoch": 0.44726810673443457, "percentage": 44.73, "elapsed_time": "2:41:44", "remaining_time": "3:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1717, "total_steps": 3836, "loss": 0.1597, "learning_rate": 3.1331578147748416e-06, "epoch": 0.4475287524842798, "percentage": 44.76, "elapsed_time": "2:41:50", "remaining_time": "3:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1718, "total_steps": 3836, "loss": 0.1544, "learning_rate": 3.131072529881326e-06, "epoch": 0.44778939823412506, "percentage": 44.79, "elapsed_time": "2:41:56", "remaining_time": "3:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1719, "total_steps": 3836, "loss": 0.1613, "learning_rate": 3.1289867759344434e-06, "epoch": 0.4480500439839703, "percentage": 44.81, "elapsed_time": "2:42:01", "remaining_time": "3:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1720, "total_steps": 3836, "loss": 0.1609, "learning_rate": 3.126900554484459e-06, "epoch": 0.44831068973381555, "percentage": 44.84, "elapsed_time": "2:42:06", "remaining_time": "3:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1721, "total_steps": 3836, "loss": 0.1616, "learning_rate": 3.1248138670819857e-06, "epoch": 0.4485713354836608, "percentage": 44.86, "elapsed_time": "2:42:12", "remaining_time": "3:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1722, "total_steps": 3836, "loss": 0.1711, "learning_rate": 3.122726715277983e-06, "epoch": 0.44883198123350604, "percentage": 44.89, "elapsed_time": "2:42:18", "remaining_time": "3:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1723, "total_steps": 3836, "loss": 0.149, "learning_rate": 3.120639100623755e-06, "epoch": 0.44909262698335123, "percentage": 44.92, "elapsed_time": "2:42:24", "remaining_time": "3:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1724, "total_steps": 3836, "loss": 0.1565, "learning_rate": 3.1185510246709487e-06, "epoch": 0.4493532727331965, "percentage": 44.94, "elapsed_time": "2:42:30", "remaining_time": "3:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1725, "total_steps": 3836, "loss": 0.1714, "learning_rate": 3.116462488971559e-06, "epoch": 0.4496139184830417, "percentage": 44.97, "elapsed_time": "2:42:35", "remaining_time": "3:18:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1726, "total_steps": 3836, "loss": 0.1511, "learning_rate": 3.1143734950779155e-06, "epoch": 0.44987456423288696, "percentage": 44.99, "elapsed_time": "2:42:41", "remaining_time": "3:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1727, "total_steps": 3836, "loss": 0.1688, "learning_rate": 3.1122840445426927e-06, "epoch": 0.4501352099827322, "percentage": 45.02, "elapsed_time": "2:42:46", "remaining_time": "3:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1728, "total_steps": 3836, "loss": 0.1642, "learning_rate": 3.1101941389189045e-06, "epoch": 0.45039585573257745, "percentage": 45.05, "elapsed_time": "2:42:51", "remaining_time": "3:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1729, "total_steps": 3836, "loss": 0.1697, "learning_rate": 3.1081037797599006e-06, "epoch": 0.4506565014824227, "percentage": 45.07, "elapsed_time": "2:42:56", "remaining_time": "3:18:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1730, "total_steps": 3836, "loss": 0.1677, "learning_rate": 3.106012968619371e-06, "epoch": 0.45091714723226795, "percentage": 45.1, "elapsed_time": "2:43:02", "remaining_time": "3:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1731, "total_steps": 3836, "loss": 0.1664, "learning_rate": 3.103921707051338e-06, "epoch": 0.4511777929821132, "percentage": 45.13, "elapsed_time": "2:43:07", "remaining_time": "3:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1732, "total_steps": 3836, "loss": 0.1865, "learning_rate": 3.1018299966101624e-06, "epoch": 0.45143843873195844, "percentage": 45.15, "elapsed_time": "2:43:13", "remaining_time": "3:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1733, "total_steps": 3836, "loss": 0.1667, "learning_rate": 3.0997378388505354e-06, "epoch": 0.4516990844818037, "percentage": 45.18, "elapsed_time": "2:43:19", "remaining_time": "3:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1734, "total_steps": 3836, "loss": 0.1649, "learning_rate": 3.097645235327483e-06, "epoch": 0.4519597302316489, "percentage": 45.2, "elapsed_time": "2:43:24", "remaining_time": "3:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1735, "total_steps": 3836, "loss": 0.1582, "learning_rate": 3.095552187596361e-06, "epoch": 0.45222037598149417, "percentage": 45.23, "elapsed_time": "2:43:30", "remaining_time": "3:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1736, "total_steps": 3836, "loss": 0.1695, "learning_rate": 3.0934586972128574e-06, "epoch": 0.4524810217313394, "percentage": 45.26, "elapsed_time": "2:43:36", "remaining_time": "3:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1737, "total_steps": 3836, "loss": 0.141, "learning_rate": 3.091364765732986e-06, "epoch": 0.45274166748118466, "percentage": 45.28, "elapsed_time": "2:43:42", "remaining_time": "3:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1738, "total_steps": 3836, "loss": 0.1635, "learning_rate": 3.0892703947130914e-06, "epoch": 0.45300231323102985, "percentage": 45.31, "elapsed_time": "2:43:47", "remaining_time": "3:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1739, "total_steps": 3836, "loss": 0.1797, "learning_rate": 3.087175585709844e-06, "epoch": 0.4532629589808751, "percentage": 45.33, "elapsed_time": "2:43:53", "remaining_time": "3:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1740, "total_steps": 3836, "loss": 0.157, "learning_rate": 3.085080340280239e-06, "epoch": 0.45352360473072034, "percentage": 45.36, "elapsed_time": "2:43:58", "remaining_time": "3:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1741, "total_steps": 3836, "loss": 0.1758, "learning_rate": 3.082984659981596e-06, "epoch": 0.4537842504805656, "percentage": 45.39, "elapsed_time": "2:44:04", "remaining_time": "3:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1742, "total_steps": 3836, "loss": 0.157, "learning_rate": 3.0808885463715584e-06, "epoch": 0.45404489623041083, "percentage": 45.41, "elapsed_time": "2:44:10", "remaining_time": "3:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1743, "total_steps": 3836, "loss": 0.1638, "learning_rate": 3.0787920010080923e-06, "epoch": 0.4543055419802561, "percentage": 45.44, "elapsed_time": "2:44:16", "remaining_time": "3:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1744, "total_steps": 3836, "loss": 0.1653, "learning_rate": 3.076695025449484e-06, "epoch": 0.4545661877301013, "percentage": 45.46, "elapsed_time": "2:44:21", "remaining_time": "3:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1745, "total_steps": 3836, "loss": 0.1544, "learning_rate": 3.0745976212543393e-06, "epoch": 0.45482683347994657, "percentage": 45.49, "elapsed_time": "2:44:27", "remaining_time": "3:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1746, "total_steps": 3836, "loss": 0.1579, "learning_rate": 3.072499789981582e-06, "epoch": 0.4550874792297918, "percentage": 45.52, "elapsed_time": "2:44:32", "remaining_time": "3:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1747, "total_steps": 3836, "loss": 0.1602, "learning_rate": 3.070401533190455e-06, "epoch": 0.45534812497963706, "percentage": 45.54, "elapsed_time": "2:44:37", "remaining_time": "3:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1748, "total_steps": 3836, "loss": 0.1638, "learning_rate": 3.068302852440517e-06, "epoch": 0.4556087707294823, "percentage": 45.57, "elapsed_time": "2:44:43", "remaining_time": "3:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1749, "total_steps": 3836, "loss": 0.1685, "learning_rate": 3.0662037492916397e-06, "epoch": 0.45586941647932755, "percentage": 45.59, "elapsed_time": "2:44:48", "remaining_time": "3:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1750, "total_steps": 3836, "loss": 0.1632, "learning_rate": 3.064104225304013e-06, "epoch": 0.4561300622291728, "percentage": 45.62, "elapsed_time": "2:44:54", "remaining_time": "3:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1751, "total_steps": 3836, "loss": 0.158, "learning_rate": 3.0620042820381344e-06, "epoch": 0.45639070797901804, "percentage": 45.65, "elapsed_time": "2:44:59", "remaining_time": "3:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1752, "total_steps": 3836, "loss": 0.1657, "learning_rate": 3.059903921054818e-06, "epoch": 0.4566513537288633, "percentage": 45.67, "elapsed_time": "2:45:05", "remaining_time": "3:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1753, "total_steps": 3836, "loss": 0.1588, "learning_rate": 3.0578031439151855e-06, "epoch": 0.4569119994787085, "percentage": 45.7, "elapsed_time": "2:45:11", "remaining_time": "3:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1754, "total_steps": 3836, "loss": 0.1549, "learning_rate": 3.0557019521806667e-06, "epoch": 0.4571726452285537, "percentage": 45.72, "elapsed_time": "2:45:16", "remaining_time": "3:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1755, "total_steps": 3836, "loss": 0.1737, "learning_rate": 3.053600347413004e-06, "epoch": 0.45743329097839897, "percentage": 45.75, "elapsed_time": "2:45:22", "remaining_time": "3:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1756, "total_steps": 3836, "loss": 0.1561, "learning_rate": 3.0514983311742426e-06, "epoch": 0.4576939367282442, "percentage": 45.78, "elapsed_time": "2:45:27", "remaining_time": "3:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1757, "total_steps": 3836, "loss": 0.1537, "learning_rate": 3.0493959050267347e-06, "epoch": 0.45795458247808946, "percentage": 45.8, "elapsed_time": "2:45:33", "remaining_time": "3:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1758, "total_steps": 3836, "loss": 0.1597, "learning_rate": 3.04729307053314e-06, "epoch": 0.4582152282279347, "percentage": 45.83, "elapsed_time": "2:45:38", "remaining_time": "3:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1759, "total_steps": 3836, "loss": 0.1643, "learning_rate": 3.045189829256416e-06, "epoch": 0.45847587397777995, "percentage": 45.86, "elapsed_time": "2:45:43", "remaining_time": "3:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1760, "total_steps": 3836, "loss": 0.1674, "learning_rate": 3.0430861827598277e-06, "epoch": 0.4587365197276252, "percentage": 45.88, "elapsed_time": "2:45:49", "remaining_time": "3:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1761, "total_steps": 3836, "loss": 0.1544, "learning_rate": 3.0409821326069387e-06, "epoch": 0.45899716547747044, "percentage": 45.91, "elapsed_time": "2:45:54", "remaining_time": "3:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1762, "total_steps": 3836, "loss": 0.143, "learning_rate": 3.0388776803616138e-06, "epoch": 0.4592578112273157, "percentage": 45.93, "elapsed_time": "2:46:00", "remaining_time": "3:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1763, "total_steps": 3836, "loss": 0.1657, "learning_rate": 3.036772827588017e-06, "epoch": 0.4595184569771609, "percentage": 45.96, "elapsed_time": "2:46:05", "remaining_time": "3:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1764, "total_steps": 3836, "loss": 0.1652, "learning_rate": 3.034667575850607e-06, "epoch": 0.4597791027270062, "percentage": 45.99, "elapsed_time": "2:46:11", "remaining_time": "3:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1765, "total_steps": 3836, "loss": 0.1464, "learning_rate": 3.032561926714142e-06, "epoch": 0.4600397484768514, "percentage": 46.01, "elapsed_time": "2:46:16", "remaining_time": "3:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1766, "total_steps": 3836, "loss": 0.1511, "learning_rate": 3.0304558817436767e-06, "epoch": 0.46030039422669666, "percentage": 46.04, "elapsed_time": "2:46:21", "remaining_time": "3:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1767, "total_steps": 3836, "loss": 0.1755, "learning_rate": 3.028349442504556e-06, "epoch": 0.4605610399765419, "percentage": 46.06, "elapsed_time": "2:46:27", "remaining_time": "3:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1768, "total_steps": 3836, "loss": 0.1722, "learning_rate": 3.02624261056242e-06, "epoch": 0.4608216857263871, "percentage": 46.09, "elapsed_time": "2:46:33", "remaining_time": "3:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1769, "total_steps": 3836, "loss": 0.1677, "learning_rate": 3.0241353874832015e-06, "epoch": 0.46108233147623234, "percentage": 46.12, "elapsed_time": "2:46:39", "remaining_time": "3:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1770, "total_steps": 3836, "loss": 0.1593, "learning_rate": 3.0220277748331223e-06, "epoch": 0.4613429772260776, "percentage": 46.14, "elapsed_time": "2:46:44", "remaining_time": "3:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1771, "total_steps": 3836, "loss": 0.18, "learning_rate": 3.019919774178695e-06, "epoch": 0.46160362297592283, "percentage": 46.17, "elapsed_time": "2:46:51", "remaining_time": "3:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1772, "total_steps": 3836, "loss": 0.1668, "learning_rate": 3.017811387086721e-06, "epoch": 0.4618642687257681, "percentage": 46.19, "elapsed_time": "2:46:56", "remaining_time": "3:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1773, "total_steps": 3836, "loss": 0.1606, "learning_rate": 3.015702615124287e-06, "epoch": 0.4621249144756133, "percentage": 46.22, "elapsed_time": "2:47:02", "remaining_time": "3:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1774, "total_steps": 3836, "loss": 0.1627, "learning_rate": 3.013593459858767e-06, "epoch": 0.46238556022545857, "percentage": 46.25, "elapsed_time": "2:47:07", "remaining_time": "3:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1775, "total_steps": 3836, "loss": 0.1685, "learning_rate": 3.0114839228578197e-06, "epoch": 0.4626462059753038, "percentage": 46.27, "elapsed_time": "2:47:12", "remaining_time": "3:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1776, "total_steps": 3836, "loss": 0.1594, "learning_rate": 3.0093740056893882e-06, "epoch": 0.46290685172514906, "percentage": 46.3, "elapsed_time": "2:47:18", "remaining_time": "3:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1777, "total_steps": 3836, "loss": 0.1539, "learning_rate": 3.007263709921697e-06, "epoch": 0.4631674974749943, "percentage": 46.32, "elapsed_time": "2:47:24", "remaining_time": "3:13:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1778, "total_steps": 3836, "loss": 0.1586, "learning_rate": 3.005153037123253e-06, "epoch": 0.46342814322483955, "percentage": 46.35, "elapsed_time": "2:47:29", "remaining_time": "3:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1779, "total_steps": 3836, "loss": 0.1748, "learning_rate": 3.003041988862842e-06, "epoch": 0.4636887889746848, "percentage": 46.38, "elapsed_time": "2:47:35", "remaining_time": "3:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1780, "total_steps": 3836, "loss": 0.161, "learning_rate": 3.000930566709531e-06, "epoch": 0.46394943472453004, "percentage": 46.4, "elapsed_time": "2:47:40", "remaining_time": "3:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1781, "total_steps": 3836, "loss": 0.1715, "learning_rate": 2.998818772232663e-06, "epoch": 0.4642100804743753, "percentage": 46.43, "elapsed_time": "2:47:46", "remaining_time": "3:13:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1782, "total_steps": 3836, "loss": 0.1671, "learning_rate": 2.996706607001858e-06, "epoch": 0.46447072622422053, "percentage": 46.45, "elapsed_time": "2:47:53", "remaining_time": "3:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1783, "total_steps": 3836, "loss": 0.1507, "learning_rate": 2.9945940725870127e-06, "epoch": 0.4647313719740657, "percentage": 46.48, "elapsed_time": "2:47:58", "remaining_time": "3:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1784, "total_steps": 3836, "loss": 0.1489, "learning_rate": 2.9924811705582966e-06, "epoch": 0.46499201772391097, "percentage": 46.51, "elapsed_time": "2:48:03", "remaining_time": "3:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1785, "total_steps": 3836, "loss": 0.1597, "learning_rate": 2.990367902486155e-06, "epoch": 0.4652526634737562, "percentage": 46.53, "elapsed_time": "2:48:09", "remaining_time": "3:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1786, "total_steps": 3836, "loss": 0.1705, "learning_rate": 2.988254269941302e-06, "epoch": 0.46551330922360146, "percentage": 46.56, "elapsed_time": "2:48:15", "remaining_time": "3:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1787, "total_steps": 3836, "loss": 0.151, "learning_rate": 2.986140274494723e-06, "epoch": 0.4657739549734467, "percentage": 46.58, "elapsed_time": "2:48:20", "remaining_time": "3:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1788, "total_steps": 3836, "loss": 0.1602, "learning_rate": 2.984025917717678e-06, "epoch": 0.46603460072329195, "percentage": 46.61, "elapsed_time": "2:48:25", "remaining_time": "3:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1789, "total_steps": 3836, "loss": 0.1765, "learning_rate": 2.9819112011816886e-06, "epoch": 0.4662952464731372, "percentage": 46.64, "elapsed_time": "2:48:31", "remaining_time": "3:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1790, "total_steps": 3836, "loss": 0.1618, "learning_rate": 2.979796126458548e-06, "epoch": 0.46655589222298244, "percentage": 46.66, "elapsed_time": "2:48:36", "remaining_time": "3:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1791, "total_steps": 3836, "loss": 0.1612, "learning_rate": 2.9776806951203154e-06, "epoch": 0.4668165379728277, "percentage": 46.69, "elapsed_time": "2:48:42", "remaining_time": "3:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1792, "total_steps": 3836, "loss": 0.1663, "learning_rate": 2.975564908739313e-06, "epoch": 0.46707718372267293, "percentage": 46.72, "elapsed_time": "2:48:48", "remaining_time": "3:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1793, "total_steps": 3836, "loss": 0.1712, "learning_rate": 2.9734487688881294e-06, "epoch": 0.4673378294725182, "percentage": 46.74, "elapsed_time": "2:48:54", "remaining_time": "3:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1794, "total_steps": 3836, "loss": 0.1602, "learning_rate": 2.9713322771396147e-06, "epoch": 0.4675984752223634, "percentage": 46.77, "elapsed_time": "2:48:59", "remaining_time": "3:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1795, "total_steps": 3836, "loss": 0.1589, "learning_rate": 2.9692154350668797e-06, "epoch": 0.46785912097220866, "percentage": 46.79, "elapsed_time": "2:49:05", "remaining_time": "3:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1796, "total_steps": 3836, "loss": 0.1727, "learning_rate": 2.967098244243297e-06, "epoch": 0.4681197667220539, "percentage": 46.82, "elapsed_time": "2:49:11", "remaining_time": "3:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1797, "total_steps": 3836, "loss": 0.1697, "learning_rate": 2.9649807062424984e-06, "epoch": 0.46838041247189915, "percentage": 46.85, "elapsed_time": "2:49:16", "remaining_time": "3:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1798, "total_steps": 3836, "loss": 0.1611, "learning_rate": 2.962862822638372e-06, "epoch": 0.46864105822174434, "percentage": 46.87, "elapsed_time": "2:49:22", "remaining_time": "3:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1799, "total_steps": 3836, "loss": 0.1448, "learning_rate": 2.960744595005066e-06, "epoch": 0.4689017039715896, "percentage": 46.9, "elapsed_time": "2:49:27", "remaining_time": "3:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1800, "total_steps": 3836, "loss": 0.1499, "learning_rate": 2.95862602491698e-06, "epoch": 0.46916234972143483, "percentage": 46.92, "elapsed_time": "2:49:33", "remaining_time": "3:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1801, "total_steps": 3836, "loss": 0.1631, "learning_rate": 2.956507113948772e-06, "epoch": 0.4694229954712801, "percentage": 46.95, "elapsed_time": "2:49:38", "remaining_time": "3:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1802, "total_steps": 3836, "loss": 0.1698, "learning_rate": 2.9543878636753514e-06, "epoch": 0.4696836412211253, "percentage": 46.98, "elapsed_time": "2:49:44", "remaining_time": "3:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1803, "total_steps": 3836, "loss": 0.1487, "learning_rate": 2.9522682756718796e-06, "epoch": 0.46994428697097057, "percentage": 47.0, "elapsed_time": "2:49:49", "remaining_time": "3:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1804, "total_steps": 3836, "loss": 0.1531, "learning_rate": 2.950148351513771e-06, "epoch": 0.4702049327208158, "percentage": 47.03, "elapsed_time": "2:49:55", "remaining_time": "3:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1805, "total_steps": 3836, "loss": 0.1629, "learning_rate": 2.9480280927766875e-06, "epoch": 0.47046557847066106, "percentage": 47.05, "elapsed_time": "2:50:01", "remaining_time": "3:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1806, "total_steps": 3836, "loss": 0.1631, "learning_rate": 2.9459075010365406e-06, "epoch": 0.4707262242205063, "percentage": 47.08, "elapsed_time": "2:50:06", "remaining_time": "3:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1807, "total_steps": 3836, "loss": 0.1667, "learning_rate": 2.9437865778694903e-06, "epoch": 0.47098686997035155, "percentage": 47.11, "elapsed_time": "2:50:12", "remaining_time": "3:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1808, "total_steps": 3836, "loss": 0.1538, "learning_rate": 2.9416653248519404e-06, "epoch": 0.4712475157201968, "percentage": 47.13, "elapsed_time": "2:50:18", "remaining_time": "3:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1809, "total_steps": 3836, "loss": 0.1704, "learning_rate": 2.9395437435605435e-06, "epoch": 0.47150816147004204, "percentage": 47.16, "elapsed_time": "2:50:24", "remaining_time": "3:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1810, "total_steps": 3836, "loss": 0.1542, "learning_rate": 2.9374218355721925e-06, "epoch": 0.4717688072198873, "percentage": 47.18, "elapsed_time": "2:50:29", "remaining_time": "3:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1811, "total_steps": 3836, "loss": 0.1583, "learning_rate": 2.935299602464025e-06, "epoch": 0.47202945296973253, "percentage": 47.21, "elapsed_time": "2:50:35", "remaining_time": "3:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1812, "total_steps": 3836, "loss": 0.1667, "learning_rate": 2.933177045813421e-06, "epoch": 0.4722900987195778, "percentage": 47.24, "elapsed_time": "2:50:41", "remaining_time": "3:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1813, "total_steps": 3836, "loss": 0.1758, "learning_rate": 2.931054167198e-06, "epoch": 0.472550744469423, "percentage": 47.26, "elapsed_time": "2:50:47", "remaining_time": "3:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1814, "total_steps": 3836, "loss": 0.1659, "learning_rate": 2.9289309681956194e-06, "epoch": 0.4728113902192682, "percentage": 47.29, "elapsed_time": "2:50:52", "remaining_time": "3:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1815, "total_steps": 3836, "loss": 0.1581, "learning_rate": 2.926807450384377e-06, "epoch": 0.47307203596911346, "percentage": 47.31, "elapsed_time": "2:50:57", "remaining_time": "3:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1816, "total_steps": 3836, "loss": 0.1508, "learning_rate": 2.924683615342607e-06, "epoch": 0.4733326817189587, "percentage": 47.34, "elapsed_time": "2:51:03", "remaining_time": "3:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1817, "total_steps": 3836, "loss": 0.1699, "learning_rate": 2.92255946464888e-06, "epoch": 0.47359332746880395, "percentage": 47.37, "elapsed_time": "2:51:08", "remaining_time": "3:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1818, "total_steps": 3836, "loss": 0.1642, "learning_rate": 2.920434999881998e-06, "epoch": 0.4738539732186492, "percentage": 47.39, "elapsed_time": "2:51:14", "remaining_time": "3:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1819, "total_steps": 3836, "loss": 0.1393, "learning_rate": 2.918310222621001e-06, "epoch": 0.47411461896849444, "percentage": 47.42, "elapsed_time": "2:51:19", "remaining_time": "3:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1820, "total_steps": 3836, "loss": 0.1643, "learning_rate": 2.9161851344451563e-06, "epoch": 0.4743752647183397, "percentage": 47.45, "elapsed_time": "2:51:25", "remaining_time": "3:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1821, "total_steps": 3836, "loss": 0.1605, "learning_rate": 2.9140597369339684e-06, "epoch": 0.47463591046818493, "percentage": 47.47, "elapsed_time": "2:51:31", "remaining_time": "3:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1822, "total_steps": 3836, "loss": 0.1528, "learning_rate": 2.9119340316671663e-06, "epoch": 0.4748965562180302, "percentage": 47.5, "elapsed_time": "2:51:36", "remaining_time": "3:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1823, "total_steps": 3836, "loss": 0.1643, "learning_rate": 2.9098080202247093e-06, "epoch": 0.4751572019678754, "percentage": 47.52, "elapsed_time": "2:51:41", "remaining_time": "3:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1824, "total_steps": 3836, "loss": 0.1572, "learning_rate": 2.9076817041867863e-06, "epoch": 0.47541784771772067, "percentage": 47.55, "elapsed_time": "2:51:47", "remaining_time": "3:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1825, "total_steps": 3836, "loss": 0.1665, "learning_rate": 2.90555508513381e-06, "epoch": 0.4756784934675659, "percentage": 47.58, "elapsed_time": "2:51:52", "remaining_time": "3:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1826, "total_steps": 3836, "loss": 0.1482, "learning_rate": 2.9034281646464197e-06, "epoch": 0.47593913921741116, "percentage": 47.6, "elapsed_time": "2:51:57", "remaining_time": "3:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1827, "total_steps": 3836, "loss": 0.1773, "learning_rate": 2.901300944305479e-06, "epoch": 0.4761997849672564, "percentage": 47.63, "elapsed_time": "2:52:02", "remaining_time": "3:09:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1828, "total_steps": 3836, "loss": 0.1522, "learning_rate": 2.8991734256920723e-06, "epoch": 0.47646043071710165, "percentage": 47.65, "elapsed_time": "2:52:08", "remaining_time": "3:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1829, "total_steps": 3836, "loss": 0.1688, "learning_rate": 2.8970456103875083e-06, "epoch": 0.47672107646694684, "percentage": 47.68, "elapsed_time": "2:52:14", "remaining_time": "3:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1830, "total_steps": 3836, "loss": 0.1695, "learning_rate": 2.894917499973315e-06, "epoch": 0.4769817222167921, "percentage": 47.71, "elapsed_time": "2:52:20", "remaining_time": "3:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1831, "total_steps": 3836, "loss": 0.1625, "learning_rate": 2.892789096031239e-06, "epoch": 0.4772423679666373, "percentage": 47.73, "elapsed_time": "2:52:26", "remaining_time": "3:08:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1832, "total_steps": 3836, "loss": 0.1602, "learning_rate": 2.890660400143248e-06, "epoch": 0.47750301371648257, "percentage": 47.76, "elapsed_time": "2:52:31", "remaining_time": "3:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1833, "total_steps": 3836, "loss": 0.1588, "learning_rate": 2.8885314138915215e-06, "epoch": 0.4777636594663278, "percentage": 47.78, "elapsed_time": "2:52:37", "remaining_time": "3:08:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1834, "total_steps": 3836, "loss": 0.1446, "learning_rate": 2.8864021388584606e-06, "epoch": 0.47802430521617306, "percentage": 47.81, "elapsed_time": "2:52:43", "remaining_time": "3:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1835, "total_steps": 3836, "loss": 0.1731, "learning_rate": 2.884272576626677e-06, "epoch": 0.4782849509660183, "percentage": 47.84, "elapsed_time": "2:52:49", "remaining_time": "3:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1836, "total_steps": 3836, "loss": 0.1719, "learning_rate": 2.882142728778997e-06, "epoch": 0.47854559671586355, "percentage": 47.86, "elapsed_time": "2:52:54", "remaining_time": "3:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1837, "total_steps": 3836, "loss": 0.161, "learning_rate": 2.880012596898461e-06, "epoch": 0.4788062424657088, "percentage": 47.89, "elapsed_time": "2:53:00", "remaining_time": "3:08:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1838, "total_steps": 3836, "loss": 0.1452, "learning_rate": 2.877882182568317e-06, "epoch": 0.47906688821555404, "percentage": 47.91, "elapsed_time": "2:53:06", "remaining_time": "3:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1839, "total_steps": 3836, "loss": 0.1565, "learning_rate": 2.875751487372026e-06, "epoch": 0.4793275339653993, "percentage": 47.94, "elapsed_time": "2:53:11", "remaining_time": "3:08:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1840, "total_steps": 3836, "loss": 0.157, "learning_rate": 2.873620512893257e-06, "epoch": 0.47958817971524453, "percentage": 47.97, "elapsed_time": "2:53:17", "remaining_time": "3:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1841, "total_steps": 3836, "loss": 0.1598, "learning_rate": 2.8714892607158847e-06, "epoch": 0.4798488254650898, "percentage": 47.99, "elapsed_time": "2:53:21", "remaining_time": "3:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1842, "total_steps": 3836, "loss": 0.1751, "learning_rate": 2.8693577324239925e-06, "epoch": 0.480109471214935, "percentage": 48.02, "elapsed_time": "2:53:27", "remaining_time": "3:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1843, "total_steps": 3836, "loss": 0.1714, "learning_rate": 2.8672259296018683e-06, "epoch": 0.48037011696478027, "percentage": 48.04, "elapsed_time": "2:53:33", "remaining_time": "3:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1844, "total_steps": 3836, "loss": 0.1633, "learning_rate": 2.865093853834004e-06, "epoch": 0.48063076271462546, "percentage": 48.07, "elapsed_time": "2:53:39", "remaining_time": "3:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1845, "total_steps": 3836, "loss": 0.1682, "learning_rate": 2.8629615067050942e-06, "epoch": 0.4808914084644707, "percentage": 48.1, "elapsed_time": "2:53:45", "remaining_time": "3:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1846, "total_steps": 3836, "loss": 0.1541, "learning_rate": 2.8608288898000356e-06, "epoch": 0.48115205421431595, "percentage": 48.12, "elapsed_time": "2:53:50", "remaining_time": "3:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1847, "total_steps": 3836, "loss": 0.1626, "learning_rate": 2.8586960047039248e-06, "epoch": 0.4814126999641612, "percentage": 48.15, "elapsed_time": "2:53:55", "remaining_time": "3:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1848, "total_steps": 3836, "loss": 0.1631, "learning_rate": 2.8565628530020584e-06, "epoch": 0.48167334571400644, "percentage": 48.18, "elapsed_time": "2:54:01", "remaining_time": "3:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1849, "total_steps": 3836, "loss": 0.1585, "learning_rate": 2.8544294362799298e-06, "epoch": 0.4819339914638517, "percentage": 48.2, "elapsed_time": "2:54:07", "remaining_time": "3:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1850, "total_steps": 3836, "loss": 0.1474, "learning_rate": 2.8522957561232323e-06, "epoch": 0.48219463721369693, "percentage": 48.23, "elapsed_time": "2:54:12", "remaining_time": "3:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1851, "total_steps": 3836, "loss": 0.1696, "learning_rate": 2.8501618141178515e-06, "epoch": 0.4824552829635422, "percentage": 48.25, "elapsed_time": "2:54:17", "remaining_time": "3:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1852, "total_steps": 3836, "loss": 0.1476, "learning_rate": 2.84802761184987e-06, "epoch": 0.4827159287133874, "percentage": 48.28, "elapsed_time": "2:54:22", "remaining_time": "3:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1853, "total_steps": 3836, "loss": 0.1543, "learning_rate": 2.8458931509055626e-06, "epoch": 0.48297657446323267, "percentage": 48.31, "elapsed_time": "2:54:28", "remaining_time": "3:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1854, "total_steps": 3836, "loss": 0.1631, "learning_rate": 2.8437584328713976e-06, "epoch": 0.4832372202130779, "percentage": 48.33, "elapsed_time": "2:54:33", "remaining_time": "3:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1855, "total_steps": 3836, "loss": 0.1571, "learning_rate": 2.841623459334033e-06, "epoch": 0.48349786596292316, "percentage": 48.36, "elapsed_time": "2:54:38", "remaining_time": "3:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1856, "total_steps": 3836, "loss": 0.1529, "learning_rate": 2.8394882318803174e-06, "epoch": 0.4837585117127684, "percentage": 48.38, "elapsed_time": "2:54:43", "remaining_time": "3:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1857, "total_steps": 3836, "loss": 0.1598, "learning_rate": 2.8373527520972884e-06, "epoch": 0.48401915746261365, "percentage": 48.41, "elapsed_time": "2:54:49", "remaining_time": "3:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1858, "total_steps": 3836, "loss": 0.1551, "learning_rate": 2.835217021572171e-06, "epoch": 0.4842798032124589, "percentage": 48.44, "elapsed_time": "2:54:55", "remaining_time": "3:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1859, "total_steps": 3836, "loss": 0.1769, "learning_rate": 2.8330810418923752e-06, "epoch": 0.4845404489623041, "percentage": 48.46, "elapsed_time": "2:55:00", "remaining_time": "3:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1860, "total_steps": 3836, "loss": 0.1492, "learning_rate": 2.8309448146454993e-06, "epoch": 0.4848010947121493, "percentage": 48.49, "elapsed_time": "2:55:06", "remaining_time": "3:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1861, "total_steps": 3836, "loss": 0.1611, "learning_rate": 2.828808341419321e-06, "epoch": 0.4850617404619946, "percentage": 48.51, "elapsed_time": "2:55:12", "remaining_time": "3:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1862, "total_steps": 3836, "loss": 0.1695, "learning_rate": 2.8266716238018065e-06, "epoch": 0.4853223862118398, "percentage": 48.54, "elapsed_time": "2:55:17", "remaining_time": "3:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1863, "total_steps": 3836, "loss": 0.1581, "learning_rate": 2.8245346633810995e-06, "epoch": 0.48558303196168506, "percentage": 48.57, "elapsed_time": "2:55:22", "remaining_time": "3:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1864, "total_steps": 3836, "loss": 0.1762, "learning_rate": 2.822397461745524e-06, "epoch": 0.4858436777115303, "percentage": 48.59, "elapsed_time": "2:55:28", "remaining_time": "3:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1865, "total_steps": 3836, "loss": 0.1616, "learning_rate": 2.8202600204835865e-06, "epoch": 0.48610432346137555, "percentage": 48.62, "elapsed_time": "2:55:34", "remaining_time": "3:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1866, "total_steps": 3836, "loss": 0.1541, "learning_rate": 2.8181223411839686e-06, "epoch": 0.4863649692112208, "percentage": 48.64, "elapsed_time": "2:55:39", "remaining_time": "3:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1867, "total_steps": 3836, "loss": 0.1604, "learning_rate": 2.8159844254355295e-06, "epoch": 0.48662561496106604, "percentage": 48.67, "elapsed_time": "2:55:45", "remaining_time": "3:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1868, "total_steps": 3836, "loss": 0.1607, "learning_rate": 2.8138462748273072e-06, "epoch": 0.4868862607109113, "percentage": 48.7, "elapsed_time": "2:55:50", "remaining_time": "3:05:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1869, "total_steps": 3836, "loss": 0.1615, "learning_rate": 2.811707890948508e-06, "epoch": 0.48714690646075653, "percentage": 48.72, "elapsed_time": "2:55:56", "remaining_time": "3:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1870, "total_steps": 3836, "loss": 0.1608, "learning_rate": 2.8095692753885177e-06, "epoch": 0.4874075522106018, "percentage": 48.75, "elapsed_time": "2:56:02", "remaining_time": "3:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1871, "total_steps": 3836, "loss": 0.154, "learning_rate": 2.8074304297368913e-06, "epoch": 0.487668197960447, "percentage": 48.77, "elapsed_time": "2:56:08", "remaining_time": "3:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1872, "total_steps": 3836, "loss": 0.1791, "learning_rate": 2.805291355583355e-06, "epoch": 0.48792884371029227, "percentage": 48.8, "elapsed_time": "2:56:14", "remaining_time": "3:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1873, "total_steps": 3836, "loss": 0.165, "learning_rate": 2.803152054517806e-06, "epoch": 0.4881894894601375, "percentage": 48.83, "elapsed_time": "2:56:19", "remaining_time": "3:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1874, "total_steps": 3836, "loss": 0.1565, "learning_rate": 2.8010125281303076e-06, "epoch": 0.4884501352099827, "percentage": 48.85, "elapsed_time": "2:56:24", "remaining_time": "3:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1875, "total_steps": 3836, "loss": 0.1546, "learning_rate": 2.798872778011094e-06, "epoch": 0.48871078095982795, "percentage": 48.88, "elapsed_time": "2:56:29", "remaining_time": "3:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1876, "total_steps": 3836, "loss": 0.1746, "learning_rate": 2.7967328057505637e-06, "epoch": 0.4889714267096732, "percentage": 48.91, "elapsed_time": "2:56:35", "remaining_time": "3:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1877, "total_steps": 3836, "loss": 0.1567, "learning_rate": 2.7945926129392797e-06, "epoch": 0.48923207245951844, "percentage": 48.93, "elapsed_time": "2:56:40", "remaining_time": "3:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1878, "total_steps": 3836, "loss": 0.1678, "learning_rate": 2.792452201167971e-06, "epoch": 0.4894927182093637, "percentage": 48.96, "elapsed_time": "2:56:46", "remaining_time": "3:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1879, "total_steps": 3836, "loss": 0.1561, "learning_rate": 2.790311572027528e-06, "epoch": 0.48975336395920893, "percentage": 48.98, "elapsed_time": "2:56:52", "remaining_time": "3:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1880, "total_steps": 3836, "loss": 0.1641, "learning_rate": 2.7881707271090018e-06, "epoch": 0.4900140097090542, "percentage": 49.01, "elapsed_time": "2:56:57", "remaining_time": "3:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1881, "total_steps": 3836, "loss": 0.1529, "learning_rate": 2.7860296680036064e-06, "epoch": 0.4902746554588994, "percentage": 49.04, "elapsed_time": "2:57:03", "remaining_time": "3:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1882, "total_steps": 3836, "loss": 0.1559, "learning_rate": 2.7838883963027118e-06, "epoch": 0.49053530120874467, "percentage": 49.06, "elapsed_time": "2:57:08", "remaining_time": "3:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1883, "total_steps": 3836, "loss": 0.1572, "learning_rate": 2.7817469135978496e-06, "epoch": 0.4907959469585899, "percentage": 49.09, "elapsed_time": "2:57:14", "remaining_time": "3:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1884, "total_steps": 3836, "loss": 0.1519, "learning_rate": 2.779605221480706e-06, "epoch": 0.49105659270843516, "percentage": 49.11, "elapsed_time": "2:57:19", "remaining_time": "3:03:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1885, "total_steps": 3836, "loss": 0.1532, "learning_rate": 2.7774633215431213e-06, "epoch": 0.4913172384582804, "percentage": 49.14, "elapsed_time": "2:57:25", "remaining_time": "3:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1886, "total_steps": 3836, "loss": 0.1675, "learning_rate": 2.7753212153770947e-06, "epoch": 0.49157788420812565, "percentage": 49.17, "elapsed_time": "2:57:30", "remaining_time": "3:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1887, "total_steps": 3836, "loss": 0.1526, "learning_rate": 2.7731789045747746e-06, "epoch": 0.4918385299579709, "percentage": 49.19, "elapsed_time": "2:57:36", "remaining_time": "3:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1888, "total_steps": 3836, "loss": 0.1619, "learning_rate": 2.7710363907284643e-06, "epoch": 0.49209917570781614, "percentage": 49.22, "elapsed_time": "2:57:41", "remaining_time": "3:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1889, "total_steps": 3836, "loss": 0.1517, "learning_rate": 2.768893675430615e-06, "epoch": 0.49235982145766133, "percentage": 49.24, "elapsed_time": "2:57:46", "remaining_time": "3:03:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1890, "total_steps": 3836, "loss": 0.1582, "learning_rate": 2.766750760273831e-06, "epoch": 0.4926204672075066, "percentage": 49.27, "elapsed_time": "2:57:51", "remaining_time": "3:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1891, "total_steps": 3836, "loss": 0.1527, "learning_rate": 2.764607646850863e-06, "epoch": 0.4928811129573518, "percentage": 49.3, "elapsed_time": "2:57:57", "remaining_time": "3:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1892, "total_steps": 3836, "loss": 0.1471, "learning_rate": 2.76246433675461e-06, "epoch": 0.49314175870719706, "percentage": 49.32, "elapsed_time": "2:58:02", "remaining_time": "3:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1893, "total_steps": 3836, "loss": 0.1557, "learning_rate": 2.7603208315781164e-06, "epoch": 0.4934024044570423, "percentage": 49.35, "elapsed_time": "2:58:07", "remaining_time": "3:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1894, "total_steps": 3836, "loss": 0.1569, "learning_rate": 2.7581771329145713e-06, "epoch": 0.49366305020688755, "percentage": 49.37, "elapsed_time": "2:58:13", "remaining_time": "3:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1895, "total_steps": 3836, "loss": 0.1567, "learning_rate": 2.75603324235731e-06, "epoch": 0.4939236959567328, "percentage": 49.4, "elapsed_time": "2:58:18", "remaining_time": "3:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1896, "total_steps": 3836, "loss": 0.1711, "learning_rate": 2.7538891614998074e-06, "epoch": 0.49418434170657805, "percentage": 49.43, "elapsed_time": "2:58:23", "remaining_time": "3:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1897, "total_steps": 3836, "loss": 0.1509, "learning_rate": 2.7517448919356815e-06, "epoch": 0.4944449874564233, "percentage": 49.45, "elapsed_time": "2:58:29", "remaining_time": "3:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1898, "total_steps": 3836, "loss": 0.1689, "learning_rate": 2.749600435258691e-06, "epoch": 0.49470563320626854, "percentage": 49.48, "elapsed_time": "2:58:34", "remaining_time": "3:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1899, "total_steps": 3836, "loss": 0.1631, "learning_rate": 2.747455793062732e-06, "epoch": 0.4949662789561138, "percentage": 49.5, "elapsed_time": "2:58:39", "remaining_time": "3:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1900, "total_steps": 3836, "loss": 0.143, "learning_rate": 2.745310966941839e-06, "epoch": 0.495226924705959, "percentage": 49.53, "elapsed_time": "2:58:45", "remaining_time": "3:02:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1901, "total_steps": 3836, "loss": 0.1715, "learning_rate": 2.743165958490186e-06, "epoch": 0.49548757045580427, "percentage": 49.56, "elapsed_time": "2:58:51", "remaining_time": "3:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1902, "total_steps": 3836, "loss": 0.1537, "learning_rate": 2.741020769302077e-06, "epoch": 0.4957482162056495, "percentage": 49.58, "elapsed_time": "2:58:56", "remaining_time": "3:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1903, "total_steps": 3836, "loss": 0.1619, "learning_rate": 2.7388754009719553e-06, "epoch": 0.49600886195549476, "percentage": 49.61, "elapsed_time": "2:59:02", "remaining_time": "3:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1904, "total_steps": 3836, "loss": 0.1607, "learning_rate": 2.7367298550943954e-06, "epoch": 0.49626950770534, "percentage": 49.64, "elapsed_time": "2:59:07", "remaining_time": "3:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1905, "total_steps": 3836, "loss": 0.161, "learning_rate": 2.7345841332641027e-06, "epoch": 0.4965301534551852, "percentage": 49.66, "elapsed_time": "2:59:13", "remaining_time": "3:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1906, "total_steps": 3836, "loss": 0.1645, "learning_rate": 2.7324382370759174e-06, "epoch": 0.49679079920503044, "percentage": 49.69, "elapsed_time": "2:59:18", "remaining_time": "3:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1907, "total_steps": 3836, "loss": 0.16, "learning_rate": 2.730292168124802e-06, "epoch": 0.4970514449548757, "percentage": 49.71, "elapsed_time": "2:59:24", "remaining_time": "3:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1908, "total_steps": 3836, "loss": 0.1457, "learning_rate": 2.7281459280058563e-06, "epoch": 0.49731209070472093, "percentage": 49.74, "elapsed_time": "2:59:30", "remaining_time": "3:01:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1909, "total_steps": 3836, "loss": 0.1467, "learning_rate": 2.7259995183143004e-06, "epoch": 0.4975727364545662, "percentage": 49.77, "elapsed_time": "2:59:35", "remaining_time": "3:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1910, "total_steps": 3836, "loss": 0.1603, "learning_rate": 2.7238529406454834e-06, "epoch": 0.4978333822044114, "percentage": 49.79, "elapsed_time": "2:59:41", "remaining_time": "3:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1911, "total_steps": 3836, "loss": 0.1537, "learning_rate": 2.7217061965948794e-06, "epoch": 0.49809402795425667, "percentage": 49.82, "elapsed_time": "2:59:47", "remaining_time": "3:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1912, "total_steps": 3836, "loss": 0.1478, "learning_rate": 2.719559287758085e-06, "epoch": 0.4983546737041019, "percentage": 49.84, "elapsed_time": "2:59:52", "remaining_time": "3:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1913, "total_steps": 3836, "loss": 0.1589, "learning_rate": 2.717412215730819e-06, "epoch": 0.49861531945394716, "percentage": 49.87, "elapsed_time": "2:59:58", "remaining_time": "3:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1914, "total_steps": 3836, "loss": 0.1635, "learning_rate": 2.7152649821089245e-06, "epoch": 0.4988759652037924, "percentage": 49.9, "elapsed_time": "3:00:04", "remaining_time": "3:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1915, "total_steps": 3836, "loss": 0.1593, "learning_rate": 2.7131175884883604e-06, "epoch": 0.49913661095363765, "percentage": 49.92, "elapsed_time": "3:00:10", "remaining_time": "3:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1916, "total_steps": 3836, "loss": 0.1545, "learning_rate": 2.7109700364652075e-06, "epoch": 0.4993972567034829, "percentage": 49.95, "elapsed_time": "3:00:15", "remaining_time": "3:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1917, "total_steps": 3836, "loss": 0.163, "learning_rate": 2.7088223276356635e-06, "epoch": 0.49965790245332814, "percentage": 49.97, "elapsed_time": "3:00:21", "remaining_time": "3:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1918, "total_steps": 3836, "loss": 0.1545, "learning_rate": 2.7066744635960423e-06, "epoch": 0.4999185482031734, "percentage": 50.0, "elapsed_time": "3:00:27", "remaining_time": "3:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1919, "total_steps": 3836, "loss": 0.164, "learning_rate": 2.7045264459427737e-06, "epoch": 0.5001791939530186, "percentage": 50.03, "elapsed_time": "3:00:32", "remaining_time": "3:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1920, "total_steps": 3836, "loss": 0.1491, "learning_rate": 2.702378276272402e-06, "epoch": 0.5004398397028639, "percentage": 50.05, "elapsed_time": "3:00:38", "remaining_time": "3:00:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1921, "total_steps": 3836, "loss": 0.1572, "learning_rate": 2.7002299561815838e-06, "epoch": 0.5007004854527091, "percentage": 50.08, "elapsed_time": "3:00:43", "remaining_time": "3:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1922, "total_steps": 3836, "loss": 0.1559, "learning_rate": 2.6980814872670863e-06, "epoch": 0.5009611312025544, "percentage": 50.1, "elapsed_time": "3:00:49", "remaining_time": "3:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1923, "total_steps": 3836, "loss": 0.1625, "learning_rate": 2.6959328711257905e-06, "epoch": 0.5012217769523996, "percentage": 50.13, "elapsed_time": "3:00:55", "remaining_time": "2:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1924, "total_steps": 3836, "loss": 0.1677, "learning_rate": 2.6937841093546842e-06, "epoch": 0.5014824227022449, "percentage": 50.16, "elapsed_time": "3:01:00", "remaining_time": "2:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1925, "total_steps": 3836, "loss": 0.1628, "learning_rate": 2.6916352035508637e-06, "epoch": 0.50174306845209, "percentage": 50.18, "elapsed_time": "3:01:06", "remaining_time": "2:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1926, "total_steps": 3836, "loss": 0.1582, "learning_rate": 2.6894861553115337e-06, "epoch": 0.5020037142019353, "percentage": 50.21, "elapsed_time": "3:01:12", "remaining_time": "2:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1927, "total_steps": 3836, "loss": 0.1672, "learning_rate": 2.6873369662340036e-06, "epoch": 0.5022643599517805, "percentage": 50.23, "elapsed_time": "3:01:17", "remaining_time": "2:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1928, "total_steps": 3836, "loss": 0.1735, "learning_rate": 2.6851876379156884e-06, "epoch": 0.5025250057016257, "percentage": 50.26, "elapsed_time": "3:01:22", "remaining_time": "2:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1929, "total_steps": 3836, "loss": 0.1606, "learning_rate": 2.6830381719541047e-06, "epoch": 0.502785651451471, "percentage": 50.29, "elapsed_time": "3:01:28", "remaining_time": "2:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1930, "total_steps": 3836, "loss": 0.1563, "learning_rate": 2.680888569946874e-06, "epoch": 0.5030462972013162, "percentage": 50.31, "elapsed_time": "3:01:33", "remaining_time": "2:59:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1931, "total_steps": 3836, "loss": 0.1619, "learning_rate": 2.6787388334917175e-06, "epoch": 0.5033069429511615, "percentage": 50.34, "elapsed_time": "3:01:39", "remaining_time": "2:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1932, "total_steps": 3836, "loss": 0.1575, "learning_rate": 2.6765889641864562e-06, "epoch": 0.5035675887010067, "percentage": 50.36, "elapsed_time": "3:01:44", "remaining_time": "2:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1933, "total_steps": 3836, "loss": 0.1595, "learning_rate": 2.67443896362901e-06, "epoch": 0.503828234450852, "percentage": 50.39, "elapsed_time": "3:01:50", "remaining_time": "2:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1934, "total_steps": 3836, "loss": 0.17, "learning_rate": 2.6722888334173974e-06, "epoch": 0.5040888802006972, "percentage": 50.42, "elapsed_time": "3:01:56", "remaining_time": "2:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1935, "total_steps": 3836, "loss": 0.162, "learning_rate": 2.6701385751497304e-06, "epoch": 0.5043495259505425, "percentage": 50.44, "elapsed_time": "3:02:02", "remaining_time": "2:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1936, "total_steps": 3836, "loss": 0.1536, "learning_rate": 2.6679881904242198e-06, "epoch": 0.5046101717003877, "percentage": 50.47, "elapsed_time": "3:02:08", "remaining_time": "2:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1937, "total_steps": 3836, "loss": 0.1611, "learning_rate": 2.665837680839169e-06, "epoch": 0.504870817450233, "percentage": 50.5, "elapsed_time": "3:02:13", "remaining_time": "2:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1938, "total_steps": 3836, "loss": 0.1566, "learning_rate": 2.663687047992972e-06, "epoch": 0.5051314632000782, "percentage": 50.52, "elapsed_time": "3:02:19", "remaining_time": "2:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1939, "total_steps": 3836, "loss": 0.1454, "learning_rate": 2.6615362934841192e-06, "epoch": 0.5053921089499235, "percentage": 50.55, "elapsed_time": "3:02:24", "remaining_time": "2:58:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1940, "total_steps": 3836, "loss": 0.147, "learning_rate": 2.6593854189111857e-06, "epoch": 0.5056527546997687, "percentage": 50.57, "elapsed_time": "3:02:29", "remaining_time": "2:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1941, "total_steps": 3836, "loss": 0.1525, "learning_rate": 2.65723442587284e-06, "epoch": 0.505913400449614, "percentage": 50.6, "elapsed_time": "3:02:35", "remaining_time": "2:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1942, "total_steps": 3836, "loss": 0.1616, "learning_rate": 2.655083315967838e-06, "epoch": 0.5061740461994592, "percentage": 50.63, "elapsed_time": "3:02:41", "remaining_time": "2:58:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1943, "total_steps": 3836, "loss": 0.1609, "learning_rate": 2.6529320907950202e-06, "epoch": 0.5064346919493043, "percentage": 50.65, "elapsed_time": "3:02:47", "remaining_time": "2:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1944, "total_steps": 3836, "loss": 0.1517, "learning_rate": 2.650780751953316e-06, "epoch": 0.5066953376991497, "percentage": 50.68, "elapsed_time": "3:02:52", "remaining_time": "2:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1945, "total_steps": 3836, "loss": 0.1611, "learning_rate": 2.648629301041737e-06, "epoch": 0.5069559834489948, "percentage": 50.7, "elapsed_time": "3:02:57", "remaining_time": "2:57:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1946, "total_steps": 3836, "loss": 0.1586, "learning_rate": 2.646477739659378e-06, "epoch": 0.5072166291988401, "percentage": 50.73, "elapsed_time": "3:03:02", "remaining_time": "2:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1947, "total_steps": 3836, "loss": 0.1525, "learning_rate": 2.644326069405419e-06, "epoch": 0.5074772749486853, "percentage": 50.76, "elapsed_time": "3:03:07", "remaining_time": "2:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1948, "total_steps": 3836, "loss": 0.1622, "learning_rate": 2.6421742918791155e-06, "epoch": 0.5077379206985306, "percentage": 50.78, "elapsed_time": "3:03:13", "remaining_time": "2:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1949, "total_steps": 3836, "loss": 0.1472, "learning_rate": 2.640022408679808e-06, "epoch": 0.5079985664483758, "percentage": 50.81, "elapsed_time": "3:03:19", "remaining_time": "2:57:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1950, "total_steps": 3836, "loss": 0.1778, "learning_rate": 2.6378704214069133e-06, "epoch": 0.5082592121982211, "percentage": 50.83, "elapsed_time": "3:03:25", "remaining_time": "2:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1951, "total_steps": 3836, "loss": 0.1608, "learning_rate": 2.6357183316599243e-06, "epoch": 0.5085198579480663, "percentage": 50.86, "elapsed_time": "3:03:30", "remaining_time": "2:57:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1952, "total_steps": 3836, "loss": 0.1691, "learning_rate": 2.633566141038413e-06, "epoch": 0.5087805036979116, "percentage": 50.89, "elapsed_time": "3:03:35", "remaining_time": "2:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1953, "total_steps": 3836, "loss": 0.1482, "learning_rate": 2.631413851142024e-06, "epoch": 0.5090411494477568, "percentage": 50.91, "elapsed_time": "3:03:40", "remaining_time": "2:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1954, "total_steps": 3836, "loss": 0.1442, "learning_rate": 2.629261463570476e-06, "epoch": 0.5093017951976021, "percentage": 50.94, "elapsed_time": "3:03:45", "remaining_time": "2:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1955, "total_steps": 3836, "loss": 0.1459, "learning_rate": 2.627108979923562e-06, "epoch": 0.5095624409474473, "percentage": 50.96, "elapsed_time": "3:03:50", "remaining_time": "2:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1956, "total_steps": 3836, "loss": 0.1595, "learning_rate": 2.6249564018011437e-06, "epoch": 0.5098230866972926, "percentage": 50.99, "elapsed_time": "3:03:56", "remaining_time": "2:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1957, "total_steps": 3836, "loss": 0.1592, "learning_rate": 2.6228037308031557e-06, "epoch": 0.5100837324471378, "percentage": 51.02, "elapsed_time": "3:04:02", "remaining_time": "2:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1958, "total_steps": 3836, "loss": 0.1647, "learning_rate": 2.6206509685296e-06, "epoch": 0.510344378196983, "percentage": 51.04, "elapsed_time": "3:04:07", "remaining_time": "2:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1959, "total_steps": 3836, "loss": 0.167, "learning_rate": 2.618498116580546e-06, "epoch": 0.5106050239468283, "percentage": 51.07, "elapsed_time": "3:04:13", "remaining_time": "2:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1960, "total_steps": 3836, "loss": 0.1559, "learning_rate": 2.6163451765561324e-06, "epoch": 0.5108656696966735, "percentage": 51.09, "elapsed_time": "3:04:19", "remaining_time": "2:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1961, "total_steps": 3836, "loss": 0.1474, "learning_rate": 2.614192150056561e-06, "epoch": 0.5111263154465188, "percentage": 51.12, "elapsed_time": "3:04:24", "remaining_time": "2:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1962, "total_steps": 3836, "loss": 0.1619, "learning_rate": 2.6120390386820975e-06, "epoch": 0.511386961196364, "percentage": 51.15, "elapsed_time": "3:04:30", "remaining_time": "2:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1963, "total_steps": 3836, "loss": 0.152, "learning_rate": 2.609885844033072e-06, "epoch": 0.5116476069462093, "percentage": 51.17, "elapsed_time": "3:04:35", "remaining_time": "2:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1964, "total_steps": 3836, "loss": 0.1613, "learning_rate": 2.607732567709877e-06, "epoch": 0.5119082526960544, "percentage": 51.2, "elapsed_time": "3:04:40", "remaining_time": "2:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1965, "total_steps": 3836, "loss": 0.1535, "learning_rate": 2.605579211312964e-06, "epoch": 0.5121688984458997, "percentage": 51.23, "elapsed_time": "3:04:46", "remaining_time": "2:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1966, "total_steps": 3836, "loss": 0.1552, "learning_rate": 2.6034257764428456e-06, "epoch": 0.5124295441957449, "percentage": 51.25, "elapsed_time": "3:04:51", "remaining_time": "2:55:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1967, "total_steps": 3836, "loss": 0.1639, "learning_rate": 2.601272264700091e-06, "epoch": 0.5126901899455902, "percentage": 51.28, "elapsed_time": "3:04:57", "remaining_time": "2:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1968, "total_steps": 3836, "loss": 0.1702, "learning_rate": 2.5991186776853277e-06, "epoch": 0.5129508356954354, "percentage": 51.3, "elapsed_time": "3:05:02", "remaining_time": "2:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1969, "total_steps": 3836, "loss": 0.1518, "learning_rate": 2.59696501699924e-06, "epoch": 0.5132114814452807, "percentage": 51.33, "elapsed_time": "3:05:08", "remaining_time": "2:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1970, "total_steps": 3836, "loss": 0.1494, "learning_rate": 2.594811284242565e-06, "epoch": 0.5134721271951259, "percentage": 51.36, "elapsed_time": "3:05:13", "remaining_time": "2:55:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1971, "total_steps": 3836, "loss": 0.1705, "learning_rate": 2.5926574810160936e-06, "epoch": 0.5137327729449712, "percentage": 51.38, "elapsed_time": "3:05:18", "remaining_time": "2:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1972, "total_steps": 3836, "loss": 0.1678, "learning_rate": 2.590503608920672e-06, "epoch": 0.5139934186948164, "percentage": 51.41, "elapsed_time": "3:05:23", "remaining_time": "2:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1973, "total_steps": 3836, "loss": 0.166, "learning_rate": 2.5883496695571934e-06, "epoch": 0.5142540644446616, "percentage": 51.43, "elapsed_time": "3:05:29", "remaining_time": "2:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1974, "total_steps": 3836, "loss": 0.1681, "learning_rate": 2.5861956645266036e-06, "epoch": 0.5145147101945069, "percentage": 51.46, "elapsed_time": "3:05:34", "remaining_time": "2:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1975, "total_steps": 3836, "loss": 0.1579, "learning_rate": 2.584041595429897e-06, "epoch": 0.5147753559443521, "percentage": 51.49, "elapsed_time": "3:05:40", "remaining_time": "2:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1976, "total_steps": 3836, "loss": 0.1533, "learning_rate": 2.581887463868114e-06, "epoch": 0.5150360016941974, "percentage": 51.51, "elapsed_time": "3:05:45", "remaining_time": "2:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1977, "total_steps": 3836, "loss": 0.1501, "learning_rate": 2.579733271442344e-06, "epoch": 0.5152966474440426, "percentage": 51.54, "elapsed_time": "3:05:51", "remaining_time": "2:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1978, "total_steps": 3836, "loss": 0.1601, "learning_rate": 2.57757901975372e-06, "epoch": 0.5155572931938879, "percentage": 51.56, "elapsed_time": "3:05:57", "remaining_time": "2:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1979, "total_steps": 3836, "loss": 0.1548, "learning_rate": 2.5754247104034177e-06, "epoch": 0.5158179389437331, "percentage": 51.59, "elapsed_time": "3:06:03", "remaining_time": "2:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1980, "total_steps": 3836, "loss": 0.1517, "learning_rate": 2.5732703449926595e-06, "epoch": 0.5160785846935784, "percentage": 51.62, "elapsed_time": "3:06:09", "remaining_time": "2:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1981, "total_steps": 3836, "loss": 0.157, "learning_rate": 2.5711159251227053e-06, "epoch": 0.5163392304434236, "percentage": 51.64, "elapsed_time": "3:06:14", "remaining_time": "2:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1982, "total_steps": 3836, "loss": 0.158, "learning_rate": 2.568961452394859e-06, "epoch": 0.5165998761932689, "percentage": 51.67, "elapsed_time": "3:06:20", "remaining_time": "2:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1983, "total_steps": 3836, "loss": 0.1443, "learning_rate": 2.5668069284104614e-06, "epoch": 0.516860521943114, "percentage": 51.69, "elapsed_time": "3:06:25", "remaining_time": "2:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1984, "total_steps": 3836, "loss": 0.1516, "learning_rate": 2.564652354770892e-06, "epoch": 0.5171211676929593, "percentage": 51.72, "elapsed_time": "3:06:31", "remaining_time": "2:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1985, "total_steps": 3836, "loss": 0.1546, "learning_rate": 2.5624977330775676e-06, "epoch": 0.5173818134428045, "percentage": 51.75, "elapsed_time": "3:06:37", "remaining_time": "2:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1986, "total_steps": 3836, "loss": 0.1563, "learning_rate": 2.560343064931941e-06, "epoch": 0.5176424591926498, "percentage": 51.77, "elapsed_time": "3:06:43", "remaining_time": "2:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1987, "total_steps": 3836, "loss": 0.1632, "learning_rate": 2.5581883519354976e-06, "epoch": 0.517903104942495, "percentage": 51.8, "elapsed_time": "3:06:49", "remaining_time": "2:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1988, "total_steps": 3836, "loss": 0.1586, "learning_rate": 2.5560335956897603e-06, "epoch": 0.5181637506923402, "percentage": 51.82, "elapsed_time": "3:06:54", "remaining_time": "2:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1989, "total_steps": 3836, "loss": 0.1508, "learning_rate": 2.553878797796278e-06, "epoch": 0.5184243964421855, "percentage": 51.85, "elapsed_time": "3:06:59", "remaining_time": "2:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1990, "total_steps": 3836, "loss": 0.1423, "learning_rate": 2.551723959856637e-06, "epoch": 0.5186850421920307, "percentage": 51.88, "elapsed_time": "3:07:05", "remaining_time": "2:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1991, "total_steps": 3836, "loss": 0.1526, "learning_rate": 2.5495690834724478e-06, "epoch": 0.518945687941876, "percentage": 51.9, "elapsed_time": "3:07:10", "remaining_time": "2:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1992, "total_steps": 3836, "loss": 0.1613, "learning_rate": 2.5474141702453536e-06, "epoch": 0.5192063336917212, "percentage": 51.93, "elapsed_time": "3:07:16", "remaining_time": "2:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1993, "total_steps": 3836, "loss": 0.1694, "learning_rate": 2.5452592217770233e-06, "epoch": 0.5194669794415665, "percentage": 51.96, "elapsed_time": "3:07:22", "remaining_time": "2:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1994, "total_steps": 3836, "loss": 0.1546, "learning_rate": 2.543104239669152e-06, "epoch": 0.5197276251914117, "percentage": 51.98, "elapsed_time": "3:07:28", "remaining_time": "2:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1995, "total_steps": 3836, "loss": 0.1455, "learning_rate": 2.54094922552346e-06, "epoch": 0.519988270941257, "percentage": 52.01, "elapsed_time": "3:07:33", "remaining_time": "2:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1996, "total_steps": 3836, "loss": 0.161, "learning_rate": 2.5387941809416895e-06, "epoch": 0.5202489166911022, "percentage": 52.03, "elapsed_time": "3:07:40", "remaining_time": "2:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1997, "total_steps": 3836, "loss": 0.1569, "learning_rate": 2.53663910752561e-06, "epoch": 0.5205095624409475, "percentage": 52.06, "elapsed_time": "3:07:45", "remaining_time": "2:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1998, "total_steps": 3836, "loss": 0.1456, "learning_rate": 2.5344840068770076e-06, "epoch": 0.5207702081907927, "percentage": 52.09, "elapsed_time": "3:07:50", "remaining_time": "2:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1999, "total_steps": 3836, "loss": 0.1718, "learning_rate": 2.5323288805976915e-06, "epoch": 0.521030853940638, "percentage": 52.11, "elapsed_time": "3:07:56", "remaining_time": "2:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 3836, "loss": 0.1529, "learning_rate": 2.530173730289488e-06, "epoch": 0.5212914996904832, "percentage": 52.14, "elapsed_time": "3:08:02", "remaining_time": "2:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 3836, "eval_loss": 0.15785683691501617, "epoch": 0.5212914996904832, "percentage": 52.14, "elapsed_time": "3:08:57", "remaining_time": "2:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2001, "total_steps": 3836, "loss": 0.1542, "learning_rate": 2.5280185575542438e-06, "epoch": 0.5215521454403285, "percentage": 52.16, "elapsed_time": "3:09:03", "remaining_time": "2:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2002, "total_steps": 3836, "loss": 0.1522, "learning_rate": 2.5258633639938195e-06, "epoch": 0.5218127911901737, "percentage": 52.19, "elapsed_time": "3:09:08", "remaining_time": "2:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2003, "total_steps": 3836, "loss": 0.152, "learning_rate": 2.5237081512100935e-06, "epoch": 0.5220734369400188, "percentage": 52.22, "elapsed_time": "3:09:14", "remaining_time": "2:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2004, "total_steps": 3836, "loss": 0.1514, "learning_rate": 2.521552920804956e-06, "epoch": 0.5223340826898641, "percentage": 52.24, "elapsed_time": "3:09:19", "remaining_time": "2:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2005, "total_steps": 3836, "loss": 0.1512, "learning_rate": 2.5193976743803138e-06, "epoch": 0.5225947284397093, "percentage": 52.27, "elapsed_time": "3:09:25", "remaining_time": "2:52:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2006, "total_steps": 3836, "loss": 0.1725, "learning_rate": 2.5172424135380817e-06, "epoch": 0.5228553741895546, "percentage": 52.29, "elapsed_time": "3:09:30", "remaining_time": "2:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2007, "total_steps": 3836, "loss": 0.1565, "learning_rate": 2.515087139880188e-06, "epoch": 0.5231160199393998, "percentage": 52.32, "elapsed_time": "3:09:36", "remaining_time": "2:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2008, "total_steps": 3836, "loss": 0.147, "learning_rate": 2.51293185500857e-06, "epoch": 0.5233766656892451, "percentage": 52.35, "elapsed_time": "3:09:42", "remaining_time": "2:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2009, "total_steps": 3836, "loss": 0.1546, "learning_rate": 2.510776560525171e-06, "epoch": 0.5236373114390903, "percentage": 52.37, "elapsed_time": "3:09:48", "remaining_time": "2:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2010, "total_steps": 3836, "loss": 0.1596, "learning_rate": 2.5086212580319457e-06, "epoch": 0.5238979571889356, "percentage": 52.4, "elapsed_time": "3:09:54", "remaining_time": "2:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2011, "total_steps": 3836, "loss": 0.1566, "learning_rate": 2.5064659491308514e-06, "epoch": 0.5241586029387808, "percentage": 52.42, "elapsed_time": "3:09:59", "remaining_time": "2:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2012, "total_steps": 3836, "loss": 0.1523, "learning_rate": 2.50431063542385e-06, "epoch": 0.5244192486886261, "percentage": 52.45, "elapsed_time": "3:10:05", "remaining_time": "2:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2013, "total_steps": 3836, "loss": 0.159, "learning_rate": 2.502155318512911e-06, "epoch": 0.5246798944384713, "percentage": 52.48, "elapsed_time": "3:10:10", "remaining_time": "2:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2014, "total_steps": 3836, "loss": 0.1661, "learning_rate": 2.5e-06, "epoch": 0.5249405401883166, "percentage": 52.5, "elapsed_time": "3:10:16", "remaining_time": "2:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2015, "total_steps": 3836, "loss": 0.1496, "learning_rate": 2.49784468148709e-06, "epoch": 0.5252011859381618, "percentage": 52.53, "elapsed_time": "3:10:22", "remaining_time": "2:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2016, "total_steps": 3836, "loss": 0.1327, "learning_rate": 2.49568936457615e-06, "epoch": 0.5254618316880071, "percentage": 52.55, "elapsed_time": "3:10:26", "remaining_time": "2:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2017, "total_steps": 3836, "loss": 0.1573, "learning_rate": 2.4935340508691502e-06, "epoch": 0.5257224774378523, "percentage": 52.58, "elapsed_time": "3:10:32", "remaining_time": "2:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2018, "total_steps": 3836, "loss": 0.147, "learning_rate": 2.491378741968055e-06, "epoch": 0.5259831231876975, "percentage": 52.61, "elapsed_time": "3:10:37", "remaining_time": "2:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2019, "total_steps": 3836, "loss": 0.1659, "learning_rate": 2.4892234394748296e-06, "epoch": 0.5262437689375428, "percentage": 52.63, "elapsed_time": "3:10:42", "remaining_time": "2:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2020, "total_steps": 3836, "loss": 0.1736, "learning_rate": 2.487068144991431e-06, "epoch": 0.526504414687388, "percentage": 52.66, "elapsed_time": "3:10:47", "remaining_time": "2:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2021, "total_steps": 3836, "loss": 0.1387, "learning_rate": 2.484912860119812e-06, "epoch": 0.5267650604372333, "percentage": 52.69, "elapsed_time": "3:10:53", "remaining_time": "2:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2022, "total_steps": 3836, "loss": 0.1583, "learning_rate": 2.4827575864619183e-06, "epoch": 0.5270257061870784, "percentage": 52.71, "elapsed_time": "3:10:58", "remaining_time": "2:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2023, "total_steps": 3836, "loss": 0.1543, "learning_rate": 2.480602325619687e-06, "epoch": 0.5272863519369237, "percentage": 52.74, "elapsed_time": "3:11:03", "remaining_time": "2:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2024, "total_steps": 3836, "loss": 0.1627, "learning_rate": 2.4784470791950442e-06, "epoch": 0.5275469976867689, "percentage": 52.76, "elapsed_time": "3:11:09", "remaining_time": "2:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2025, "total_steps": 3836, "loss": 0.155, "learning_rate": 2.476291848789907e-06, "epoch": 0.5278076434366142, "percentage": 52.79, "elapsed_time": "3:11:14", "remaining_time": "2:51:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2026, "total_steps": 3836, "loss": 0.1536, "learning_rate": 2.4741366360061813e-06, "epoch": 0.5280682891864594, "percentage": 52.82, "elapsed_time": "3:11:19", "remaining_time": "2:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2027, "total_steps": 3836, "loss": 0.1648, "learning_rate": 2.4719814424457566e-06, "epoch": 0.5283289349363047, "percentage": 52.84, "elapsed_time": "3:11:24", "remaining_time": "2:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2028, "total_steps": 3836, "loss": 0.1629, "learning_rate": 2.4698262697105128e-06, "epoch": 0.5285895806861499, "percentage": 52.87, "elapsed_time": "3:11:30", "remaining_time": "2:50:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2029, "total_steps": 3836, "loss": 0.1606, "learning_rate": 2.4676711194023102e-06, "epoch": 0.5288502264359952, "percentage": 52.89, "elapsed_time": "3:11:36", "remaining_time": "2:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2030, "total_steps": 3836, "loss": 0.1688, "learning_rate": 2.4655159931229932e-06, "epoch": 0.5291108721858404, "percentage": 52.92, "elapsed_time": "3:11:41", "remaining_time": "2:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2031, "total_steps": 3836, "loss": 0.1595, "learning_rate": 2.463360892474391e-06, "epoch": 0.5293715179356857, "percentage": 52.95, "elapsed_time": "3:11:47", "remaining_time": "2:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2032, "total_steps": 3836, "loss": 0.1487, "learning_rate": 2.461205819058311e-06, "epoch": 0.5296321636855309, "percentage": 52.97, "elapsed_time": "3:11:53", "remaining_time": "2:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2033, "total_steps": 3836, "loss": 0.1585, "learning_rate": 2.4590507744765414e-06, "epoch": 0.5298928094353762, "percentage": 53.0, "elapsed_time": "3:11:58", "remaining_time": "2:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2034, "total_steps": 3836, "loss": 0.1393, "learning_rate": 2.4568957603308494e-06, "epoch": 0.5301534551852214, "percentage": 53.02, "elapsed_time": "3:12:04", "remaining_time": "2:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2035, "total_steps": 3836, "loss": 0.1454, "learning_rate": 2.4547407782229775e-06, "epoch": 0.5304141009350666, "percentage": 53.05, "elapsed_time": "3:12:09", "remaining_time": "2:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2036, "total_steps": 3836, "loss": 0.173, "learning_rate": 2.452585829754647e-06, "epoch": 0.5306747466849119, "percentage": 53.08, "elapsed_time": "3:12:15", "remaining_time": "2:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2037, "total_steps": 3836, "loss": 0.1731, "learning_rate": 2.4504309165275527e-06, "epoch": 0.5309353924347571, "percentage": 53.1, "elapsed_time": "3:12:20", "remaining_time": "2:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2038, "total_steps": 3836, "loss": 0.1531, "learning_rate": 2.448276040143364e-06, "epoch": 0.5311960381846024, "percentage": 53.13, "elapsed_time": "3:12:26", "remaining_time": "2:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2039, "total_steps": 3836, "loss": 0.1469, "learning_rate": 2.446121202203723e-06, "epoch": 0.5314566839344476, "percentage": 53.15, "elapsed_time": "3:12:31", "remaining_time": "2:49:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2040, "total_steps": 3836, "loss": 0.1586, "learning_rate": 2.4439664043102414e-06, "epoch": 0.5317173296842929, "percentage": 53.18, "elapsed_time": "3:12:37", "remaining_time": "2:49:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2041, "total_steps": 3836, "loss": 0.1589, "learning_rate": 2.441811648064503e-06, "epoch": 0.531977975434138, "percentage": 53.21, "elapsed_time": "3:12:43", "remaining_time": "2:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2042, "total_steps": 3836, "loss": 0.1556, "learning_rate": 2.43965693506806e-06, "epoch": 0.5322386211839834, "percentage": 53.23, "elapsed_time": "3:12:48", "remaining_time": "2:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2043, "total_steps": 3836, "loss": 0.1627, "learning_rate": 2.4375022669224328e-06, "epoch": 0.5324992669338285, "percentage": 53.26, "elapsed_time": "3:12:54", "remaining_time": "2:49:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2044, "total_steps": 3836, "loss": 0.1682, "learning_rate": 2.4353476452291086e-06, "epoch": 0.5327599126836738, "percentage": 53.28, "elapsed_time": "3:13:00", "remaining_time": "2:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2045, "total_steps": 3836, "loss": 0.1515, "learning_rate": 2.43319307158954e-06, "epoch": 0.533020558433519, "percentage": 53.31, "elapsed_time": "3:13:06", "remaining_time": "2:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2046, "total_steps": 3836, "loss": 0.153, "learning_rate": 2.431038547605142e-06, "epoch": 0.5332812041833643, "percentage": 53.34, "elapsed_time": "3:13:12", "remaining_time": "2:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2047, "total_steps": 3836, "loss": 0.1531, "learning_rate": 2.4288840748772955e-06, "epoch": 0.5335418499332095, "percentage": 53.36, "elapsed_time": "3:13:18", "remaining_time": "2:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2048, "total_steps": 3836, "loss": 0.1514, "learning_rate": 2.4267296550073413e-06, "epoch": 0.5338024956830548, "percentage": 53.39, "elapsed_time": "3:13:23", "remaining_time": "2:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2049, "total_steps": 3836, "loss": 0.155, "learning_rate": 2.4245752895965828e-06, "epoch": 0.5340631414329, "percentage": 53.42, "elapsed_time": "3:13:29", "remaining_time": "2:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2050, "total_steps": 3836, "loss": 0.1509, "learning_rate": 2.4224209802462818e-06, "epoch": 0.5343237871827452, "percentage": 53.44, "elapsed_time": "3:13:34", "remaining_time": "2:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2051, "total_steps": 3836, "loss": 0.1531, "learning_rate": 2.420266728557657e-06, "epoch": 0.5345844329325905, "percentage": 53.47, "elapsed_time": "3:13:39", "remaining_time": "2:48:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2052, "total_steps": 3836, "loss": 0.1495, "learning_rate": 2.4181125361318868e-06, "epoch": 0.5348450786824357, "percentage": 53.49, "elapsed_time": "3:13:45", "remaining_time": "2:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2053, "total_steps": 3836, "loss": 0.1588, "learning_rate": 2.4159584045701037e-06, "epoch": 0.535105724432281, "percentage": 53.52, "elapsed_time": "3:13:50", "remaining_time": "2:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2054, "total_steps": 3836, "loss": 0.1613, "learning_rate": 2.413804335473397e-06, "epoch": 0.5353663701821262, "percentage": 53.55, "elapsed_time": "3:13:56", "remaining_time": "2:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2055, "total_steps": 3836, "loss": 0.1612, "learning_rate": 2.411650330442807e-06, "epoch": 0.5356270159319715, "percentage": 53.57, "elapsed_time": "3:14:01", "remaining_time": "2:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2056, "total_steps": 3836, "loss": 0.1531, "learning_rate": 2.409496391079329e-06, "epoch": 0.5358876616818167, "percentage": 53.6, "elapsed_time": "3:14:08", "remaining_time": "2:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2057, "total_steps": 3836, "loss": 0.1552, "learning_rate": 2.4073425189839068e-06, "epoch": 0.536148307431662, "percentage": 53.62, "elapsed_time": "3:14:13", "remaining_time": "2:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2058, "total_steps": 3836, "loss": 0.146, "learning_rate": 2.4051887157574356e-06, "epoch": 0.5364089531815072, "percentage": 53.65, "elapsed_time": "3:14:19", "remaining_time": "2:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2059, "total_steps": 3836, "loss": 0.1498, "learning_rate": 2.4030349830007607e-06, "epoch": 0.5366695989313525, "percentage": 53.68, "elapsed_time": "3:14:24", "remaining_time": "2:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2060, "total_steps": 3836, "loss": 0.1556, "learning_rate": 2.4008813223146723e-06, "epoch": 0.5369302446811977, "percentage": 53.7, "elapsed_time": "3:14:29", "remaining_time": "2:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2061, "total_steps": 3836, "loss": 0.1434, "learning_rate": 2.39872773529991e-06, "epoch": 0.537190890431043, "percentage": 53.73, "elapsed_time": "3:14:35", "remaining_time": "2:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2062, "total_steps": 3836, "loss": 0.154, "learning_rate": 2.3965742235571557e-06, "epoch": 0.5374515361808881, "percentage": 53.75, "elapsed_time": "3:14:40", "remaining_time": "2:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2063, "total_steps": 3836, "loss": 0.1564, "learning_rate": 2.3944207886870364e-06, "epoch": 0.5377121819307334, "percentage": 53.78, "elapsed_time": "3:14:46", "remaining_time": "2:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2064, "total_steps": 3836, "loss": 0.1673, "learning_rate": 2.3922674322901236e-06, "epoch": 0.5379728276805786, "percentage": 53.81, "elapsed_time": "3:14:52", "remaining_time": "2:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2065, "total_steps": 3836, "loss": 0.148, "learning_rate": 2.390114155966928e-06, "epoch": 0.5382334734304238, "percentage": 53.83, "elapsed_time": "3:14:57", "remaining_time": "2:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2066, "total_steps": 3836, "loss": 0.1611, "learning_rate": 2.387960961317903e-06, "epoch": 0.5384941191802691, "percentage": 53.86, "elapsed_time": "3:15:03", "remaining_time": "2:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2067, "total_steps": 3836, "loss": 0.1532, "learning_rate": 2.38580784994344e-06, "epoch": 0.5387547649301143, "percentage": 53.88, "elapsed_time": "3:15:08", "remaining_time": "2:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2068, "total_steps": 3836, "loss": 0.1499, "learning_rate": 2.383654823443868e-06, "epoch": 0.5390154106799596, "percentage": 53.91, "elapsed_time": "3:15:13", "remaining_time": "2:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2069, "total_steps": 3836, "loss": 0.1649, "learning_rate": 2.3815018834194542e-06, "epoch": 0.5392760564298048, "percentage": 53.94, "elapsed_time": "3:15:19", "remaining_time": "2:46:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2070, "total_steps": 3836, "loss": 0.1481, "learning_rate": 2.3793490314704005e-06, "epoch": 0.5395367021796501, "percentage": 53.96, "elapsed_time": "3:15:25", "remaining_time": "2:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2071, "total_steps": 3836, "loss": 0.1573, "learning_rate": 2.377196269196845e-06, "epoch": 0.5397973479294953, "percentage": 53.99, "elapsed_time": "3:15:30", "remaining_time": "2:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2072, "total_steps": 3836, "loss": 0.1482, "learning_rate": 2.3750435981988576e-06, "epoch": 0.5400579936793406, "percentage": 54.01, "elapsed_time": "3:15:36", "remaining_time": "2:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2073, "total_steps": 3836, "loss": 0.144, "learning_rate": 2.3728910200764394e-06, "epoch": 0.5403186394291858, "percentage": 54.04, "elapsed_time": "3:15:41", "remaining_time": "2:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2074, "total_steps": 3836, "loss": 0.1563, "learning_rate": 2.3707385364295245e-06, "epoch": 0.5405792851790311, "percentage": 54.07, "elapsed_time": "3:15:47", "remaining_time": "2:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2075, "total_steps": 3836, "loss": 0.1585, "learning_rate": 2.368586148857977e-06, "epoch": 0.5408399309288763, "percentage": 54.09, "elapsed_time": "3:15:53", "remaining_time": "2:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2076, "total_steps": 3836, "loss": 0.1527, "learning_rate": 2.366433858961587e-06, "epoch": 0.5411005766787216, "percentage": 54.12, "elapsed_time": "3:15:58", "remaining_time": "2:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2077, "total_steps": 3836, "loss": 0.1528, "learning_rate": 2.3642816683400756e-06, "epoch": 0.5413612224285668, "percentage": 54.14, "elapsed_time": "3:16:04", "remaining_time": "2:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2078, "total_steps": 3836, "loss": 0.1652, "learning_rate": 2.362129578593088e-06, "epoch": 0.5416218681784121, "percentage": 54.17, "elapsed_time": "3:16:09", "remaining_time": "2:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2079, "total_steps": 3836, "loss": 0.154, "learning_rate": 2.3599775913201924e-06, "epoch": 0.5418825139282573, "percentage": 54.2, "elapsed_time": "3:16:15", "remaining_time": "2:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2080, "total_steps": 3836, "loss": 0.1558, "learning_rate": 2.3578257081208853e-06, "epoch": 0.5421431596781024, "percentage": 54.22, "elapsed_time": "3:16:20", "remaining_time": "2:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2081, "total_steps": 3836, "loss": 0.1649, "learning_rate": 2.355673930594582e-06, "epoch": 0.5424038054279477, "percentage": 54.25, "elapsed_time": "3:16:26", "remaining_time": "2:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2082, "total_steps": 3836, "loss": 0.1808, "learning_rate": 2.3535222603406223e-06, "epoch": 0.5426644511777929, "percentage": 54.28, "elapsed_time": "3:16:32", "remaining_time": "2:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2083, "total_steps": 3836, "loss": 0.1766, "learning_rate": 2.3513706989582643e-06, "epoch": 0.5429250969276382, "percentage": 54.3, "elapsed_time": "3:16:37", "remaining_time": "2:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2084, "total_steps": 3836, "loss": 0.1552, "learning_rate": 2.3492192480466845e-06, "epoch": 0.5431857426774834, "percentage": 54.33, "elapsed_time": "3:16:42", "remaining_time": "2:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2085, "total_steps": 3836, "loss": 0.1488, "learning_rate": 2.3470679092049806e-06, "epoch": 0.5434463884273287, "percentage": 54.35, "elapsed_time": "3:16:48", "remaining_time": "2:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2086, "total_steps": 3836, "loss": 0.1505, "learning_rate": 2.344916684032163e-06, "epoch": 0.5437070341771739, "percentage": 54.38, "elapsed_time": "3:16:54", "remaining_time": "2:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2087, "total_steps": 3836, "loss": 0.1525, "learning_rate": 2.3427655741271605e-06, "epoch": 0.5439676799270192, "percentage": 54.41, "elapsed_time": "3:16:59", "remaining_time": "2:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2088, "total_steps": 3836, "loss": 0.1422, "learning_rate": 2.3406145810888143e-06, "epoch": 0.5442283256768644, "percentage": 54.43, "elapsed_time": "3:17:04", "remaining_time": "2:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2089, "total_steps": 3836, "loss": 0.1482, "learning_rate": 2.338463706515882e-06, "epoch": 0.5444889714267097, "percentage": 54.46, "elapsed_time": "3:17:10", "remaining_time": "2:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2090, "total_steps": 3836, "loss": 0.1424, "learning_rate": 2.3363129520070286e-06, "epoch": 0.5447496171765549, "percentage": 54.48, "elapsed_time": "3:17:15", "remaining_time": "2:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2091, "total_steps": 3836, "loss": 0.1498, "learning_rate": 2.334162319160832e-06, "epoch": 0.5450102629264002, "percentage": 54.51, "elapsed_time": "3:17:21", "remaining_time": "2:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2092, "total_steps": 3836, "loss": 0.1652, "learning_rate": 2.3320118095757806e-06, "epoch": 0.5452709086762454, "percentage": 54.54, "elapsed_time": "3:17:26", "remaining_time": "2:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2093, "total_steps": 3836, "loss": 0.1564, "learning_rate": 2.3298614248502696e-06, "epoch": 0.5455315544260907, "percentage": 54.56, "elapsed_time": "3:17:32", "remaining_time": "2:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2094, "total_steps": 3836, "loss": 0.1434, "learning_rate": 2.327711166582604e-06, "epoch": 0.5457922001759359, "percentage": 54.59, "elapsed_time": "3:17:37", "remaining_time": "2:44:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2095, "total_steps": 3836, "loss": 0.1764, "learning_rate": 2.325561036370991e-06, "epoch": 0.5460528459257811, "percentage": 54.61, "elapsed_time": "3:17:43", "remaining_time": "2:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2096, "total_steps": 3836, "loss": 0.1639, "learning_rate": 2.3234110358135446e-06, "epoch": 0.5463134916756264, "percentage": 54.64, "elapsed_time": "3:17:48", "remaining_time": "2:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2097, "total_steps": 3836, "loss": 0.1469, "learning_rate": 2.3212611665082834e-06, "epoch": 0.5465741374254716, "percentage": 54.67, "elapsed_time": "3:17:54", "remaining_time": "2:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2098, "total_steps": 3836, "loss": 0.1593, "learning_rate": 2.319111430053126e-06, "epoch": 0.5468347831753169, "percentage": 54.69, "elapsed_time": "3:18:00", "remaining_time": "2:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2099, "total_steps": 3836, "loss": 0.1482, "learning_rate": 2.3169618280458957e-06, "epoch": 0.547095428925162, "percentage": 54.72, "elapsed_time": "3:18:06", "remaining_time": "2:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2100, "total_steps": 3836, "loss": 0.1412, "learning_rate": 2.3148123620843132e-06, "epoch": 0.5473560746750074, "percentage": 54.74, "elapsed_time": "3:18:11", "remaining_time": "2:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2101, "total_steps": 3836, "loss": 0.151, "learning_rate": 2.3126630337659973e-06, "epoch": 0.5476167204248525, "percentage": 54.77, "elapsed_time": "3:18:18", "remaining_time": "2:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2102, "total_steps": 3836, "loss": 0.1515, "learning_rate": 2.310513844688467e-06, "epoch": 0.5478773661746978, "percentage": 54.8, "elapsed_time": "3:18:23", "remaining_time": "2:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2103, "total_steps": 3836, "loss": 0.1603, "learning_rate": 2.3083647964491367e-06, "epoch": 0.548138011924543, "percentage": 54.82, "elapsed_time": "3:18:29", "remaining_time": "2:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2104, "total_steps": 3836, "loss": 0.1605, "learning_rate": 2.306215890645316e-06, "epoch": 0.5483986576743883, "percentage": 54.85, "elapsed_time": "3:18:34", "remaining_time": "2:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2105, "total_steps": 3836, "loss": 0.1458, "learning_rate": 2.3040671288742103e-06, "epoch": 0.5486593034242335, "percentage": 54.87, "elapsed_time": "3:18:40", "remaining_time": "2:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2106, "total_steps": 3836, "loss": 0.1618, "learning_rate": 2.3019185127329145e-06, "epoch": 0.5489199491740788, "percentage": 54.9, "elapsed_time": "3:18:45", "remaining_time": "2:43:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2107, "total_steps": 3836, "loss": 0.1509, "learning_rate": 2.299770043818417e-06, "epoch": 0.549180594923924, "percentage": 54.93, "elapsed_time": "3:18:50", "remaining_time": "2:43:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2108, "total_steps": 3836, "loss": 0.1499, "learning_rate": 2.2976217237275983e-06, "epoch": 0.5494412406737693, "percentage": 54.95, "elapsed_time": "3:18:56", "remaining_time": "2:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2109, "total_steps": 3836, "loss": 0.1549, "learning_rate": 2.2954735540572263e-06, "epoch": 0.5497018864236145, "percentage": 54.98, "elapsed_time": "3:19:01", "remaining_time": "2:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2110, "total_steps": 3836, "loss": 0.156, "learning_rate": 2.293325536403958e-06, "epoch": 0.5499625321734597, "percentage": 55.01, "elapsed_time": "3:19:07", "remaining_time": "2:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2111, "total_steps": 3836, "loss": 0.1591, "learning_rate": 2.2911776723643378e-06, "epoch": 0.550223177923305, "percentage": 55.03, "elapsed_time": "3:19:13", "remaining_time": "2:42:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2112, "total_steps": 3836, "loss": 0.1683, "learning_rate": 2.2890299635347933e-06, "epoch": 0.5504838236731502, "percentage": 55.06, "elapsed_time": "3:19:19", "remaining_time": "2:42:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2113, "total_steps": 3836, "loss": 0.1636, "learning_rate": 2.2868824115116404e-06, "epoch": 0.5507444694229955, "percentage": 55.08, "elapsed_time": "3:19:24", "remaining_time": "2:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2114, "total_steps": 3836, "loss": 0.1533, "learning_rate": 2.2847350178910763e-06, "epoch": 0.5510051151728407, "percentage": 55.11, "elapsed_time": "3:19:29", "remaining_time": "2:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2115, "total_steps": 3836, "loss": 0.1578, "learning_rate": 2.2825877842691813e-06, "epoch": 0.551265760922686, "percentage": 55.14, "elapsed_time": "3:19:34", "remaining_time": "2:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2116, "total_steps": 3836, "loss": 0.1628, "learning_rate": 2.2804407122419165e-06, "epoch": 0.5515264066725312, "percentage": 55.16, "elapsed_time": "3:19:40", "remaining_time": "2:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2117, "total_steps": 3836, "loss": 0.1535, "learning_rate": 2.2782938034051214e-06, "epoch": 0.5517870524223765, "percentage": 55.19, "elapsed_time": "3:19:44", "remaining_time": "2:42:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2118, "total_steps": 3836, "loss": 0.1568, "learning_rate": 2.276147059354517e-06, "epoch": 0.5520476981722217, "percentage": 55.21, "elapsed_time": "3:19:50", "remaining_time": "2:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2119, "total_steps": 3836, "loss": 0.1759, "learning_rate": 2.2740004816857e-06, "epoch": 0.552308343922067, "percentage": 55.24, "elapsed_time": "3:19:56", "remaining_time": "2:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2120, "total_steps": 3836, "loss": 0.1533, "learning_rate": 2.271854071994144e-06, "epoch": 0.5525689896719121, "percentage": 55.27, "elapsed_time": "3:20:02", "remaining_time": "2:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2121, "total_steps": 3836, "loss": 0.1461, "learning_rate": 2.2697078318751974e-06, "epoch": 0.5528296354217574, "percentage": 55.29, "elapsed_time": "3:20:07", "remaining_time": "2:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2122, "total_steps": 3836, "loss": 0.1383, "learning_rate": 2.2675617629240842e-06, "epoch": 0.5530902811716026, "percentage": 55.32, "elapsed_time": "3:20:12", "remaining_time": "2:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2123, "total_steps": 3836, "loss": 0.1634, "learning_rate": 2.2654158667358977e-06, "epoch": 0.5533509269214479, "percentage": 55.34, "elapsed_time": "3:20:17", "remaining_time": "2:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2124, "total_steps": 3836, "loss": 0.1517, "learning_rate": 2.2632701449056054e-06, "epoch": 0.5536115726712931, "percentage": 55.37, "elapsed_time": "3:20:23", "remaining_time": "2:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2125, "total_steps": 3836, "loss": 0.1594, "learning_rate": 2.2611245990280455e-06, "epoch": 0.5538722184211383, "percentage": 55.4, "elapsed_time": "3:20:29", "remaining_time": "2:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2126, "total_steps": 3836, "loss": 0.1669, "learning_rate": 2.258979230697923e-06, "epoch": 0.5541328641709836, "percentage": 55.42, "elapsed_time": "3:20:34", "remaining_time": "2:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2127, "total_steps": 3836, "loss": 0.1447, "learning_rate": 2.2568340415098154e-06, "epoch": 0.5543935099208288, "percentage": 55.45, "elapsed_time": "3:20:40", "remaining_time": "2:41:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2128, "total_steps": 3836, "loss": 0.1632, "learning_rate": 2.2546890330581616e-06, "epoch": 0.5546541556706741, "percentage": 55.47, "elapsed_time": "3:20:45", "remaining_time": "2:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2129, "total_steps": 3836, "loss": 0.1404, "learning_rate": 2.2525442069372687e-06, "epoch": 0.5549148014205193, "percentage": 55.5, "elapsed_time": "3:20:51", "remaining_time": "2:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2130, "total_steps": 3836, "loss": 0.1546, "learning_rate": 2.25039956474131e-06, "epoch": 0.5551754471703646, "percentage": 55.53, "elapsed_time": "3:20:56", "remaining_time": "2:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2131, "total_steps": 3836, "loss": 0.1562, "learning_rate": 2.2482551080643185e-06, "epoch": 0.5554360929202098, "percentage": 55.55, "elapsed_time": "3:21:01", "remaining_time": "2:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2132, "total_steps": 3836, "loss": 0.157, "learning_rate": 2.246110838500194e-06, "epoch": 0.5556967386700551, "percentage": 55.58, "elapsed_time": "3:21:07", "remaining_time": "2:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2133, "total_steps": 3836, "loss": 0.1427, "learning_rate": 2.2439667576426905e-06, "epoch": 0.5559573844199003, "percentage": 55.6, "elapsed_time": "3:21:13", "remaining_time": "2:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2134, "total_steps": 3836, "loss": 0.1534, "learning_rate": 2.241822867085429e-06, "epoch": 0.5562180301697456, "percentage": 55.63, "elapsed_time": "3:21:19", "remaining_time": "2:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2135, "total_steps": 3836, "loss": 0.1488, "learning_rate": 2.2396791684218844e-06, "epoch": 0.5564786759195908, "percentage": 55.66, "elapsed_time": "3:21:24", "remaining_time": "2:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2136, "total_steps": 3836, "loss": 0.1503, "learning_rate": 2.2375356632453906e-06, "epoch": 0.5567393216694361, "percentage": 55.68, "elapsed_time": "3:21:30", "remaining_time": "2:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2137, "total_steps": 3836, "loss": 0.151, "learning_rate": 2.235392353149137e-06, "epoch": 0.5569999674192813, "percentage": 55.71, "elapsed_time": "3:21:36", "remaining_time": "2:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2138, "total_steps": 3836, "loss": 0.1577, "learning_rate": 2.2332492397261695e-06, "epoch": 0.5572606131691266, "percentage": 55.74, "elapsed_time": "3:21:41", "remaining_time": "2:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2139, "total_steps": 3836, "loss": 0.1618, "learning_rate": 2.231106324569386e-06, "epoch": 0.5575212589189718, "percentage": 55.76, "elapsed_time": "3:21:47", "remaining_time": "2:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2140, "total_steps": 3836, "loss": 0.1447, "learning_rate": 2.2289636092715365e-06, "epoch": 0.5577819046688169, "percentage": 55.79, "elapsed_time": "3:21:53", "remaining_time": "2:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2141, "total_steps": 3836, "loss": 0.1516, "learning_rate": 2.2268210954252258e-06, "epoch": 0.5580425504186622, "percentage": 55.81, "elapsed_time": "3:21:58", "remaining_time": "2:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2142, "total_steps": 3836, "loss": 0.148, "learning_rate": 2.2246787846229057e-06, "epoch": 0.5583031961685074, "percentage": 55.84, "elapsed_time": "3:22:03", "remaining_time": "2:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2143, "total_steps": 3836, "loss": 0.1576, "learning_rate": 2.2225366784568796e-06, "epoch": 0.5585638419183527, "percentage": 55.87, "elapsed_time": "3:22:09", "remaining_time": "2:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2144, "total_steps": 3836, "loss": 0.133, "learning_rate": 2.2203947785192954e-06, "epoch": 0.5588244876681979, "percentage": 55.89, "elapsed_time": "3:22:15", "remaining_time": "2:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2145, "total_steps": 3836, "loss": 0.1485, "learning_rate": 2.2182530864021508e-06, "epoch": 0.5590851334180432, "percentage": 55.92, "elapsed_time": "3:22:21", "remaining_time": "2:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2146, "total_steps": 3836, "loss": 0.166, "learning_rate": 2.2161116036972886e-06, "epoch": 0.5593457791678884, "percentage": 55.94, "elapsed_time": "3:22:27", "remaining_time": "2:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2147, "total_steps": 3836, "loss": 0.1545, "learning_rate": 2.2139703319963945e-06, "epoch": 0.5596064249177337, "percentage": 55.97, "elapsed_time": "3:22:32", "remaining_time": "2:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2148, "total_steps": 3836, "loss": 0.1609, "learning_rate": 2.2118292728909986e-06, "epoch": 0.5598670706675789, "percentage": 56.0, "elapsed_time": "3:22:37", "remaining_time": "2:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2149, "total_steps": 3836, "loss": 0.1515, "learning_rate": 2.2096884279724733e-06, "epoch": 0.5601277164174242, "percentage": 56.02, "elapsed_time": "3:22:43", "remaining_time": "2:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2150, "total_steps": 3836, "loss": 0.1482, "learning_rate": 2.2075477988320295e-06, "epoch": 0.5603883621672694, "percentage": 56.05, "elapsed_time": "3:22:48", "remaining_time": "2:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2151, "total_steps": 3836, "loss": 0.1536, "learning_rate": 2.205407387060721e-06, "epoch": 0.5606490079171147, "percentage": 56.07, "elapsed_time": "3:22:54", "remaining_time": "2:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2152, "total_steps": 3836, "loss": 0.154, "learning_rate": 2.2032671942494367e-06, "epoch": 0.5609096536669599, "percentage": 56.1, "elapsed_time": "3:22:59", "remaining_time": "2:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2153, "total_steps": 3836, "loss": 0.162, "learning_rate": 2.2011272219889067e-06, "epoch": 0.5611702994168052, "percentage": 56.13, "elapsed_time": "3:23:05", "remaining_time": "2:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2154, "total_steps": 3836, "loss": 0.1453, "learning_rate": 2.1989874718696936e-06, "epoch": 0.5614309451666504, "percentage": 56.15, "elapsed_time": "3:23:11", "remaining_time": "2:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2155, "total_steps": 3836, "loss": 0.1605, "learning_rate": 2.196847945482195e-06, "epoch": 0.5616915909164956, "percentage": 56.18, "elapsed_time": "3:23:16", "remaining_time": "2:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2156, "total_steps": 3836, "loss": 0.1637, "learning_rate": 2.194708644416646e-06, "epoch": 0.5619522366663409, "percentage": 56.2, "elapsed_time": "3:23:22", "remaining_time": "2:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2157, "total_steps": 3836, "loss": 0.1477, "learning_rate": 2.192569570263109e-06, "epoch": 0.562212882416186, "percentage": 56.23, "elapsed_time": "3:23:27", "remaining_time": "2:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2158, "total_steps": 3836, "loss": 0.151, "learning_rate": 2.1904307246114827e-06, "epoch": 0.5624735281660314, "percentage": 56.26, "elapsed_time": "3:23:33", "remaining_time": "2:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2159, "total_steps": 3836, "loss": 0.1552, "learning_rate": 2.1882921090514923e-06, "epoch": 0.5627341739158765, "percentage": 56.28, "elapsed_time": "3:23:38", "remaining_time": "2:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2160, "total_steps": 3836, "loss": 0.1589, "learning_rate": 2.1861537251726944e-06, "epoch": 0.5629948196657218, "percentage": 56.31, "elapsed_time": "3:23:44", "remaining_time": "2:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2161, "total_steps": 3836, "loss": 0.1536, "learning_rate": 2.184015574564471e-06, "epoch": 0.563255465415567, "percentage": 56.33, "elapsed_time": "3:23:50", "remaining_time": "2:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2162, "total_steps": 3836, "loss": 0.1536, "learning_rate": 2.1818776588160323e-06, "epoch": 0.5635161111654123, "percentage": 56.36, "elapsed_time": "3:23:55", "remaining_time": "2:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2163, "total_steps": 3836, "loss": 0.1628, "learning_rate": 2.179739979516414e-06, "epoch": 0.5637767569152575, "percentage": 56.39, "elapsed_time": "3:24:00", "remaining_time": "2:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2164, "total_steps": 3836, "loss": 0.1612, "learning_rate": 2.1776025382544765e-06, "epoch": 0.5640374026651028, "percentage": 56.41, "elapsed_time": "3:24:06", "remaining_time": "2:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2165, "total_steps": 3836, "loss": 0.1487, "learning_rate": 2.1754653366189018e-06, "epoch": 0.564298048414948, "percentage": 56.44, "elapsed_time": "3:24:11", "remaining_time": "2:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2166, "total_steps": 3836, "loss": 0.1537, "learning_rate": 2.173328376198194e-06, "epoch": 0.5645586941647933, "percentage": 56.47, "elapsed_time": "3:24:16", "remaining_time": "2:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2167, "total_steps": 3836, "loss": 0.1593, "learning_rate": 2.1711916585806793e-06, "epoch": 0.5648193399146385, "percentage": 56.49, "elapsed_time": "3:24:22", "remaining_time": "2:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2168, "total_steps": 3836, "loss": 0.1573, "learning_rate": 2.1690551853545016e-06, "epoch": 0.5650799856644838, "percentage": 56.52, "elapsed_time": "3:24:28", "remaining_time": "2:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2169, "total_steps": 3836, "loss": 0.1473, "learning_rate": 2.166918958107625e-06, "epoch": 0.565340631414329, "percentage": 56.54, "elapsed_time": "3:24:34", "remaining_time": "2:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2170, "total_steps": 3836, "loss": 0.1355, "learning_rate": 2.1647829784278294e-06, "epoch": 0.5656012771641742, "percentage": 56.57, "elapsed_time": "3:24:39", "remaining_time": "2:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2171, "total_steps": 3836, "loss": 0.1543, "learning_rate": 2.1626472479027125e-06, "epoch": 0.5658619229140195, "percentage": 56.6, "elapsed_time": "3:24:44", "remaining_time": "2:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2172, "total_steps": 3836, "loss": 0.1502, "learning_rate": 2.1605117681196834e-06, "epoch": 0.5661225686638647, "percentage": 56.62, "elapsed_time": "3:24:50", "remaining_time": "2:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2173, "total_steps": 3836, "loss": 0.1469, "learning_rate": 2.1583765406659678e-06, "epoch": 0.56638321441371, "percentage": 56.65, "elapsed_time": "3:24:56", "remaining_time": "2:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2174, "total_steps": 3836, "loss": 0.1415, "learning_rate": 2.1562415671286032e-06, "epoch": 0.5666438601635552, "percentage": 56.67, "elapsed_time": "3:25:01", "remaining_time": "2:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2175, "total_steps": 3836, "loss": 0.1531, "learning_rate": 2.154106849094438e-06, "epoch": 0.5669045059134005, "percentage": 56.7, "elapsed_time": "3:25:07", "remaining_time": "2:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2176, "total_steps": 3836, "loss": 0.1526, "learning_rate": 2.151972388150131e-06, "epoch": 0.5671651516632457, "percentage": 56.73, "elapsed_time": "3:25:12", "remaining_time": "2:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2177, "total_steps": 3836, "loss": 0.1635, "learning_rate": 2.1498381858821497e-06, "epoch": 0.567425797413091, "percentage": 56.75, "elapsed_time": "3:25:18", "remaining_time": "2:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2178, "total_steps": 3836, "loss": 0.152, "learning_rate": 2.1477042438767685e-06, "epoch": 0.5676864431629361, "percentage": 56.78, "elapsed_time": "3:25:23", "remaining_time": "2:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2179, "total_steps": 3836, "loss": 0.1576, "learning_rate": 2.1455705637200706e-06, "epoch": 0.5679470889127815, "percentage": 56.8, "elapsed_time": "3:25:28", "remaining_time": "2:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2180, "total_steps": 3836, "loss": 0.1607, "learning_rate": 2.1434371469979424e-06, "epoch": 0.5682077346626266, "percentage": 56.83, "elapsed_time": "3:25:33", "remaining_time": "2:36:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2181, "total_steps": 3836, "loss": 0.1629, "learning_rate": 2.1413039952960756e-06, "epoch": 0.5684683804124719, "percentage": 56.86, "elapsed_time": "3:25:39", "remaining_time": "2:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2182, "total_steps": 3836, "loss": 0.1367, "learning_rate": 2.1391711101999656e-06, "epoch": 0.5687290261623171, "percentage": 56.88, "elapsed_time": "3:25:44", "remaining_time": "2:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2183, "total_steps": 3836, "loss": 0.1271, "learning_rate": 2.1370384932949066e-06, "epoch": 0.5689896719121624, "percentage": 56.91, "elapsed_time": "3:25:49", "remaining_time": "2:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2184, "total_steps": 3836, "loss": 0.1574, "learning_rate": 2.1349061461659966e-06, "epoch": 0.5692503176620076, "percentage": 56.93, "elapsed_time": "3:25:55", "remaining_time": "2:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2185, "total_steps": 3836, "loss": 0.1581, "learning_rate": 2.132774070398132e-06, "epoch": 0.5695109634118528, "percentage": 56.96, "elapsed_time": "3:26:00", "remaining_time": "2:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2186, "total_steps": 3836, "loss": 0.1531, "learning_rate": 2.130642267576008e-06, "epoch": 0.5697716091616981, "percentage": 56.99, "elapsed_time": "3:26:06", "remaining_time": "2:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2187, "total_steps": 3836, "loss": 0.1595, "learning_rate": 2.1285107392841166e-06, "epoch": 0.5700322549115433, "percentage": 57.01, "elapsed_time": "3:26:11", "remaining_time": "2:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2188, "total_steps": 3836, "loss": 0.1461, "learning_rate": 2.1263794871067443e-06, "epoch": 0.5702929006613886, "percentage": 57.04, "elapsed_time": "3:26:17", "remaining_time": "2:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2189, "total_steps": 3836, "loss": 0.1548, "learning_rate": 2.124248512627975e-06, "epoch": 0.5705535464112338, "percentage": 57.06, "elapsed_time": "3:26:23", "remaining_time": "2:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2190, "total_steps": 3836, "loss": 0.1478, "learning_rate": 2.1221178174316833e-06, "epoch": 0.5708141921610791, "percentage": 57.09, "elapsed_time": "3:26:28", "remaining_time": "2:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2191, "total_steps": 3836, "loss": 0.1628, "learning_rate": 2.1199874031015395e-06, "epoch": 0.5710748379109243, "percentage": 57.12, "elapsed_time": "3:26:33", "remaining_time": "2:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2192, "total_steps": 3836, "loss": 0.1555, "learning_rate": 2.117857271221003e-06, "epoch": 0.5713354836607696, "percentage": 57.14, "elapsed_time": "3:26:39", "remaining_time": "2:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2193, "total_steps": 3836, "loss": 0.1605, "learning_rate": 2.1157274233733242e-06, "epoch": 0.5715961294106148, "percentage": 57.17, "elapsed_time": "3:26:46", "remaining_time": "2:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2194, "total_steps": 3836, "loss": 0.1468, "learning_rate": 2.11359786114154e-06, "epoch": 0.5718567751604601, "percentage": 57.19, "elapsed_time": "3:26:51", "remaining_time": "2:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2195, "total_steps": 3836, "loss": 0.1481, "learning_rate": 2.1114685861084793e-06, "epoch": 0.5721174209103053, "percentage": 57.22, "elapsed_time": "3:26:56", "remaining_time": "2:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2196, "total_steps": 3836, "loss": 0.1667, "learning_rate": 2.1093395998567527e-06, "epoch": 0.5723780666601506, "percentage": 57.25, "elapsed_time": "3:27:02", "remaining_time": "2:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2197, "total_steps": 3836, "loss": 0.1492, "learning_rate": 2.107210903968761e-06, "epoch": 0.5726387124099958, "percentage": 57.27, "elapsed_time": "3:27:08", "remaining_time": "2:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2198, "total_steps": 3836, "loss": 0.1472, "learning_rate": 2.1050825000266862e-06, "epoch": 0.572899358159841, "percentage": 57.3, "elapsed_time": "3:27:13", "remaining_time": "2:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2199, "total_steps": 3836, "loss": 0.1561, "learning_rate": 2.1029543896124925e-06, "epoch": 0.5731600039096862, "percentage": 57.33, "elapsed_time": "3:27:19", "remaining_time": "2:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2200, "total_steps": 3836, "loss": 0.1523, "learning_rate": 2.1008265743079286e-06, "epoch": 0.5734206496595314, "percentage": 57.35, "elapsed_time": "3:27:25", "remaining_time": "2:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2201, "total_steps": 3836, "loss": 0.1546, "learning_rate": 2.098699055694522e-06, "epoch": 0.5736812954093767, "percentage": 57.38, "elapsed_time": "3:27:30", "remaining_time": "2:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2202, "total_steps": 3836, "loss": 0.1422, "learning_rate": 2.0965718353535807e-06, "epoch": 0.5739419411592219, "percentage": 57.4, "elapsed_time": "3:27:36", "remaining_time": "2:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2203, "total_steps": 3836, "loss": 0.1408, "learning_rate": 2.0944449148661898e-06, "epoch": 0.5742025869090672, "percentage": 57.43, "elapsed_time": "3:27:41", "remaining_time": "2:33:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2204, "total_steps": 3836, "loss": 0.1476, "learning_rate": 2.0923182958132146e-06, "epoch": 0.5744632326589124, "percentage": 57.46, "elapsed_time": "3:27:46", "remaining_time": "2:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2205, "total_steps": 3836, "loss": 0.1423, "learning_rate": 2.0901919797752915e-06, "epoch": 0.5747238784087577, "percentage": 57.48, "elapsed_time": "3:27:52", "remaining_time": "2:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2206, "total_steps": 3836, "loss": 0.1568, "learning_rate": 2.0880659683328346e-06, "epoch": 0.5749845241586029, "percentage": 57.51, "elapsed_time": "3:27:58", "remaining_time": "2:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2207, "total_steps": 3836, "loss": 0.1596, "learning_rate": 2.0859402630660324e-06, "epoch": 0.5752451699084482, "percentage": 57.53, "elapsed_time": "3:28:03", "remaining_time": "2:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2208, "total_steps": 3836, "loss": 0.1425, "learning_rate": 2.0838148655548433e-06, "epoch": 0.5755058156582934, "percentage": 57.56, "elapsed_time": "3:28:09", "remaining_time": "2:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2209, "total_steps": 3836, "loss": 0.1499, "learning_rate": 2.0816897773790002e-06, "epoch": 0.5757664614081387, "percentage": 57.59, "elapsed_time": "3:28:14", "remaining_time": "2:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2210, "total_steps": 3836, "loss": 0.1443, "learning_rate": 2.0795650001180028e-06, "epoch": 0.5760271071579839, "percentage": 57.61, "elapsed_time": "3:28:20", "remaining_time": "2:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2211, "total_steps": 3836, "loss": 0.1487, "learning_rate": 2.077440535351121e-06, "epoch": 0.5762877529078292, "percentage": 57.64, "elapsed_time": "3:28:25", "remaining_time": "2:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2212, "total_steps": 3836, "loss": 0.1381, "learning_rate": 2.0753163846573933e-06, "epoch": 0.5765483986576744, "percentage": 57.66, "elapsed_time": "3:28:30", "remaining_time": "2:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2213, "total_steps": 3836, "loss": 0.1495, "learning_rate": 2.073192549615623e-06, "epoch": 0.5768090444075197, "percentage": 57.69, "elapsed_time": "3:28:36", "remaining_time": "2:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2214, "total_steps": 3836, "loss": 0.1568, "learning_rate": 2.0710690318043814e-06, "epoch": 0.5770696901573649, "percentage": 57.72, "elapsed_time": "3:28:42", "remaining_time": "2:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2215, "total_steps": 3836, "loss": 0.1679, "learning_rate": 2.0689458328020017e-06, "epoch": 0.5773303359072102, "percentage": 57.74, "elapsed_time": "3:28:48", "remaining_time": "2:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2216, "total_steps": 3836, "loss": 0.1459, "learning_rate": 2.0668229541865796e-06, "epoch": 0.5775909816570554, "percentage": 57.77, "elapsed_time": "3:28:53", "remaining_time": "2:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2217, "total_steps": 3836, "loss": 0.149, "learning_rate": 2.0647003975359757e-06, "epoch": 0.5778516274069005, "percentage": 57.79, "elapsed_time": "3:28:58", "remaining_time": "2:32:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2218, "total_steps": 3836, "loss": 0.1478, "learning_rate": 2.0625781644278083e-06, "epoch": 0.5781122731567458, "percentage": 57.82, "elapsed_time": "3:29:04", "remaining_time": "2:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2219, "total_steps": 3836, "loss": 0.1535, "learning_rate": 2.060456256439457e-06, "epoch": 0.578372918906591, "percentage": 57.85, "elapsed_time": "3:29:09", "remaining_time": "2:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2220, "total_steps": 3836, "loss": 0.165, "learning_rate": 2.058334675148061e-06, "epoch": 0.5786335646564363, "percentage": 57.87, "elapsed_time": "3:29:15", "remaining_time": "2:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2221, "total_steps": 3836, "loss": 0.1356, "learning_rate": 2.056213422130511e-06, "epoch": 0.5788942104062815, "percentage": 57.9, "elapsed_time": "3:29:20", "remaining_time": "2:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2222, "total_steps": 3836, "loss": 0.1716, "learning_rate": 2.05409249896346e-06, "epoch": 0.5791548561561268, "percentage": 57.92, "elapsed_time": "3:29:26", "remaining_time": "2:32:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2223, "total_steps": 3836, "loss": 0.1515, "learning_rate": 2.0519719072233133e-06, "epoch": 0.579415501905972, "percentage": 57.95, "elapsed_time": "3:29:31", "remaining_time": "2:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2224, "total_steps": 3836, "loss": 0.1369, "learning_rate": 2.049851648486229e-06, "epoch": 0.5796761476558173, "percentage": 57.98, "elapsed_time": "3:29:37", "remaining_time": "2:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2225, "total_steps": 3836, "loss": 0.1509, "learning_rate": 2.0477317243281204e-06, "epoch": 0.5799367934056625, "percentage": 58.0, "elapsed_time": "3:29:43", "remaining_time": "2:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2226, "total_steps": 3836, "loss": 0.1503, "learning_rate": 2.04561213632465e-06, "epoch": 0.5801974391555078, "percentage": 58.03, "elapsed_time": "3:29:48", "remaining_time": "2:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2227, "total_steps": 3836, "loss": 0.1465, "learning_rate": 2.043492886051229e-06, "epoch": 0.580458084905353, "percentage": 58.06, "elapsed_time": "3:29:53", "remaining_time": "2:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2228, "total_steps": 3836, "loss": 0.174, "learning_rate": 2.041373975083021e-06, "epoch": 0.5807187306551983, "percentage": 58.08, "elapsed_time": "3:29:59", "remaining_time": "2:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2229, "total_steps": 3836, "loss": 0.1437, "learning_rate": 2.0392554049949348e-06, "epoch": 0.5809793764050435, "percentage": 58.11, "elapsed_time": "3:30:05", "remaining_time": "2:31:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2230, "total_steps": 3836, "loss": 0.1605, "learning_rate": 2.037137177361628e-06, "epoch": 0.5812400221548888, "percentage": 58.13, "elapsed_time": "3:30:11", "remaining_time": "2:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2231, "total_steps": 3836, "loss": 0.1346, "learning_rate": 2.035019293757503e-06, "epoch": 0.581500667904734, "percentage": 58.16, "elapsed_time": "3:30:17", "remaining_time": "2:31:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2232, "total_steps": 3836, "loss": 0.143, "learning_rate": 2.0329017557567034e-06, "epoch": 0.5817613136545792, "percentage": 58.19, "elapsed_time": "3:30:22", "remaining_time": "2:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2233, "total_steps": 3836, "loss": 0.1423, "learning_rate": 2.030784564933121e-06, "epoch": 0.5820219594044245, "percentage": 58.21, "elapsed_time": "3:30:28", "remaining_time": "2:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2234, "total_steps": 3836, "loss": 0.1541, "learning_rate": 2.028667722860386e-06, "epoch": 0.5822826051542697, "percentage": 58.24, "elapsed_time": "3:30:33", "remaining_time": "2:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2235, "total_steps": 3836, "loss": 0.1487, "learning_rate": 2.026551231111871e-06, "epoch": 0.582543250904115, "percentage": 58.26, "elapsed_time": "3:30:39", "remaining_time": "2:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2236, "total_steps": 3836, "loss": 0.1479, "learning_rate": 2.024435091260687e-06, "epoch": 0.5828038966539602, "percentage": 58.29, "elapsed_time": "3:30:45", "remaining_time": "2:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2237, "total_steps": 3836, "loss": 0.1459, "learning_rate": 2.022319304879686e-06, "epoch": 0.5830645424038055, "percentage": 58.32, "elapsed_time": "3:30:50", "remaining_time": "2:30:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2238, "total_steps": 3836, "loss": 0.1471, "learning_rate": 2.0202038735414532e-06, "epoch": 0.5833251881536506, "percentage": 58.34, "elapsed_time": "3:30:55", "remaining_time": "2:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2239, "total_steps": 3836, "loss": 0.1502, "learning_rate": 2.018088798818312e-06, "epoch": 0.5835858339034959, "percentage": 58.37, "elapsed_time": "3:31:01", "remaining_time": "2:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2240, "total_steps": 3836, "loss": 0.1602, "learning_rate": 2.0159740822823233e-06, "epoch": 0.5838464796533411, "percentage": 58.39, "elapsed_time": "3:31:07", "remaining_time": "2:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2241, "total_steps": 3836, "loss": 0.134, "learning_rate": 2.0138597255052766e-06, "epoch": 0.5841071254031864, "percentage": 58.42, "elapsed_time": "3:31:12", "remaining_time": "2:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2242, "total_steps": 3836, "loss": 0.1598, "learning_rate": 2.0117457300586996e-06, "epoch": 0.5843677711530316, "percentage": 58.45, "elapsed_time": "3:31:18", "remaining_time": "2:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2243, "total_steps": 3836, "loss": 0.1534, "learning_rate": 2.0096320975138463e-06, "epoch": 0.5846284169028769, "percentage": 58.47, "elapsed_time": "3:31:24", "remaining_time": "2:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2244, "total_steps": 3836, "loss": 0.1504, "learning_rate": 2.007518829441704e-06, "epoch": 0.5848890626527221, "percentage": 58.5, "elapsed_time": "3:31:29", "remaining_time": "2:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2245, "total_steps": 3836, "loss": 0.1456, "learning_rate": 2.005405927412988e-06, "epoch": 0.5851497084025674, "percentage": 58.52, "elapsed_time": "3:31:34", "remaining_time": "2:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2246, "total_steps": 3836, "loss": 0.1511, "learning_rate": 2.0032933929981425e-06, "epoch": 0.5854103541524126, "percentage": 58.55, "elapsed_time": "3:31:40", "remaining_time": "2:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2247, "total_steps": 3836, "loss": 0.1484, "learning_rate": 2.0011812277673375e-06, "epoch": 0.5856709999022578, "percentage": 58.58, "elapsed_time": "3:31:45", "remaining_time": "2:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2248, "total_steps": 3836, "loss": 0.1382, "learning_rate": 1.9990694332904705e-06, "epoch": 0.5859316456521031, "percentage": 58.6, "elapsed_time": "3:31:51", "remaining_time": "2:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2249, "total_steps": 3836, "loss": 0.1385, "learning_rate": 1.9969580111371587e-06, "epoch": 0.5861922914019483, "percentage": 58.63, "elapsed_time": "3:31:56", "remaining_time": "2:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2250, "total_steps": 3836, "loss": 0.1388, "learning_rate": 1.9948469628767475e-06, "epoch": 0.5864529371517936, "percentage": 58.65, "elapsed_time": "3:32:02", "remaining_time": "2:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2251, "total_steps": 3836, "loss": 0.1534, "learning_rate": 1.9927362900783037e-06, "epoch": 0.5867135829016388, "percentage": 58.68, "elapsed_time": "3:32:07", "remaining_time": "2:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2252, "total_steps": 3836, "loss": 0.1481, "learning_rate": 1.990625994310612e-06, "epoch": 0.5869742286514841, "percentage": 58.71, "elapsed_time": "3:32:12", "remaining_time": "2:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2253, "total_steps": 3836, "loss": 0.1469, "learning_rate": 1.988516077142181e-06, "epoch": 0.5872348744013293, "percentage": 58.73, "elapsed_time": "3:32:18", "remaining_time": "2:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2254, "total_steps": 3836, "loss": 0.1548, "learning_rate": 1.986406540141234e-06, "epoch": 0.5874955201511746, "percentage": 58.76, "elapsed_time": "3:32:24", "remaining_time": "2:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2255, "total_steps": 3836, "loss": 0.1457, "learning_rate": 1.984297384875714e-06, "epoch": 0.5877561659010198, "percentage": 58.79, "elapsed_time": "3:32:29", "remaining_time": "2:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2256, "total_steps": 3836, "loss": 0.1436, "learning_rate": 1.98218861291328e-06, "epoch": 0.5880168116508651, "percentage": 58.81, "elapsed_time": "3:32:35", "remaining_time": "2:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2257, "total_steps": 3836, "loss": 0.1383, "learning_rate": 1.980080225821305e-06, "epoch": 0.5882774574007102, "percentage": 58.84, "elapsed_time": "3:32:40", "remaining_time": "2:28:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2258, "total_steps": 3836, "loss": 0.1597, "learning_rate": 1.977972225166878e-06, "epoch": 0.5885381031505555, "percentage": 58.86, "elapsed_time": "3:32:46", "remaining_time": "2:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2259, "total_steps": 3836, "loss": 0.1588, "learning_rate": 1.9758646125167997e-06, "epoch": 0.5887987489004007, "percentage": 58.89, "elapsed_time": "3:32:51", "remaining_time": "2:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2260, "total_steps": 3836, "loss": 0.1507, "learning_rate": 1.973757389437581e-06, "epoch": 0.589059394650246, "percentage": 58.92, "elapsed_time": "3:32:57", "remaining_time": "2:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2261, "total_steps": 3836, "loss": 0.1417, "learning_rate": 1.9716505574954455e-06, "epoch": 0.5893200404000912, "percentage": 58.94, "elapsed_time": "3:33:02", "remaining_time": "2:28:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2262, "total_steps": 3836, "loss": 0.1462, "learning_rate": 1.9695441182563237e-06, "epoch": 0.5895806861499364, "percentage": 58.97, "elapsed_time": "3:33:08", "remaining_time": "2:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2263, "total_steps": 3836, "loss": 0.1461, "learning_rate": 1.967438073285858e-06, "epoch": 0.5898413318997817, "percentage": 58.99, "elapsed_time": "3:33:13", "remaining_time": "2:28:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2264, "total_steps": 3836, "loss": 0.1532, "learning_rate": 1.965332424149394e-06, "epoch": 0.5901019776496269, "percentage": 59.02, "elapsed_time": "3:33:19", "remaining_time": "2:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2265, "total_steps": 3836, "loss": 0.1565, "learning_rate": 1.963227172411984e-06, "epoch": 0.5903626233994722, "percentage": 59.05, "elapsed_time": "3:33:24", "remaining_time": "2:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2266, "total_steps": 3836, "loss": 0.1513, "learning_rate": 1.9611223196383866e-06, "epoch": 0.5906232691493174, "percentage": 59.07, "elapsed_time": "3:33:29", "remaining_time": "2:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2267, "total_steps": 3836, "loss": 0.1561, "learning_rate": 1.9590178673930617e-06, "epoch": 0.5908839148991627, "percentage": 59.1, "elapsed_time": "3:33:34", "remaining_time": "2:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2268, "total_steps": 3836, "loss": 0.1656, "learning_rate": 1.956913817240173e-06, "epoch": 0.5911445606490079, "percentage": 59.12, "elapsed_time": "3:33:40", "remaining_time": "2:27:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2269, "total_steps": 3836, "loss": 0.1464, "learning_rate": 1.9548101707435845e-06, "epoch": 0.5914052063988532, "percentage": 59.15, "elapsed_time": "3:33:46", "remaining_time": "2:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2270, "total_steps": 3836, "loss": 0.1487, "learning_rate": 1.9527069294668617e-06, "epoch": 0.5916658521486984, "percentage": 59.18, "elapsed_time": "3:33:51", "remaining_time": "2:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2271, "total_steps": 3836, "loss": 0.1593, "learning_rate": 1.9506040949732657e-06, "epoch": 0.5919264978985437, "percentage": 59.2, "elapsed_time": "3:33:57", "remaining_time": "2:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2272, "total_steps": 3836, "loss": 0.148, "learning_rate": 1.9485016688257578e-06, "epoch": 0.5921871436483889, "percentage": 59.23, "elapsed_time": "3:34:02", "remaining_time": "2:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2273, "total_steps": 3836, "loss": 0.1535, "learning_rate": 1.946399652586997e-06, "epoch": 0.5924477893982342, "percentage": 59.25, "elapsed_time": "3:34:08", "remaining_time": "2:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2274, "total_steps": 3836, "loss": 0.1589, "learning_rate": 1.9442980478193332e-06, "epoch": 0.5927084351480794, "percentage": 59.28, "elapsed_time": "3:34:14", "remaining_time": "2:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2275, "total_steps": 3836, "loss": 0.1394, "learning_rate": 1.9421968560848158e-06, "epoch": 0.5929690808979247, "percentage": 59.31, "elapsed_time": "3:34:19", "remaining_time": "2:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2276, "total_steps": 3836, "loss": 0.147, "learning_rate": 1.9400960789451827e-06, "epoch": 0.5932297266477699, "percentage": 59.33, "elapsed_time": "3:34:26", "remaining_time": "2:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2277, "total_steps": 3836, "loss": 0.1669, "learning_rate": 1.937995717961866e-06, "epoch": 0.593490372397615, "percentage": 59.36, "elapsed_time": "3:34:31", "remaining_time": "2:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2278, "total_steps": 3836, "loss": 0.1541, "learning_rate": 1.935895774695988e-06, "epoch": 0.5937510181474603, "percentage": 59.38, "elapsed_time": "3:34:37", "remaining_time": "2:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2279, "total_steps": 3836, "loss": 0.1508, "learning_rate": 1.9337962507083603e-06, "epoch": 0.5940116638973055, "percentage": 59.41, "elapsed_time": "3:34:42", "remaining_time": "2:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2280, "total_steps": 3836, "loss": 0.1539, "learning_rate": 1.9316971475594835e-06, "epoch": 0.5942723096471508, "percentage": 59.44, "elapsed_time": "3:34:47", "remaining_time": "2:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2281, "total_steps": 3836, "loss": 0.17, "learning_rate": 1.9295984668095457e-06, "epoch": 0.594532955396996, "percentage": 59.46, "elapsed_time": "3:34:52", "remaining_time": "2:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2282, "total_steps": 3836, "loss": 0.1643, "learning_rate": 1.9275002100184186e-06, "epoch": 0.5947936011468413, "percentage": 59.49, "elapsed_time": "3:34:58", "remaining_time": "2:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2283, "total_steps": 3836, "loss": 0.1454, "learning_rate": 1.9254023787456615e-06, "epoch": 0.5950542468966865, "percentage": 59.52, "elapsed_time": "3:35:03", "remaining_time": "2:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2284, "total_steps": 3836, "loss": 0.1454, "learning_rate": 1.9233049745505167e-06, "epoch": 0.5953148926465318, "percentage": 59.54, "elapsed_time": "3:35:09", "remaining_time": "2:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2285, "total_steps": 3836, "loss": 0.1576, "learning_rate": 1.9212079989919073e-06, "epoch": 0.595575538396377, "percentage": 59.57, "elapsed_time": "3:35:15", "remaining_time": "2:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2286, "total_steps": 3836, "loss": 0.1431, "learning_rate": 1.919111453628442e-06, "epoch": 0.5958361841462223, "percentage": 59.59, "elapsed_time": "3:35:21", "remaining_time": "2:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2287, "total_steps": 3836, "loss": 0.1601, "learning_rate": 1.9170153400184054e-06, "epoch": 0.5960968298960675, "percentage": 59.62, "elapsed_time": "3:35:27", "remaining_time": "2:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2288, "total_steps": 3836, "loss": 0.1526, "learning_rate": 1.914919659719762e-06, "epoch": 0.5963574756459128, "percentage": 59.65, "elapsed_time": "3:35:31", "remaining_time": "2:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2289, "total_steps": 3836, "loss": 0.1574, "learning_rate": 1.912824414290157e-06, "epoch": 0.596618121395758, "percentage": 59.67, "elapsed_time": "3:35:37", "remaining_time": "2:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2290, "total_steps": 3836, "loss": 0.1392, "learning_rate": 1.9107296052869086e-06, "epoch": 0.5968787671456033, "percentage": 59.7, "elapsed_time": "3:35:42", "remaining_time": "2:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2291, "total_steps": 3836, "loss": 0.1426, "learning_rate": 1.9086352342670144e-06, "epoch": 0.5971394128954485, "percentage": 59.72, "elapsed_time": "3:35:47", "remaining_time": "2:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2292, "total_steps": 3836, "loss": 0.157, "learning_rate": 1.9065413027871437e-06, "epoch": 0.5974000586452937, "percentage": 59.75, "elapsed_time": "3:35:53", "remaining_time": "2:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2293, "total_steps": 3836, "loss": 0.1567, "learning_rate": 1.9044478124036395e-06, "epoch": 0.597660704395139, "percentage": 59.78, "elapsed_time": "3:35:58", "remaining_time": "2:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2294, "total_steps": 3836, "loss": 0.1421, "learning_rate": 1.902354764672518e-06, "epoch": 0.5979213501449842, "percentage": 59.8, "elapsed_time": "3:36:03", "remaining_time": "2:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2295, "total_steps": 3836, "loss": 0.152, "learning_rate": 1.9002621611494654e-06, "epoch": 0.5981819958948295, "percentage": 59.83, "elapsed_time": "3:36:09", "remaining_time": "2:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2296, "total_steps": 3836, "loss": 0.1433, "learning_rate": 1.8981700033898387e-06, "epoch": 0.5984426416446746, "percentage": 59.85, "elapsed_time": "3:36:15", "remaining_time": "2:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2297, "total_steps": 3836, "loss": 0.1395, "learning_rate": 1.896078292948663e-06, "epoch": 0.59870328739452, "percentage": 59.88, "elapsed_time": "3:36:21", "remaining_time": "2:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2298, "total_steps": 3836, "loss": 0.1627, "learning_rate": 1.8939870313806302e-06, "epoch": 0.5989639331443651, "percentage": 59.91, "elapsed_time": "3:36:27", "remaining_time": "2:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2299, "total_steps": 3836, "loss": 0.158, "learning_rate": 1.8918962202401003e-06, "epoch": 0.5992245788942104, "percentage": 59.93, "elapsed_time": "3:36:33", "remaining_time": "2:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2300, "total_steps": 3836, "loss": 0.1639, "learning_rate": 1.8898058610810963e-06, "epoch": 0.5994852246440556, "percentage": 59.96, "elapsed_time": "3:36:38", "remaining_time": "2:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2301, "total_steps": 3836, "loss": 0.1481, "learning_rate": 1.887715955457308e-06, "epoch": 0.5997458703939009, "percentage": 59.98, "elapsed_time": "3:36:44", "remaining_time": "2:24:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2302, "total_steps": 3836, "loss": 0.1525, "learning_rate": 1.8856265049220852e-06, "epoch": 0.6000065161437461, "percentage": 60.01, "elapsed_time": "3:36:50", "remaining_time": "2:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2303, "total_steps": 3836, "loss": 0.1564, "learning_rate": 1.8835375110284424e-06, "epoch": 0.6002671618935914, "percentage": 60.04, "elapsed_time": "3:36:55", "remaining_time": "2:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2304, "total_steps": 3836, "loss": 0.153, "learning_rate": 1.8814489753290517e-06, "epoch": 0.6005278076434366, "percentage": 60.06, "elapsed_time": "3:37:01", "remaining_time": "2:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2305, "total_steps": 3836, "loss": 0.1426, "learning_rate": 1.8793608993762464e-06, "epoch": 0.6007884533932819, "percentage": 60.09, "elapsed_time": "3:37:06", "remaining_time": "2:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2306, "total_steps": 3836, "loss": 0.1516, "learning_rate": 1.8772732847220182e-06, "epoch": 0.6010490991431271, "percentage": 60.11, "elapsed_time": "3:37:12", "remaining_time": "2:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2307, "total_steps": 3836, "loss": 0.1494, "learning_rate": 1.8751861329180149e-06, "epoch": 0.6013097448929723, "percentage": 60.14, "elapsed_time": "3:37:18", "remaining_time": "2:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2308, "total_steps": 3836, "loss": 0.1471, "learning_rate": 1.873099445515542e-06, "epoch": 0.6015703906428176, "percentage": 60.17, "elapsed_time": "3:37:23", "remaining_time": "2:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2309, "total_steps": 3836, "loss": 0.1394, "learning_rate": 1.8710132240655575e-06, "epoch": 0.6018310363926628, "percentage": 60.19, "elapsed_time": "3:37:29", "remaining_time": "2:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2310, "total_steps": 3836, "loss": 0.1537, "learning_rate": 1.868927470118675e-06, "epoch": 0.6020916821425081, "percentage": 60.22, "elapsed_time": "3:37:34", "remaining_time": "2:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2311, "total_steps": 3836, "loss": 0.141, "learning_rate": 1.8668421852251588e-06, "epoch": 0.6023523278923533, "percentage": 60.25, "elapsed_time": "3:37:40", "remaining_time": "2:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2312, "total_steps": 3836, "loss": 0.1561, "learning_rate": 1.8647573709349275e-06, "epoch": 0.6026129736421986, "percentage": 60.27, "elapsed_time": "3:37:46", "remaining_time": "2:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2313, "total_steps": 3836, "loss": 0.1477, "learning_rate": 1.8626730287975467e-06, "epoch": 0.6028736193920438, "percentage": 60.3, "elapsed_time": "3:37:52", "remaining_time": "2:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2314, "total_steps": 3836, "loss": 0.147, "learning_rate": 1.860589160362234e-06, "epoch": 0.6031342651418891, "percentage": 60.32, "elapsed_time": "3:37:58", "remaining_time": "2:23:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2315, "total_steps": 3836, "loss": 0.1466, "learning_rate": 1.8585057671778512e-06, "epoch": 0.6033949108917342, "percentage": 60.35, "elapsed_time": "3:38:03", "remaining_time": "2:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2316, "total_steps": 3836, "loss": 0.1567, "learning_rate": 1.8564228507929099e-06, "epoch": 0.6036555566415795, "percentage": 60.38, "elapsed_time": "3:38:09", "remaining_time": "2:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2317, "total_steps": 3836, "loss": 0.1437, "learning_rate": 1.8543404127555672e-06, "epoch": 0.6039162023914247, "percentage": 60.4, "elapsed_time": "3:38:14", "remaining_time": "2:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2318, "total_steps": 3836, "loss": 0.1517, "learning_rate": 1.852258454613623e-06, "epoch": 0.60417684814127, "percentage": 60.43, "elapsed_time": "3:38:19", "remaining_time": "2:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2319, "total_steps": 3836, "loss": 0.1548, "learning_rate": 1.8501769779145223e-06, "epoch": 0.6044374938911152, "percentage": 60.45, "elapsed_time": "3:38:25", "remaining_time": "2:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2320, "total_steps": 3836, "loss": 0.1606, "learning_rate": 1.8480959842053508e-06, "epoch": 0.6046981396409605, "percentage": 60.48, "elapsed_time": "3:38:30", "remaining_time": "2:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2321, "total_steps": 3836, "loss": 0.1427, "learning_rate": 1.8460154750328351e-06, "epoch": 0.6049587853908057, "percentage": 60.51, "elapsed_time": "3:38:35", "remaining_time": "2:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2322, "total_steps": 3836, "loss": 0.1582, "learning_rate": 1.843935451943344e-06, "epoch": 0.6052194311406509, "percentage": 60.53, "elapsed_time": "3:38:41", "remaining_time": "2:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2323, "total_steps": 3836, "loss": 0.1556, "learning_rate": 1.841855916482882e-06, "epoch": 0.6054800768904962, "percentage": 60.56, "elapsed_time": "3:38:46", "remaining_time": "2:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2324, "total_steps": 3836, "loss": 0.1589, "learning_rate": 1.839776870197093e-06, "epoch": 0.6057407226403414, "percentage": 60.58, "elapsed_time": "3:38:52", "remaining_time": "2:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2325, "total_steps": 3836, "loss": 0.1456, "learning_rate": 1.8376983146312577e-06, "epoch": 0.6060013683901867, "percentage": 60.61, "elapsed_time": "3:38:58", "remaining_time": "2:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2326, "total_steps": 3836, "loss": 0.1523, "learning_rate": 1.8356202513302896e-06, "epoch": 0.6062620141400319, "percentage": 60.64, "elapsed_time": "3:39:03", "remaining_time": "2:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2327, "total_steps": 3836, "loss": 0.1413, "learning_rate": 1.8335426818387386e-06, "epoch": 0.6065226598898772, "percentage": 60.66, "elapsed_time": "3:39:09", "remaining_time": "2:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2328, "total_steps": 3836, "loss": 0.1416, "learning_rate": 1.831465607700787e-06, "epoch": 0.6067833056397224, "percentage": 60.69, "elapsed_time": "3:39:14", "remaining_time": "2:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2329, "total_steps": 3836, "loss": 0.1542, "learning_rate": 1.8293890304602491e-06, "epoch": 0.6070439513895677, "percentage": 60.71, "elapsed_time": "3:39:19", "remaining_time": "2:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2330, "total_steps": 3836, "loss": 0.1534, "learning_rate": 1.8273129516605698e-06, "epoch": 0.6073045971394129, "percentage": 60.74, "elapsed_time": "3:39:25", "remaining_time": "2:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2331, "total_steps": 3836, "loss": 0.1406, "learning_rate": 1.825237372844822e-06, "epoch": 0.6075652428892582, "percentage": 60.77, "elapsed_time": "3:39:31", "remaining_time": "2:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2332, "total_steps": 3836, "loss": 0.1525, "learning_rate": 1.8231622955557094e-06, "epoch": 0.6078258886391034, "percentage": 60.79, "elapsed_time": "3:39:36", "remaining_time": "2:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2333, "total_steps": 3836, "loss": 0.1472, "learning_rate": 1.8210877213355613e-06, "epoch": 0.6080865343889487, "percentage": 60.82, "elapsed_time": "3:39:41", "remaining_time": "2:21:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2334, "total_steps": 3836, "loss": 0.1503, "learning_rate": 1.819013651726334e-06, "epoch": 0.6083471801387939, "percentage": 60.84, "elapsed_time": "3:39:46", "remaining_time": "2:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2335, "total_steps": 3836, "loss": 0.1507, "learning_rate": 1.8169400882696081e-06, "epoch": 0.6086078258886392, "percentage": 60.87, "elapsed_time": "3:39:52", "remaining_time": "2:21:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2336, "total_steps": 3836, "loss": 0.148, "learning_rate": 1.8148670325065893e-06, "epoch": 0.6088684716384843, "percentage": 60.9, "elapsed_time": "3:39:57", "remaining_time": "2:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2337, "total_steps": 3836, "loss": 0.1486, "learning_rate": 1.8127944859781037e-06, "epoch": 0.6091291173883295, "percentage": 60.92, "elapsed_time": "3:40:02", "remaining_time": "2:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2338, "total_steps": 3836, "loss": 0.1553, "learning_rate": 1.8107224502245997e-06, "epoch": 0.6093897631381748, "percentage": 60.95, "elapsed_time": "3:40:08", "remaining_time": "2:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2339, "total_steps": 3836, "loss": 0.1451, "learning_rate": 1.8086509267861472e-06, "epoch": 0.60965040888802, "percentage": 60.97, "elapsed_time": "3:40:13", "remaining_time": "2:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2340, "total_steps": 3836, "loss": 0.1436, "learning_rate": 1.806579917202435e-06, "epoch": 0.6099110546378653, "percentage": 61.0, "elapsed_time": "3:40:19", "remaining_time": "2:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2341, "total_steps": 3836, "loss": 0.143, "learning_rate": 1.8045094230127697e-06, "epoch": 0.6101717003877105, "percentage": 61.03, "elapsed_time": "3:40:25", "remaining_time": "2:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2342, "total_steps": 3836, "loss": 0.1543, "learning_rate": 1.802439445756073e-06, "epoch": 0.6104323461375558, "percentage": 61.05, "elapsed_time": "3:40:31", "remaining_time": "2:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2343, "total_steps": 3836, "loss": 0.1567, "learning_rate": 1.8003699869708858e-06, "epoch": 0.610692991887401, "percentage": 61.08, "elapsed_time": "3:40:36", "remaining_time": "2:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2344, "total_steps": 3836, "loss": 0.1478, "learning_rate": 1.7983010481953605e-06, "epoch": 0.6109536376372463, "percentage": 61.11, "elapsed_time": "3:40:41", "remaining_time": "2:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2345, "total_steps": 3836, "loss": 0.1595, "learning_rate": 1.7962326309672661e-06, "epoch": 0.6112142833870915, "percentage": 61.13, "elapsed_time": "3:40:47", "remaining_time": "2:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2346, "total_steps": 3836, "loss": 0.1487, "learning_rate": 1.7941647368239806e-06, "epoch": 0.6114749291369368, "percentage": 61.16, "elapsed_time": "3:40:52", "remaining_time": "2:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2347, "total_steps": 3836, "loss": 0.1407, "learning_rate": 1.7920973673024967e-06, "epoch": 0.611735574886782, "percentage": 61.18, "elapsed_time": "3:40:57", "remaining_time": "2:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2348, "total_steps": 3836, "loss": 0.1612, "learning_rate": 1.7900305239394134e-06, "epoch": 0.6119962206366273, "percentage": 61.21, "elapsed_time": "3:41:03", "remaining_time": "2:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2349, "total_steps": 3836, "loss": 0.1374, "learning_rate": 1.7879642082709411e-06, "epoch": 0.6122568663864725, "percentage": 61.24, "elapsed_time": "3:41:08", "remaining_time": "2:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2350, "total_steps": 3836, "loss": 0.14, "learning_rate": 1.785898421832898e-06, "epoch": 0.6125175121363178, "percentage": 61.26, "elapsed_time": "3:41:13", "remaining_time": "2:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2351, "total_steps": 3836, "loss": 0.148, "learning_rate": 1.7838331661607078e-06, "epoch": 0.612778157886163, "percentage": 61.29, "elapsed_time": "3:41:19", "remaining_time": "2:19:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2352, "total_steps": 3836, "loss": 0.1536, "learning_rate": 1.7817684427894016e-06, "epoch": 0.6130388036360082, "percentage": 61.31, "elapsed_time": "3:41:24", "remaining_time": "2:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2353, "total_steps": 3836, "loss": 0.1476, "learning_rate": 1.7797042532536118e-06, "epoch": 0.6132994493858535, "percentage": 61.34, "elapsed_time": "3:41:30", "remaining_time": "2:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2354, "total_steps": 3836, "loss": 0.1544, "learning_rate": 1.7776405990875761e-06, "epoch": 0.6135600951356986, "percentage": 61.37, "elapsed_time": "3:41:35", "remaining_time": "2:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2355, "total_steps": 3836, "loss": 0.1555, "learning_rate": 1.7755774818251348e-06, "epoch": 0.613820740885544, "percentage": 61.39, "elapsed_time": "3:41:40", "remaining_time": "2:19:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2356, "total_steps": 3836, "loss": 0.1477, "learning_rate": 1.7735149029997273e-06, "epoch": 0.6140813866353891, "percentage": 61.42, "elapsed_time": "3:41:46", "remaining_time": "2:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2357, "total_steps": 3836, "loss": 0.1479, "learning_rate": 1.7714528641443952e-06, "epoch": 0.6143420323852344, "percentage": 61.44, "elapsed_time": "3:41:51", "remaining_time": "2:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2358, "total_steps": 3836, "loss": 0.1366, "learning_rate": 1.7693913667917757e-06, "epoch": 0.6146026781350796, "percentage": 61.47, "elapsed_time": "3:41:57", "remaining_time": "2:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2359, "total_steps": 3836, "loss": 0.1497, "learning_rate": 1.7673304124741055e-06, "epoch": 0.6148633238849249, "percentage": 61.5, "elapsed_time": "3:42:03", "remaining_time": "2:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2360, "total_steps": 3836, "loss": 0.139, "learning_rate": 1.7652700027232184e-06, "epoch": 0.6151239696347701, "percentage": 61.52, "elapsed_time": "3:42:08", "remaining_time": "2:18:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2361, "total_steps": 3836, "loss": 0.1472, "learning_rate": 1.7632101390705408e-06, "epoch": 0.6153846153846154, "percentage": 61.55, "elapsed_time": "3:42:14", "remaining_time": "2:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2362, "total_steps": 3836, "loss": 0.1395, "learning_rate": 1.7611508230470963e-06, "epoch": 0.6156452611344606, "percentage": 61.57, "elapsed_time": "3:42:19", "remaining_time": "2:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2363, "total_steps": 3836, "loss": 0.1531, "learning_rate": 1.7590920561835002e-06, "epoch": 0.6159059068843059, "percentage": 61.6, "elapsed_time": "3:42:24", "remaining_time": "2:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2364, "total_steps": 3836, "loss": 0.1475, "learning_rate": 1.7570338400099569e-06, "epoch": 0.6161665526341511, "percentage": 61.63, "elapsed_time": "3:42:30", "remaining_time": "2:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2365, "total_steps": 3836, "loss": 0.1275, "learning_rate": 1.7549761760562662e-06, "epoch": 0.6164271983839964, "percentage": 61.65, "elapsed_time": "3:42:35", "remaining_time": "2:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2366, "total_steps": 3836, "loss": 0.1544, "learning_rate": 1.7529190658518142e-06, "epoch": 0.6166878441338416, "percentage": 61.68, "elapsed_time": "3:42:40", "remaining_time": "2:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2367, "total_steps": 3836, "loss": 0.1551, "learning_rate": 1.750862510925577e-06, "epoch": 0.6169484898836868, "percentage": 61.7, "elapsed_time": "3:42:46", "remaining_time": "2:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2368, "total_steps": 3836, "loss": 0.1345, "learning_rate": 1.7488065128061187e-06, "epoch": 0.6172091356335321, "percentage": 61.73, "elapsed_time": "3:42:52", "remaining_time": "2:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2369, "total_steps": 3836, "loss": 0.1582, "learning_rate": 1.7467510730215854e-06, "epoch": 0.6174697813833773, "percentage": 61.76, "elapsed_time": "3:42:57", "remaining_time": "2:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2370, "total_steps": 3836, "loss": 0.1627, "learning_rate": 1.7446961930997126e-06, "epoch": 0.6177304271332226, "percentage": 61.78, "elapsed_time": "3:43:03", "remaining_time": "2:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2371, "total_steps": 3836, "loss": 0.1605, "learning_rate": 1.7426418745678182e-06, "epoch": 0.6179910728830678, "percentage": 61.81, "elapsed_time": "3:43:08", "remaining_time": "2:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2372, "total_steps": 3836, "loss": 0.142, "learning_rate": 1.7405881189528024e-06, "epoch": 0.6182517186329131, "percentage": 61.84, "elapsed_time": "3:43:14", "remaining_time": "2:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2373, "total_steps": 3836, "loss": 0.1571, "learning_rate": 1.7385349277811483e-06, "epoch": 0.6185123643827583, "percentage": 61.86, "elapsed_time": "3:43:20", "remaining_time": "2:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2374, "total_steps": 3836, "loss": 0.144, "learning_rate": 1.7364823025789184e-06, "epoch": 0.6187730101326036, "percentage": 61.89, "elapsed_time": "3:43:27", "remaining_time": "2:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2375, "total_steps": 3836, "loss": 0.1419, "learning_rate": 1.7344302448717537e-06, "epoch": 0.6190336558824487, "percentage": 61.91, "elapsed_time": "3:43:32", "remaining_time": "2:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2376, "total_steps": 3836, "loss": 0.1513, "learning_rate": 1.732378756184875e-06, "epoch": 0.619294301632294, "percentage": 61.94, "elapsed_time": "3:43:37", "remaining_time": "2:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2377, "total_steps": 3836, "loss": 0.1302, "learning_rate": 1.7303278380430794e-06, "epoch": 0.6195549473821392, "percentage": 61.97, "elapsed_time": "3:43:43", "remaining_time": "2:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2378, "total_steps": 3836, "loss": 0.1407, "learning_rate": 1.7282774919707406e-06, "epoch": 0.6198155931319845, "percentage": 61.99, "elapsed_time": "3:43:48", "remaining_time": "2:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2379, "total_steps": 3836, "loss": 0.1581, "learning_rate": 1.726227719491807e-06, "epoch": 0.6200762388818297, "percentage": 62.02, "elapsed_time": "3:43:53", "remaining_time": "2:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2380, "total_steps": 3836, "loss": 0.1461, "learning_rate": 1.7241785221297984e-06, "epoch": 0.620336884631675, "percentage": 62.04, "elapsed_time": "3:43:59", "remaining_time": "2:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2381, "total_steps": 3836, "loss": 0.1547, "learning_rate": 1.7221299014078107e-06, "epoch": 0.6205975303815202, "percentage": 62.07, "elapsed_time": "3:44:04", "remaining_time": "2:16:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2382, "total_steps": 3836, "loss": 0.1648, "learning_rate": 1.7200818588485088e-06, "epoch": 0.6208581761313655, "percentage": 62.1, "elapsed_time": "3:44:09", "remaining_time": "2:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2383, "total_steps": 3836, "loss": 0.1604, "learning_rate": 1.7180343959741292e-06, "epoch": 0.6211188218812107, "percentage": 62.12, "elapsed_time": "3:44:14", "remaining_time": "2:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2384, "total_steps": 3836, "loss": 0.1549, "learning_rate": 1.715987514306476e-06, "epoch": 0.6213794676310559, "percentage": 62.15, "elapsed_time": "3:44:20", "remaining_time": "2:16:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2385, "total_steps": 3836, "loss": 0.1465, "learning_rate": 1.713941215366924e-06, "epoch": 0.6216401133809012, "percentage": 62.17, "elapsed_time": "3:44:25", "remaining_time": "2:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2386, "total_steps": 3836, "loss": 0.1425, "learning_rate": 1.7118955006764116e-06, "epoch": 0.6219007591307464, "percentage": 62.2, "elapsed_time": "3:44:30", "remaining_time": "2:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2387, "total_steps": 3836, "loss": 0.149, "learning_rate": 1.7098503717554437e-06, "epoch": 0.6221614048805917, "percentage": 62.23, "elapsed_time": "3:44:36", "remaining_time": "2:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2388, "total_steps": 3836, "loss": 0.1578, "learning_rate": 1.707805830124093e-06, "epoch": 0.6224220506304369, "percentage": 62.25, "elapsed_time": "3:44:42", "remaining_time": "2:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2389, "total_steps": 3836, "loss": 0.1594, "learning_rate": 1.705761877301991e-06, "epoch": 0.6226826963802822, "percentage": 62.28, "elapsed_time": "3:44:48", "remaining_time": "2:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2390, "total_steps": 3836, "loss": 0.1361, "learning_rate": 1.703718514808336e-06, "epoch": 0.6229433421301274, "percentage": 62.3, "elapsed_time": "3:44:53", "remaining_time": "2:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2391, "total_steps": 3836, "loss": 0.1376, "learning_rate": 1.7016757441618837e-06, "epoch": 0.6232039878799727, "percentage": 62.33, "elapsed_time": "3:44:58", "remaining_time": "2:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2392, "total_steps": 3836, "loss": 0.1489, "learning_rate": 1.6996335668809515e-06, "epoch": 0.6234646336298179, "percentage": 62.36, "elapsed_time": "3:45:03", "remaining_time": "2:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2393, "total_steps": 3836, "loss": 0.1391, "learning_rate": 1.6975919844834172e-06, "epoch": 0.6237252793796632, "percentage": 62.38, "elapsed_time": "3:45:09", "remaining_time": "2:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2394, "total_steps": 3836, "loss": 0.1531, "learning_rate": 1.6955509984867136e-06, "epoch": 0.6239859251295083, "percentage": 62.41, "elapsed_time": "3:45:14", "remaining_time": "2:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2395, "total_steps": 3836, "loss": 0.1586, "learning_rate": 1.6935106104078325e-06, "epoch": 0.6242465708793536, "percentage": 62.43, "elapsed_time": "3:45:19", "remaining_time": "2:15:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2396, "total_steps": 3836, "loss": 0.1504, "learning_rate": 1.691470821763322e-06, "epoch": 0.6245072166291988, "percentage": 62.46, "elapsed_time": "3:45:25", "remaining_time": "2:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2397, "total_steps": 3836, "loss": 0.1308, "learning_rate": 1.6894316340692802e-06, "epoch": 0.6247678623790441, "percentage": 62.49, "elapsed_time": "3:45:31", "remaining_time": "2:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2398, "total_steps": 3836, "loss": 0.1292, "learning_rate": 1.6873930488413628e-06, "epoch": 0.6250285081288893, "percentage": 62.51, "elapsed_time": "3:45:37", "remaining_time": "2:15:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2399, "total_steps": 3836, "loss": 0.1594, "learning_rate": 1.6853550675947772e-06, "epoch": 0.6252891538787345, "percentage": 62.54, "elapsed_time": "3:45:43", "remaining_time": "2:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2400, "total_steps": 3836, "loss": 0.1371, "learning_rate": 1.6833176918442796e-06, "epoch": 0.6255497996285798, "percentage": 62.57, "elapsed_time": "3:45:48", "remaining_time": "2:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2401, "total_steps": 3836, "loss": 0.1428, "learning_rate": 1.6812809231041794e-06, "epoch": 0.625810445378425, "percentage": 62.59, "elapsed_time": "3:45:53", "remaining_time": "2:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2402, "total_steps": 3836, "loss": 0.1477, "learning_rate": 1.6792447628883318e-06, "epoch": 0.6260710911282703, "percentage": 62.62, "elapsed_time": "3:45:59", "remaining_time": "2:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2403, "total_steps": 3836, "loss": 0.1434, "learning_rate": 1.6772092127101407e-06, "epoch": 0.6263317368781155, "percentage": 62.64, "elapsed_time": "3:46:04", "remaining_time": "2:14:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2404, "total_steps": 3836, "loss": 0.1612, "learning_rate": 1.6751742740825583e-06, "epoch": 0.6265923826279608, "percentage": 62.67, "elapsed_time": "3:46:10", "remaining_time": "2:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2405, "total_steps": 3836, "loss": 0.1417, "learning_rate": 1.673139948518079e-06, "epoch": 0.626853028377806, "percentage": 62.7, "elapsed_time": "3:46:15", "remaining_time": "2:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2406, "total_steps": 3836, "loss": 0.1533, "learning_rate": 1.6711062375287451e-06, "epoch": 0.6271136741276513, "percentage": 62.72, "elapsed_time": "3:46:21", "remaining_time": "2:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2407, "total_steps": 3836, "loss": 0.1585, "learning_rate": 1.6690731426261403e-06, "epoch": 0.6273743198774965, "percentage": 62.75, "elapsed_time": "3:46:26", "remaining_time": "2:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2408, "total_steps": 3836, "loss": 0.1548, "learning_rate": 1.6670406653213883e-06, "epoch": 0.6276349656273418, "percentage": 62.77, "elapsed_time": "3:46:32", "remaining_time": "2:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2409, "total_steps": 3836, "loss": 0.1535, "learning_rate": 1.665008807125158e-06, "epoch": 0.627895611377187, "percentage": 62.8, "elapsed_time": "3:46:38", "remaining_time": "2:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2410, "total_steps": 3836, "loss": 0.152, "learning_rate": 1.6629775695476551e-06, "epoch": 0.6281562571270323, "percentage": 62.83, "elapsed_time": "3:46:43", "remaining_time": "2:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2411, "total_steps": 3836, "loss": 0.1474, "learning_rate": 1.6609469540986257e-06, "epoch": 0.6284169028768775, "percentage": 62.85, "elapsed_time": "3:46:49", "remaining_time": "2:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2412, "total_steps": 3836, "loss": 0.1427, "learning_rate": 1.6589169622873524e-06, "epoch": 0.6286775486267228, "percentage": 62.88, "elapsed_time": "3:46:55", "remaining_time": "2:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2413, "total_steps": 3836, "loss": 0.1489, "learning_rate": 1.6568875956226537e-06, "epoch": 0.628938194376568, "percentage": 62.9, "elapsed_time": "3:47:00", "remaining_time": "2:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2414, "total_steps": 3836, "loss": 0.1491, "learning_rate": 1.654858855612886e-06, "epoch": 0.6291988401264131, "percentage": 62.93, "elapsed_time": "3:47:05", "remaining_time": "2:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2415, "total_steps": 3836, "loss": 0.1438, "learning_rate": 1.6528307437659369e-06, "epoch": 0.6294594858762584, "percentage": 62.96, "elapsed_time": "3:47:11", "remaining_time": "2:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2416, "total_steps": 3836, "loss": 0.1409, "learning_rate": 1.6508032615892294e-06, "epoch": 0.6297201316261036, "percentage": 62.98, "elapsed_time": "3:47:16", "remaining_time": "2:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2417, "total_steps": 3836, "loss": 0.1556, "learning_rate": 1.6487764105897172e-06, "epoch": 0.6299807773759489, "percentage": 63.01, "elapsed_time": "3:47:22", "remaining_time": "2:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2418, "total_steps": 3836, "loss": 0.137, "learning_rate": 1.6467501922738862e-06, "epoch": 0.6302414231257941, "percentage": 63.03, "elapsed_time": "3:47:27", "remaining_time": "2:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2419, "total_steps": 3836, "loss": 0.1522, "learning_rate": 1.6447246081477503e-06, "epoch": 0.6305020688756394, "percentage": 63.06, "elapsed_time": "3:47:33", "remaining_time": "2:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2420, "total_steps": 3836, "loss": 0.1579, "learning_rate": 1.6426996597168517e-06, "epoch": 0.6307627146254846, "percentage": 63.09, "elapsed_time": "3:47:38", "remaining_time": "2:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2421, "total_steps": 3836, "loss": 0.1501, "learning_rate": 1.6406753484862636e-06, "epoch": 0.6310233603753299, "percentage": 63.11, "elapsed_time": "3:47:44", "remaining_time": "2:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2422, "total_steps": 3836, "loss": 0.1373, "learning_rate": 1.6386516759605813e-06, "epoch": 0.6312840061251751, "percentage": 63.14, "elapsed_time": "3:47:50", "remaining_time": "2:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2423, "total_steps": 3836, "loss": 0.1467, "learning_rate": 1.6366286436439294e-06, "epoch": 0.6315446518750204, "percentage": 63.16, "elapsed_time": "3:47:56", "remaining_time": "2:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2424, "total_steps": 3836, "loss": 0.1445, "learning_rate": 1.6346062530399525e-06, "epoch": 0.6318052976248656, "percentage": 63.19, "elapsed_time": "3:48:02", "remaining_time": "2:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2425, "total_steps": 3836, "loss": 0.1525, "learning_rate": 1.6325845056518211e-06, "epoch": 0.6320659433747109, "percentage": 63.22, "elapsed_time": "3:48:08", "remaining_time": "2:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2426, "total_steps": 3836, "loss": 0.1531, "learning_rate": 1.6305634029822267e-06, "epoch": 0.6323265891245561, "percentage": 63.24, "elapsed_time": "3:48:13", "remaining_time": "2:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2427, "total_steps": 3836, "loss": 0.1537, "learning_rate": 1.6285429465333827e-06, "epoch": 0.6325872348744014, "percentage": 63.27, "elapsed_time": "3:48:18", "remaining_time": "2:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2428, "total_steps": 3836, "loss": 0.1585, "learning_rate": 1.6265231378070197e-06, "epoch": 0.6328478806242466, "percentage": 63.3, "elapsed_time": "3:48:24", "remaining_time": "2:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2429, "total_steps": 3836, "loss": 0.1547, "learning_rate": 1.6245039783043905e-06, "epoch": 0.6331085263740918, "percentage": 63.32, "elapsed_time": "3:48:29", "remaining_time": "2:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2430, "total_steps": 3836, "loss": 0.1576, "learning_rate": 1.6224854695262616e-06, "epoch": 0.6333691721239371, "percentage": 63.35, "elapsed_time": "3:48:34", "remaining_time": "2:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2431, "total_steps": 3836, "loss": 0.1473, "learning_rate": 1.6204676129729175e-06, "epoch": 0.6336298178737823, "percentage": 63.37, "elapsed_time": "3:48:39", "remaining_time": "2:12:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2432, "total_steps": 3836, "loss": 0.163, "learning_rate": 1.6184504101441584e-06, "epoch": 0.6338904636236276, "percentage": 63.4, "elapsed_time": "3:48:45", "remaining_time": "2:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2433, "total_steps": 3836, "loss": 0.1448, "learning_rate": 1.6164338625392977e-06, "epoch": 0.6341511093734727, "percentage": 63.43, "elapsed_time": "3:48:50", "remaining_time": "2:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2434, "total_steps": 3836, "loss": 0.1476, "learning_rate": 1.614417971657164e-06, "epoch": 0.634411755123318, "percentage": 63.45, "elapsed_time": "3:48:56", "remaining_time": "2:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2435, "total_steps": 3836, "loss": 0.1513, "learning_rate": 1.6124027389960938e-06, "epoch": 0.6346724008731632, "percentage": 63.48, "elapsed_time": "3:49:02", "remaining_time": "2:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2436, "total_steps": 3836, "loss": 0.133, "learning_rate": 1.6103881660539369e-06, "epoch": 0.6349330466230085, "percentage": 63.5, "elapsed_time": "3:49:07", "remaining_time": "2:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2437, "total_steps": 3836, "loss": 0.1434, "learning_rate": 1.6083742543280537e-06, "epoch": 0.6351936923728537, "percentage": 63.53, "elapsed_time": "3:49:12", "remaining_time": "2:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2438, "total_steps": 3836, "loss": 0.142, "learning_rate": 1.6063610053153106e-06, "epoch": 0.635454338122699, "percentage": 63.56, "elapsed_time": "3:49:18", "remaining_time": "2:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2439, "total_steps": 3836, "loss": 0.1394, "learning_rate": 1.6043484205120834e-06, "epoch": 0.6357149838725442, "percentage": 63.58, "elapsed_time": "3:49:23", "remaining_time": "2:11:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2440, "total_steps": 3836, "loss": 0.1616, "learning_rate": 1.6023365014142544e-06, "epoch": 0.6359756296223895, "percentage": 63.61, "elapsed_time": "3:49:29", "remaining_time": "2:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2441, "total_steps": 3836, "loss": 0.1523, "learning_rate": 1.600325249517208e-06, "epoch": 0.6362362753722347, "percentage": 63.63, "elapsed_time": "3:49:35", "remaining_time": "2:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2442, "total_steps": 3836, "loss": 0.1566, "learning_rate": 1.5983146663158368e-06, "epoch": 0.63649692112208, "percentage": 63.66, "elapsed_time": "3:49:41", "remaining_time": "2:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2443, "total_steps": 3836, "loss": 0.1474, "learning_rate": 1.5963047533045334e-06, "epoch": 0.6367575668719252, "percentage": 63.69, "elapsed_time": "3:49:46", "remaining_time": "2:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2444, "total_steps": 3836, "loss": 0.1462, "learning_rate": 1.5942955119771942e-06, "epoch": 0.6370182126217704, "percentage": 63.71, "elapsed_time": "3:49:52", "remaining_time": "2:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2445, "total_steps": 3836, "loss": 0.1488, "learning_rate": 1.592286943827216e-06, "epoch": 0.6372788583716157, "percentage": 63.74, "elapsed_time": "3:49:58", "remaining_time": "2:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2446, "total_steps": 3836, "loss": 0.1554, "learning_rate": 1.5902790503474928e-06, "epoch": 0.6375395041214609, "percentage": 63.76, "elapsed_time": "3:50:03", "remaining_time": "2:10:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2447, "total_steps": 3836, "loss": 0.1441, "learning_rate": 1.5882718330304209e-06, "epoch": 0.6378001498713062, "percentage": 63.79, "elapsed_time": "3:50:08", "remaining_time": "2:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2448, "total_steps": 3836, "loss": 0.1326, "learning_rate": 1.586265293367891e-06, "epoch": 0.6380607956211514, "percentage": 63.82, "elapsed_time": "3:50:13", "remaining_time": "2:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2449, "total_steps": 3836, "loss": 0.1532, "learning_rate": 1.5842594328512927e-06, "epoch": 0.6383214413709967, "percentage": 63.84, "elapsed_time": "3:50:19", "remaining_time": "2:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2450, "total_steps": 3836, "loss": 0.1319, "learning_rate": 1.5822542529715084e-06, "epoch": 0.6385820871208419, "percentage": 63.87, "elapsed_time": "3:50:24", "remaining_time": "2:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2451, "total_steps": 3836, "loss": 0.135, "learning_rate": 1.5802497552189177e-06, "epoch": 0.6388427328706872, "percentage": 63.89, "elapsed_time": "3:50:30", "remaining_time": "2:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2452, "total_steps": 3836, "loss": 0.1508, "learning_rate": 1.578245941083389e-06, "epoch": 0.6391033786205323, "percentage": 63.92, "elapsed_time": "3:50:36", "remaining_time": "2:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2453, "total_steps": 3836, "loss": 0.1435, "learning_rate": 1.576242812054285e-06, "epoch": 0.6393640243703776, "percentage": 63.95, "elapsed_time": "3:50:42", "remaining_time": "2:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2454, "total_steps": 3836, "loss": 0.1387, "learning_rate": 1.57424036962046e-06, "epoch": 0.6396246701202228, "percentage": 63.97, "elapsed_time": "3:50:48", "remaining_time": "2:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2455, "total_steps": 3836, "loss": 0.1505, "learning_rate": 1.572238615270256e-06, "epoch": 0.6398853158700681, "percentage": 64.0, "elapsed_time": "3:50:53", "remaining_time": "2:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2456, "total_steps": 3836, "loss": 0.1407, "learning_rate": 1.5702375504915062e-06, "epoch": 0.6401459616199133, "percentage": 64.03, "elapsed_time": "3:50:58", "remaining_time": "2:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2457, "total_steps": 3836, "loss": 0.1424, "learning_rate": 1.5682371767715276e-06, "epoch": 0.6404066073697586, "percentage": 64.05, "elapsed_time": "3:51:04", "remaining_time": "2:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2458, "total_steps": 3836, "loss": 0.1518, "learning_rate": 1.5662374955971268e-06, "epoch": 0.6406672531196038, "percentage": 64.08, "elapsed_time": "3:51:09", "remaining_time": "2:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2459, "total_steps": 3836, "loss": 0.1366, "learning_rate": 1.5642385084545936e-06, "epoch": 0.640927898869449, "percentage": 64.1, "elapsed_time": "3:51:14", "remaining_time": "2:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2460, "total_steps": 3836, "loss": 0.1509, "learning_rate": 1.562240216829704e-06, "epoch": 0.6411885446192943, "percentage": 64.13, "elapsed_time": "3:51:20", "remaining_time": "2:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2461, "total_steps": 3836, "loss": 0.1574, "learning_rate": 1.5602426222077144e-06, "epoch": 0.6414491903691395, "percentage": 64.16, "elapsed_time": "3:51:27", "remaining_time": "2:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2462, "total_steps": 3836, "loss": 0.1602, "learning_rate": 1.5582457260733664e-06, "epoch": 0.6417098361189848, "percentage": 64.18, "elapsed_time": "3:51:32", "remaining_time": "2:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2463, "total_steps": 3836, "loss": 0.1429, "learning_rate": 1.5562495299108793e-06, "epoch": 0.64197048186883, "percentage": 64.21, "elapsed_time": "3:51:37", "remaining_time": "2:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2464, "total_steps": 3836, "loss": 0.1469, "learning_rate": 1.5542540352039525e-06, "epoch": 0.6422311276186753, "percentage": 64.23, "elapsed_time": "3:51:43", "remaining_time": "2:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2465, "total_steps": 3836, "loss": 0.144, "learning_rate": 1.552259243435767e-06, "epoch": 0.6424917733685205, "percentage": 64.26, "elapsed_time": "3:51:48", "remaining_time": "2:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2466, "total_steps": 3836, "loss": 0.1453, "learning_rate": 1.550265156088978e-06, "epoch": 0.6427524191183658, "percentage": 64.29, "elapsed_time": "3:51:54", "remaining_time": "2:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2467, "total_steps": 3836, "loss": 0.1361, "learning_rate": 1.5482717746457199e-06, "epoch": 0.643013064868211, "percentage": 64.31, "elapsed_time": "3:51:59", "remaining_time": "2:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2468, "total_steps": 3836, "loss": 0.1325, "learning_rate": 1.5462791005875994e-06, "epoch": 0.6432737106180563, "percentage": 64.34, "elapsed_time": "3:52:04", "remaining_time": "2:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2469, "total_steps": 3836, "loss": 0.1476, "learning_rate": 1.544287135395699e-06, "epoch": 0.6435343563679015, "percentage": 64.36, "elapsed_time": "3:52:09", "remaining_time": "2:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2470, "total_steps": 3836, "loss": 0.1463, "learning_rate": 1.542295880550575e-06, "epoch": 0.6437950021177468, "percentage": 64.39, "elapsed_time": "3:52:15", "remaining_time": "2:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2471, "total_steps": 3836, "loss": 0.1438, "learning_rate": 1.5403053375322548e-06, "epoch": 0.644055647867592, "percentage": 64.42, "elapsed_time": "3:52:21", "remaining_time": "2:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2472, "total_steps": 3836, "loss": 0.1475, "learning_rate": 1.5383155078202377e-06, "epoch": 0.6443162936174373, "percentage": 64.44, "elapsed_time": "3:52:26", "remaining_time": "2:08:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2473, "total_steps": 3836, "loss": 0.152, "learning_rate": 1.5363263928934919e-06, "epoch": 0.6445769393672824, "percentage": 64.47, "elapsed_time": "3:52:32", "remaining_time": "2:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2474, "total_steps": 3836, "loss": 0.1498, "learning_rate": 1.534337994230453e-06, "epoch": 0.6448375851171276, "percentage": 64.49, "elapsed_time": "3:52:37", "remaining_time": "2:08:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2475, "total_steps": 3836, "loss": 0.1549, "learning_rate": 1.5323503133090273e-06, "epoch": 0.6450982308669729, "percentage": 64.52, "elapsed_time": "3:52:43", "remaining_time": "2:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2476, "total_steps": 3836, "loss": 0.1435, "learning_rate": 1.5303633516065852e-06, "epoch": 0.6453588766168181, "percentage": 64.55, "elapsed_time": "3:52:48", "remaining_time": "2:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2477, "total_steps": 3836, "loss": 0.1348, "learning_rate": 1.528377110599964e-06, "epoch": 0.6456195223666634, "percentage": 64.57, "elapsed_time": "3:52:54", "remaining_time": "2:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2478, "total_steps": 3836, "loss": 0.138, "learning_rate": 1.5263915917654654e-06, "epoch": 0.6458801681165086, "percentage": 64.6, "elapsed_time": "3:52:59", "remaining_time": "2:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2479, "total_steps": 3836, "loss": 0.1424, "learning_rate": 1.5244067965788518e-06, "epoch": 0.6461408138663539, "percentage": 64.62, "elapsed_time": "3:53:05", "remaining_time": "2:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2480, "total_steps": 3836, "loss": 0.1585, "learning_rate": 1.5224227265153512e-06, "epoch": 0.6464014596161991, "percentage": 64.65, "elapsed_time": "3:53:11", "remaining_time": "2:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2481, "total_steps": 3836, "loss": 0.1471, "learning_rate": 1.52043938304965e-06, "epoch": 0.6466621053660444, "percentage": 64.68, "elapsed_time": "3:53:17", "remaining_time": "2:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2482, "total_steps": 3836, "loss": 0.1447, "learning_rate": 1.5184567676558965e-06, "epoch": 0.6469227511158896, "percentage": 64.7, "elapsed_time": "3:53:22", "remaining_time": "2:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2483, "total_steps": 3836, "loss": 0.1422, "learning_rate": 1.5164748818076964e-06, "epoch": 0.6471833968657349, "percentage": 64.73, "elapsed_time": "3:53:28", "remaining_time": "2:07:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2484, "total_steps": 3836, "loss": 0.155, "learning_rate": 1.5144937269781142e-06, "epoch": 0.6474440426155801, "percentage": 64.75, "elapsed_time": "3:53:33", "remaining_time": "2:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2485, "total_steps": 3836, "loss": 0.1548, "learning_rate": 1.5125133046396699e-06, "epoch": 0.6477046883654254, "percentage": 64.78, "elapsed_time": "3:53:38", "remaining_time": "2:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2486, "total_steps": 3836, "loss": 0.1524, "learning_rate": 1.5105336162643403e-06, "epoch": 0.6479653341152706, "percentage": 64.81, "elapsed_time": "3:53:44", "remaining_time": "2:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2487, "total_steps": 3836, "loss": 0.1526, "learning_rate": 1.5085546633235554e-06, "epoch": 0.6482259798651159, "percentage": 64.83, "elapsed_time": "3:53:49", "remaining_time": "2:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2488, "total_steps": 3836, "loss": 0.1404, "learning_rate": 1.5065764472882e-06, "epoch": 0.6484866256149611, "percentage": 64.86, "elapsed_time": "3:53:55", "remaining_time": "2:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2489, "total_steps": 3836, "loss": 0.1417, "learning_rate": 1.5045989696286112e-06, "epoch": 0.6487472713648063, "percentage": 64.89, "elapsed_time": "3:54:01", "remaining_time": "2:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2490, "total_steps": 3836, "loss": 0.1451, "learning_rate": 1.5026222318145745e-06, "epoch": 0.6490079171146516, "percentage": 64.91, "elapsed_time": "3:54:06", "remaining_time": "2:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2491, "total_steps": 3836, "loss": 0.1482, "learning_rate": 1.500646235315329e-06, "epoch": 0.6492685628644967, "percentage": 64.94, "elapsed_time": "3:54:12", "remaining_time": "2:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2492, "total_steps": 3836, "loss": 0.1489, "learning_rate": 1.4986709815995604e-06, "epoch": 0.649529208614342, "percentage": 64.96, "elapsed_time": "3:54:18", "remaining_time": "2:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2493, "total_steps": 3836, "loss": 0.1541, "learning_rate": 1.4966964721354047e-06, "epoch": 0.6497898543641872, "percentage": 64.99, "elapsed_time": "3:54:24", "remaining_time": "2:06:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2494, "total_steps": 3836, "loss": 0.1402, "learning_rate": 1.494722708390442e-06, "epoch": 0.6500505001140325, "percentage": 65.02, "elapsed_time": "3:54:30", "remaining_time": "2:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2495, "total_steps": 3836, "loss": 0.1423, "learning_rate": 1.4927496918317009e-06, "epoch": 0.6503111458638777, "percentage": 65.04, "elapsed_time": "3:54:35", "remaining_time": "2:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2496, "total_steps": 3836, "loss": 0.1537, "learning_rate": 1.4907774239256517e-06, "epoch": 0.650571791613723, "percentage": 65.07, "elapsed_time": "3:54:40", "remaining_time": "2:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2497, "total_steps": 3836, "loss": 0.1472, "learning_rate": 1.4888059061382098e-06, "epoch": 0.6508324373635682, "percentage": 65.09, "elapsed_time": "3:54:46", "remaining_time": "2:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2498, "total_steps": 3836, "loss": 0.1585, "learning_rate": 1.486835139934734e-06, "epoch": 0.6510930831134135, "percentage": 65.12, "elapsed_time": "3:54:51", "remaining_time": "2:05:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2499, "total_steps": 3836, "loss": 0.1389, "learning_rate": 1.4848651267800224e-06, "epoch": 0.6513537288632587, "percentage": 65.15, "elapsed_time": "3:54:56", "remaining_time": "2:05:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 3836, "loss": 0.1393, "learning_rate": 1.4828958681383163e-06, "epoch": 0.651614374613104, "percentage": 65.17, "elapsed_time": "3:55:02", "remaining_time": "2:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 3836, "eval_loss": 0.14706705510616302, "epoch": 0.651614374613104, "percentage": 65.17, "elapsed_time": "3:55:57", "remaining_time": "2:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2501, "total_steps": 3836, "loss": 0.159, "learning_rate": 1.4809273654732925e-06, "epoch": 0.6518750203629492, "percentage": 65.2, "elapsed_time": "3:56:03", "remaining_time": "2:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2502, "total_steps": 3836, "loss": 0.1563, "learning_rate": 1.4789596202480678e-06, "epoch": 0.6521356661127945, "percentage": 65.22, "elapsed_time": "3:56:08", "remaining_time": "2:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2503, "total_steps": 3836, "loss": 0.1517, "learning_rate": 1.4769926339251972e-06, "epoch": 0.6523963118626397, "percentage": 65.25, "elapsed_time": "3:56:14", "remaining_time": "2:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2504, "total_steps": 3836, "loss": 0.1567, "learning_rate": 1.475026407966669e-06, "epoch": 0.6526569576124849, "percentage": 65.28, "elapsed_time": "3:56:20", "remaining_time": "2:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2505, "total_steps": 3836, "loss": 0.1487, "learning_rate": 1.4730609438339095e-06, "epoch": 0.6529176033623302, "percentage": 65.3, "elapsed_time": "3:56:25", "remaining_time": "2:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2506, "total_steps": 3836, "loss": 0.1533, "learning_rate": 1.4710962429877763e-06, "epoch": 0.6531782491121754, "percentage": 65.33, "elapsed_time": "3:56:30", "remaining_time": "2:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2507, "total_steps": 3836, "loss": 0.1375, "learning_rate": 1.4691323068885593e-06, "epoch": 0.6534388948620207, "percentage": 65.35, "elapsed_time": "3:56:36", "remaining_time": "2:05:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2508, "total_steps": 3836, "loss": 0.1458, "learning_rate": 1.4671691369959826e-06, "epoch": 0.6536995406118659, "percentage": 65.38, "elapsed_time": "3:56:42", "remaining_time": "2:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2509, "total_steps": 3836, "loss": 0.1454, "learning_rate": 1.4652067347691985e-06, "epoch": 0.6539601863617112, "percentage": 65.41, "elapsed_time": "3:56:47", "remaining_time": "2:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2510, "total_steps": 3836, "loss": 0.1454, "learning_rate": 1.4632451016667899e-06, "epoch": 0.6542208321115563, "percentage": 65.43, "elapsed_time": "3:56:51", "remaining_time": "2:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2511, "total_steps": 3836, "loss": 0.1515, "learning_rate": 1.461284239146768e-06, "epoch": 0.6544814778614017, "percentage": 65.46, "elapsed_time": "3:56:57", "remaining_time": "2:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2512, "total_steps": 3836, "loss": 0.1501, "learning_rate": 1.4593241486665705e-06, "epoch": 0.6547421236112468, "percentage": 65.48, "elapsed_time": "3:57:03", "remaining_time": "2:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2513, "total_steps": 3836, "loss": 0.1389, "learning_rate": 1.45736483168306e-06, "epoch": 0.6550027693610921, "percentage": 65.51, "elapsed_time": "3:57:08", "remaining_time": "2:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2514, "total_steps": 3836, "loss": 0.138, "learning_rate": 1.4554062896525295e-06, "epoch": 0.6552634151109373, "percentage": 65.54, "elapsed_time": "3:57:14", "remaining_time": "2:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2515, "total_steps": 3836, "loss": 0.1561, "learning_rate": 1.45344852403069e-06, "epoch": 0.6555240608607826, "percentage": 65.56, "elapsed_time": "3:57:19", "remaining_time": "2:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2516, "total_steps": 3836, "loss": 0.1306, "learning_rate": 1.4514915362726773e-06, "epoch": 0.6557847066106278, "percentage": 65.59, "elapsed_time": "3:57:24", "remaining_time": "2:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2517, "total_steps": 3836, "loss": 0.1511, "learning_rate": 1.4495353278330527e-06, "epoch": 0.6560453523604731, "percentage": 65.62, "elapsed_time": "3:57:30", "remaining_time": "2:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2518, "total_steps": 3836, "loss": 0.1399, "learning_rate": 1.447579900165792e-06, "epoch": 0.6563059981103183, "percentage": 65.64, "elapsed_time": "3:57:36", "remaining_time": "2:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2519, "total_steps": 3836, "loss": 0.1393, "learning_rate": 1.4456252547242935e-06, "epoch": 0.6565666438601635, "percentage": 65.67, "elapsed_time": "3:57:41", "remaining_time": "2:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2520, "total_steps": 3836, "loss": 0.1485, "learning_rate": 1.4436713929613771e-06, "epoch": 0.6568272896100088, "percentage": 65.69, "elapsed_time": "3:57:47", "remaining_time": "2:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2521, "total_steps": 3836, "loss": 0.145, "learning_rate": 1.4417183163292759e-06, "epoch": 0.657087935359854, "percentage": 65.72, "elapsed_time": "3:57:52", "remaining_time": "2:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2522, "total_steps": 3836, "loss": 0.1444, "learning_rate": 1.4397660262796411e-06, "epoch": 0.6573485811096993, "percentage": 65.75, "elapsed_time": "3:57:58", "remaining_time": "2:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2523, "total_steps": 3836, "loss": 0.1403, "learning_rate": 1.4378145242635397e-06, "epoch": 0.6576092268595445, "percentage": 65.77, "elapsed_time": "3:58:04", "remaining_time": "2:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2524, "total_steps": 3836, "loss": 0.1379, "learning_rate": 1.4358638117314521e-06, "epoch": 0.6578698726093898, "percentage": 65.8, "elapsed_time": "3:58:09", "remaining_time": "2:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2525, "total_steps": 3836, "loss": 0.1442, "learning_rate": 1.4339138901332723e-06, "epoch": 0.658130518359235, "percentage": 65.82, "elapsed_time": "3:58:15", "remaining_time": "2:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2526, "total_steps": 3836, "loss": 0.1403, "learning_rate": 1.4319647609183058e-06, "epoch": 0.6583911641090803, "percentage": 65.85, "elapsed_time": "3:58:22", "remaining_time": "2:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2527, "total_steps": 3836, "loss": 0.1293, "learning_rate": 1.430016425535271e-06, "epoch": 0.6586518098589255, "percentage": 65.88, "elapsed_time": "3:58:27", "remaining_time": "2:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2528, "total_steps": 3836, "loss": 0.1451, "learning_rate": 1.428068885432296e-06, "epoch": 0.6589124556087708, "percentage": 65.9, "elapsed_time": "3:58:33", "remaining_time": "2:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2529, "total_steps": 3836, "loss": 0.1444, "learning_rate": 1.4261221420569135e-06, "epoch": 0.659173101358616, "percentage": 65.93, "elapsed_time": "3:58:38", "remaining_time": "2:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2530, "total_steps": 3836, "loss": 0.1535, "learning_rate": 1.4241761968560703e-06, "epoch": 0.6594337471084613, "percentage": 65.95, "elapsed_time": "3:58:45", "remaining_time": "2:03:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2531, "total_steps": 3836, "loss": 0.1375, "learning_rate": 1.4222310512761162e-06, "epoch": 0.6596943928583064, "percentage": 65.98, "elapsed_time": "3:58:50", "remaining_time": "2:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2532, "total_steps": 3836, "loss": 0.1554, "learning_rate": 1.4202867067628068e-06, "epoch": 0.6599550386081517, "percentage": 66.01, "elapsed_time": "3:58:56", "remaining_time": "2:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2533, "total_steps": 3836, "loss": 0.1408, "learning_rate": 1.418343164761304e-06, "epoch": 0.6602156843579969, "percentage": 66.03, "elapsed_time": "3:59:01", "remaining_time": "2:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2534, "total_steps": 3836, "loss": 0.1438, "learning_rate": 1.4164004267161718e-06, "epoch": 0.6604763301078421, "percentage": 66.06, "elapsed_time": "3:59:07", "remaining_time": "2:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2535, "total_steps": 3836, "loss": 0.1544, "learning_rate": 1.4144584940713769e-06, "epoch": 0.6607369758576874, "percentage": 66.08, "elapsed_time": "3:59:12", "remaining_time": "2:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2536, "total_steps": 3836, "loss": 0.1375, "learning_rate": 1.4125173682702869e-06, "epoch": 0.6609976216075326, "percentage": 66.11, "elapsed_time": "3:59:18", "remaining_time": "2:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2537, "total_steps": 3836, "loss": 0.1513, "learning_rate": 1.4105770507556718e-06, "epoch": 0.6612582673573779, "percentage": 66.14, "elapsed_time": "3:59:23", "remaining_time": "2:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2538, "total_steps": 3836, "loss": 0.1453, "learning_rate": 1.4086375429696987e-06, "epoch": 0.6615189131072231, "percentage": 66.16, "elapsed_time": "3:59:29", "remaining_time": "2:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2539, "total_steps": 3836, "loss": 0.1442, "learning_rate": 1.4066988463539338e-06, "epoch": 0.6617795588570684, "percentage": 66.19, "elapsed_time": "3:59:35", "remaining_time": "2:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2540, "total_steps": 3836, "loss": 0.1494, "learning_rate": 1.4047609623493396e-06, "epoch": 0.6620402046069136, "percentage": 66.21, "elapsed_time": "3:59:40", "remaining_time": "2:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2541, "total_steps": 3836, "loss": 0.1366, "learning_rate": 1.4028238923962753e-06, "epoch": 0.6623008503567589, "percentage": 66.24, "elapsed_time": "3:59:46", "remaining_time": "2:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2542, "total_steps": 3836, "loss": 0.1422, "learning_rate": 1.400887637934495e-06, "epoch": 0.6625614961066041, "percentage": 66.27, "elapsed_time": "3:59:52", "remaining_time": "2:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2543, "total_steps": 3836, "loss": 0.1319, "learning_rate": 1.3989522004031457e-06, "epoch": 0.6628221418564494, "percentage": 66.29, "elapsed_time": "3:59:58", "remaining_time": "2:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2544, "total_steps": 3836, "loss": 0.1481, "learning_rate": 1.3970175812407705e-06, "epoch": 0.6630827876062946, "percentage": 66.32, "elapsed_time": "4:00:03", "remaining_time": "2:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2545, "total_steps": 3836, "loss": 0.1398, "learning_rate": 1.3950837818852982e-06, "epoch": 0.6633434333561399, "percentage": 66.35, "elapsed_time": "4:00:09", "remaining_time": "2:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2546, "total_steps": 3836, "loss": 0.1391, "learning_rate": 1.393150803774055e-06, "epoch": 0.6636040791059851, "percentage": 66.37, "elapsed_time": "4:00:14", "remaining_time": "2:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2547, "total_steps": 3836, "loss": 0.15, "learning_rate": 1.3912186483437522e-06, "epoch": 0.6638647248558304, "percentage": 66.4, "elapsed_time": "4:00:19", "remaining_time": "2:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2548, "total_steps": 3836, "loss": 0.1477, "learning_rate": 1.3892873170304913e-06, "epoch": 0.6641253706056756, "percentage": 66.42, "elapsed_time": "4:00:24", "remaining_time": "2:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2549, "total_steps": 3836, "loss": 0.1529, "learning_rate": 1.3873568112697596e-06, "epoch": 0.6643860163555207, "percentage": 66.45, "elapsed_time": "4:00:30", "remaining_time": "2:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2550, "total_steps": 3836, "loss": 0.1555, "learning_rate": 1.3854271324964353e-06, "epoch": 0.664646662105366, "percentage": 66.48, "elapsed_time": "4:00:35", "remaining_time": "2:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2551, "total_steps": 3836, "loss": 0.1384, "learning_rate": 1.3834982821447762e-06, "epoch": 0.6649073078552112, "percentage": 66.5, "elapsed_time": "4:00:41", "remaining_time": "2:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2552, "total_steps": 3836, "loss": 0.1609, "learning_rate": 1.3815702616484262e-06, "epoch": 0.6651679536050565, "percentage": 66.53, "elapsed_time": "4:00:47", "remaining_time": "2:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2553, "total_steps": 3836, "loss": 0.16, "learning_rate": 1.3796430724404155e-06, "epoch": 0.6654285993549017, "percentage": 66.55, "elapsed_time": "4:00:53", "remaining_time": "2:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2554, "total_steps": 3836, "loss": 0.1431, "learning_rate": 1.3777167159531532e-06, "epoch": 0.665689245104747, "percentage": 66.58, "elapsed_time": "4:00:58", "remaining_time": "2:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2555, "total_steps": 3836, "loss": 0.1345, "learning_rate": 1.3757911936184303e-06, "epoch": 0.6659498908545922, "percentage": 66.61, "elapsed_time": "4:01:04", "remaining_time": "2:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2556, "total_steps": 3836, "loss": 0.1385, "learning_rate": 1.3738665068674176e-06, "epoch": 0.6662105366044375, "percentage": 66.63, "elapsed_time": "4:01:10", "remaining_time": "2:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2557, "total_steps": 3836, "loss": 0.1483, "learning_rate": 1.3719426571306654e-06, "epoch": 0.6664711823542827, "percentage": 66.66, "elapsed_time": "4:01:16", "remaining_time": "2:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2558, "total_steps": 3836, "loss": 0.1337, "learning_rate": 1.3700196458381012e-06, "epoch": 0.666731828104128, "percentage": 66.68, "elapsed_time": "4:01:22", "remaining_time": "2:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2559, "total_steps": 3836, "loss": 0.1381, "learning_rate": 1.368097474419029e-06, "epoch": 0.6669924738539732, "percentage": 66.71, "elapsed_time": "4:01:27", "remaining_time": "2:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2560, "total_steps": 3836, "loss": 0.163, "learning_rate": 1.3661761443021316e-06, "epoch": 0.6672531196038185, "percentage": 66.74, "elapsed_time": "4:01:33", "remaining_time": "2:00:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2561, "total_steps": 3836, "loss": 0.1409, "learning_rate": 1.364255656915463e-06, "epoch": 0.6675137653536637, "percentage": 66.76, "elapsed_time": "4:01:39", "remaining_time": "2:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2562, "total_steps": 3836, "loss": 0.1578, "learning_rate": 1.36233601368645e-06, "epoch": 0.667774411103509, "percentage": 66.79, "elapsed_time": "4:01:43", "remaining_time": "2:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2563, "total_steps": 3836, "loss": 0.1491, "learning_rate": 1.3604172160418965e-06, "epoch": 0.6680350568533542, "percentage": 66.81, "elapsed_time": "4:01:49", "remaining_time": "2:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2564, "total_steps": 3836, "loss": 0.1445, "learning_rate": 1.3584992654079742e-06, "epoch": 0.6682957026031995, "percentage": 66.84, "elapsed_time": "4:01:55", "remaining_time": "2:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2565, "total_steps": 3836, "loss": 0.1397, "learning_rate": 1.3565821632102269e-06, "epoch": 0.6685563483530447, "percentage": 66.87, "elapsed_time": "4:02:00", "remaining_time": "1:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2566, "total_steps": 3836, "loss": 0.1435, "learning_rate": 1.3546659108735666e-06, "epoch": 0.6688169941028899, "percentage": 66.89, "elapsed_time": "4:02:06", "remaining_time": "1:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2567, "total_steps": 3836, "loss": 0.1414, "learning_rate": 1.352750509822275e-06, "epoch": 0.6690776398527352, "percentage": 66.92, "elapsed_time": "4:02:11", "remaining_time": "1:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2568, "total_steps": 3836, "loss": 0.1419, "learning_rate": 1.3508359614799998e-06, "epoch": 0.6693382856025804, "percentage": 66.94, "elapsed_time": "4:02:16", "remaining_time": "1:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2569, "total_steps": 3836, "loss": 0.1364, "learning_rate": 1.3489222672697545e-06, "epoch": 0.6695989313524257, "percentage": 66.97, "elapsed_time": "4:02:22", "remaining_time": "1:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2570, "total_steps": 3836, "loss": 0.1393, "learning_rate": 1.3470094286139213e-06, "epoch": 0.6698595771022708, "percentage": 67.0, "elapsed_time": "4:02:28", "remaining_time": "1:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2571, "total_steps": 3836, "loss": 0.1609, "learning_rate": 1.345097446934242e-06, "epoch": 0.6701202228521161, "percentage": 67.02, "elapsed_time": "4:02:34", "remaining_time": "1:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2572, "total_steps": 3836, "loss": 0.1386, "learning_rate": 1.3431863236518242e-06, "epoch": 0.6703808686019613, "percentage": 67.05, "elapsed_time": "4:02:40", "remaining_time": "1:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2573, "total_steps": 3836, "loss": 0.1488, "learning_rate": 1.3412760601871364e-06, "epoch": 0.6706415143518066, "percentage": 67.08, "elapsed_time": "4:02:45", "remaining_time": "1:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2574, "total_steps": 3836, "loss": 0.139, "learning_rate": 1.3393666579600078e-06, "epoch": 0.6709021601016518, "percentage": 67.1, "elapsed_time": "4:02:50", "remaining_time": "1:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2575, "total_steps": 3836, "loss": 0.1425, "learning_rate": 1.337458118389628e-06, "epoch": 0.6711628058514971, "percentage": 67.13, "elapsed_time": "4:02:56", "remaining_time": "1:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2576, "total_steps": 3836, "loss": 0.1395, "learning_rate": 1.3355504428945464e-06, "epoch": 0.6714234516013423, "percentage": 67.15, "elapsed_time": "4:03:01", "remaining_time": "1:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2577, "total_steps": 3836, "loss": 0.1506, "learning_rate": 1.3336436328926697e-06, "epoch": 0.6716840973511876, "percentage": 67.18, "elapsed_time": "4:03:07", "remaining_time": "1:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2578, "total_steps": 3836, "loss": 0.1348, "learning_rate": 1.3317376898012573e-06, "epoch": 0.6719447431010328, "percentage": 67.21, "elapsed_time": "4:03:13", "remaining_time": "1:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2579, "total_steps": 3836, "loss": 0.1444, "learning_rate": 1.3298326150369313e-06, "epoch": 0.6722053888508781, "percentage": 67.23, "elapsed_time": "4:03:19", "remaining_time": "1:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2580, "total_steps": 3836, "loss": 0.1376, "learning_rate": 1.3279284100156633e-06, "epoch": 0.6724660346007233, "percentage": 67.26, "elapsed_time": "4:03:24", "remaining_time": "1:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2581, "total_steps": 3836, "loss": 0.1419, "learning_rate": 1.3260250761527802e-06, "epoch": 0.6727266803505685, "percentage": 67.28, "elapsed_time": "4:03:30", "remaining_time": "1:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2582, "total_steps": 3836, "loss": 0.1474, "learning_rate": 1.32412261486296e-06, "epoch": 0.6729873261004138, "percentage": 67.31, "elapsed_time": "4:03:34", "remaining_time": "1:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2583, "total_steps": 3836, "loss": 0.1453, "learning_rate": 1.3222210275602364e-06, "epoch": 0.673247971850259, "percentage": 67.34, "elapsed_time": "4:03:39", "remaining_time": "1:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2584, "total_steps": 3836, "loss": 0.1468, "learning_rate": 1.3203203156579875e-06, "epoch": 0.6735086176001043, "percentage": 67.36, "elapsed_time": "4:03:45", "remaining_time": "1:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2585, "total_steps": 3836, "loss": 0.1479, "learning_rate": 1.3184204805689435e-06, "epoch": 0.6737692633499495, "percentage": 67.39, "elapsed_time": "4:03:50", "remaining_time": "1:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2586, "total_steps": 3836, "loss": 0.1385, "learning_rate": 1.316521523705185e-06, "epoch": 0.6740299090997948, "percentage": 67.41, "elapsed_time": "4:03:55", "remaining_time": "1:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2587, "total_steps": 3836, "loss": 0.1448, "learning_rate": 1.3146234464781372e-06, "epoch": 0.67429055484964, "percentage": 67.44, "elapsed_time": "4:04:01", "remaining_time": "1:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2588, "total_steps": 3836, "loss": 0.1418, "learning_rate": 1.3127262502985722e-06, "epoch": 0.6745512005994853, "percentage": 67.47, "elapsed_time": "4:04:05", "remaining_time": "1:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2589, "total_steps": 3836, "loss": 0.1443, "learning_rate": 1.3108299365766064e-06, "epoch": 0.6748118463493304, "percentage": 67.49, "elapsed_time": "4:04:12", "remaining_time": "1:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2590, "total_steps": 3836, "loss": 0.1585, "learning_rate": 1.3089345067217025e-06, "epoch": 0.6750724920991757, "percentage": 67.52, "elapsed_time": "4:04:17", "remaining_time": "1:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2591, "total_steps": 3836, "loss": 0.1461, "learning_rate": 1.307039962142664e-06, "epoch": 0.6753331378490209, "percentage": 67.54, "elapsed_time": "4:04:23", "remaining_time": "1:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2592, "total_steps": 3836, "loss": 0.1374, "learning_rate": 1.3051463042476358e-06, "epoch": 0.6755937835988662, "percentage": 67.57, "elapsed_time": "4:04:29", "remaining_time": "1:57:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2593, "total_steps": 3836, "loss": 0.1463, "learning_rate": 1.3032535344441096e-06, "epoch": 0.6758544293487114, "percentage": 67.6, "elapsed_time": "4:04:34", "remaining_time": "1:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2594, "total_steps": 3836, "loss": 0.1418, "learning_rate": 1.301361654138909e-06, "epoch": 0.6761150750985567, "percentage": 67.62, "elapsed_time": "4:04:40", "remaining_time": "1:57:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2595, "total_steps": 3836, "loss": 0.1456, "learning_rate": 1.2994706647382001e-06, "epoch": 0.6763757208484019, "percentage": 67.65, "elapsed_time": "4:04:45", "remaining_time": "1:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2596, "total_steps": 3836, "loss": 0.138, "learning_rate": 1.297580567647489e-06, "epoch": 0.6766363665982471, "percentage": 67.67, "elapsed_time": "4:04:50", "remaining_time": "1:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2597, "total_steps": 3836, "loss": 0.1334, "learning_rate": 1.2956913642716157e-06, "epoch": 0.6768970123480924, "percentage": 67.7, "elapsed_time": "4:04:56", "remaining_time": "1:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2598, "total_steps": 3836, "loss": 0.1366, "learning_rate": 1.2938030560147558e-06, "epoch": 0.6771576580979376, "percentage": 67.73, "elapsed_time": "4:05:01", "remaining_time": "1:56:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2599, "total_steps": 3836, "loss": 0.133, "learning_rate": 1.2919156442804216e-06, "epoch": 0.6774183038477829, "percentage": 67.75, "elapsed_time": "4:05:07", "remaining_time": "1:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2600, "total_steps": 3836, "loss": 0.1325, "learning_rate": 1.2900291304714568e-06, "epoch": 0.6776789495976281, "percentage": 67.78, "elapsed_time": "4:05:12", "remaining_time": "1:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2601, "total_steps": 3836, "loss": 0.1255, "learning_rate": 1.2881435159900396e-06, "epoch": 0.6779395953474734, "percentage": 67.81, "elapsed_time": "4:05:17", "remaining_time": "1:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2602, "total_steps": 3836, "loss": 0.1495, "learning_rate": 1.2862588022376782e-06, "epoch": 0.6782002410973186, "percentage": 67.83, "elapsed_time": "4:05:24", "remaining_time": "1:56:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2603, "total_steps": 3836, "loss": 0.146, "learning_rate": 1.284374990615213e-06, "epoch": 0.6784608868471639, "percentage": 67.86, "elapsed_time": "4:05:30", "remaining_time": "1:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2604, "total_steps": 3836, "loss": 0.151, "learning_rate": 1.2824920825228132e-06, "epoch": 0.6787215325970091, "percentage": 67.88, "elapsed_time": "4:05:35", "remaining_time": "1:56:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2605, "total_steps": 3836, "loss": 0.1479, "learning_rate": 1.2806100793599758e-06, "epoch": 0.6789821783468544, "percentage": 67.91, "elapsed_time": "4:05:40", "remaining_time": "1:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2606, "total_steps": 3836, "loss": 0.139, "learning_rate": 1.278728982525525e-06, "epoch": 0.6792428240966996, "percentage": 67.94, "elapsed_time": "4:05:45", "remaining_time": "1:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2607, "total_steps": 3836, "loss": 0.1481, "learning_rate": 1.276848793417613e-06, "epoch": 0.6795034698465449, "percentage": 67.96, "elapsed_time": "4:05:52", "remaining_time": "1:55:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2608, "total_steps": 3836, "loss": 0.1367, "learning_rate": 1.2749695134337149e-06, "epoch": 0.67976411559639, "percentage": 67.99, "elapsed_time": "4:05:57", "remaining_time": "1:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2609, "total_steps": 3836, "loss": 0.1519, "learning_rate": 1.2730911439706327e-06, "epoch": 0.6800247613462354, "percentage": 68.01, "elapsed_time": "4:06:02", "remaining_time": "1:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2610, "total_steps": 3836, "loss": 0.15, "learning_rate": 1.2712136864244917e-06, "epoch": 0.6802854070960805, "percentage": 68.04, "elapsed_time": "4:06:08", "remaining_time": "1:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2611, "total_steps": 3836, "loss": 0.1447, "learning_rate": 1.2693371421907342e-06, "epoch": 0.6805460528459257, "percentage": 68.07, "elapsed_time": "4:06:13", "remaining_time": "1:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2612, "total_steps": 3836, "loss": 0.1332, "learning_rate": 1.2674615126641313e-06, "epoch": 0.680806698595771, "percentage": 68.09, "elapsed_time": "4:06:19", "remaining_time": "1:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2613, "total_steps": 3836, "loss": 0.1541, "learning_rate": 1.2655867992387687e-06, "epoch": 0.6810673443456162, "percentage": 68.12, "elapsed_time": "4:06:24", "remaining_time": "1:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2614, "total_steps": 3836, "loss": 0.1408, "learning_rate": 1.2637130033080541e-06, "epoch": 0.6813279900954615, "percentage": 68.14, "elapsed_time": "4:06:29", "remaining_time": "1:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2615, "total_steps": 3836, "loss": 0.1506, "learning_rate": 1.2618401262647111e-06, "epoch": 0.6815886358453067, "percentage": 68.17, "elapsed_time": "4:06:35", "remaining_time": "1:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2616, "total_steps": 3836, "loss": 0.1489, "learning_rate": 1.2599681695007822e-06, "epoch": 0.681849281595152, "percentage": 68.2, "elapsed_time": "4:06:41", "remaining_time": "1:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2617, "total_steps": 3836, "loss": 0.1428, "learning_rate": 1.258097134407625e-06, "epoch": 0.6821099273449972, "percentage": 68.22, "elapsed_time": "4:06:46", "remaining_time": "1:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2618, "total_steps": 3836, "loss": 0.1556, "learning_rate": 1.2562270223759104e-06, "epoch": 0.6823705730948425, "percentage": 68.25, "elapsed_time": "4:06:51", "remaining_time": "1:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2619, "total_steps": 3836, "loss": 0.1463, "learning_rate": 1.2543578347956282e-06, "epoch": 0.6826312188446877, "percentage": 68.27, "elapsed_time": "4:06:57", "remaining_time": "1:54:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2620, "total_steps": 3836, "loss": 0.131, "learning_rate": 1.2524895730560755e-06, "epoch": 0.682891864594533, "percentage": 68.3, "elapsed_time": "4:07:02", "remaining_time": "1:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2621, "total_steps": 3836, "loss": 0.1238, "learning_rate": 1.250622238545865e-06, "epoch": 0.6831525103443782, "percentage": 68.33, "elapsed_time": "4:07:08", "remaining_time": "1:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2622, "total_steps": 3836, "loss": 0.1558, "learning_rate": 1.2487558326529177e-06, "epoch": 0.6834131560942235, "percentage": 68.35, "elapsed_time": "4:07:14", "remaining_time": "1:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2623, "total_steps": 3836, "loss": 0.1548, "learning_rate": 1.2468903567644661e-06, "epoch": 0.6836738018440687, "percentage": 68.38, "elapsed_time": "4:07:20", "remaining_time": "1:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2624, "total_steps": 3836, "loss": 0.1316, "learning_rate": 1.2450258122670508e-06, "epoch": 0.683934447593914, "percentage": 68.4, "elapsed_time": "4:07:25", "remaining_time": "1:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2625, "total_steps": 3836, "loss": 0.1412, "learning_rate": 1.2431622005465193e-06, "epoch": 0.6841950933437592, "percentage": 68.43, "elapsed_time": "4:07:31", "remaining_time": "1:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2626, "total_steps": 3836, "loss": 0.1478, "learning_rate": 1.2412995229880295e-06, "epoch": 0.6844557390936044, "percentage": 68.46, "elapsed_time": "4:07:36", "remaining_time": "1:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2627, "total_steps": 3836, "loss": 0.1433, "learning_rate": 1.2394377809760396e-06, "epoch": 0.6847163848434497, "percentage": 68.48, "elapsed_time": "4:07:42", "remaining_time": "1:54:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2628, "total_steps": 3836, "loss": 0.1295, "learning_rate": 1.2375769758943148e-06, "epoch": 0.6849770305932948, "percentage": 68.51, "elapsed_time": "4:07:47", "remaining_time": "1:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2629, "total_steps": 3836, "loss": 0.1498, "learning_rate": 1.2357171091259263e-06, "epoch": 0.6852376763431401, "percentage": 68.53, "elapsed_time": "4:07:53", "remaining_time": "1:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2630, "total_steps": 3836, "loss": 0.1437, "learning_rate": 1.2338581820532442e-06, "epoch": 0.6854983220929853, "percentage": 68.56, "elapsed_time": "4:07:59", "remaining_time": "1:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2631, "total_steps": 3836, "loss": 0.1316, "learning_rate": 1.2320001960579414e-06, "epoch": 0.6857589678428306, "percentage": 68.59, "elapsed_time": "4:08:04", "remaining_time": "1:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2632, "total_steps": 3836, "loss": 0.1468, "learning_rate": 1.2301431525209942e-06, "epoch": 0.6860196135926758, "percentage": 68.61, "elapsed_time": "4:08:09", "remaining_time": "1:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2633, "total_steps": 3836, "loss": 0.1329, "learning_rate": 1.2282870528226731e-06, "epoch": 0.6862802593425211, "percentage": 68.64, "elapsed_time": "4:08:14", "remaining_time": "1:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2634, "total_steps": 3836, "loss": 0.141, "learning_rate": 1.2264318983425498e-06, "epoch": 0.6865409050923663, "percentage": 68.67, "elapsed_time": "4:08:20", "remaining_time": "1:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2635, "total_steps": 3836, "loss": 0.1432, "learning_rate": 1.2245776904594953e-06, "epoch": 0.6868015508422116, "percentage": 68.69, "elapsed_time": "4:08:25", "remaining_time": "1:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2636, "total_steps": 3836, "loss": 0.1461, "learning_rate": 1.222724430551674e-06, "epoch": 0.6870621965920568, "percentage": 68.72, "elapsed_time": "4:08:30", "remaining_time": "1:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2637, "total_steps": 3836, "loss": 0.1329, "learning_rate": 1.2208721199965476e-06, "epoch": 0.6873228423419021, "percentage": 68.74, "elapsed_time": "4:08:36", "remaining_time": "1:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2638, "total_steps": 3836, "loss": 0.1477, "learning_rate": 1.2190207601708707e-06, "epoch": 0.6875834880917473, "percentage": 68.77, "elapsed_time": "4:08:42", "remaining_time": "1:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2639, "total_steps": 3836, "loss": 0.1402, "learning_rate": 1.2171703524506925e-06, "epoch": 0.6878441338415926, "percentage": 68.8, "elapsed_time": "4:08:47", "remaining_time": "1:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2640, "total_steps": 3836, "loss": 0.1561, "learning_rate": 1.215320898211354e-06, "epoch": 0.6881047795914378, "percentage": 68.82, "elapsed_time": "4:08:52", "remaining_time": "1:52:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2641, "total_steps": 3836, "loss": 0.1575, "learning_rate": 1.2134723988274868e-06, "epoch": 0.688365425341283, "percentage": 68.85, "elapsed_time": "4:08:58", "remaining_time": "1:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2642, "total_steps": 3836, "loss": 0.1394, "learning_rate": 1.2116248556730151e-06, "epoch": 0.6886260710911283, "percentage": 68.87, "elapsed_time": "4:09:03", "remaining_time": "1:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2643, "total_steps": 3836, "loss": 0.1411, "learning_rate": 1.2097782701211511e-06, "epoch": 0.6888867168409735, "percentage": 68.9, "elapsed_time": "4:09:09", "remaining_time": "1:52:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2644, "total_steps": 3836, "loss": 0.1354, "learning_rate": 1.207932643544392e-06, "epoch": 0.6891473625908188, "percentage": 68.93, "elapsed_time": "4:09:15", "remaining_time": "1:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2645, "total_steps": 3836, "loss": 0.146, "learning_rate": 1.2060879773145282e-06, "epoch": 0.689408008340664, "percentage": 68.95, "elapsed_time": "4:09:20", "remaining_time": "1:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2646, "total_steps": 3836, "loss": 0.1471, "learning_rate": 1.2042442728026325e-06, "epoch": 0.6896686540905093, "percentage": 68.98, "elapsed_time": "4:09:25", "remaining_time": "1:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2647, "total_steps": 3836, "loss": 0.1468, "learning_rate": 1.2024015313790632e-06, "epoch": 0.6899292998403544, "percentage": 69.0, "elapsed_time": "4:09:31", "remaining_time": "1:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2648, "total_steps": 3836, "loss": 0.1397, "learning_rate": 1.200559754413464e-06, "epoch": 0.6901899455901997, "percentage": 69.03, "elapsed_time": "4:09:36", "remaining_time": "1:51:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2649, "total_steps": 3836, "loss": 0.1498, "learning_rate": 1.1987189432747604e-06, "epoch": 0.6904505913400449, "percentage": 69.06, "elapsed_time": "4:09:42", "remaining_time": "1:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2650, "total_steps": 3836, "loss": 0.1377, "learning_rate": 1.1968790993311613e-06, "epoch": 0.6907112370898902, "percentage": 69.08, "elapsed_time": "4:09:47", "remaining_time": "1:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2651, "total_steps": 3836, "loss": 0.1342, "learning_rate": 1.1950402239501547e-06, "epoch": 0.6909718828397354, "percentage": 69.11, "elapsed_time": "4:09:52", "remaining_time": "1:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2652, "total_steps": 3836, "loss": 0.1335, "learning_rate": 1.193202318498512e-06, "epoch": 0.6912325285895807, "percentage": 69.13, "elapsed_time": "4:09:58", "remaining_time": "1:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2653, "total_steps": 3836, "loss": 0.1285, "learning_rate": 1.1913653843422813e-06, "epoch": 0.6914931743394259, "percentage": 69.16, "elapsed_time": "4:10:03", "remaining_time": "1:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2654, "total_steps": 3836, "loss": 0.1376, "learning_rate": 1.1895294228467886e-06, "epoch": 0.6917538200892712, "percentage": 69.19, "elapsed_time": "4:10:08", "remaining_time": "1:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2655, "total_steps": 3836, "loss": 0.1441, "learning_rate": 1.1876944353766382e-06, "epoch": 0.6920144658391164, "percentage": 69.21, "elapsed_time": "4:10:14", "remaining_time": "1:51:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2656, "total_steps": 3836, "loss": 0.144, "learning_rate": 1.1858604232957096e-06, "epoch": 0.6922751115889616, "percentage": 69.24, "elapsed_time": "4:10:20", "remaining_time": "1:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2657, "total_steps": 3836, "loss": 0.15, "learning_rate": 1.1840273879671576e-06, "epoch": 0.6925357573388069, "percentage": 69.26, "elapsed_time": "4:10:25", "remaining_time": "1:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2658, "total_steps": 3836, "loss": 0.1387, "learning_rate": 1.18219533075341e-06, "epoch": 0.6927964030886521, "percentage": 69.29, "elapsed_time": "4:10:31", "remaining_time": "1:51:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2659, "total_steps": 3836, "loss": 0.1477, "learning_rate": 1.1803642530161715e-06, "epoch": 0.6930570488384974, "percentage": 69.32, "elapsed_time": "4:10:36", "remaining_time": "1:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2660, "total_steps": 3836, "loss": 0.1524, "learning_rate": 1.1785341561164135e-06, "epoch": 0.6933176945883426, "percentage": 69.34, "elapsed_time": "4:10:42", "remaining_time": "1:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2661, "total_steps": 3836, "loss": 0.1378, "learning_rate": 1.1767050414143798e-06, "epoch": 0.6935783403381879, "percentage": 69.37, "elapsed_time": "4:10:47", "remaining_time": "1:50:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2662, "total_steps": 3836, "loss": 0.1376, "learning_rate": 1.1748769102695882e-06, "epoch": 0.6938389860880331, "percentage": 69.4, "elapsed_time": "4:10:53", "remaining_time": "1:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2663, "total_steps": 3836, "loss": 0.1466, "learning_rate": 1.1730497640408203e-06, "epoch": 0.6940996318378784, "percentage": 69.42, "elapsed_time": "4:10:58", "remaining_time": "1:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2664, "total_steps": 3836, "loss": 0.1439, "learning_rate": 1.1712236040861278e-06, "epoch": 0.6943602775877236, "percentage": 69.45, "elapsed_time": "4:11:03", "remaining_time": "1:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2665, "total_steps": 3836, "loss": 0.1472, "learning_rate": 1.1693984317628314e-06, "epoch": 0.6946209233375689, "percentage": 69.47, "elapsed_time": "4:11:09", "remaining_time": "1:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2666, "total_steps": 3836, "loss": 0.1306, "learning_rate": 1.1675742484275132e-06, "epoch": 0.694881569087414, "percentage": 69.5, "elapsed_time": "4:11:14", "remaining_time": "1:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2667, "total_steps": 3836, "loss": 0.1397, "learning_rate": 1.1657510554360224e-06, "epoch": 0.6951422148372594, "percentage": 69.53, "elapsed_time": "4:11:19", "remaining_time": "1:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2668, "total_steps": 3836, "loss": 0.1428, "learning_rate": 1.1639288541434745e-06, "epoch": 0.6954028605871045, "percentage": 69.55, "elapsed_time": "4:11:25", "remaining_time": "1:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2669, "total_steps": 3836, "loss": 0.1312, "learning_rate": 1.1621076459042447e-06, "epoch": 0.6956635063369498, "percentage": 69.58, "elapsed_time": "4:11:30", "remaining_time": "1:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2670, "total_steps": 3836, "loss": 0.1432, "learning_rate": 1.160287432071971e-06, "epoch": 0.695924152086795, "percentage": 69.6, "elapsed_time": "4:11:35", "remaining_time": "1:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2671, "total_steps": 3836, "loss": 0.1295, "learning_rate": 1.1584682139995527e-06, "epoch": 0.6961847978366402, "percentage": 69.63, "elapsed_time": "4:11:41", "remaining_time": "1:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2672, "total_steps": 3836, "loss": 0.1417, "learning_rate": 1.1566499930391484e-06, "epoch": 0.6964454435864855, "percentage": 69.66, "elapsed_time": "4:11:46", "remaining_time": "1:49:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2673, "total_steps": 3836, "loss": 0.135, "learning_rate": 1.1548327705421763e-06, "epoch": 0.6967060893363307, "percentage": 69.68, "elapsed_time": "4:11:51", "remaining_time": "1:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2674, "total_steps": 3836, "loss": 0.1408, "learning_rate": 1.153016547859311e-06, "epoch": 0.696966735086176, "percentage": 69.71, "elapsed_time": "4:11:56", "remaining_time": "1:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2675, "total_steps": 3836, "loss": 0.1448, "learning_rate": 1.1512013263404867e-06, "epoch": 0.6972273808360212, "percentage": 69.73, "elapsed_time": "4:12:02", "remaining_time": "1:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2676, "total_steps": 3836, "loss": 0.1438, "learning_rate": 1.1493871073348926e-06, "epoch": 0.6974880265858665, "percentage": 69.76, "elapsed_time": "4:12:08", "remaining_time": "1:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2677, "total_steps": 3836, "loss": 0.1457, "learning_rate": 1.1475738921909682e-06, "epoch": 0.6977486723357117, "percentage": 69.79, "elapsed_time": "4:12:13", "remaining_time": "1:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2678, "total_steps": 3836, "loss": 0.1465, "learning_rate": 1.1457616822564145e-06, "epoch": 0.698009318085557, "percentage": 69.81, "elapsed_time": "4:12:19", "remaining_time": "1:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2679, "total_steps": 3836, "loss": 0.1439, "learning_rate": 1.1439504788781797e-06, "epoch": 0.6982699638354022, "percentage": 69.84, "elapsed_time": "4:12:24", "remaining_time": "1:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2680, "total_steps": 3836, "loss": 0.149, "learning_rate": 1.1421402834024662e-06, "epoch": 0.6985306095852475, "percentage": 69.86, "elapsed_time": "4:12:30", "remaining_time": "1:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2681, "total_steps": 3836, "loss": 0.1429, "learning_rate": 1.1403310971747263e-06, "epoch": 0.6987912553350927, "percentage": 69.89, "elapsed_time": "4:12:35", "remaining_time": "1:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2682, "total_steps": 3836, "loss": 0.1509, "learning_rate": 1.1385229215396638e-06, "epoch": 0.699051901084938, "percentage": 69.92, "elapsed_time": "4:12:41", "remaining_time": "1:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2683, "total_steps": 3836, "loss": 0.1414, "learning_rate": 1.1367157578412288e-06, "epoch": 0.6993125468347832, "percentage": 69.94, "elapsed_time": "4:12:46", "remaining_time": "1:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2684, "total_steps": 3836, "loss": 0.1613, "learning_rate": 1.1349096074226205e-06, "epoch": 0.6995731925846285, "percentage": 69.97, "elapsed_time": "4:12:52", "remaining_time": "1:48:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2685, "total_steps": 3836, "loss": 0.1403, "learning_rate": 1.1331044716262869e-06, "epoch": 0.6998338383344737, "percentage": 69.99, "elapsed_time": "4:12:58", "remaining_time": "1:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2686, "total_steps": 3836, "loss": 0.1384, "learning_rate": 1.1313003517939189e-06, "epoch": 0.7000944840843188, "percentage": 70.02, "elapsed_time": "4:13:03", "remaining_time": "1:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2687, "total_steps": 3836, "loss": 0.1328, "learning_rate": 1.1294972492664537e-06, "epoch": 0.7003551298341641, "percentage": 70.05, "elapsed_time": "4:13:09", "remaining_time": "1:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2688, "total_steps": 3836, "loss": 0.1417, "learning_rate": 1.127695165384072e-06, "epoch": 0.7006157755840093, "percentage": 70.07, "elapsed_time": "4:13:15", "remaining_time": "1:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2689, "total_steps": 3836, "loss": 0.1427, "learning_rate": 1.125894101486198e-06, "epoch": 0.7008764213338546, "percentage": 70.1, "elapsed_time": "4:13:20", "remaining_time": "1:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2690, "total_steps": 3836, "loss": 0.1548, "learning_rate": 1.1240940589114953e-06, "epoch": 0.7011370670836998, "percentage": 70.13, "elapsed_time": "4:13:25", "remaining_time": "1:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2691, "total_steps": 3836, "loss": 0.1244, "learning_rate": 1.1222950389978735e-06, "epoch": 0.7013977128335451, "percentage": 70.15, "elapsed_time": "4:13:30", "remaining_time": "1:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2692, "total_steps": 3836, "loss": 0.1477, "learning_rate": 1.1204970430824782e-06, "epoch": 0.7016583585833903, "percentage": 70.18, "elapsed_time": "4:13:36", "remaining_time": "1:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2693, "total_steps": 3836, "loss": 0.1336, "learning_rate": 1.118700072501692e-06, "epoch": 0.7019190043332356, "percentage": 70.2, "elapsed_time": "4:13:41", "remaining_time": "1:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2694, "total_steps": 3836, "loss": 0.1515, "learning_rate": 1.1169041285911411e-06, "epoch": 0.7021796500830808, "percentage": 70.23, "elapsed_time": "4:13:46", "remaining_time": "1:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2695, "total_steps": 3836, "loss": 0.1483, "learning_rate": 1.1151092126856845e-06, "epoch": 0.7024402958329261, "percentage": 70.26, "elapsed_time": "4:13:53", "remaining_time": "1:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2696, "total_steps": 3836, "loss": 0.1487, "learning_rate": 1.113315326119418e-06, "epoch": 0.7027009415827713, "percentage": 70.28, "elapsed_time": "4:13:59", "remaining_time": "1:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2697, "total_steps": 3836, "loss": 0.1436, "learning_rate": 1.111522470225672e-06, "epoch": 0.7029615873326166, "percentage": 70.31, "elapsed_time": "4:14:04", "remaining_time": "1:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2698, "total_steps": 3836, "loss": 0.1477, "learning_rate": 1.1097306463370142e-06, "epoch": 0.7032222330824618, "percentage": 70.33, "elapsed_time": "4:14:09", "remaining_time": "1:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2699, "total_steps": 3836, "loss": 0.127, "learning_rate": 1.1079398557852392e-06, "epoch": 0.7034828788323071, "percentage": 70.36, "elapsed_time": "4:14:15", "remaining_time": "1:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2700, "total_steps": 3836, "loss": 0.1387, "learning_rate": 1.1061500999013771e-06, "epoch": 0.7037435245821523, "percentage": 70.39, "elapsed_time": "4:14:19", "remaining_time": "1:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2701, "total_steps": 3836, "loss": 0.1517, "learning_rate": 1.1043613800156905e-06, "epoch": 0.7040041703319975, "percentage": 70.41, "elapsed_time": "4:14:25", "remaining_time": "1:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2702, "total_steps": 3836, "loss": 0.1282, "learning_rate": 1.1025736974576693e-06, "epoch": 0.7042648160818428, "percentage": 70.44, "elapsed_time": "4:14:30", "remaining_time": "1:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2703, "total_steps": 3836, "loss": 0.1364, "learning_rate": 1.1007870535560331e-06, "epoch": 0.704525461831688, "percentage": 70.46, "elapsed_time": "4:14:36", "remaining_time": "1:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2704, "total_steps": 3836, "loss": 0.1291, "learning_rate": 1.0990014496387296e-06, "epoch": 0.7047861075815333, "percentage": 70.49, "elapsed_time": "4:14:42", "remaining_time": "1:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2705, "total_steps": 3836, "loss": 0.1236, "learning_rate": 1.0972168870329337e-06, "epoch": 0.7050467533313785, "percentage": 70.52, "elapsed_time": "4:14:48", "remaining_time": "1:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2706, "total_steps": 3836, "loss": 0.1417, "learning_rate": 1.0954333670650461e-06, "epoch": 0.7053073990812238, "percentage": 70.54, "elapsed_time": "4:14:53", "remaining_time": "1:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2707, "total_steps": 3836, "loss": 0.126, "learning_rate": 1.0936508910606917e-06, "epoch": 0.7055680448310689, "percentage": 70.57, "elapsed_time": "4:14:58", "remaining_time": "1:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2708, "total_steps": 3836, "loss": 0.1521, "learning_rate": 1.0918694603447221e-06, "epoch": 0.7058286905809142, "percentage": 70.59, "elapsed_time": "4:15:04", "remaining_time": "1:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2709, "total_steps": 3836, "loss": 0.1506, "learning_rate": 1.0900890762412106e-06, "epoch": 0.7060893363307594, "percentage": 70.62, "elapsed_time": "4:15:10", "remaining_time": "1:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2710, "total_steps": 3836, "loss": 0.1398, "learning_rate": 1.0883097400734494e-06, "epoch": 0.7063499820806047, "percentage": 70.65, "elapsed_time": "4:15:15", "remaining_time": "1:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2711, "total_steps": 3836, "loss": 0.1431, "learning_rate": 1.086531453163957e-06, "epoch": 0.7066106278304499, "percentage": 70.67, "elapsed_time": "4:15:21", "remaining_time": "1:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2712, "total_steps": 3836, "loss": 0.1403, "learning_rate": 1.0847542168344695e-06, "epoch": 0.7068712735802952, "percentage": 70.7, "elapsed_time": "4:15:26", "remaining_time": "1:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2713, "total_steps": 3836, "loss": 0.148, "learning_rate": 1.0829780324059416e-06, "epoch": 0.7071319193301404, "percentage": 70.72, "elapsed_time": "4:15:31", "remaining_time": "1:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2714, "total_steps": 3836, "loss": 0.1387, "learning_rate": 1.0812029011985472e-06, "epoch": 0.7073925650799857, "percentage": 70.75, "elapsed_time": "4:15:36", "remaining_time": "1:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2715, "total_steps": 3836, "loss": 0.1553, "learning_rate": 1.0794288245316772e-06, "epoch": 0.7076532108298309, "percentage": 70.78, "elapsed_time": "4:15:42", "remaining_time": "1:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2716, "total_steps": 3836, "loss": 0.1416, "learning_rate": 1.0776558037239385e-06, "epoch": 0.7079138565796761, "percentage": 70.8, "elapsed_time": "4:15:48", "remaining_time": "1:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2717, "total_steps": 3836, "loss": 0.1318, "learning_rate": 1.0758838400931524e-06, "epoch": 0.7081745023295214, "percentage": 70.83, "elapsed_time": "4:15:53", "remaining_time": "1:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2718, "total_steps": 3836, "loss": 0.146, "learning_rate": 1.0741129349563567e-06, "epoch": 0.7084351480793666, "percentage": 70.86, "elapsed_time": "4:15:58", "remaining_time": "1:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2719, "total_steps": 3836, "loss": 0.1435, "learning_rate": 1.072343089629801e-06, "epoch": 0.7086957938292119, "percentage": 70.88, "elapsed_time": "4:16:03", "remaining_time": "1:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2720, "total_steps": 3836, "loss": 0.1523, "learning_rate": 1.0705743054289464e-06, "epoch": 0.7089564395790571, "percentage": 70.91, "elapsed_time": "4:16:09", "remaining_time": "1:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2721, "total_steps": 3836, "loss": 0.13, "learning_rate": 1.0688065836684666e-06, "epoch": 0.7092170853289024, "percentage": 70.93, "elapsed_time": "4:16:15", "remaining_time": "1:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2722, "total_steps": 3836, "loss": 0.1367, "learning_rate": 1.0670399256622455e-06, "epoch": 0.7094777310787476, "percentage": 70.96, "elapsed_time": "4:16:20", "remaining_time": "1:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2723, "total_steps": 3836, "loss": 0.1342, "learning_rate": 1.0652743327233744e-06, "epoch": 0.7097383768285929, "percentage": 70.99, "elapsed_time": "4:16:25", "remaining_time": "1:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2724, "total_steps": 3836, "loss": 0.1328, "learning_rate": 1.0635098061641572e-06, "epoch": 0.709999022578438, "percentage": 71.01, "elapsed_time": "4:16:31", "remaining_time": "1:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2725, "total_steps": 3836, "loss": 0.1447, "learning_rate": 1.061746347296102e-06, "epoch": 0.7102596683282834, "percentage": 71.04, "elapsed_time": "4:16:36", "remaining_time": "1:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2726, "total_steps": 3836, "loss": 0.1409, "learning_rate": 1.0599839574299217e-06, "epoch": 0.7105203140781285, "percentage": 71.06, "elapsed_time": "4:16:42", "remaining_time": "1:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2727, "total_steps": 3836, "loss": 0.1424, "learning_rate": 1.0582226378755391e-06, "epoch": 0.7107809598279738, "percentage": 71.09, "elapsed_time": "4:16:47", "remaining_time": "1:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2728, "total_steps": 3836, "loss": 0.1436, "learning_rate": 1.056462389942079e-06, "epoch": 0.711041605577819, "percentage": 71.12, "elapsed_time": "4:16:53", "remaining_time": "1:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2729, "total_steps": 3836, "loss": 0.1529, "learning_rate": 1.0547032149378694e-06, "epoch": 0.7113022513276643, "percentage": 71.14, "elapsed_time": "4:16:59", "remaining_time": "1:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2730, "total_steps": 3836, "loss": 0.1379, "learning_rate": 1.052945114170441e-06, "epoch": 0.7115628970775095, "percentage": 71.17, "elapsed_time": "4:17:05", "remaining_time": "1:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2731, "total_steps": 3836, "loss": 0.1488, "learning_rate": 1.0511880889465284e-06, "epoch": 0.7118235428273547, "percentage": 71.19, "elapsed_time": "4:17:10", "remaining_time": "1:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2732, "total_steps": 3836, "loss": 0.1406, "learning_rate": 1.0494321405720627e-06, "epoch": 0.7120841885772, "percentage": 71.22, "elapsed_time": "4:17:16", "remaining_time": "1:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2733, "total_steps": 3836, "loss": 0.138, "learning_rate": 1.047677270352177e-06, "epoch": 0.7123448343270452, "percentage": 71.25, "elapsed_time": "4:17:21", "remaining_time": "1:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2734, "total_steps": 3836, "loss": 0.1451, "learning_rate": 1.045923479591204e-06, "epoch": 0.7126054800768905, "percentage": 71.27, "elapsed_time": "4:17:27", "remaining_time": "1:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2735, "total_steps": 3836, "loss": 0.1452, "learning_rate": 1.0441707695926726e-06, "epoch": 0.7128661258267357, "percentage": 71.3, "elapsed_time": "4:17:33", "remaining_time": "1:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2736, "total_steps": 3836, "loss": 0.1297, "learning_rate": 1.042419141659308e-06, "epoch": 0.713126771576581, "percentage": 71.32, "elapsed_time": "4:17:38", "remaining_time": "1:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2737, "total_steps": 3836, "loss": 0.1255, "learning_rate": 1.0406685970930325e-06, "epoch": 0.7133874173264262, "percentage": 71.35, "elapsed_time": "4:17:44", "remaining_time": "1:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2738, "total_steps": 3836, "loss": 0.1425, "learning_rate": 1.038919137194962e-06, "epoch": 0.7136480630762715, "percentage": 71.38, "elapsed_time": "4:17:49", "remaining_time": "1:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2739, "total_steps": 3836, "loss": 0.1387, "learning_rate": 1.0371707632654071e-06, "epoch": 0.7139087088261167, "percentage": 71.4, "elapsed_time": "4:17:55", "remaining_time": "1:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2740, "total_steps": 3836, "loss": 0.1294, "learning_rate": 1.0354234766038696e-06, "epoch": 0.714169354575962, "percentage": 71.43, "elapsed_time": "4:18:00", "remaining_time": "1:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2741, "total_steps": 3836, "loss": 0.1364, "learning_rate": 1.0336772785090466e-06, "epoch": 0.7144300003258072, "percentage": 71.45, "elapsed_time": "4:18:06", "remaining_time": "1:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2742, "total_steps": 3836, "loss": 0.15, "learning_rate": 1.0319321702788234e-06, "epoch": 0.7146906460756525, "percentage": 71.48, "elapsed_time": "4:18:12", "remaining_time": "1:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2743, "total_steps": 3836, "loss": 0.1578, "learning_rate": 1.030188153210274e-06, "epoch": 0.7149512918254977, "percentage": 71.51, "elapsed_time": "4:18:17", "remaining_time": "1:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2744, "total_steps": 3836, "loss": 0.1494, "learning_rate": 1.028445228599665e-06, "epoch": 0.715211937575343, "percentage": 71.53, "elapsed_time": "4:18:23", "remaining_time": "1:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2745, "total_steps": 3836, "loss": 0.1367, "learning_rate": 1.0267033977424485e-06, "epoch": 0.7154725833251881, "percentage": 71.56, "elapsed_time": "4:18:29", "remaining_time": "1:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2746, "total_steps": 3836, "loss": 0.1368, "learning_rate": 1.0249626619332642e-06, "epoch": 0.7157332290750335, "percentage": 71.58, "elapsed_time": "4:18:35", "remaining_time": "1:42:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2747, "total_steps": 3836, "loss": 0.1464, "learning_rate": 1.0232230224659385e-06, "epoch": 0.7159938748248786, "percentage": 71.61, "elapsed_time": "4:18:40", "remaining_time": "1:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2748, "total_steps": 3836, "loss": 0.1398, "learning_rate": 1.0214844806334817e-06, "epoch": 0.7162545205747238, "percentage": 71.64, "elapsed_time": "4:18:45", "remaining_time": "1:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2749, "total_steps": 3836, "loss": 0.1328, "learning_rate": 1.0197470377280888e-06, "epoch": 0.7165151663245691, "percentage": 71.66, "elapsed_time": "4:18:51", "remaining_time": "1:42:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2750, "total_steps": 3836, "loss": 0.1303, "learning_rate": 1.0180106950411397e-06, "epoch": 0.7167758120744143, "percentage": 71.69, "elapsed_time": "4:18:56", "remaining_time": "1:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2751, "total_steps": 3836, "loss": 0.1368, "learning_rate": 1.0162754538631945e-06, "epoch": 0.7170364578242596, "percentage": 71.72, "elapsed_time": "4:19:02", "remaining_time": "1:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2752, "total_steps": 3836, "loss": 0.14, "learning_rate": 1.0145413154839945e-06, "epoch": 0.7172971035741048, "percentage": 71.74, "elapsed_time": "4:19:08", "remaining_time": "1:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2753, "total_steps": 3836, "loss": 0.1381, "learning_rate": 1.0128082811924625e-06, "epoch": 0.7175577493239501, "percentage": 71.77, "elapsed_time": "4:19:13", "remaining_time": "1:41:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2754, "total_steps": 3836, "loss": 0.1447, "learning_rate": 1.0110763522767e-06, "epoch": 0.7178183950737953, "percentage": 71.79, "elapsed_time": "4:19:19", "remaining_time": "1:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2755, "total_steps": 3836, "loss": 0.1404, "learning_rate": 1.0093455300239871e-06, "epoch": 0.7180790408236406, "percentage": 71.82, "elapsed_time": "4:19:25", "remaining_time": "1:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2756, "total_steps": 3836, "loss": 0.1502, "learning_rate": 1.0076158157207801e-06, "epoch": 0.7183396865734858, "percentage": 71.85, "elapsed_time": "4:19:30", "remaining_time": "1:41:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2757, "total_steps": 3836, "loss": 0.1447, "learning_rate": 1.0058872106527157e-06, "epoch": 0.7186003323233311, "percentage": 71.87, "elapsed_time": "4:19:35", "remaining_time": "1:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2758, "total_steps": 3836, "loss": 0.1399, "learning_rate": 1.0041597161046025e-06, "epoch": 0.7188609780731763, "percentage": 71.9, "elapsed_time": "4:19:40", "remaining_time": "1:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2759, "total_steps": 3836, "loss": 0.1413, "learning_rate": 1.0024333333604225e-06, "epoch": 0.7191216238230216, "percentage": 71.92, "elapsed_time": "4:19:45", "remaining_time": "1:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2760, "total_steps": 3836, "loss": 0.1333, "learning_rate": 1.0007080637033359e-06, "epoch": 0.7193822695728668, "percentage": 71.95, "elapsed_time": "4:19:51", "remaining_time": "1:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2761, "total_steps": 3836, "loss": 0.1426, "learning_rate": 9.989839084156725e-07, "epoch": 0.7196429153227121, "percentage": 71.98, "elapsed_time": "4:19:57", "remaining_time": "1:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2762, "total_steps": 3836, "loss": 0.1345, "learning_rate": 9.972608687789346e-07, "epoch": 0.7199035610725573, "percentage": 72.0, "elapsed_time": "4:20:02", "remaining_time": "1:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2763, "total_steps": 3836, "loss": 0.1348, "learning_rate": 9.95538946073794e-07, "epoch": 0.7201642068224025, "percentage": 72.03, "elapsed_time": "4:20:08", "remaining_time": "1:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2764, "total_steps": 3836, "loss": 0.1404, "learning_rate": 9.938181415800966e-07, "epoch": 0.7204248525722478, "percentage": 72.05, "elapsed_time": "4:20:14", "remaining_time": "1:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2765, "total_steps": 3836, "loss": 0.1571, "learning_rate": 9.92098456576851e-07, "epoch": 0.7206854983220929, "percentage": 72.08, "elapsed_time": "4:20:20", "remaining_time": "1:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2766, "total_steps": 3836, "loss": 0.1332, "learning_rate": 9.903798923422369e-07, "epoch": 0.7209461440719382, "percentage": 72.11, "elapsed_time": "4:20:25", "remaining_time": "1:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2767, "total_steps": 3836, "loss": 0.1326, "learning_rate": 9.886624501536028e-07, "epoch": 0.7212067898217834, "percentage": 72.13, "elapsed_time": "4:20:31", "remaining_time": "1:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2768, "total_steps": 3836, "loss": 0.1542, "learning_rate": 9.869461312874603e-07, "epoch": 0.7214674355716287, "percentage": 72.16, "elapsed_time": "4:20:37", "remaining_time": "1:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2769, "total_steps": 3836, "loss": 0.1247, "learning_rate": 9.852309370194873e-07, "epoch": 0.7217280813214739, "percentage": 72.18, "elapsed_time": "4:20:42", "remaining_time": "1:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2770, "total_steps": 3836, "loss": 0.1231, "learning_rate": 9.835168686245252e-07, "epoch": 0.7219887270713192, "percentage": 72.21, "elapsed_time": "4:20:48", "remaining_time": "1:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2771, "total_steps": 3836, "loss": 0.1387, "learning_rate": 9.818039273765794e-07, "epoch": 0.7222493728211644, "percentage": 72.24, "elapsed_time": "4:20:54", "remaining_time": "1:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2772, "total_steps": 3836, "loss": 0.143, "learning_rate": 9.800921145488171e-07, "epoch": 0.7225100185710097, "percentage": 72.26, "elapsed_time": "4:21:00", "remaining_time": "1:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2773, "total_steps": 3836, "loss": 0.1429, "learning_rate": 9.783814314135656e-07, "epoch": 0.7227706643208549, "percentage": 72.29, "elapsed_time": "4:21:05", "remaining_time": "1:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2774, "total_steps": 3836, "loss": 0.1394, "learning_rate": 9.766718792423159e-07, "epoch": 0.7230313100707002, "percentage": 72.31, "elapsed_time": "4:21:10", "remaining_time": "1:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2775, "total_steps": 3836, "loss": 0.1454, "learning_rate": 9.749634593057159e-07, "epoch": 0.7232919558205454, "percentage": 72.34, "elapsed_time": "4:21:16", "remaining_time": "1:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2776, "total_steps": 3836, "loss": 0.1326, "learning_rate": 9.732561728735698e-07, "epoch": 0.7235526015703907, "percentage": 72.37, "elapsed_time": "4:21:21", "remaining_time": "1:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2777, "total_steps": 3836, "loss": 0.1374, "learning_rate": 9.715500212148444e-07, "epoch": 0.7238132473202359, "percentage": 72.39, "elapsed_time": "4:21:27", "remaining_time": "1:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2778, "total_steps": 3836, "loss": 0.1453, "learning_rate": 9.698450055976596e-07, "epoch": 0.7240738930700811, "percentage": 72.42, "elapsed_time": "4:21:33", "remaining_time": "1:39:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2779, "total_steps": 3836, "loss": 0.1497, "learning_rate": 9.681411272892913e-07, "epoch": 0.7243345388199264, "percentage": 72.45, "elapsed_time": "4:21:39", "remaining_time": "1:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2780, "total_steps": 3836, "loss": 0.1346, "learning_rate": 9.664383875561726e-07, "epoch": 0.7245951845697716, "percentage": 72.47, "elapsed_time": "4:21:45", "remaining_time": "1:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2781, "total_steps": 3836, "loss": 0.1588, "learning_rate": 9.647367876638858e-07, "epoch": 0.7248558303196169, "percentage": 72.5, "elapsed_time": "4:21:51", "remaining_time": "1:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2782, "total_steps": 3836, "loss": 0.1295, "learning_rate": 9.630363288771689e-07, "epoch": 0.7251164760694621, "percentage": 72.52, "elapsed_time": "4:21:56", "remaining_time": "1:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2783, "total_steps": 3836, "loss": 0.1405, "learning_rate": 9.613370124599124e-07, "epoch": 0.7253771218193074, "percentage": 72.55, "elapsed_time": "4:22:01", "remaining_time": "1:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2784, "total_steps": 3836, "loss": 0.1464, "learning_rate": 9.596388396751567e-07, "epoch": 0.7256377675691525, "percentage": 72.58, "elapsed_time": "4:22:07", "remaining_time": "1:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2785, "total_steps": 3836, "loss": 0.1295, "learning_rate": 9.579418117850915e-07, "epoch": 0.7258984133189978, "percentage": 72.6, "elapsed_time": "4:22:12", "remaining_time": "1:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2786, "total_steps": 3836, "loss": 0.1319, "learning_rate": 9.562459300510562e-07, "epoch": 0.726159059068843, "percentage": 72.63, "elapsed_time": "4:22:18", "remaining_time": "1:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2787, "total_steps": 3836, "loss": 0.1433, "learning_rate": 9.545511957335388e-07, "epoch": 0.7264197048186883, "percentage": 72.65, "elapsed_time": "4:22:23", "remaining_time": "1:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2788, "total_steps": 3836, "loss": 0.1332, "learning_rate": 9.528576100921736e-07, "epoch": 0.7266803505685335, "percentage": 72.68, "elapsed_time": "4:22:29", "remaining_time": "1:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2789, "total_steps": 3836, "loss": 0.1389, "learning_rate": 9.511651743857406e-07, "epoch": 0.7269409963183788, "percentage": 72.71, "elapsed_time": "4:22:34", "remaining_time": "1:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2790, "total_steps": 3836, "loss": 0.1332, "learning_rate": 9.494738898721681e-07, "epoch": 0.727201642068224, "percentage": 72.73, "elapsed_time": "4:22:40", "remaining_time": "1:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2791, "total_steps": 3836, "loss": 0.1355, "learning_rate": 9.477837578085261e-07, "epoch": 0.7274622878180693, "percentage": 72.76, "elapsed_time": "4:22:45", "remaining_time": "1:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2792, "total_steps": 3836, "loss": 0.148, "learning_rate": 9.460947794510264e-07, "epoch": 0.7277229335679145, "percentage": 72.78, "elapsed_time": "4:22:50", "remaining_time": "1:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2793, "total_steps": 3836, "loss": 0.1327, "learning_rate": 9.444069560550279e-07, "epoch": 0.7279835793177597, "percentage": 72.81, "elapsed_time": "4:22:55", "remaining_time": "1:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2794, "total_steps": 3836, "loss": 0.1359, "learning_rate": 9.427202888750278e-07, "epoch": 0.728244225067605, "percentage": 72.84, "elapsed_time": "4:23:01", "remaining_time": "1:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2795, "total_steps": 3836, "loss": 0.1412, "learning_rate": 9.410347791646648e-07, "epoch": 0.7285048708174502, "percentage": 72.86, "elapsed_time": "4:23:06", "remaining_time": "1:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2796, "total_steps": 3836, "loss": 0.1412, "learning_rate": 9.393504281767163e-07, "epoch": 0.7287655165672955, "percentage": 72.89, "elapsed_time": "4:23:12", "remaining_time": "1:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2797, "total_steps": 3836, "loss": 0.1406, "learning_rate": 9.376672371631021e-07, "epoch": 0.7290261623171407, "percentage": 72.91, "elapsed_time": "4:23:18", "remaining_time": "1:37:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2798, "total_steps": 3836, "loss": 0.1377, "learning_rate": 9.359852073748746e-07, "epoch": 0.729286808066986, "percentage": 72.94, "elapsed_time": "4:23:23", "remaining_time": "1:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2799, "total_steps": 3836, "loss": 0.1379, "learning_rate": 9.343043400622256e-07, "epoch": 0.7295474538168312, "percentage": 72.97, "elapsed_time": "4:23:28", "remaining_time": "1:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2800, "total_steps": 3836, "loss": 0.1227, "learning_rate": 9.326246364744845e-07, "epoch": 0.7298080995666765, "percentage": 72.99, "elapsed_time": "4:23:34", "remaining_time": "1:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2801, "total_steps": 3836, "loss": 0.146, "learning_rate": 9.309460978601137e-07, "epoch": 0.7300687453165217, "percentage": 73.02, "elapsed_time": "4:23:40", "remaining_time": "1:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2802, "total_steps": 3836, "loss": 0.1295, "learning_rate": 9.292687254667096e-07, "epoch": 0.730329391066367, "percentage": 73.04, "elapsed_time": "4:23:46", "remaining_time": "1:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2803, "total_steps": 3836, "loss": 0.1513, "learning_rate": 9.27592520541003e-07, "epoch": 0.7305900368162122, "percentage": 73.07, "elapsed_time": "4:23:51", "remaining_time": "1:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2804, "total_steps": 3836, "loss": 0.1473, "learning_rate": 9.259174843288557e-07, "epoch": 0.7308506825660575, "percentage": 73.1, "elapsed_time": "4:23:57", "remaining_time": "1:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2805, "total_steps": 3836, "loss": 0.1441, "learning_rate": 9.242436180752623e-07, "epoch": 0.7311113283159026, "percentage": 73.12, "elapsed_time": "4:24:02", "remaining_time": "1:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2806, "total_steps": 3836, "loss": 0.1417, "learning_rate": 9.225709230243455e-07, "epoch": 0.7313719740657479, "percentage": 73.15, "elapsed_time": "4:24:08", "remaining_time": "1:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2807, "total_steps": 3836, "loss": 0.1242, "learning_rate": 9.208994004193605e-07, "epoch": 0.7316326198155931, "percentage": 73.18, "elapsed_time": "4:24:13", "remaining_time": "1:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2808, "total_steps": 3836, "loss": 0.1545, "learning_rate": 9.192290515026903e-07, "epoch": 0.7318932655654383, "percentage": 73.2, "elapsed_time": "4:24:19", "remaining_time": "1:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2809, "total_steps": 3836, "loss": 0.1358, "learning_rate": 9.175598775158417e-07, "epoch": 0.7321539113152836, "percentage": 73.23, "elapsed_time": "4:24:24", "remaining_time": "1:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2810, "total_steps": 3836, "loss": 0.1462, "learning_rate": 9.158918796994543e-07, "epoch": 0.7324145570651288, "percentage": 73.25, "elapsed_time": "4:24:30", "remaining_time": "1:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2811, "total_steps": 3836, "loss": 0.1402, "learning_rate": 9.142250592932891e-07, "epoch": 0.7326752028149741, "percentage": 73.28, "elapsed_time": "4:24:36", "remaining_time": "1:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2812, "total_steps": 3836, "loss": 0.1425, "learning_rate": 9.125594175362326e-07, "epoch": 0.7329358485648193, "percentage": 73.31, "elapsed_time": "4:24:41", "remaining_time": "1:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2813, "total_steps": 3836, "loss": 0.1547, "learning_rate": 9.108949556662991e-07, "epoch": 0.7331964943146646, "percentage": 73.33, "elapsed_time": "4:24:46", "remaining_time": "1:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2814, "total_steps": 3836, "loss": 0.1437, "learning_rate": 9.092316749206198e-07, "epoch": 0.7334571400645098, "percentage": 73.36, "elapsed_time": "4:24:52", "remaining_time": "1:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2815, "total_steps": 3836, "loss": 0.1386, "learning_rate": 9.075695765354511e-07, "epoch": 0.7337177858143551, "percentage": 73.38, "elapsed_time": "4:24:57", "remaining_time": "1:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2816, "total_steps": 3836, "loss": 0.138, "learning_rate": 9.059086617461723e-07, "epoch": 0.7339784315642003, "percentage": 73.41, "elapsed_time": "4:25:02", "remaining_time": "1:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2817, "total_steps": 3836, "loss": 0.1477, "learning_rate": 9.042489317872807e-07, "epoch": 0.7342390773140456, "percentage": 73.44, "elapsed_time": "4:25:07", "remaining_time": "1:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2818, "total_steps": 3836, "loss": 0.1492, "learning_rate": 9.025903878923934e-07, "epoch": 0.7344997230638908, "percentage": 73.46, "elapsed_time": "4:25:13", "remaining_time": "1:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2819, "total_steps": 3836, "loss": 0.129, "learning_rate": 9.009330312942455e-07, "epoch": 0.7347603688137361, "percentage": 73.49, "elapsed_time": "4:25:18", "remaining_time": "1:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2820, "total_steps": 3836, "loss": 0.1394, "learning_rate": 8.992768632246907e-07, "epoch": 0.7350210145635813, "percentage": 73.51, "elapsed_time": "4:25:23", "remaining_time": "1:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2821, "total_steps": 3836, "loss": 0.1383, "learning_rate": 8.976218849146987e-07, "epoch": 0.7352816603134266, "percentage": 73.54, "elapsed_time": "4:25:29", "remaining_time": "1:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2822, "total_steps": 3836, "loss": 0.1419, "learning_rate": 8.959680975943541e-07, "epoch": 0.7355423060632718, "percentage": 73.57, "elapsed_time": "4:25:34", "remaining_time": "1:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2823, "total_steps": 3836, "loss": 0.1498, "learning_rate": 8.943155024928588e-07, "epoch": 0.735802951813117, "percentage": 73.59, "elapsed_time": "4:25:40", "remaining_time": "1:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2824, "total_steps": 3836, "loss": 0.1177, "learning_rate": 8.926641008385268e-07, "epoch": 0.7360635975629622, "percentage": 73.62, "elapsed_time": "4:25:45", "remaining_time": "1:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2825, "total_steps": 3836, "loss": 0.1298, "learning_rate": 8.910138938587828e-07, "epoch": 0.7363242433128074, "percentage": 73.64, "elapsed_time": "4:25:50", "remaining_time": "1:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2826, "total_steps": 3836, "loss": 0.136, "learning_rate": 8.893648827801685e-07, "epoch": 0.7365848890626527, "percentage": 73.67, "elapsed_time": "4:25:56", "remaining_time": "1:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2827, "total_steps": 3836, "loss": 0.1438, "learning_rate": 8.877170688283332e-07, "epoch": 0.7368455348124979, "percentage": 73.7, "elapsed_time": "4:26:01", "remaining_time": "1:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2828, "total_steps": 3836, "loss": 0.1341, "learning_rate": 8.860704532280373e-07, "epoch": 0.7371061805623432, "percentage": 73.72, "elapsed_time": "4:26:06", "remaining_time": "1:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2829, "total_steps": 3836, "loss": 0.1482, "learning_rate": 8.844250372031504e-07, "epoch": 0.7373668263121884, "percentage": 73.75, "elapsed_time": "4:26:12", "remaining_time": "1:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2830, "total_steps": 3836, "loss": 0.1348, "learning_rate": 8.827808219766513e-07, "epoch": 0.7376274720620337, "percentage": 73.77, "elapsed_time": "4:26:17", "remaining_time": "1:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2831, "total_steps": 3836, "loss": 0.152, "learning_rate": 8.811378087706251e-07, "epoch": 0.7378881178118789, "percentage": 73.8, "elapsed_time": "4:26:22", "remaining_time": "1:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2832, "total_steps": 3836, "loss": 0.1396, "learning_rate": 8.794959988062632e-07, "epoch": 0.7381487635617242, "percentage": 73.83, "elapsed_time": "4:26:27", "remaining_time": "1:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2833, "total_steps": 3836, "loss": 0.1298, "learning_rate": 8.778553933038655e-07, "epoch": 0.7384094093115694, "percentage": 73.85, "elapsed_time": "4:26:33", "remaining_time": "1:34:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2834, "total_steps": 3836, "loss": 0.1397, "learning_rate": 8.762159934828337e-07, "epoch": 0.7386700550614147, "percentage": 73.88, "elapsed_time": "4:26:39", "remaining_time": "1:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2835, "total_steps": 3836, "loss": 0.155, "learning_rate": 8.745778005616745e-07, "epoch": 0.7389307008112599, "percentage": 73.91, "elapsed_time": "4:26:45", "remaining_time": "1:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2836, "total_steps": 3836, "loss": 0.1448, "learning_rate": 8.729408157579968e-07, "epoch": 0.7391913465611052, "percentage": 73.93, "elapsed_time": "4:26:50", "remaining_time": "1:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2837, "total_steps": 3836, "loss": 0.1364, "learning_rate": 8.713050402885129e-07, "epoch": 0.7394519923109504, "percentage": 73.96, "elapsed_time": "4:26:56", "remaining_time": "1:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2838, "total_steps": 3836, "loss": 0.1343, "learning_rate": 8.696704753690344e-07, "epoch": 0.7397126380607956, "percentage": 73.98, "elapsed_time": "4:27:01", "remaining_time": "1:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2839, "total_steps": 3836, "loss": 0.1354, "learning_rate": 8.680371222144757e-07, "epoch": 0.7399732838106409, "percentage": 74.01, "elapsed_time": "4:27:06", "remaining_time": "1:33:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2840, "total_steps": 3836, "loss": 0.1411, "learning_rate": 8.664049820388492e-07, "epoch": 0.7402339295604861, "percentage": 74.04, "elapsed_time": "4:27:12", "remaining_time": "1:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2841, "total_steps": 3836, "loss": 0.172, "learning_rate": 8.647740560552631e-07, "epoch": 0.7404945753103314, "percentage": 74.06, "elapsed_time": "4:27:18", "remaining_time": "1:33:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2842, "total_steps": 3836, "loss": 0.131, "learning_rate": 8.631443454759283e-07, "epoch": 0.7407552210601765, "percentage": 74.09, "elapsed_time": "4:27:23", "remaining_time": "1:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2843, "total_steps": 3836, "loss": 0.1333, "learning_rate": 8.615158515121486e-07, "epoch": 0.7410158668100219, "percentage": 74.11, "elapsed_time": "4:27:28", "remaining_time": "1:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2844, "total_steps": 3836, "loss": 0.1324, "learning_rate": 8.598885753743247e-07, "epoch": 0.741276512559867, "percentage": 74.14, "elapsed_time": "4:27:34", "remaining_time": "1:33:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2845, "total_steps": 3836, "loss": 0.1541, "learning_rate": 8.582625182719515e-07, "epoch": 0.7415371583097123, "percentage": 74.17, "elapsed_time": "4:27:39", "remaining_time": "1:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2846, "total_steps": 3836, "loss": 0.1274, "learning_rate": 8.566376814136201e-07, "epoch": 0.7417978040595575, "percentage": 74.19, "elapsed_time": "4:27:44", "remaining_time": "1:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2847, "total_steps": 3836, "loss": 0.1248, "learning_rate": 8.550140660070114e-07, "epoch": 0.7420584498094028, "percentage": 74.22, "elapsed_time": "4:27:50", "remaining_time": "1:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2848, "total_steps": 3836, "loss": 0.1359, "learning_rate": 8.533916732588996e-07, "epoch": 0.742319095559248, "percentage": 74.24, "elapsed_time": "4:27:55", "remaining_time": "1:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2849, "total_steps": 3836, "loss": 0.1349, "learning_rate": 8.517705043751517e-07, "epoch": 0.7425797413090933, "percentage": 74.27, "elapsed_time": "4:28:01", "remaining_time": "1:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2850, "total_steps": 3836, "loss": 0.1381, "learning_rate": 8.501505605607236e-07, "epoch": 0.7428403870589385, "percentage": 74.3, "elapsed_time": "4:28:06", "remaining_time": "1:32:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2851, "total_steps": 3836, "loss": 0.1348, "learning_rate": 8.485318430196604e-07, "epoch": 0.7431010328087838, "percentage": 74.32, "elapsed_time": "4:28:12", "remaining_time": "1:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2852, "total_steps": 3836, "loss": 0.1483, "learning_rate": 8.469143529550968e-07, "epoch": 0.743361678558629, "percentage": 74.35, "elapsed_time": "4:28:18", "remaining_time": "1:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2853, "total_steps": 3836, "loss": 0.1444, "learning_rate": 8.452980915692544e-07, "epoch": 0.7436223243084742, "percentage": 74.37, "elapsed_time": "4:28:24", "remaining_time": "1:32:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2854, "total_steps": 3836, "loss": 0.1397, "learning_rate": 8.436830600634416e-07, "epoch": 0.7438829700583195, "percentage": 74.4, "elapsed_time": "4:28:30", "remaining_time": "1:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2855, "total_steps": 3836, "loss": 0.1344, "learning_rate": 8.420692596380523e-07, "epoch": 0.7441436158081647, "percentage": 74.43, "elapsed_time": "4:28:35", "remaining_time": "1:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2856, "total_steps": 3836, "loss": 0.1431, "learning_rate": 8.404566914925672e-07, "epoch": 0.74440426155801, "percentage": 74.45, "elapsed_time": "4:28:41", "remaining_time": "1:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2857, "total_steps": 3836, "loss": 0.1335, "learning_rate": 8.388453568255503e-07, "epoch": 0.7446649073078552, "percentage": 74.48, "elapsed_time": "4:28:47", "remaining_time": "1:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2858, "total_steps": 3836, "loss": 0.1374, "learning_rate": 8.372352568346453e-07, "epoch": 0.7449255530577005, "percentage": 74.5, "elapsed_time": "4:28:52", "remaining_time": "1:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2859, "total_steps": 3836, "loss": 0.1482, "learning_rate": 8.356263927165845e-07, "epoch": 0.7451861988075457, "percentage": 74.53, "elapsed_time": "4:28:58", "remaining_time": "1:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2860, "total_steps": 3836, "loss": 0.1346, "learning_rate": 8.340187656671767e-07, "epoch": 0.745446844557391, "percentage": 74.56, "elapsed_time": "4:29:03", "remaining_time": "1:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2861, "total_steps": 3836, "loss": 0.1445, "learning_rate": 8.324123768813133e-07, "epoch": 0.7457074903072362, "percentage": 74.58, "elapsed_time": "4:29:08", "remaining_time": "1:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2862, "total_steps": 3836, "loss": 0.1324, "learning_rate": 8.308072275529652e-07, "epoch": 0.7459681360570815, "percentage": 74.61, "elapsed_time": "4:29:13", "remaining_time": "1:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2863, "total_steps": 3836, "loss": 0.1421, "learning_rate": 8.29203318875181e-07, "epoch": 0.7462287818069266, "percentage": 74.64, "elapsed_time": "4:29:19", "remaining_time": "1:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2864, "total_steps": 3836, "loss": 0.1441, "learning_rate": 8.27600652040089e-07, "epoch": 0.746489427556772, "percentage": 74.66, "elapsed_time": "4:29:24", "remaining_time": "1:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2865, "total_steps": 3836, "loss": 0.1458, "learning_rate": 8.259992282388917e-07, "epoch": 0.7467500733066171, "percentage": 74.69, "elapsed_time": "4:29:30", "remaining_time": "1:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2866, "total_steps": 3836, "loss": 0.1407, "learning_rate": 8.243990486618717e-07, "epoch": 0.7470107190564624, "percentage": 74.71, "elapsed_time": "4:29:36", "remaining_time": "1:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2867, "total_steps": 3836, "loss": 0.1478, "learning_rate": 8.228001144983833e-07, "epoch": 0.7472713648063076, "percentage": 74.74, "elapsed_time": "4:29:41", "remaining_time": "1:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2868, "total_steps": 3836, "loss": 0.1354, "learning_rate": 8.212024269368565e-07, "epoch": 0.7475320105561528, "percentage": 74.77, "elapsed_time": "4:29:47", "remaining_time": "1:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2869, "total_steps": 3836, "loss": 0.1414, "learning_rate": 8.196059871647949e-07, "epoch": 0.7477926563059981, "percentage": 74.79, "elapsed_time": "4:29:53", "remaining_time": "1:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2870, "total_steps": 3836, "loss": 0.1513, "learning_rate": 8.180107963687741e-07, "epoch": 0.7480533020558433, "percentage": 74.82, "elapsed_time": "4:29:59", "remaining_time": "1:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2871, "total_steps": 3836, "loss": 0.1496, "learning_rate": 8.164168557344413e-07, "epoch": 0.7483139478056886, "percentage": 74.84, "elapsed_time": "4:30:05", "remaining_time": "1:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2872, "total_steps": 3836, "loss": 0.1435, "learning_rate": 8.148241664465157e-07, "epoch": 0.7485745935555338, "percentage": 74.87, "elapsed_time": "4:30:10", "remaining_time": "1:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2873, "total_steps": 3836, "loss": 0.1265, "learning_rate": 8.132327296887863e-07, "epoch": 0.7488352393053791, "percentage": 74.9, "elapsed_time": "4:30:16", "remaining_time": "1:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2874, "total_steps": 3836, "loss": 0.1353, "learning_rate": 8.116425466441077e-07, "epoch": 0.7490958850552243, "percentage": 74.92, "elapsed_time": "4:30:21", "remaining_time": "1:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2875, "total_steps": 3836, "loss": 0.1359, "learning_rate": 8.100536184944077e-07, "epoch": 0.7493565308050696, "percentage": 74.95, "elapsed_time": "4:30:26", "remaining_time": "1:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2876, "total_steps": 3836, "loss": 0.1255, "learning_rate": 8.084659464206787e-07, "epoch": 0.7496171765549148, "percentage": 74.97, "elapsed_time": "4:30:32", "remaining_time": "1:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2877, "total_steps": 3836, "loss": 0.1507, "learning_rate": 8.068795316029796e-07, "epoch": 0.7498778223047601, "percentage": 75.0, "elapsed_time": "4:30:38", "remaining_time": "1:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2878, "total_steps": 3836, "loss": 0.1337, "learning_rate": 8.052943752204339e-07, "epoch": 0.7501384680546053, "percentage": 75.03, "elapsed_time": "4:30:43", "remaining_time": "1:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2879, "total_steps": 3836, "loss": 0.1436, "learning_rate": 8.037104784512343e-07, "epoch": 0.7503991138044506, "percentage": 75.05, "elapsed_time": "4:30:49", "remaining_time": "1:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2880, "total_steps": 3836, "loss": 0.1274, "learning_rate": 8.021278424726308e-07, "epoch": 0.7506597595542958, "percentage": 75.08, "elapsed_time": "4:30:54", "remaining_time": "1:29:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2881, "total_steps": 3836, "loss": 0.1473, "learning_rate": 8.005464684609399e-07, "epoch": 0.7509204053041411, "percentage": 75.1, "elapsed_time": "4:31:00", "remaining_time": "1:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2882, "total_steps": 3836, "loss": 0.1267, "learning_rate": 7.989663575915407e-07, "epoch": 0.7511810510539862, "percentage": 75.13, "elapsed_time": "4:31:05", "remaining_time": "1:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2883, "total_steps": 3836, "loss": 0.1431, "learning_rate": 7.97387511038872e-07, "epoch": 0.7514416968038314, "percentage": 75.16, "elapsed_time": "4:31:11", "remaining_time": "1:29:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2884, "total_steps": 3836, "loss": 0.1427, "learning_rate": 7.958099299764332e-07, "epoch": 0.7517023425536767, "percentage": 75.18, "elapsed_time": "4:31:16", "remaining_time": "1:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2885, "total_steps": 3836, "loss": 0.1312, "learning_rate": 7.942336155767833e-07, "epoch": 0.7519629883035219, "percentage": 75.21, "elapsed_time": "4:31:22", "remaining_time": "1:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2886, "total_steps": 3836, "loss": 0.1388, "learning_rate": 7.926585690115396e-07, "epoch": 0.7522236340533672, "percentage": 75.23, "elapsed_time": "4:31:27", "remaining_time": "1:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2887, "total_steps": 3836, "loss": 0.1484, "learning_rate": 7.910847914513772e-07, "epoch": 0.7524842798032124, "percentage": 75.26, "elapsed_time": "4:31:33", "remaining_time": "1:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2888, "total_steps": 3836, "loss": 0.1422, "learning_rate": 7.895122840660272e-07, "epoch": 0.7527449255530577, "percentage": 75.29, "elapsed_time": "4:31:39", "remaining_time": "1:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2889, "total_steps": 3836, "loss": 0.1288, "learning_rate": 7.879410480242791e-07, "epoch": 0.7530055713029029, "percentage": 75.31, "elapsed_time": "4:31:44", "remaining_time": "1:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2890, "total_steps": 3836, "loss": 0.1261, "learning_rate": 7.863710844939759e-07, "epoch": 0.7532662170527482, "percentage": 75.34, "elapsed_time": "4:31:50", "remaining_time": "1:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2891, "total_steps": 3836, "loss": 0.1453, "learning_rate": 7.848023946420119e-07, "epoch": 0.7535268628025934, "percentage": 75.36, "elapsed_time": "4:31:56", "remaining_time": "1:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2892, "total_steps": 3836, "loss": 0.1455, "learning_rate": 7.8323497963434e-07, "epoch": 0.7537875085524387, "percentage": 75.39, "elapsed_time": "4:32:01", "remaining_time": "1:28:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2893, "total_steps": 3836, "loss": 0.1389, "learning_rate": 7.816688406359624e-07, "epoch": 0.7540481543022839, "percentage": 75.42, "elapsed_time": "4:32:07", "remaining_time": "1:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2894, "total_steps": 3836, "loss": 0.142, "learning_rate": 7.801039788109332e-07, "epoch": 0.7543088000521292, "percentage": 75.44, "elapsed_time": "4:32:12", "remaining_time": "1:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2895, "total_steps": 3836, "loss": 0.1289, "learning_rate": 7.78540395322358e-07, "epoch": 0.7545694458019744, "percentage": 75.47, "elapsed_time": "4:32:18", "remaining_time": "1:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2896, "total_steps": 3836, "loss": 0.1329, "learning_rate": 7.769780913323916e-07, "epoch": 0.7548300915518197, "percentage": 75.5, "elapsed_time": "4:32:24", "remaining_time": "1:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2897, "total_steps": 3836, "loss": 0.1283, "learning_rate": 7.754170680022369e-07, "epoch": 0.7550907373016649, "percentage": 75.52, "elapsed_time": "4:32:29", "remaining_time": "1:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2898, "total_steps": 3836, "loss": 0.1342, "learning_rate": 7.738573264921481e-07, "epoch": 0.7553513830515101, "percentage": 75.55, "elapsed_time": "4:32:34", "remaining_time": "1:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2899, "total_steps": 3836, "loss": 0.1391, "learning_rate": 7.722988679614238e-07, "epoch": 0.7556120288013554, "percentage": 75.57, "elapsed_time": "4:32:39", "remaining_time": "1:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2900, "total_steps": 3836, "loss": 0.1475, "learning_rate": 7.707416935684092e-07, "epoch": 0.7558726745512006, "percentage": 75.6, "elapsed_time": "4:32:45", "remaining_time": "1:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2901, "total_steps": 3836, "loss": 0.1356, "learning_rate": 7.691858044704964e-07, "epoch": 0.7561333203010459, "percentage": 75.63, "elapsed_time": "4:32:51", "remaining_time": "1:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2902, "total_steps": 3836, "loss": 0.1396, "learning_rate": 7.676312018241211e-07, "epoch": 0.756393966050891, "percentage": 75.65, "elapsed_time": "4:32:57", "remaining_time": "1:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2903, "total_steps": 3836, "loss": 0.1297, "learning_rate": 7.660778867847632e-07, "epoch": 0.7566546118007363, "percentage": 75.68, "elapsed_time": "4:33:02", "remaining_time": "1:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2904, "total_steps": 3836, "loss": 0.1338, "learning_rate": 7.645258605069444e-07, "epoch": 0.7569152575505815, "percentage": 75.7, "elapsed_time": "4:33:08", "remaining_time": "1:27:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2905, "total_steps": 3836, "loss": 0.1499, "learning_rate": 7.62975124144232e-07, "epoch": 0.7571759033004268, "percentage": 75.73, "elapsed_time": "4:33:14", "remaining_time": "1:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2906, "total_steps": 3836, "loss": 0.1391, "learning_rate": 7.614256788492316e-07, "epoch": 0.757436549050272, "percentage": 75.76, "elapsed_time": "4:33:20", "remaining_time": "1:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2907, "total_steps": 3836, "loss": 0.1338, "learning_rate": 7.598775257735877e-07, "epoch": 0.7576971948001173, "percentage": 75.78, "elapsed_time": "4:33:26", "remaining_time": "1:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2908, "total_steps": 3836, "loss": 0.1453, "learning_rate": 7.583306660679888e-07, "epoch": 0.7579578405499625, "percentage": 75.81, "elapsed_time": "4:33:31", "remaining_time": "1:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2909, "total_steps": 3836, "loss": 0.147, "learning_rate": 7.567851008821586e-07, "epoch": 0.7582184862998078, "percentage": 75.83, "elapsed_time": "4:33:37", "remaining_time": "1:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2910, "total_steps": 3836, "loss": 0.1426, "learning_rate": 7.552408313648602e-07, "epoch": 0.758479132049653, "percentage": 75.86, "elapsed_time": "4:33:42", "remaining_time": "1:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2911, "total_steps": 3836, "loss": 0.1375, "learning_rate": 7.536978586638921e-07, "epoch": 0.7587397777994983, "percentage": 75.89, "elapsed_time": "4:33:48", "remaining_time": "1:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2912, "total_steps": 3836, "loss": 0.1493, "learning_rate": 7.521561839260927e-07, "epoch": 0.7590004235493435, "percentage": 75.91, "elapsed_time": "4:33:54", "remaining_time": "1:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2913, "total_steps": 3836, "loss": 0.1268, "learning_rate": 7.506158082973305e-07, "epoch": 0.7592610692991888, "percentage": 75.94, "elapsed_time": "4:33:59", "remaining_time": "1:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2914, "total_steps": 3836, "loss": 0.138, "learning_rate": 7.49076732922511e-07, "epoch": 0.759521715049034, "percentage": 75.96, "elapsed_time": "4:34:05", "remaining_time": "1:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2915, "total_steps": 3836, "loss": 0.1367, "learning_rate": 7.475389589455748e-07, "epoch": 0.7597823607988792, "percentage": 75.99, "elapsed_time": "4:34:10", "remaining_time": "1:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2916, "total_steps": 3836, "loss": 0.1608, "learning_rate": 7.460024875094926e-07, "epoch": 0.7600430065487245, "percentage": 76.02, "elapsed_time": "4:34:16", "remaining_time": "1:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2917, "total_steps": 3836, "loss": 0.1399, "learning_rate": 7.444673197562682e-07, "epoch": 0.7603036522985697, "percentage": 76.04, "elapsed_time": "4:34:23", "remaining_time": "1:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2918, "total_steps": 3836, "loss": 0.1462, "learning_rate": 7.429334568269364e-07, "epoch": 0.760564298048415, "percentage": 76.07, "elapsed_time": "4:34:27", "remaining_time": "1:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2919, "total_steps": 3836, "loss": 0.1413, "learning_rate": 7.414008998615619e-07, "epoch": 0.7608249437982602, "percentage": 76.09, "elapsed_time": "4:34:34", "remaining_time": "1:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2920, "total_steps": 3836, "loss": 0.1336, "learning_rate": 7.398696499992386e-07, "epoch": 0.7610855895481055, "percentage": 76.12, "elapsed_time": "4:34:39", "remaining_time": "1:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2921, "total_steps": 3836, "loss": 0.1428, "learning_rate": 7.383397083780882e-07, "epoch": 0.7613462352979506, "percentage": 76.15, "elapsed_time": "4:34:45", "remaining_time": "1:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2922, "total_steps": 3836, "loss": 0.1306, "learning_rate": 7.368110761352631e-07, "epoch": 0.761606881047796, "percentage": 76.17, "elapsed_time": "4:34:50", "remaining_time": "1:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2923, "total_steps": 3836, "loss": 0.1463, "learning_rate": 7.3528375440694e-07, "epoch": 0.7618675267976411, "percentage": 76.2, "elapsed_time": "4:34:55", "remaining_time": "1:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2924, "total_steps": 3836, "loss": 0.1488, "learning_rate": 7.337577443283192e-07, "epoch": 0.7621281725474864, "percentage": 76.23, "elapsed_time": "4:35:01", "remaining_time": "1:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2925, "total_steps": 3836, "loss": 0.1495, "learning_rate": 7.322330470336314e-07, "epoch": 0.7623888182973316, "percentage": 76.25, "elapsed_time": "4:35:06", "remaining_time": "1:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2926, "total_steps": 3836, "loss": 0.1335, "learning_rate": 7.307096636561281e-07, "epoch": 0.7626494640471769, "percentage": 76.28, "elapsed_time": "4:35:12", "remaining_time": "1:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2927, "total_steps": 3836, "loss": 0.1353, "learning_rate": 7.291875953280842e-07, "epoch": 0.7629101097970221, "percentage": 76.3, "elapsed_time": "4:35:17", "remaining_time": "1:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2928, "total_steps": 3836, "loss": 0.1416, "learning_rate": 7.276668431808004e-07, "epoch": 0.7631707555468674, "percentage": 76.33, "elapsed_time": "4:35:23", "remaining_time": "1:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2929, "total_steps": 3836, "loss": 0.1351, "learning_rate": 7.261474083445941e-07, "epoch": 0.7634314012967126, "percentage": 76.36, "elapsed_time": "4:35:28", "remaining_time": "1:25:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2930, "total_steps": 3836, "loss": 0.1398, "learning_rate": 7.246292919488068e-07, "epoch": 0.7636920470465578, "percentage": 76.38, "elapsed_time": "4:35:34", "remaining_time": "1:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2931, "total_steps": 3836, "loss": 0.1519, "learning_rate": 7.231124951218002e-07, "epoch": 0.7639526927964031, "percentage": 76.41, "elapsed_time": "4:35:39", "remaining_time": "1:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2932, "total_steps": 3836, "loss": 0.1298, "learning_rate": 7.215970189909546e-07, "epoch": 0.7642133385462483, "percentage": 76.43, "elapsed_time": "4:35:45", "remaining_time": "1:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2933, "total_steps": 3836, "loss": 0.1313, "learning_rate": 7.20082864682668e-07, "epoch": 0.7644739842960936, "percentage": 76.46, "elapsed_time": "4:35:50", "remaining_time": "1:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2934, "total_steps": 3836, "loss": 0.161, "learning_rate": 7.185700333223564e-07, "epoch": 0.7647346300459388, "percentage": 76.49, "elapsed_time": "4:35:56", "remaining_time": "1:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2935, "total_steps": 3836, "loss": 0.1359, "learning_rate": 7.170585260344528e-07, "epoch": 0.7649952757957841, "percentage": 76.51, "elapsed_time": "4:36:01", "remaining_time": "1:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2936, "total_steps": 3836, "loss": 0.1419, "learning_rate": 7.155483439424058e-07, "epoch": 0.7652559215456293, "percentage": 76.54, "elapsed_time": "4:36:07", "remaining_time": "1:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2937, "total_steps": 3836, "loss": 0.1484, "learning_rate": 7.140394881686785e-07, "epoch": 0.7655165672954746, "percentage": 76.56, "elapsed_time": "4:36:13", "remaining_time": "1:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2938, "total_steps": 3836, "loss": 0.1309, "learning_rate": 7.1253195983475e-07, "epoch": 0.7657772130453198, "percentage": 76.59, "elapsed_time": "4:36:18", "remaining_time": "1:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2939, "total_steps": 3836, "loss": 0.1432, "learning_rate": 7.110257600611117e-07, "epoch": 0.7660378587951651, "percentage": 76.62, "elapsed_time": "4:36:24", "remaining_time": "1:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2940, "total_steps": 3836, "loss": 0.1326, "learning_rate": 7.09520889967265e-07, "epoch": 0.7662985045450103, "percentage": 76.64, "elapsed_time": "4:36:30", "remaining_time": "1:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2941, "total_steps": 3836, "loss": 0.1479, "learning_rate": 7.08017350671728e-07, "epoch": 0.7665591502948556, "percentage": 76.67, "elapsed_time": "4:36:35", "remaining_time": "1:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2942, "total_steps": 3836, "loss": 0.1469, "learning_rate": 7.065151432920258e-07, "epoch": 0.7668197960447007, "percentage": 76.69, "elapsed_time": "4:36:40", "remaining_time": "1:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2943, "total_steps": 3836, "loss": 0.1377, "learning_rate": 7.050142689446951e-07, "epoch": 0.767080441794546, "percentage": 76.72, "elapsed_time": "4:36:47", "remaining_time": "1:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2944, "total_steps": 3836, "loss": 0.135, "learning_rate": 7.035147287452803e-07, "epoch": 0.7673410875443912, "percentage": 76.75, "elapsed_time": "4:36:53", "remaining_time": "1:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2945, "total_steps": 3836, "loss": 0.1311, "learning_rate": 7.020165238083382e-07, "epoch": 0.7676017332942364, "percentage": 76.77, "elapsed_time": "4:36:58", "remaining_time": "1:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2946, "total_steps": 3836, "loss": 0.1272, "learning_rate": 7.005196552474275e-07, "epoch": 0.7678623790440817, "percentage": 76.8, "elapsed_time": "4:37:04", "remaining_time": "1:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2947, "total_steps": 3836, "loss": 0.139, "learning_rate": 6.990241241751167e-07, "epoch": 0.7681230247939269, "percentage": 76.82, "elapsed_time": "4:37:09", "remaining_time": "1:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2948, "total_steps": 3836, "loss": 0.1342, "learning_rate": 6.975299317029813e-07, "epoch": 0.7683836705437722, "percentage": 76.85, "elapsed_time": "4:37:15", "remaining_time": "1:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2949, "total_steps": 3836, "loss": 0.1437, "learning_rate": 6.960370789415999e-07, "epoch": 0.7686443162936174, "percentage": 76.88, "elapsed_time": "4:37:20", "remaining_time": "1:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2950, "total_steps": 3836, "loss": 0.1487, "learning_rate": 6.945455670005558e-07, "epoch": 0.7689049620434627, "percentage": 76.9, "elapsed_time": "4:37:26", "remaining_time": "1:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2951, "total_steps": 3836, "loss": 0.1391, "learning_rate": 6.930553969884354e-07, "epoch": 0.7691656077933079, "percentage": 76.93, "elapsed_time": "4:37:31", "remaining_time": "1:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2952, "total_steps": 3836, "loss": 0.1342, "learning_rate": 6.915665700128291e-07, "epoch": 0.7694262535431532, "percentage": 76.96, "elapsed_time": "4:37:37", "remaining_time": "1:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2953, "total_steps": 3836, "loss": 0.1503, "learning_rate": 6.900790871803273e-07, "epoch": 0.7696868992929984, "percentage": 76.98, "elapsed_time": "4:37:43", "remaining_time": "1:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2954, "total_steps": 3836, "loss": 0.135, "learning_rate": 6.885929495965216e-07, "epoch": 0.7699475450428437, "percentage": 77.01, "elapsed_time": "4:37:49", "remaining_time": "1:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2955, "total_steps": 3836, "loss": 0.128, "learning_rate": 6.871081583660058e-07, "epoch": 0.7702081907926889, "percentage": 77.03, "elapsed_time": "4:37:55", "remaining_time": "1:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2956, "total_steps": 3836, "loss": 0.1384, "learning_rate": 6.856247145923708e-07, "epoch": 0.7704688365425342, "percentage": 77.06, "elapsed_time": "4:37:59", "remaining_time": "1:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2957, "total_steps": 3836, "loss": 0.1363, "learning_rate": 6.841426193782066e-07, "epoch": 0.7707294822923794, "percentage": 77.09, "elapsed_time": "4:38:05", "remaining_time": "1:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2958, "total_steps": 3836, "loss": 0.1312, "learning_rate": 6.82661873825101e-07, "epoch": 0.7709901280422247, "percentage": 77.11, "elapsed_time": "4:38:10", "remaining_time": "1:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2959, "total_steps": 3836, "loss": 0.1372, "learning_rate": 6.811824790336382e-07, "epoch": 0.7712507737920699, "percentage": 77.14, "elapsed_time": "4:38:15", "remaining_time": "1:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2960, "total_steps": 3836, "loss": 0.1406, "learning_rate": 6.797044361033986e-07, "epoch": 0.771511419541915, "percentage": 77.16, "elapsed_time": "4:38:21", "remaining_time": "1:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2961, "total_steps": 3836, "loss": 0.1346, "learning_rate": 6.7822774613296e-07, "epoch": 0.7717720652917603, "percentage": 77.19, "elapsed_time": "4:38:26", "remaining_time": "1:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2962, "total_steps": 3836, "loss": 0.1347, "learning_rate": 6.767524102198903e-07, "epoch": 0.7720327110416055, "percentage": 77.22, "elapsed_time": "4:38:31", "remaining_time": "1:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2963, "total_steps": 3836, "loss": 0.1215, "learning_rate": 6.752784294607531e-07, "epoch": 0.7722933567914508, "percentage": 77.24, "elapsed_time": "4:38:36", "remaining_time": "1:22:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2964, "total_steps": 3836, "loss": 0.1526, "learning_rate": 6.738058049511067e-07, "epoch": 0.772554002541296, "percentage": 77.27, "elapsed_time": "4:38:42", "remaining_time": "1:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2965, "total_steps": 3836, "loss": 0.1367, "learning_rate": 6.72334537785499e-07, "epoch": 0.7728146482911413, "percentage": 77.29, "elapsed_time": "4:38:47", "remaining_time": "1:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2966, "total_steps": 3836, "loss": 0.139, "learning_rate": 6.708646290574694e-07, "epoch": 0.7730752940409865, "percentage": 77.32, "elapsed_time": "4:38:53", "remaining_time": "1:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2967, "total_steps": 3836, "loss": 0.1566, "learning_rate": 6.693960798595478e-07, "epoch": 0.7733359397908318, "percentage": 77.35, "elapsed_time": "4:38:59", "remaining_time": "1:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2968, "total_steps": 3836, "loss": 0.1279, "learning_rate": 6.679288912832538e-07, "epoch": 0.773596585540677, "percentage": 77.37, "elapsed_time": "4:39:05", "remaining_time": "1:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2969, "total_steps": 3836, "loss": 0.1416, "learning_rate": 6.664630644190953e-07, "epoch": 0.7738572312905223, "percentage": 77.4, "elapsed_time": "4:39:11", "remaining_time": "1:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2970, "total_steps": 3836, "loss": 0.1404, "learning_rate": 6.649986003565678e-07, "epoch": 0.7741178770403675, "percentage": 77.42, "elapsed_time": "4:39:17", "remaining_time": "1:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2971, "total_steps": 3836, "loss": 0.1327, "learning_rate": 6.635355001841559e-07, "epoch": 0.7743785227902128, "percentage": 77.45, "elapsed_time": "4:39:23", "remaining_time": "1:21:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2972, "total_steps": 3836, "loss": 0.1429, "learning_rate": 6.620737649893291e-07, "epoch": 0.774639168540058, "percentage": 77.48, "elapsed_time": "4:39:28", "remaining_time": "1:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2973, "total_steps": 3836, "loss": 0.1428, "learning_rate": 6.606133958585401e-07, "epoch": 0.7748998142899033, "percentage": 77.5, "elapsed_time": "4:39:34", "remaining_time": "1:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2974, "total_steps": 3836, "loss": 0.1421, "learning_rate": 6.591543938772302e-07, "epoch": 0.7751604600397485, "percentage": 77.53, "elapsed_time": "4:39:39", "remaining_time": "1:21:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2975, "total_steps": 3836, "loss": 0.1387, "learning_rate": 6.576967601298223e-07, "epoch": 0.7754211057895937, "percentage": 77.55, "elapsed_time": "4:39:44", "remaining_time": "1:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2976, "total_steps": 3836, "loss": 0.1407, "learning_rate": 6.562404956997229e-07, "epoch": 0.775681751539439, "percentage": 77.58, "elapsed_time": "4:39:50", "remaining_time": "1:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2977, "total_steps": 3836, "loss": 0.1389, "learning_rate": 6.547856016693193e-07, "epoch": 0.7759423972892842, "percentage": 77.61, "elapsed_time": "4:39:56", "remaining_time": "1:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2978, "total_steps": 3836, "loss": 0.1288, "learning_rate": 6.533320791199848e-07, "epoch": 0.7762030430391295, "percentage": 77.63, "elapsed_time": "4:40:02", "remaining_time": "1:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2979, "total_steps": 3836, "loss": 0.1203, "learning_rate": 6.518799291320671e-07, "epoch": 0.7764636887889746, "percentage": 77.66, "elapsed_time": "4:40:07", "remaining_time": "1:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2980, "total_steps": 3836, "loss": 0.1325, "learning_rate": 6.504291527848972e-07, "epoch": 0.77672433453882, "percentage": 77.69, "elapsed_time": "4:40:12", "remaining_time": "1:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2981, "total_steps": 3836, "loss": 0.1604, "learning_rate": 6.489797511567856e-07, "epoch": 0.7769849802886651, "percentage": 77.71, "elapsed_time": "4:40:17", "remaining_time": "1:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2982, "total_steps": 3836, "loss": 0.1442, "learning_rate": 6.475317253250196e-07, "epoch": 0.7772456260385104, "percentage": 77.74, "elapsed_time": "4:40:23", "remaining_time": "1:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2983, "total_steps": 3836, "loss": 0.1436, "learning_rate": 6.460850763658647e-07, "epoch": 0.7775062717883556, "percentage": 77.76, "elapsed_time": "4:40:28", "remaining_time": "1:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2984, "total_steps": 3836, "loss": 0.1416, "learning_rate": 6.446398053545619e-07, "epoch": 0.7777669175382009, "percentage": 77.79, "elapsed_time": "4:40:34", "remaining_time": "1:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2985, "total_steps": 3836, "loss": 0.1316, "learning_rate": 6.431959133653296e-07, "epoch": 0.7780275632880461, "percentage": 77.82, "elapsed_time": "4:40:39", "remaining_time": "1:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2986, "total_steps": 3836, "loss": 0.1263, "learning_rate": 6.417534014713594e-07, "epoch": 0.7782882090378914, "percentage": 77.84, "elapsed_time": "4:40:44", "remaining_time": "1:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2987, "total_steps": 3836, "loss": 0.1319, "learning_rate": 6.403122707448198e-07, "epoch": 0.7785488547877366, "percentage": 77.87, "elapsed_time": "4:40:49", "remaining_time": "1:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2988, "total_steps": 3836, "loss": 0.1364, "learning_rate": 6.388725222568498e-07, "epoch": 0.7788095005375819, "percentage": 77.89, "elapsed_time": "4:40:55", "remaining_time": "1:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2989, "total_steps": 3836, "loss": 0.1413, "learning_rate": 6.374341570775633e-07, "epoch": 0.7790701462874271, "percentage": 77.92, "elapsed_time": "4:41:01", "remaining_time": "1:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2990, "total_steps": 3836, "loss": 0.1389, "learning_rate": 6.359971762760442e-07, "epoch": 0.7793307920372723, "percentage": 77.95, "elapsed_time": "4:41:07", "remaining_time": "1:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2991, "total_steps": 3836, "loss": 0.1395, "learning_rate": 6.345615809203487e-07, "epoch": 0.7795914377871176, "percentage": 77.97, "elapsed_time": "4:41:12", "remaining_time": "1:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2992, "total_steps": 3836, "loss": 0.134, "learning_rate": 6.331273720775028e-07, "epoch": 0.7798520835369628, "percentage": 78.0, "elapsed_time": "4:41:18", "remaining_time": "1:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2993, "total_steps": 3836, "loss": 0.1495, "learning_rate": 6.316945508135014e-07, "epoch": 0.7801127292868081, "percentage": 78.02, "elapsed_time": "4:41:24", "remaining_time": "1:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2994, "total_steps": 3836, "loss": 0.1391, "learning_rate": 6.302631181933106e-07, "epoch": 0.7803733750366533, "percentage": 78.05, "elapsed_time": "4:41:29", "remaining_time": "1:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2995, "total_steps": 3836, "loss": 0.1464, "learning_rate": 6.288330752808605e-07, "epoch": 0.7806340207864986, "percentage": 78.08, "elapsed_time": "4:41:35", "remaining_time": "1:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2996, "total_steps": 3836, "loss": 0.1392, "learning_rate": 6.274044231390503e-07, "epoch": 0.7808946665363438, "percentage": 78.1, "elapsed_time": "4:41:40", "remaining_time": "1:18:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2997, "total_steps": 3836, "loss": 0.1436, "learning_rate": 6.259771628297465e-07, "epoch": 0.7811553122861891, "percentage": 78.13, "elapsed_time": "4:41:46", "remaining_time": "1:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2998, "total_steps": 3836, "loss": 0.1451, "learning_rate": 6.245512954137795e-07, "epoch": 0.7814159580360343, "percentage": 78.15, "elapsed_time": "4:41:52", "remaining_time": "1:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2999, "total_steps": 3836, "loss": 0.1453, "learning_rate": 6.23126821950945e-07, "epoch": 0.7816766037858796, "percentage": 78.18, "elapsed_time": "4:41:57", "remaining_time": "1:18:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 3836, "loss": 0.1442, "learning_rate": 6.217037435000028e-07, "epoch": 0.7819372495357247, "percentage": 78.21, "elapsed_time": "4:42:02", "remaining_time": "1:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 3836, "eval_loss": 0.13870234787464142, "epoch": 0.7819372495357247, "percentage": 78.21, "elapsed_time": "4:42:57", "remaining_time": "1:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3001, "total_steps": 3836, "loss": 0.1429, "learning_rate": 6.20282061118675e-07, "epoch": 0.78219789528557, "percentage": 78.23, "elapsed_time": "4:43:03", "remaining_time": "1:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3002, "total_steps": 3836, "loss": 0.1485, "learning_rate": 6.18861775863647e-07, "epoch": 0.7824585410354152, "percentage": 78.26, "elapsed_time": "4:43:08", "remaining_time": "1:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3003, "total_steps": 3836, "loss": 0.1379, "learning_rate": 6.174428887905648e-07, "epoch": 0.7827191867852605, "percentage": 78.28, "elapsed_time": "4:43:13", "remaining_time": "1:18:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3004, "total_steps": 3836, "loss": 0.1412, "learning_rate": 6.16025400954037e-07, "epoch": 0.7829798325351057, "percentage": 78.31, "elapsed_time": "4:43:19", "remaining_time": "1:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3005, "total_steps": 3836, "loss": 0.139, "learning_rate": 6.146093134076314e-07, "epoch": 0.7832404782849509, "percentage": 78.34, "elapsed_time": "4:43:26", "remaining_time": "1:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3006, "total_steps": 3836, "loss": 0.1311, "learning_rate": 6.131946272038719e-07, "epoch": 0.7835011240347962, "percentage": 78.36, "elapsed_time": "4:43:31", "remaining_time": "1:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3007, "total_steps": 3836, "loss": 0.1294, "learning_rate": 6.11781343394246e-07, "epoch": 0.7837617697846414, "percentage": 78.39, "elapsed_time": "4:43:36", "remaining_time": "1:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3008, "total_steps": 3836, "loss": 0.1483, "learning_rate": 6.103694630291954e-07, "epoch": 0.7840224155344867, "percentage": 78.42, "elapsed_time": "4:43:41", "remaining_time": "1:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3009, "total_steps": 3836, "loss": 0.1382, "learning_rate": 6.089589871581203e-07, "epoch": 0.7842830612843319, "percentage": 78.44, "elapsed_time": "4:43:47", "remaining_time": "1:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3010, "total_steps": 3836, "loss": 0.1462, "learning_rate": 6.07549916829375e-07, "epoch": 0.7845437070341772, "percentage": 78.47, "elapsed_time": "4:43:52", "remaining_time": "1:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3011, "total_steps": 3836, "loss": 0.1384, "learning_rate": 6.061422530902727e-07, "epoch": 0.7848043527840224, "percentage": 78.49, "elapsed_time": "4:43:57", "remaining_time": "1:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3012, "total_steps": 3836, "loss": 0.148, "learning_rate": 6.047359969870773e-07, "epoch": 0.7850649985338677, "percentage": 78.52, "elapsed_time": "4:44:03", "remaining_time": "1:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3013, "total_steps": 3836, "loss": 0.1317, "learning_rate": 6.033311495650074e-07, "epoch": 0.7853256442837129, "percentage": 78.55, "elapsed_time": "4:44:09", "remaining_time": "1:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3014, "total_steps": 3836, "loss": 0.1432, "learning_rate": 6.019277118682371e-07, "epoch": 0.7855862900335582, "percentage": 78.57, "elapsed_time": "4:44:14", "remaining_time": "1:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3015, "total_steps": 3836, "loss": 0.1403, "learning_rate": 6.005256849398899e-07, "epoch": 0.7858469357834034, "percentage": 78.6, "elapsed_time": "4:44:19", "remaining_time": "1:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3016, "total_steps": 3836, "loss": 0.1419, "learning_rate": 5.991250698220416e-07, "epoch": 0.7861075815332487, "percentage": 78.62, "elapsed_time": "4:44:25", "remaining_time": "1:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3017, "total_steps": 3836, "loss": 0.1515, "learning_rate": 5.977258675557191e-07, "epoch": 0.7863682272830939, "percentage": 78.65, "elapsed_time": "4:44:32", "remaining_time": "1:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3018, "total_steps": 3836, "loss": 0.1294, "learning_rate": 5.963280791808984e-07, "epoch": 0.7866288730329392, "percentage": 78.68, "elapsed_time": "4:44:37", "remaining_time": "1:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3019, "total_steps": 3836, "loss": 0.1443, "learning_rate": 5.949317057365042e-07, "epoch": 0.7868895187827843, "percentage": 78.7, "elapsed_time": "4:44:43", "remaining_time": "1:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3020, "total_steps": 3836, "loss": 0.1352, "learning_rate": 5.935367482604124e-07, "epoch": 0.7871501645326295, "percentage": 78.73, "elapsed_time": "4:44:49", "remaining_time": "1:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3021, "total_steps": 3836, "loss": 0.1331, "learning_rate": 5.921432077894429e-07, "epoch": 0.7874108102824748, "percentage": 78.75, "elapsed_time": "4:44:54", "remaining_time": "1:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3022, "total_steps": 3836, "loss": 0.15, "learning_rate": 5.907510853593642e-07, "epoch": 0.78767145603232, "percentage": 78.78, "elapsed_time": "4:45:00", "remaining_time": "1:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3023, "total_steps": 3836, "loss": 0.1444, "learning_rate": 5.89360382004891e-07, "epoch": 0.7879321017821653, "percentage": 78.81, "elapsed_time": "4:45:05", "remaining_time": "1:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3024, "total_steps": 3836, "loss": 0.1359, "learning_rate": 5.879710987596818e-07, "epoch": 0.7881927475320105, "percentage": 78.83, "elapsed_time": "4:45:11", "remaining_time": "1:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3025, "total_steps": 3836, "loss": 0.1482, "learning_rate": 5.865832366563415e-07, "epoch": 0.7884533932818558, "percentage": 78.86, "elapsed_time": "4:45:17", "remaining_time": "1:16:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3026, "total_steps": 3836, "loss": 0.1478, "learning_rate": 5.851967967264164e-07, "epoch": 0.788714039031701, "percentage": 78.88, "elapsed_time": "4:45:23", "remaining_time": "1:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3027, "total_steps": 3836, "loss": 0.1426, "learning_rate": 5.838117800003995e-07, "epoch": 0.7889746847815463, "percentage": 78.91, "elapsed_time": "4:45:28", "remaining_time": "1:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3028, "total_steps": 3836, "loss": 0.1443, "learning_rate": 5.824281875077212e-07, "epoch": 0.7892353305313915, "percentage": 78.94, "elapsed_time": "4:45:34", "remaining_time": "1:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3029, "total_steps": 3836, "loss": 0.132, "learning_rate": 5.810460202767563e-07, "epoch": 0.7894959762812368, "percentage": 78.96, "elapsed_time": "4:45:39", "remaining_time": "1:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3030, "total_steps": 3836, "loss": 0.1493, "learning_rate": 5.796652793348203e-07, "epoch": 0.789756622031082, "percentage": 78.99, "elapsed_time": "4:45:44", "remaining_time": "1:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3031, "total_steps": 3836, "loss": 0.1325, "learning_rate": 5.78285965708168e-07, "epoch": 0.7900172677809273, "percentage": 79.01, "elapsed_time": "4:45:51", "remaining_time": "1:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3032, "total_steps": 3836, "loss": 0.1493, "learning_rate": 5.769080804219929e-07, "epoch": 0.7902779135307725, "percentage": 79.04, "elapsed_time": "4:45:56", "remaining_time": "1:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3033, "total_steps": 3836, "loss": 0.1437, "learning_rate": 5.755316245004275e-07, "epoch": 0.7905385592806178, "percentage": 79.07, "elapsed_time": "4:46:02", "remaining_time": "1:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3034, "total_steps": 3836, "loss": 0.135, "learning_rate": 5.741565989665413e-07, "epoch": 0.790799205030463, "percentage": 79.09, "elapsed_time": "4:46:07", "remaining_time": "1:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3035, "total_steps": 3836, "loss": 0.143, "learning_rate": 5.72783004842341e-07, "epoch": 0.7910598507803082, "percentage": 79.12, "elapsed_time": "4:46:13", "remaining_time": "1:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3036, "total_steps": 3836, "loss": 0.1235, "learning_rate": 5.714108431487692e-07, "epoch": 0.7913204965301535, "percentage": 79.14, "elapsed_time": "4:46:19", "remaining_time": "1:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3037, "total_steps": 3836, "loss": 0.1382, "learning_rate": 5.70040114905705e-07, "epoch": 0.7915811422799987, "percentage": 79.17, "elapsed_time": "4:46:24", "remaining_time": "1:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3038, "total_steps": 3836, "loss": 0.1429, "learning_rate": 5.68670821131961e-07, "epoch": 0.791841788029844, "percentage": 79.2, "elapsed_time": "4:46:30", "remaining_time": "1:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3039, "total_steps": 3836, "loss": 0.1259, "learning_rate": 5.673029628452819e-07, "epoch": 0.7921024337796891, "percentage": 79.22, "elapsed_time": "4:46:36", "remaining_time": "1:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3040, "total_steps": 3836, "loss": 0.131, "learning_rate": 5.659365410623491e-07, "epoch": 0.7923630795295344, "percentage": 79.25, "elapsed_time": "4:46:41", "remaining_time": "1:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3041, "total_steps": 3836, "loss": 0.1377, "learning_rate": 5.645715567987742e-07, "epoch": 0.7926237252793796, "percentage": 79.28, "elapsed_time": "4:46:47", "remaining_time": "1:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3042, "total_steps": 3836, "loss": 0.1292, "learning_rate": 5.63208011069099e-07, "epoch": 0.7928843710292249, "percentage": 79.3, "elapsed_time": "4:46:53", "remaining_time": "1:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3043, "total_steps": 3836, "loss": 0.1279, "learning_rate": 5.618459048868008e-07, "epoch": 0.7931450167790701, "percentage": 79.33, "elapsed_time": "4:46:58", "remaining_time": "1:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3044, "total_steps": 3836, "loss": 0.1383, "learning_rate": 5.604852392642813e-07, "epoch": 0.7934056625289154, "percentage": 79.35, "elapsed_time": "4:47:04", "remaining_time": "1:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3045, "total_steps": 3836, "loss": 0.1352, "learning_rate": 5.591260152128736e-07, "epoch": 0.7936663082787606, "percentage": 79.38, "elapsed_time": "4:47:09", "remaining_time": "1:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3046, "total_steps": 3836, "loss": 0.1472, "learning_rate": 5.577682337428417e-07, "epoch": 0.7939269540286059, "percentage": 79.41, "elapsed_time": "4:47:15", "remaining_time": "1:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3047, "total_steps": 3836, "loss": 0.1392, "learning_rate": 5.564118958633746e-07, "epoch": 0.7941875997784511, "percentage": 79.43, "elapsed_time": "4:47:20", "remaining_time": "1:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3048, "total_steps": 3836, "loss": 0.1299, "learning_rate": 5.550570025825888e-07, "epoch": 0.7944482455282964, "percentage": 79.46, "elapsed_time": "4:47:26", "remaining_time": "1:14:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3049, "total_steps": 3836, "loss": 0.1396, "learning_rate": 5.537035549075279e-07, "epoch": 0.7947088912781416, "percentage": 79.48, "elapsed_time": "4:47:32", "remaining_time": "1:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3050, "total_steps": 3836, "loss": 0.1321, "learning_rate": 5.523515538441604e-07, "epoch": 0.7949695370279868, "percentage": 79.51, "elapsed_time": "4:47:37", "remaining_time": "1:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3051, "total_steps": 3836, "loss": 0.1368, "learning_rate": 5.510010003973795e-07, "epoch": 0.7952301827778321, "percentage": 79.54, "elapsed_time": "4:47:42", "remaining_time": "1:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3052, "total_steps": 3836, "loss": 0.1435, "learning_rate": 5.496518955710023e-07, "epoch": 0.7954908285276773, "percentage": 79.56, "elapsed_time": "4:47:48", "remaining_time": "1:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3053, "total_steps": 3836, "loss": 0.143, "learning_rate": 5.483042403677707e-07, "epoch": 0.7957514742775226, "percentage": 79.59, "elapsed_time": "4:47:54", "remaining_time": "1:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3054, "total_steps": 3836, "loss": 0.1383, "learning_rate": 5.469580357893484e-07, "epoch": 0.7960121200273678, "percentage": 79.61, "elapsed_time": "4:47:59", "remaining_time": "1:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3055, "total_steps": 3836, "loss": 0.1391, "learning_rate": 5.456132828363181e-07, "epoch": 0.7962727657772131, "percentage": 79.64, "elapsed_time": "4:48:05", "remaining_time": "1:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3056, "total_steps": 3836, "loss": 0.1429, "learning_rate": 5.442699825081885e-07, "epoch": 0.7965334115270583, "percentage": 79.67, "elapsed_time": "4:48:11", "remaining_time": "1:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3057, "total_steps": 3836, "loss": 0.1342, "learning_rate": 5.429281358033847e-07, "epoch": 0.7967940572769036, "percentage": 79.69, "elapsed_time": "4:48:16", "remaining_time": "1:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3058, "total_steps": 3836, "loss": 0.1395, "learning_rate": 5.415877437192535e-07, "epoch": 0.7970547030267487, "percentage": 79.72, "elapsed_time": "4:48:21", "remaining_time": "1:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3059, "total_steps": 3836, "loss": 0.1309, "learning_rate": 5.402488072520587e-07, "epoch": 0.797315348776594, "percentage": 79.74, "elapsed_time": "4:48:27", "remaining_time": "1:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3060, "total_steps": 3836, "loss": 0.1279, "learning_rate": 5.389113273969857e-07, "epoch": 0.7975759945264392, "percentage": 79.77, "elapsed_time": "4:48:32", "remaining_time": "1:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3061, "total_steps": 3836, "loss": 0.1559, "learning_rate": 5.375753051481324e-07, "epoch": 0.7978366402762845, "percentage": 79.8, "elapsed_time": "4:48:38", "remaining_time": "1:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3062, "total_steps": 3836, "loss": 0.1442, "learning_rate": 5.36240741498516e-07, "epoch": 0.7980972860261297, "percentage": 79.82, "elapsed_time": "4:48:44", "remaining_time": "1:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3063, "total_steps": 3836, "loss": 0.1427, "learning_rate": 5.349076374400708e-07, "epoch": 0.798357931775975, "percentage": 79.85, "elapsed_time": "4:48:50", "remaining_time": "1:12:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3064, "total_steps": 3836, "loss": 0.1349, "learning_rate": 5.33575993963644e-07, "epoch": 0.7986185775258202, "percentage": 79.87, "elapsed_time": "4:48:56", "remaining_time": "1:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3065, "total_steps": 3836, "loss": 0.1464, "learning_rate": 5.32245812058998e-07, "epoch": 0.7988792232756654, "percentage": 79.9, "elapsed_time": "4:49:01", "remaining_time": "1:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3066, "total_steps": 3836, "loss": 0.143, "learning_rate": 5.309170927148088e-07, "epoch": 0.7991398690255107, "percentage": 79.93, "elapsed_time": "4:49:07", "remaining_time": "1:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3067, "total_steps": 3836, "loss": 0.1314, "learning_rate": 5.295898369186655e-07, "epoch": 0.7994005147753559, "percentage": 79.95, "elapsed_time": "4:49:13", "remaining_time": "1:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3068, "total_steps": 3836, "loss": 0.1334, "learning_rate": 5.282640456570692e-07, "epoch": 0.7996611605252012, "percentage": 79.98, "elapsed_time": "4:49:18", "remaining_time": "1:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3069, "total_steps": 3836, "loss": 0.1401, "learning_rate": 5.269397199154319e-07, "epoch": 0.7999218062750464, "percentage": 80.01, "elapsed_time": "4:49:23", "remaining_time": "1:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3070, "total_steps": 3836, "loss": 0.138, "learning_rate": 5.256168606780784e-07, "epoch": 0.8001824520248917, "percentage": 80.03, "elapsed_time": "4:49:28", "remaining_time": "1:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3071, "total_steps": 3836, "loss": 0.1321, "learning_rate": 5.24295468928242e-07, "epoch": 0.8004430977747369, "percentage": 80.06, "elapsed_time": "4:49:33", "remaining_time": "1:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3072, "total_steps": 3836, "loss": 0.1409, "learning_rate": 5.229755456480635e-07, "epoch": 0.8007037435245822, "percentage": 80.08, "elapsed_time": "4:49:39", "remaining_time": "1:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3073, "total_steps": 3836, "loss": 0.1278, "learning_rate": 5.216570918185956e-07, "epoch": 0.8009643892744274, "percentage": 80.11, "elapsed_time": "4:49:44", "remaining_time": "1:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3074, "total_steps": 3836, "loss": 0.1404, "learning_rate": 5.203401084197973e-07, "epoch": 0.8012250350242727, "percentage": 80.14, "elapsed_time": "4:49:49", "remaining_time": "1:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3075, "total_steps": 3836, "loss": 0.1306, "learning_rate": 5.190245964305338e-07, "epoch": 0.8014856807741179, "percentage": 80.16, "elapsed_time": "4:49:55", "remaining_time": "1:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3076, "total_steps": 3836, "loss": 0.1369, "learning_rate": 5.177105568285793e-07, "epoch": 0.8017463265239632, "percentage": 80.19, "elapsed_time": "4:50:00", "remaining_time": "1:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3077, "total_steps": 3836, "loss": 0.1466, "learning_rate": 5.163979905906102e-07, "epoch": 0.8020069722738083, "percentage": 80.21, "elapsed_time": "4:50:05", "remaining_time": "1:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3078, "total_steps": 3836, "loss": 0.1385, "learning_rate": 5.150868986922092e-07, "epoch": 0.8022676180236537, "percentage": 80.24, "elapsed_time": "4:50:10", "remaining_time": "1:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3079, "total_steps": 3836, "loss": 0.1349, "learning_rate": 5.137772821078649e-07, "epoch": 0.8025282637734988, "percentage": 80.27, "elapsed_time": "4:50:16", "remaining_time": "1:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3080, "total_steps": 3836, "loss": 0.1243, "learning_rate": 5.124691418109673e-07, "epoch": 0.802788909523344, "percentage": 80.29, "elapsed_time": "4:50:21", "remaining_time": "1:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3081, "total_steps": 3836, "loss": 0.1385, "learning_rate": 5.111624787738095e-07, "epoch": 0.8030495552731893, "percentage": 80.32, "elapsed_time": "4:50:26", "remaining_time": "1:11:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3082, "total_steps": 3836, "loss": 0.1469, "learning_rate": 5.09857293967587e-07, "epoch": 0.8033102010230345, "percentage": 80.34, "elapsed_time": "4:50:31", "remaining_time": "1:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3083, "total_steps": 3836, "loss": 0.136, "learning_rate": 5.085535883623966e-07, "epoch": 0.8035708467728798, "percentage": 80.37, "elapsed_time": "4:50:37", "remaining_time": "1:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3084, "total_steps": 3836, "loss": 0.145, "learning_rate": 5.072513629272352e-07, "epoch": 0.803831492522725, "percentage": 80.4, "elapsed_time": "4:50:43", "remaining_time": "1:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3085, "total_steps": 3836, "loss": 0.136, "learning_rate": 5.059506186299992e-07, "epoch": 0.8040921382725703, "percentage": 80.42, "elapsed_time": "4:50:48", "remaining_time": "1:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3086, "total_steps": 3836, "loss": 0.136, "learning_rate": 5.046513564374861e-07, "epoch": 0.8043527840224155, "percentage": 80.45, "elapsed_time": "4:50:54", "remaining_time": "1:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3087, "total_steps": 3836, "loss": 0.1363, "learning_rate": 5.033535773153906e-07, "epoch": 0.8046134297722608, "percentage": 80.47, "elapsed_time": "4:50:59", "remaining_time": "1:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3088, "total_steps": 3836, "loss": 0.1313, "learning_rate": 5.020572822283027e-07, "epoch": 0.804874075522106, "percentage": 80.5, "elapsed_time": "4:51:05", "remaining_time": "1:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3089, "total_steps": 3836, "loss": 0.1354, "learning_rate": 5.007624721397139e-07, "epoch": 0.8051347212719513, "percentage": 80.53, "elapsed_time": "4:51:10", "remaining_time": "1:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3090, "total_steps": 3836, "loss": 0.1318, "learning_rate": 4.994691480120086e-07, "epoch": 0.8053953670217965, "percentage": 80.55, "elapsed_time": "4:51:16", "remaining_time": "1:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3091, "total_steps": 3836, "loss": 0.1174, "learning_rate": 4.981773108064683e-07, "epoch": 0.8056560127716418, "percentage": 80.58, "elapsed_time": "4:51:21", "remaining_time": "1:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3092, "total_steps": 3836, "loss": 0.146, "learning_rate": 4.968869614832681e-07, "epoch": 0.805916658521487, "percentage": 80.6, "elapsed_time": "4:51:26", "remaining_time": "1:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3093, "total_steps": 3836, "loss": 0.1325, "learning_rate": 4.955981010014793e-07, "epoch": 0.8061773042713323, "percentage": 80.63, "elapsed_time": "4:51:32", "remaining_time": "1:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3094, "total_steps": 3836, "loss": 0.1376, "learning_rate": 4.943107303190639e-07, "epoch": 0.8064379500211775, "percentage": 80.66, "elapsed_time": "4:51:37", "remaining_time": "1:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3095, "total_steps": 3836, "loss": 0.1319, "learning_rate": 4.930248503928778e-07, "epoch": 0.8066985957710228, "percentage": 80.68, "elapsed_time": "4:51:42", "remaining_time": "1:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3096, "total_steps": 3836, "loss": 0.1283, "learning_rate": 4.917404621786703e-07, "epoch": 0.806959241520868, "percentage": 80.71, "elapsed_time": "4:51:47", "remaining_time": "1:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3097, "total_steps": 3836, "loss": 0.1198, "learning_rate": 4.904575666310798e-07, "epoch": 0.8072198872707131, "percentage": 80.74, "elapsed_time": "4:51:53", "remaining_time": "1:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3098, "total_steps": 3836, "loss": 0.1316, "learning_rate": 4.891761647036364e-07, "epoch": 0.8074805330205584, "percentage": 80.76, "elapsed_time": "4:51:59", "remaining_time": "1:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3099, "total_steps": 3836, "loss": 0.1349, "learning_rate": 4.878962573487598e-07, "epoch": 0.8077411787704036, "percentage": 80.79, "elapsed_time": "4:52:05", "remaining_time": "1:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3100, "total_steps": 3836, "loss": 0.1347, "learning_rate": 4.866178455177584e-07, "epoch": 0.8080018245202489, "percentage": 80.81, "elapsed_time": "4:52:10", "remaining_time": "1:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3101, "total_steps": 3836, "loss": 0.1493, "learning_rate": 4.853409301608297e-07, "epoch": 0.8082624702700941, "percentage": 80.84, "elapsed_time": "4:52:16", "remaining_time": "1:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3102, "total_steps": 3836, "loss": 0.1367, "learning_rate": 4.840655122270582e-07, "epoch": 0.8085231160199394, "percentage": 80.87, "elapsed_time": "4:52:22", "remaining_time": "1:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3103, "total_steps": 3836, "loss": 0.1351, "learning_rate": 4.827915926644169e-07, "epoch": 0.8087837617697846, "percentage": 80.89, "elapsed_time": "4:52:27", "remaining_time": "1:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3104, "total_steps": 3836, "loss": 0.1294, "learning_rate": 4.815191724197634e-07, "epoch": 0.8090444075196299, "percentage": 80.92, "elapsed_time": "4:52:33", "remaining_time": "1:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3105, "total_steps": 3836, "loss": 0.1368, "learning_rate": 4.802482524388418e-07, "epoch": 0.8093050532694751, "percentage": 80.94, "elapsed_time": "4:52:39", "remaining_time": "1:08:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3106, "total_steps": 3836, "loss": 0.1429, "learning_rate": 4.78978833666281e-07, "epoch": 0.8095656990193204, "percentage": 80.97, "elapsed_time": "4:52:44", "remaining_time": "1:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3107, "total_steps": 3836, "loss": 0.1384, "learning_rate": 4.777109170455938e-07, "epoch": 0.8098263447691656, "percentage": 81.0, "elapsed_time": "4:52:50", "remaining_time": "1:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3108, "total_steps": 3836, "loss": 0.1324, "learning_rate": 4.7644450351917617e-07, "epoch": 0.8100869905190109, "percentage": 81.02, "elapsed_time": "4:52:55", "remaining_time": "1:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3109, "total_steps": 3836, "loss": 0.1263, "learning_rate": 4.751795940283094e-07, "epoch": 0.8103476362688561, "percentage": 81.05, "elapsed_time": "4:53:01", "remaining_time": "1:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3110, "total_steps": 3836, "loss": 0.1339, "learning_rate": 4.7391618951315277e-07, "epoch": 0.8106082820187014, "percentage": 81.07, "elapsed_time": "4:53:07", "remaining_time": "1:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3111, "total_steps": 3836, "loss": 0.1256, "learning_rate": 4.7265429091274935e-07, "epoch": 0.8108689277685466, "percentage": 81.1, "elapsed_time": "4:53:12", "remaining_time": "1:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3112, "total_steps": 3836, "loss": 0.1445, "learning_rate": 4.713938991650241e-07, "epoch": 0.8111295735183918, "percentage": 81.13, "elapsed_time": "4:53:18", "remaining_time": "1:08:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3113, "total_steps": 3836, "loss": 0.1254, "learning_rate": 4.701350152067796e-07, "epoch": 0.8113902192682371, "percentage": 81.15, "elapsed_time": "4:53:23", "remaining_time": "1:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3114, "total_steps": 3836, "loss": 0.1405, "learning_rate": 4.688776399736991e-07, "epoch": 0.8116508650180823, "percentage": 81.18, "elapsed_time": "4:53:29", "remaining_time": "1:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3115, "total_steps": 3836, "loss": 0.1341, "learning_rate": 4.676217744003439e-07, "epoch": 0.8119115107679276, "percentage": 81.2, "elapsed_time": "4:53:34", "remaining_time": "1:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3116, "total_steps": 3836, "loss": 0.1455, "learning_rate": 4.6636741942015314e-07, "epoch": 0.8121721565177727, "percentage": 81.23, "elapsed_time": "4:53:39", "remaining_time": "1:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3117, "total_steps": 3836, "loss": 0.1414, "learning_rate": 4.6511457596544406e-07, "epoch": 0.812432802267618, "percentage": 81.26, "elapsed_time": "4:53:45", "remaining_time": "1:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3118, "total_steps": 3836, "loss": 0.1268, "learning_rate": 4.6386324496740855e-07, "epoch": 0.8126934480174632, "percentage": 81.28, "elapsed_time": "4:53:50", "remaining_time": "1:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3119, "total_steps": 3836, "loss": 0.1301, "learning_rate": 4.626134273561175e-07, "epoch": 0.8129540937673085, "percentage": 81.31, "elapsed_time": "4:53:55", "remaining_time": "1:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3120, "total_steps": 3836, "loss": 0.1404, "learning_rate": 4.6136512406051495e-07, "epoch": 0.8132147395171537, "percentage": 81.33, "elapsed_time": "4:54:01", "remaining_time": "1:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3121, "total_steps": 3836, "loss": 0.1437, "learning_rate": 4.601183360084174e-07, "epoch": 0.813475385266999, "percentage": 81.36, "elapsed_time": "4:54:07", "remaining_time": "1:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3122, "total_steps": 3836, "loss": 0.1308, "learning_rate": 4.5887306412651933e-07, "epoch": 0.8137360310168442, "percentage": 81.39, "elapsed_time": "4:54:12", "remaining_time": "1:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3123, "total_steps": 3836, "loss": 0.135, "learning_rate": 4.576293093403855e-07, "epoch": 0.8139966767666895, "percentage": 81.41, "elapsed_time": "4:54:18", "remaining_time": "1:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3124, "total_steps": 3836, "loss": 0.1221, "learning_rate": 4.563870725744543e-07, "epoch": 0.8142573225165347, "percentage": 81.44, "elapsed_time": "4:54:23", "remaining_time": "1:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3125, "total_steps": 3836, "loss": 0.1408, "learning_rate": 4.551463547520341e-07, "epoch": 0.81451796826638, "percentage": 81.47, "elapsed_time": "4:54:29", "remaining_time": "1:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3126, "total_steps": 3836, "loss": 0.1293, "learning_rate": 4.539071567953077e-07, "epoch": 0.8147786140162252, "percentage": 81.49, "elapsed_time": "4:54:35", "remaining_time": "1:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3127, "total_steps": 3836, "loss": 0.1328, "learning_rate": 4.526694796253242e-07, "epoch": 0.8150392597660704, "percentage": 81.52, "elapsed_time": "4:54:40", "remaining_time": "1:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3128, "total_steps": 3836, "loss": 0.1381, "learning_rate": 4.514333241620045e-07, "epoch": 0.8152999055159157, "percentage": 81.54, "elapsed_time": "4:54:46", "remaining_time": "1:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3129, "total_steps": 3836, "loss": 0.1324, "learning_rate": 4.5019869132413877e-07, "epoch": 0.8155605512657609, "percentage": 81.57, "elapsed_time": "4:54:52", "remaining_time": "1:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3130, "total_steps": 3836, "loss": 0.1317, "learning_rate": 4.4896558202938505e-07, "epoch": 0.8158211970156062, "percentage": 81.6, "elapsed_time": "4:54:57", "remaining_time": "1:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3131, "total_steps": 3836, "loss": 0.1429, "learning_rate": 4.4773399719426816e-07, "epoch": 0.8160818427654514, "percentage": 81.62, "elapsed_time": "4:55:03", "remaining_time": "1:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3132, "total_steps": 3836, "loss": 0.1373, "learning_rate": 4.4650393773418123e-07, "epoch": 0.8163424885152967, "percentage": 81.65, "elapsed_time": "4:55:09", "remaining_time": "1:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3133, "total_steps": 3836, "loss": 0.1356, "learning_rate": 4.4527540456338224e-07, "epoch": 0.8166031342651419, "percentage": 81.67, "elapsed_time": "4:55:15", "remaining_time": "1:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3134, "total_steps": 3836, "loss": 0.1392, "learning_rate": 4.440483985949953e-07, "epoch": 0.8168637800149872, "percentage": 81.7, "elapsed_time": "4:55:20", "remaining_time": "1:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3135, "total_steps": 3836, "loss": 0.1408, "learning_rate": 4.428229207410106e-07, "epoch": 0.8171244257648324, "percentage": 81.73, "elapsed_time": "4:55:26", "remaining_time": "1:06:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3136, "total_steps": 3836, "loss": 0.1388, "learning_rate": 4.4159897191228096e-07, "epoch": 0.8173850715146777, "percentage": 81.75, "elapsed_time": "4:55:31", "remaining_time": "1:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3137, "total_steps": 3836, "loss": 0.1227, "learning_rate": 4.403765530185228e-07, "epoch": 0.8176457172645228, "percentage": 81.78, "elapsed_time": "4:55:36", "remaining_time": "1:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3138, "total_steps": 3836, "loss": 0.1279, "learning_rate": 4.3915566496831654e-07, "epoch": 0.8179063630143681, "percentage": 81.8, "elapsed_time": "4:55:41", "remaining_time": "1:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3139, "total_steps": 3836, "loss": 0.145, "learning_rate": 4.3793630866910326e-07, "epoch": 0.8181670087642133, "percentage": 81.83, "elapsed_time": "4:55:46", "remaining_time": "1:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3140, "total_steps": 3836, "loss": 0.146, "learning_rate": 4.367184850271872e-07, "epoch": 0.8184276545140586, "percentage": 81.86, "elapsed_time": "4:55:52", "remaining_time": "1:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3141, "total_steps": 3836, "loss": 0.1534, "learning_rate": 4.3550219494773116e-07, "epoch": 0.8186883002639038, "percentage": 81.88, "elapsed_time": "4:55:58", "remaining_time": "1:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3142, "total_steps": 3836, "loss": 0.1413, "learning_rate": 4.3428743933476207e-07, "epoch": 0.818948946013749, "percentage": 81.91, "elapsed_time": "4:56:03", "remaining_time": "1:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3143, "total_steps": 3836, "loss": 0.1308, "learning_rate": 4.330742190911616e-07, "epoch": 0.8192095917635943, "percentage": 81.93, "elapsed_time": "4:56:09", "remaining_time": "1:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3144, "total_steps": 3836, "loss": 0.1327, "learning_rate": 4.3186253511867227e-07, "epoch": 0.8194702375134395, "percentage": 81.96, "elapsed_time": "4:56:14", "remaining_time": "1:05:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3145, "total_steps": 3836, "loss": 0.127, "learning_rate": 4.306523883178965e-07, "epoch": 0.8197308832632848, "percentage": 81.99, "elapsed_time": "4:56:20", "remaining_time": "1:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3146, "total_steps": 3836, "loss": 0.136, "learning_rate": 4.294437795882919e-07, "epoch": 0.81999152901313, "percentage": 82.01, "elapsed_time": "4:56:25", "remaining_time": "1:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3147, "total_steps": 3836, "loss": 0.1348, "learning_rate": 4.2823670982817365e-07, "epoch": 0.8202521747629753, "percentage": 82.04, "elapsed_time": "4:56:31", "remaining_time": "1:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3148, "total_steps": 3836, "loss": 0.1434, "learning_rate": 4.2703117993471295e-07, "epoch": 0.8205128205128205, "percentage": 82.06, "elapsed_time": "4:56:37", "remaining_time": "1:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3149, "total_steps": 3836, "loss": 0.1365, "learning_rate": 4.258271908039363e-07, "epoch": 0.8207734662626658, "percentage": 82.09, "elapsed_time": "4:56:43", "remaining_time": "1:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3150, "total_steps": 3836, "loss": 0.1401, "learning_rate": 4.2462474333072544e-07, "epoch": 0.821034112012511, "percentage": 82.12, "elapsed_time": "4:56:49", "remaining_time": "1:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3151, "total_steps": 3836, "loss": 0.1427, "learning_rate": 4.2342383840881544e-07, "epoch": 0.8212947577623563, "percentage": 82.14, "elapsed_time": "4:56:54", "remaining_time": "1:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3152, "total_steps": 3836, "loss": 0.1379, "learning_rate": 4.222244769307965e-07, "epoch": 0.8215554035122015, "percentage": 82.17, "elapsed_time": "4:57:00", "remaining_time": "1:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3153, "total_steps": 3836, "loss": 0.1373, "learning_rate": 4.21026659788111e-07, "epoch": 0.8218160492620468, "percentage": 82.19, "elapsed_time": "4:57:06", "remaining_time": "1:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3154, "total_steps": 3836, "loss": 0.137, "learning_rate": 4.198303878710508e-07, "epoch": 0.822076695011892, "percentage": 82.22, "elapsed_time": "4:57:12", "remaining_time": "1:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3155, "total_steps": 3836, "loss": 0.1248, "learning_rate": 4.186356620687637e-07, "epoch": 0.8223373407617373, "percentage": 82.25, "elapsed_time": "4:57:17", "remaining_time": "1:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3156, "total_steps": 3836, "loss": 0.1208, "learning_rate": 4.174424832692453e-07, "epoch": 0.8225979865115824, "percentage": 82.27, "elapsed_time": "4:57:23", "remaining_time": "1:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3157, "total_steps": 3836, "loss": 0.131, "learning_rate": 4.1625085235934225e-07, "epoch": 0.8228586322614276, "percentage": 82.3, "elapsed_time": "4:57:29", "remaining_time": "1:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3158, "total_steps": 3836, "loss": 0.1246, "learning_rate": 4.1506077022475e-07, "epoch": 0.8231192780112729, "percentage": 82.33, "elapsed_time": "4:57:35", "remaining_time": "1:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3159, "total_steps": 3836, "loss": 0.1092, "learning_rate": 4.138722377500154e-07, "epoch": 0.8233799237611181, "percentage": 82.35, "elapsed_time": "4:57:40", "remaining_time": "1:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3160, "total_steps": 3836, "loss": 0.1272, "learning_rate": 4.1268525581853015e-07, "epoch": 0.8236405695109634, "percentage": 82.38, "elapsed_time": "4:57:46", "remaining_time": "1:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3161, "total_steps": 3836, "loss": 0.1243, "learning_rate": 4.1149982531253435e-07, "epoch": 0.8239012152608086, "percentage": 82.4, "elapsed_time": "4:57:51", "remaining_time": "1:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3162, "total_steps": 3836, "loss": 0.1427, "learning_rate": 4.1031594711311686e-07, "epoch": 0.8241618610106539, "percentage": 82.43, "elapsed_time": "4:57:57", "remaining_time": "1:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3163, "total_steps": 3836, "loss": 0.1403, "learning_rate": 4.091336221002112e-07, "epoch": 0.8244225067604991, "percentage": 82.46, "elapsed_time": "4:58:02", "remaining_time": "1:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3164, "total_steps": 3836, "loss": 0.1295, "learning_rate": 4.079528511525968e-07, "epoch": 0.8246831525103444, "percentage": 82.48, "elapsed_time": "4:58:07", "remaining_time": "1:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3165, "total_steps": 3836, "loss": 0.1369, "learning_rate": 4.067736351478979e-07, "epoch": 0.8249437982601896, "percentage": 82.51, "elapsed_time": "4:58:13", "remaining_time": "1:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3166, "total_steps": 3836, "loss": 0.133, "learning_rate": 4.0559597496258263e-07, "epoch": 0.8252044440100349, "percentage": 82.53, "elapsed_time": "4:58:18", "remaining_time": "1:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3167, "total_steps": 3836, "loss": 0.1267, "learning_rate": 4.044198714719633e-07, "epoch": 0.8254650897598801, "percentage": 82.56, "elapsed_time": "4:58:23", "remaining_time": "1:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3168, "total_steps": 3836, "loss": 0.1405, "learning_rate": 4.032453255501956e-07, "epoch": 0.8257257355097254, "percentage": 82.59, "elapsed_time": "4:58:28", "remaining_time": "1:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3169, "total_steps": 3836, "loss": 0.131, "learning_rate": 4.020723380702768e-07, "epoch": 0.8259863812595706, "percentage": 82.61, "elapsed_time": "4:58:34", "remaining_time": "1:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3170, "total_steps": 3836, "loss": 0.1485, "learning_rate": 4.0090090990404563e-07, "epoch": 0.8262470270094159, "percentage": 82.64, "elapsed_time": "4:58:40", "remaining_time": "1:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3171, "total_steps": 3836, "loss": 0.1328, "learning_rate": 3.9973104192218283e-07, "epoch": 0.8265076727592611, "percentage": 82.66, "elapsed_time": "4:58:45", "remaining_time": "1:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3172, "total_steps": 3836, "loss": 0.1211, "learning_rate": 3.9856273499420837e-07, "epoch": 0.8267683185091063, "percentage": 82.69, "elapsed_time": "4:58:50", "remaining_time": "1:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3173, "total_steps": 3836, "loss": 0.1324, "learning_rate": 3.97395989988483e-07, "epoch": 0.8270289642589516, "percentage": 82.72, "elapsed_time": "4:58:56", "remaining_time": "1:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3174, "total_steps": 3836, "loss": 0.1415, "learning_rate": 3.962308077722049e-07, "epoch": 0.8272896100087967, "percentage": 82.74, "elapsed_time": "4:59:02", "remaining_time": "1:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3175, "total_steps": 3836, "loss": 0.1429, "learning_rate": 3.950671892114141e-07, "epoch": 0.827550255758642, "percentage": 82.77, "elapsed_time": "4:59:07", "remaining_time": "1:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3176, "total_steps": 3836, "loss": 0.1246, "learning_rate": 3.9390513517098413e-07, "epoch": 0.8278109015084872, "percentage": 82.79, "elapsed_time": "4:59:13", "remaining_time": "1:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3177, "total_steps": 3836, "loss": 0.1497, "learning_rate": 3.9274464651462786e-07, "epoch": 0.8280715472583325, "percentage": 82.82, "elapsed_time": "4:59:19", "remaining_time": "1:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3178, "total_steps": 3836, "loss": 0.1363, "learning_rate": 3.9158572410489537e-07, "epoch": 0.8283321930081777, "percentage": 82.85, "elapsed_time": "4:59:25", "remaining_time": "1:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3179, "total_steps": 3836, "loss": 0.1389, "learning_rate": 3.904283688031715e-07, "epoch": 0.828592838758023, "percentage": 82.87, "elapsed_time": "4:59:30", "remaining_time": "1:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3180, "total_steps": 3836, "loss": 0.1427, "learning_rate": 3.8927258146967626e-07, "epoch": 0.8288534845078682, "percentage": 82.9, "elapsed_time": "4:59:36", "remaining_time": "1:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3181, "total_steps": 3836, "loss": 0.1362, "learning_rate": 3.8811836296346466e-07, "epoch": 0.8291141302577135, "percentage": 82.92, "elapsed_time": "4:59:41", "remaining_time": "1:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3182, "total_steps": 3836, "loss": 0.1319, "learning_rate": 3.8696571414242546e-07, "epoch": 0.8293747760075587, "percentage": 82.95, "elapsed_time": "4:59:47", "remaining_time": "1:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3183, "total_steps": 3836, "loss": 0.1332, "learning_rate": 3.858146358632811e-07, "epoch": 0.829635421757404, "percentage": 82.98, "elapsed_time": "4:59:53", "remaining_time": "1:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3184, "total_steps": 3836, "loss": 0.1281, "learning_rate": 3.846651289815856e-07, "epoch": 0.8298960675072492, "percentage": 83.0, "elapsed_time": "4:59:58", "remaining_time": "1:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3185, "total_steps": 3836, "loss": 0.1355, "learning_rate": 3.8351719435172685e-07, "epoch": 0.8301567132570945, "percentage": 83.03, "elapsed_time": "5:00:04", "remaining_time": "1:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3186, "total_steps": 3836, "loss": 0.1381, "learning_rate": 3.823708328269232e-07, "epoch": 0.8304173590069397, "percentage": 83.06, "elapsed_time": "5:00:10", "remaining_time": "1:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3187, "total_steps": 3836, "loss": 0.1324, "learning_rate": 3.81226045259222e-07, "epoch": 0.8306780047567849, "percentage": 83.08, "elapsed_time": "5:00:15", "remaining_time": "1:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3188, "total_steps": 3836, "loss": 0.1415, "learning_rate": 3.800828324995043e-07, "epoch": 0.8309386505066302, "percentage": 83.11, "elapsed_time": "5:00:21", "remaining_time": "1:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3189, "total_steps": 3836, "loss": 0.1331, "learning_rate": 3.789411953974778e-07, "epoch": 0.8311992962564754, "percentage": 83.13, "elapsed_time": "5:00:26", "remaining_time": "1:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3190, "total_steps": 3836, "loss": 0.1365, "learning_rate": 3.7780113480167967e-07, "epoch": 0.8314599420063207, "percentage": 83.16, "elapsed_time": "5:00:31", "remaining_time": "1:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3191, "total_steps": 3836, "loss": 0.1426, "learning_rate": 3.7666265155947677e-07, "epoch": 0.8317205877561659, "percentage": 83.19, "elapsed_time": "5:00:37", "remaining_time": "1:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3192, "total_steps": 3836, "loss": 0.1213, "learning_rate": 3.7552574651706253e-07, "epoch": 0.8319812335060112, "percentage": 83.21, "elapsed_time": "5:00:43", "remaining_time": "1:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3193, "total_steps": 3836, "loss": 0.1296, "learning_rate": 3.7439042051945565e-07, "epoch": 0.8322418792558564, "percentage": 83.24, "elapsed_time": "5:00:48", "remaining_time": "1:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3194, "total_steps": 3836, "loss": 0.1391, "learning_rate": 3.7325667441050457e-07, "epoch": 0.8325025250057017, "percentage": 83.26, "elapsed_time": "5:00:54", "remaining_time": "1:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3195, "total_steps": 3836, "loss": 0.1354, "learning_rate": 3.7212450903288094e-07, "epoch": 0.8327631707555468, "percentage": 83.29, "elapsed_time": "5:00:59", "remaining_time": "1:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3196, "total_steps": 3836, "loss": 0.1279, "learning_rate": 3.7099392522808253e-07, "epoch": 0.8330238165053921, "percentage": 83.32, "elapsed_time": "5:01:05", "remaining_time": "1:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3197, "total_steps": 3836, "loss": 0.1339, "learning_rate": 3.698649238364313e-07, "epoch": 0.8332844622552373, "percentage": 83.34, "elapsed_time": "5:01:10", "remaining_time": "1:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3198, "total_steps": 3836, "loss": 0.1294, "learning_rate": 3.6873750569707297e-07, "epoch": 0.8335451080050826, "percentage": 83.37, "elapsed_time": "5:01:16", "remaining_time": "1:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3199, "total_steps": 3836, "loss": 0.1383, "learning_rate": 3.676116716479769e-07, "epoch": 0.8338057537549278, "percentage": 83.39, "elapsed_time": "5:01:21", "remaining_time": "1:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3200, "total_steps": 3836, "loss": 0.1321, "learning_rate": 3.664874225259338e-07, "epoch": 0.8340663995047731, "percentage": 83.42, "elapsed_time": "5:01:26", "remaining_time": "0:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3201, "total_steps": 3836, "loss": 0.1402, "learning_rate": 3.6536475916655907e-07, "epoch": 0.8343270452546183, "percentage": 83.45, "elapsed_time": "5:01:31", "remaining_time": "0:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3202, "total_steps": 3836, "loss": 0.1276, "learning_rate": 3.6424368240428666e-07, "epoch": 0.8345876910044635, "percentage": 83.47, "elapsed_time": "5:01:36", "remaining_time": "0:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3203, "total_steps": 3836, "loss": 0.1586, "learning_rate": 3.6312419307237277e-07, "epoch": 0.8348483367543088, "percentage": 83.5, "elapsed_time": "5:01:42", "remaining_time": "0:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3204, "total_steps": 3836, "loss": 0.1333, "learning_rate": 3.62006292002893e-07, "epoch": 0.835108982504154, "percentage": 83.52, "elapsed_time": "5:01:48", "remaining_time": "0:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3205, "total_steps": 3836, "loss": 0.1269, "learning_rate": 3.6088998002674266e-07, "epoch": 0.8353696282539993, "percentage": 83.55, "elapsed_time": "5:01:53", "remaining_time": "0:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3206, "total_steps": 3836, "loss": 0.1387, "learning_rate": 3.597752579736363e-07, "epoch": 0.8356302740038445, "percentage": 83.58, "elapsed_time": "5:01:59", "remaining_time": "0:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3207, "total_steps": 3836, "loss": 0.1363, "learning_rate": 3.5866212667210576e-07, "epoch": 0.8358909197536898, "percentage": 83.6, "elapsed_time": "5:02:05", "remaining_time": "0:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3208, "total_steps": 3836, "loss": 0.1432, "learning_rate": 3.57550586949503e-07, "epoch": 0.836151565503535, "percentage": 83.63, "elapsed_time": "5:02:11", "remaining_time": "0:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3209, "total_steps": 3836, "loss": 0.1217, "learning_rate": 3.564406396319936e-07, "epoch": 0.8364122112533803, "percentage": 83.65, "elapsed_time": "5:02:16", "remaining_time": "0:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3210, "total_steps": 3836, "loss": 0.1409, "learning_rate": 3.5533228554456095e-07, "epoch": 0.8366728570032255, "percentage": 83.68, "elapsed_time": "5:02:21", "remaining_time": "0:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3211, "total_steps": 3836, "loss": 0.1493, "learning_rate": 3.5422552551100607e-07, "epoch": 0.8369335027530708, "percentage": 83.71, "elapsed_time": "5:02:27", "remaining_time": "0:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3212, "total_steps": 3836, "loss": 0.1444, "learning_rate": 3.5312036035394263e-07, "epoch": 0.837194148502916, "percentage": 83.73, "elapsed_time": "5:02:33", "remaining_time": "0:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3213, "total_steps": 3836, "loss": 0.1466, "learning_rate": 3.520167908948002e-07, "epoch": 0.8374547942527613, "percentage": 83.76, "elapsed_time": "5:02:39", "remaining_time": "0:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3214, "total_steps": 3836, "loss": 0.1274, "learning_rate": 3.5091481795382216e-07, "epoch": 0.8377154400026064, "percentage": 83.79, "elapsed_time": "5:02:45", "remaining_time": "0:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3215, "total_steps": 3836, "loss": 0.136, "learning_rate": 3.4981444235006464e-07, "epoch": 0.8379760857524517, "percentage": 83.81, "elapsed_time": "5:02:50", "remaining_time": "0:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3216, "total_steps": 3836, "loss": 0.1228, "learning_rate": 3.487156649013973e-07, "epoch": 0.8382367315022969, "percentage": 83.84, "elapsed_time": "5:02:56", "remaining_time": "0:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3217, "total_steps": 3836, "loss": 0.1233, "learning_rate": 3.476184864245011e-07, "epoch": 0.8384973772521421, "percentage": 83.86, "elapsed_time": "5:03:02", "remaining_time": "0:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3218, "total_steps": 3836, "loss": 0.1386, "learning_rate": 3.4652290773487003e-07, "epoch": 0.8387580230019874, "percentage": 83.89, "elapsed_time": "5:03:07", "remaining_time": "0:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3219, "total_steps": 3836, "loss": 0.1347, "learning_rate": 3.4542892964680804e-07, "epoch": 0.8390186687518326, "percentage": 83.92, "elapsed_time": "5:03:13", "remaining_time": "0:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3220, "total_steps": 3836, "loss": 0.1287, "learning_rate": 3.44336552973428e-07, "epoch": 0.8392793145016779, "percentage": 83.94, "elapsed_time": "5:03:19", "remaining_time": "0:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3221, "total_steps": 3836, "loss": 0.1391, "learning_rate": 3.432457785266552e-07, "epoch": 0.8395399602515231, "percentage": 83.97, "elapsed_time": "5:03:24", "remaining_time": "0:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3222, "total_steps": 3836, "loss": 0.1409, "learning_rate": 3.4215660711722276e-07, "epoch": 0.8398006060013684, "percentage": 83.99, "elapsed_time": "5:03:30", "remaining_time": "0:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3223, "total_steps": 3836, "loss": 0.1241, "learning_rate": 3.410690395546717e-07, "epoch": 0.8400612517512136, "percentage": 84.02, "elapsed_time": "5:03:35", "remaining_time": "0:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3224, "total_steps": 3836, "loss": 0.1319, "learning_rate": 3.399830766473525e-07, "epoch": 0.8403218975010589, "percentage": 84.05, "elapsed_time": "5:03:41", "remaining_time": "0:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3225, "total_steps": 3836, "loss": 0.1345, "learning_rate": 3.3889871920242235e-07, "epoch": 0.8405825432509041, "percentage": 84.07, "elapsed_time": "5:03:46", "remaining_time": "0:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3226, "total_steps": 3836, "loss": 0.1543, "learning_rate": 3.378159680258428e-07, "epoch": 0.8408431890007494, "percentage": 84.1, "elapsed_time": "5:03:52", "remaining_time": "0:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3227, "total_steps": 3836, "loss": 0.1277, "learning_rate": 3.3673482392238584e-07, "epoch": 0.8411038347505946, "percentage": 84.12, "elapsed_time": "5:03:58", "remaining_time": "0:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3228, "total_steps": 3836, "loss": 0.1272, "learning_rate": 3.356552876956257e-07, "epoch": 0.8413644805004399, "percentage": 84.15, "elapsed_time": "5:04:04", "remaining_time": "0:57:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3229, "total_steps": 3836, "loss": 0.1447, "learning_rate": 3.345773601479427e-07, "epoch": 0.8416251262502851, "percentage": 84.18, "elapsed_time": "5:04:10", "remaining_time": "0:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3230, "total_steps": 3836, "loss": 0.1597, "learning_rate": 3.3350104208052153e-07, "epoch": 0.8418857720001304, "percentage": 84.2, "elapsed_time": "5:04:15", "remaining_time": "0:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3231, "total_steps": 3836, "loss": 0.1241, "learning_rate": 3.3242633429335034e-07, "epoch": 0.8421464177499756, "percentage": 84.23, "elapsed_time": "5:04:21", "remaining_time": "0:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3232, "total_steps": 3836, "loss": 0.1347, "learning_rate": 3.3135323758522047e-07, "epoch": 0.8424070634998208, "percentage": 84.25, "elapsed_time": "5:04:26", "remaining_time": "0:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3233, "total_steps": 3836, "loss": 0.1373, "learning_rate": 3.302817527537255e-07, "epoch": 0.842667709249666, "percentage": 84.28, "elapsed_time": "5:04:31", "remaining_time": "0:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3234, "total_steps": 3836, "loss": 0.1413, "learning_rate": 3.292118805952621e-07, "epoch": 0.8429283549995112, "percentage": 84.31, "elapsed_time": "5:04:37", "remaining_time": "0:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3235, "total_steps": 3836, "loss": 0.1298, "learning_rate": 3.281436219050274e-07, "epoch": 0.8431890007493565, "percentage": 84.33, "elapsed_time": "5:04:41", "remaining_time": "0:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3236, "total_steps": 3836, "loss": 0.1275, "learning_rate": 3.2707697747701913e-07, "epoch": 0.8434496464992017, "percentage": 84.36, "elapsed_time": "5:04:46", "remaining_time": "0:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3237, "total_steps": 3836, "loss": 0.1393, "learning_rate": 3.260119481040355e-07, "epoch": 0.843710292249047, "percentage": 84.38, "elapsed_time": "5:04:51", "remaining_time": "0:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3238, "total_steps": 3836, "loss": 0.1321, "learning_rate": 3.249485345776743e-07, "epoch": 0.8439709379988922, "percentage": 84.41, "elapsed_time": "5:04:57", "remaining_time": "0:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3239, "total_steps": 3836, "loss": 0.1269, "learning_rate": 3.2388673768833226e-07, "epoch": 0.8442315837487375, "percentage": 84.44, "elapsed_time": "5:05:03", "remaining_time": "0:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3240, "total_steps": 3836, "loss": 0.1377, "learning_rate": 3.228265582252041e-07, "epoch": 0.8444922294985827, "percentage": 84.46, "elapsed_time": "5:05:09", "remaining_time": "0:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3241, "total_steps": 3836, "loss": 0.1354, "learning_rate": 3.2176799697628434e-07, "epoch": 0.844752875248428, "percentage": 84.49, "elapsed_time": "5:05:14", "remaining_time": "0:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3242, "total_steps": 3836, "loss": 0.1432, "learning_rate": 3.2071105472836207e-07, "epoch": 0.8450135209982732, "percentage": 84.52, "elapsed_time": "5:05:19", "remaining_time": "0:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3243, "total_steps": 3836, "loss": 0.1416, "learning_rate": 3.196557322670235e-07, "epoch": 0.8452741667481185, "percentage": 84.54, "elapsed_time": "5:05:25", "remaining_time": "0:55:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3244, "total_steps": 3836, "loss": 0.1376, "learning_rate": 3.186020303766532e-07, "epoch": 0.8455348124979637, "percentage": 84.57, "elapsed_time": "5:05:31", "remaining_time": "0:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3245, "total_steps": 3836, "loss": 0.1372, "learning_rate": 3.175499498404291e-07, "epoch": 0.845795458247809, "percentage": 84.59, "elapsed_time": "5:05:37", "remaining_time": "0:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3246, "total_steps": 3836, "loss": 0.1376, "learning_rate": 3.164994914403241e-07, "epoch": 0.8460561039976542, "percentage": 84.62, "elapsed_time": "5:05:43", "remaining_time": "0:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3247, "total_steps": 3836, "loss": 0.1487, "learning_rate": 3.154506559571066e-07, "epoch": 0.8463167497474994, "percentage": 84.65, "elapsed_time": "5:05:48", "remaining_time": "0:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3248, "total_steps": 3836, "loss": 0.1416, "learning_rate": 3.1440344417033754e-07, "epoch": 0.8465773954973447, "percentage": 84.67, "elapsed_time": "5:05:53", "remaining_time": "0:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3249, "total_steps": 3836, "loss": 0.1392, "learning_rate": 3.1335785685837117e-07, "epoch": 0.8468380412471899, "percentage": 84.7, "elapsed_time": "5:05:59", "remaining_time": "0:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3250, "total_steps": 3836, "loss": 0.1302, "learning_rate": 3.123138947983556e-07, "epoch": 0.8470986869970352, "percentage": 84.72, "elapsed_time": "5:06:04", "remaining_time": "0:55:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3251, "total_steps": 3836, "loss": 0.1453, "learning_rate": 3.1127155876622986e-07, "epoch": 0.8473593327468804, "percentage": 84.75, "elapsed_time": "5:06:11", "remaining_time": "0:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3252, "total_steps": 3836, "loss": 0.1306, "learning_rate": 3.102308495367243e-07, "epoch": 0.8476199784967257, "percentage": 84.78, "elapsed_time": "5:06:16", "remaining_time": "0:55:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3253, "total_steps": 3836, "loss": 0.1296, "learning_rate": 3.091917678833603e-07, "epoch": 0.8478806242465708, "percentage": 84.8, "elapsed_time": "5:06:21", "remaining_time": "0:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3254, "total_steps": 3836, "loss": 0.1391, "learning_rate": 3.081543145784499e-07, "epoch": 0.8481412699964161, "percentage": 84.83, "elapsed_time": "5:06:27", "remaining_time": "0:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3255, "total_steps": 3836, "loss": 0.1301, "learning_rate": 3.071184903930946e-07, "epoch": 0.8484019157462613, "percentage": 84.85, "elapsed_time": "5:06:33", "remaining_time": "0:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3256, "total_steps": 3836, "loss": 0.1406, "learning_rate": 3.060842960971844e-07, "epoch": 0.8486625614961066, "percentage": 84.88, "elapsed_time": "5:06:38", "remaining_time": "0:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3257, "total_steps": 3836, "loss": 0.1376, "learning_rate": 3.050517324593996e-07, "epoch": 0.8489232072459518, "percentage": 84.91, "elapsed_time": "5:06:44", "remaining_time": "0:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3258, "total_steps": 3836, "loss": 0.1458, "learning_rate": 3.0402080024720724e-07, "epoch": 0.8491838529957971, "percentage": 84.93, "elapsed_time": "5:06:49", "remaining_time": "0:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3259, "total_steps": 3836, "loss": 0.1325, "learning_rate": 3.029915002268605e-07, "epoch": 0.8494444987456423, "percentage": 84.96, "elapsed_time": "5:06:54", "remaining_time": "0:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3260, "total_steps": 3836, "loss": 0.1367, "learning_rate": 3.0196383316340226e-07, "epoch": 0.8497051444954876, "percentage": 84.98, "elapsed_time": "5:07:00", "remaining_time": "0:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3261, "total_steps": 3836, "loss": 0.1206, "learning_rate": 3.0093779982065973e-07, "epoch": 0.8499657902453328, "percentage": 85.01, "elapsed_time": "5:07:05", "remaining_time": "0:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3262, "total_steps": 3836, "loss": 0.1303, "learning_rate": 2.9991340096124644e-07, "epoch": 0.850226435995178, "percentage": 85.04, "elapsed_time": "5:07:11", "remaining_time": "0:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3263, "total_steps": 3836, "loss": 0.137, "learning_rate": 2.988906373465608e-07, "epoch": 0.8504870817450233, "percentage": 85.06, "elapsed_time": "5:07:16", "remaining_time": "0:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3264, "total_steps": 3836, "loss": 0.1423, "learning_rate": 2.978695097367862e-07, "epoch": 0.8507477274948685, "percentage": 85.09, "elapsed_time": "5:07:22", "remaining_time": "0:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3265, "total_steps": 3836, "loss": 0.1372, "learning_rate": 2.968500188908899e-07, "epoch": 0.8510083732447138, "percentage": 85.11, "elapsed_time": "5:07:27", "remaining_time": "0:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3266, "total_steps": 3836, "loss": 0.133, "learning_rate": 2.958321655666219e-07, "epoch": 0.851269018994559, "percentage": 85.14, "elapsed_time": "5:07:33", "remaining_time": "0:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3267, "total_steps": 3836, "loss": 0.1293, "learning_rate": 2.948159505205164e-07, "epoch": 0.8515296647444043, "percentage": 85.17, "elapsed_time": "5:07:38", "remaining_time": "0:53:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3268, "total_steps": 3836, "loss": 0.1282, "learning_rate": 2.938013745078899e-07, "epoch": 0.8517903104942495, "percentage": 85.19, "elapsed_time": "5:07:44", "remaining_time": "0:53:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3269, "total_steps": 3836, "loss": 0.1403, "learning_rate": 2.9278843828283803e-07, "epoch": 0.8520509562440948, "percentage": 85.22, "elapsed_time": "5:07:50", "remaining_time": "0:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3270, "total_steps": 3836, "loss": 0.127, "learning_rate": 2.917771425982413e-07, "epoch": 0.85231160199394, "percentage": 85.25, "elapsed_time": "5:07:55", "remaining_time": "0:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3271, "total_steps": 3836, "loss": 0.129, "learning_rate": 2.9076748820575875e-07, "epoch": 0.8525722477437853, "percentage": 85.27, "elapsed_time": "5:08:01", "remaining_time": "0:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3272, "total_steps": 3836, "loss": 0.1378, "learning_rate": 2.897594758558298e-07, "epoch": 0.8528328934936305, "percentage": 85.3, "elapsed_time": "5:08:06", "remaining_time": "0:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3273, "total_steps": 3836, "loss": 0.1357, "learning_rate": 2.8875310629767314e-07, "epoch": 0.8530935392434758, "percentage": 85.32, "elapsed_time": "5:08:11", "remaining_time": "0:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3274, "total_steps": 3836, "loss": 0.1287, "learning_rate": 2.8774838027928854e-07, "epoch": 0.8533541849933209, "percentage": 85.35, "elapsed_time": "5:08:17", "remaining_time": "0:52:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3275, "total_steps": 3836, "loss": 0.1349, "learning_rate": 2.867452985474503e-07, "epoch": 0.8536148307431662, "percentage": 85.38, "elapsed_time": "5:08:22", "remaining_time": "0:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3276, "total_steps": 3836, "loss": 0.135, "learning_rate": 2.857438618477135e-07, "epoch": 0.8538754764930114, "percentage": 85.4, "elapsed_time": "5:08:28", "remaining_time": "0:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3277, "total_steps": 3836, "loss": 0.1395, "learning_rate": 2.8474407092441035e-07, "epoch": 0.8541361222428567, "percentage": 85.43, "elapsed_time": "5:08:34", "remaining_time": "0:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3278, "total_steps": 3836, "loss": 0.13, "learning_rate": 2.837459265206491e-07, "epoch": 0.8543967679927019, "percentage": 85.45, "elapsed_time": "5:08:39", "remaining_time": "0:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3279, "total_steps": 3836, "loss": 0.1366, "learning_rate": 2.8274942937831393e-07, "epoch": 0.8546574137425471, "percentage": 85.48, "elapsed_time": "5:08:45", "remaining_time": "0:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3280, "total_steps": 3836, "loss": 0.1303, "learning_rate": 2.817545802380653e-07, "epoch": 0.8549180594923924, "percentage": 85.51, "elapsed_time": "5:08:50", "remaining_time": "0:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3281, "total_steps": 3836, "loss": 0.137, "learning_rate": 2.8076137983933856e-07, "epoch": 0.8551787052422376, "percentage": 85.53, "elapsed_time": "5:08:56", "remaining_time": "0:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3282, "total_steps": 3836, "loss": 0.1231, "learning_rate": 2.797698289203432e-07, "epoch": 0.8554393509920829, "percentage": 85.56, "elapsed_time": "5:09:02", "remaining_time": "0:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3283, "total_steps": 3836, "loss": 0.132, "learning_rate": 2.7877992821806394e-07, "epoch": 0.8556999967419281, "percentage": 85.58, "elapsed_time": "5:09:08", "remaining_time": "0:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3284, "total_steps": 3836, "loss": 0.1397, "learning_rate": 2.7779167846825797e-07, "epoch": 0.8559606424917734, "percentage": 85.61, "elapsed_time": "5:09:13", "remaining_time": "0:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3285, "total_steps": 3836, "loss": 0.1368, "learning_rate": 2.768050804054551e-07, "epoch": 0.8562212882416186, "percentage": 85.64, "elapsed_time": "5:09:19", "remaining_time": "0:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3286, "total_steps": 3836, "loss": 0.1379, "learning_rate": 2.7582013476295826e-07, "epoch": 0.8564819339914639, "percentage": 85.66, "elapsed_time": "5:09:25", "remaining_time": "0:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3287, "total_steps": 3836, "loss": 0.1414, "learning_rate": 2.7483684227284204e-07, "epoch": 0.8567425797413091, "percentage": 85.69, "elapsed_time": "5:09:30", "remaining_time": "0:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3288, "total_steps": 3836, "loss": 0.1276, "learning_rate": 2.738552036659517e-07, "epoch": 0.8570032254911544, "percentage": 85.71, "elapsed_time": "5:09:37", "remaining_time": "0:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3289, "total_steps": 3836, "loss": 0.1392, "learning_rate": 2.728752196719034e-07, "epoch": 0.8572638712409996, "percentage": 85.74, "elapsed_time": "5:09:42", "remaining_time": "0:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3290, "total_steps": 3836, "loss": 0.1334, "learning_rate": 2.718968910190853e-07, "epoch": 0.8575245169908449, "percentage": 85.77, "elapsed_time": "5:09:49", "remaining_time": "0:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3291, "total_steps": 3836, "loss": 0.1538, "learning_rate": 2.709202184346524e-07, "epoch": 0.85778516274069, "percentage": 85.79, "elapsed_time": "5:09:54", "remaining_time": "0:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3292, "total_steps": 3836, "loss": 0.1278, "learning_rate": 2.6994520264452957e-07, "epoch": 0.8580458084905354, "percentage": 85.82, "elapsed_time": "5:10:00", "remaining_time": "0:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3293, "total_steps": 3836, "loss": 0.1421, "learning_rate": 2.689718443734121e-07, "epoch": 0.8583064542403805, "percentage": 85.84, "elapsed_time": "5:10:06", "remaining_time": "0:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3294, "total_steps": 3836, "loss": 0.1333, "learning_rate": 2.6800014434476137e-07, "epoch": 0.8585670999902257, "percentage": 85.87, "elapsed_time": "5:10:11", "remaining_time": "0:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3295, "total_steps": 3836, "loss": 0.1466, "learning_rate": 2.6703010328080675e-07, "epoch": 0.858827745740071, "percentage": 85.9, "elapsed_time": "5:10:16", "remaining_time": "0:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3296, "total_steps": 3836, "loss": 0.1348, "learning_rate": 2.6606172190254467e-07, "epoch": 0.8590883914899162, "percentage": 85.92, "elapsed_time": "5:10:22", "remaining_time": "0:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3297, "total_steps": 3836, "loss": 0.1322, "learning_rate": 2.650950009297382e-07, "epoch": 0.8593490372397615, "percentage": 85.95, "elapsed_time": "5:10:27", "remaining_time": "0:50:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3298, "total_steps": 3836, "loss": 0.1413, "learning_rate": 2.6412994108091586e-07, "epoch": 0.8596096829896067, "percentage": 85.97, "elapsed_time": "5:10:33", "remaining_time": "0:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3299, "total_steps": 3836, "loss": 0.1403, "learning_rate": 2.6316654307337126e-07, "epoch": 0.859870328739452, "percentage": 86.0, "elapsed_time": "5:10:38", "remaining_time": "0:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3300, "total_steps": 3836, "loss": 0.14, "learning_rate": 2.6220480762316396e-07, "epoch": 0.8601309744892972, "percentage": 86.03, "elapsed_time": "5:10:44", "remaining_time": "0:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3301, "total_steps": 3836, "loss": 0.1377, "learning_rate": 2.612447354451175e-07, "epoch": 0.8603916202391425, "percentage": 86.05, "elapsed_time": "5:10:49", "remaining_time": "0:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3302, "total_steps": 3836, "loss": 0.1345, "learning_rate": 2.6028632725281723e-07, "epoch": 0.8606522659889877, "percentage": 86.08, "elapsed_time": "5:10:55", "remaining_time": "0:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3303, "total_steps": 3836, "loss": 0.1296, "learning_rate": 2.593295837586146e-07, "epoch": 0.860912911738833, "percentage": 86.11, "elapsed_time": "5:11:01", "remaining_time": "0:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3304, "total_steps": 3836, "loss": 0.1403, "learning_rate": 2.58374505673622e-07, "epoch": 0.8611735574886782, "percentage": 86.13, "elapsed_time": "5:11:06", "remaining_time": "0:50:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3305, "total_steps": 3836, "loss": 0.1377, "learning_rate": 2.5742109370771427e-07, "epoch": 0.8614342032385235, "percentage": 86.16, "elapsed_time": "5:11:12", "remaining_time": "0:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3306, "total_steps": 3836, "loss": 0.1217, "learning_rate": 2.56469348569528e-07, "epoch": 0.8616948489883687, "percentage": 86.18, "elapsed_time": "5:11:18", "remaining_time": "0:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3307, "total_steps": 3836, "loss": 0.1378, "learning_rate": 2.555192709664617e-07, "epoch": 0.861955494738214, "percentage": 86.21, "elapsed_time": "5:11:23", "remaining_time": "0:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3308, "total_steps": 3836, "loss": 0.1472, "learning_rate": 2.5457086160467187e-07, "epoch": 0.8622161404880592, "percentage": 86.24, "elapsed_time": "5:11:28", "remaining_time": "0:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3309, "total_steps": 3836, "loss": 0.143, "learning_rate": 2.5362412118907886e-07, "epoch": 0.8624767862379044, "percentage": 86.26, "elapsed_time": "5:11:34", "remaining_time": "0:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3310, "total_steps": 3836, "loss": 0.1472, "learning_rate": 2.526790504233592e-07, "epoch": 0.8627374319877497, "percentage": 86.29, "elapsed_time": "5:11:40", "remaining_time": "0:49:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3311, "total_steps": 3836, "loss": 0.1336, "learning_rate": 2.5173565000995047e-07, "epoch": 0.8629980777375948, "percentage": 86.31, "elapsed_time": "5:11:45", "remaining_time": "0:49:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3312, "total_steps": 3836, "loss": 0.1431, "learning_rate": 2.507939206500479e-07, "epoch": 0.8632587234874401, "percentage": 86.34, "elapsed_time": "5:11:50", "remaining_time": "0:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3313, "total_steps": 3836, "loss": 0.1362, "learning_rate": 2.498538630436048e-07, "epoch": 0.8635193692372853, "percentage": 86.37, "elapsed_time": "5:11:56", "remaining_time": "0:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3314, "total_steps": 3836, "loss": 0.1424, "learning_rate": 2.4891547788933185e-07, "epoch": 0.8637800149871306, "percentage": 86.39, "elapsed_time": "5:12:01", "remaining_time": "0:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3315, "total_steps": 3836, "loss": 0.1433, "learning_rate": 2.479787658846963e-07, "epoch": 0.8640406607369758, "percentage": 86.42, "elapsed_time": "5:12:06", "remaining_time": "0:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3316, "total_steps": 3836, "loss": 0.1376, "learning_rate": 2.4704372772592326e-07, "epoch": 0.8643013064868211, "percentage": 86.44, "elapsed_time": "5:12:12", "remaining_time": "0:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3317, "total_steps": 3836, "loss": 0.1388, "learning_rate": 2.4611036410799233e-07, "epoch": 0.8645619522366663, "percentage": 86.47, "elapsed_time": "5:12:18", "remaining_time": "0:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3318, "total_steps": 3836, "loss": 0.1363, "learning_rate": 2.4517867572463884e-07, "epoch": 0.8648225979865116, "percentage": 86.5, "elapsed_time": "5:12:24", "remaining_time": "0:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3319, "total_steps": 3836, "loss": 0.1279, "learning_rate": 2.44248663268353e-07, "epoch": 0.8650832437363568, "percentage": 86.52, "elapsed_time": "5:12:30", "remaining_time": "0:48:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3320, "total_steps": 3836, "loss": 0.1262, "learning_rate": 2.433203274303794e-07, "epoch": 0.8653438894862021, "percentage": 86.55, "elapsed_time": "5:12:35", "remaining_time": "0:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3321, "total_steps": 3836, "loss": 0.1375, "learning_rate": 2.423936689007167e-07, "epoch": 0.8656045352360473, "percentage": 86.57, "elapsed_time": "5:12:40", "remaining_time": "0:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3322, "total_steps": 3836, "loss": 0.1415, "learning_rate": 2.414686883681158e-07, "epoch": 0.8658651809858926, "percentage": 86.6, "elapsed_time": "5:12:46", "remaining_time": "0:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3323, "total_steps": 3836, "loss": 0.1417, "learning_rate": 2.4054538652008295e-07, "epoch": 0.8661258267357378, "percentage": 86.63, "elapsed_time": "5:12:51", "remaining_time": "0:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3324, "total_steps": 3836, "loss": 0.1447, "learning_rate": 2.3962376404287365e-07, "epoch": 0.866386472485583, "percentage": 86.65, "elapsed_time": "5:12:57", "remaining_time": "0:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3325, "total_steps": 3836, "loss": 0.1455, "learning_rate": 2.3870382162149627e-07, "epoch": 0.8666471182354283, "percentage": 86.68, "elapsed_time": "5:13:03", "remaining_time": "0:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3326, "total_steps": 3836, "loss": 0.1366, "learning_rate": 2.3778555993971164e-07, "epoch": 0.8669077639852735, "percentage": 86.7, "elapsed_time": "5:13:09", "remaining_time": "0:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3327, "total_steps": 3836, "loss": 0.1303, "learning_rate": 2.3686897968002998e-07, "epoch": 0.8671684097351188, "percentage": 86.73, "elapsed_time": "5:13:14", "remaining_time": "0:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3328, "total_steps": 3836, "loss": 0.1399, "learning_rate": 2.359540815237124e-07, "epoch": 0.867429055484964, "percentage": 86.76, "elapsed_time": "5:13:20", "remaining_time": "0:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3329, "total_steps": 3836, "loss": 0.1471, "learning_rate": 2.350408661507697e-07, "epoch": 0.8676897012348093, "percentage": 86.78, "elapsed_time": "5:13:26", "remaining_time": "0:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3330, "total_steps": 3836, "loss": 0.129, "learning_rate": 2.3412933423996114e-07, "epoch": 0.8679503469846545, "percentage": 86.81, "elapsed_time": "5:13:31", "remaining_time": "0:47:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3331, "total_steps": 3836, "loss": 0.1391, "learning_rate": 2.3321948646879616e-07, "epoch": 0.8682109927344998, "percentage": 86.84, "elapsed_time": "5:13:37", "remaining_time": "0:47:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3332, "total_steps": 3836, "loss": 0.1449, "learning_rate": 2.3231132351353075e-07, "epoch": 0.8684716384843449, "percentage": 86.86, "elapsed_time": "5:13:42", "remaining_time": "0:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3333, "total_steps": 3836, "loss": 0.1526, "learning_rate": 2.314048460491708e-07, "epoch": 0.8687322842341902, "percentage": 86.89, "elapsed_time": "5:13:47", "remaining_time": "0:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3334, "total_steps": 3836, "loss": 0.1314, "learning_rate": 2.305000547494679e-07, "epoch": 0.8689929299840354, "percentage": 86.91, "elapsed_time": "5:13:53", "remaining_time": "0:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3335, "total_steps": 3836, "loss": 0.1286, "learning_rate": 2.295969502869194e-07, "epoch": 0.8692535757338807, "percentage": 86.94, "elapsed_time": "5:13:58", "remaining_time": "0:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3336, "total_steps": 3836, "loss": 0.1271, "learning_rate": 2.2869553333277145e-07, "epoch": 0.8695142214837259, "percentage": 86.97, "elapsed_time": "5:14:04", "remaining_time": "0:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3337, "total_steps": 3836, "loss": 0.1322, "learning_rate": 2.2779580455701444e-07, "epoch": 0.8697748672335712, "percentage": 86.99, "elapsed_time": "5:14:10", "remaining_time": "0:46:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3338, "total_steps": 3836, "loss": 0.1307, "learning_rate": 2.2689776462838348e-07, "epoch": 0.8700355129834164, "percentage": 87.02, "elapsed_time": "5:14:15", "remaining_time": "0:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3339, "total_steps": 3836, "loss": 0.1268, "learning_rate": 2.2600141421436017e-07, "epoch": 0.8702961587332616, "percentage": 87.04, "elapsed_time": "5:14:20", "remaining_time": "0:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3340, "total_steps": 3836, "loss": 0.1381, "learning_rate": 2.251067539811691e-07, "epoch": 0.8705568044831069, "percentage": 87.07, "elapsed_time": "5:14:25", "remaining_time": "0:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3341, "total_steps": 3836, "loss": 0.1375, "learning_rate": 2.242137845937778e-07, "epoch": 0.8708174502329521, "percentage": 87.1, "elapsed_time": "5:14:30", "remaining_time": "0:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3342, "total_steps": 3836, "loss": 0.134, "learning_rate": 2.233225067158995e-07, "epoch": 0.8710780959827974, "percentage": 87.12, "elapsed_time": "5:14:36", "remaining_time": "0:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3343, "total_steps": 3836, "loss": 0.1372, "learning_rate": 2.2243292100998792e-07, "epoch": 0.8713387417326426, "percentage": 87.15, "elapsed_time": "5:14:41", "remaining_time": "0:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3344, "total_steps": 3836, "loss": 0.1309, "learning_rate": 2.2154502813724026e-07, "epoch": 0.8715993874824879, "percentage": 87.17, "elapsed_time": "5:14:46", "remaining_time": "0:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3345, "total_steps": 3836, "loss": 0.1313, "learning_rate": 2.2065882875759532e-07, "epoch": 0.8718600332323331, "percentage": 87.2, "elapsed_time": "5:14:51", "remaining_time": "0:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3346, "total_steps": 3836, "loss": 0.1383, "learning_rate": 2.1977432352973226e-07, "epoch": 0.8721206789821784, "percentage": 87.23, "elapsed_time": "5:14:56", "remaining_time": "0:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3347, "total_steps": 3836, "loss": 0.1398, "learning_rate": 2.188915131110725e-07, "epoch": 0.8723813247320236, "percentage": 87.25, "elapsed_time": "5:15:02", "remaining_time": "0:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3348, "total_steps": 3836, "loss": 0.1368, "learning_rate": 2.1801039815777637e-07, "epoch": 0.8726419704818689, "percentage": 87.28, "elapsed_time": "5:15:07", "remaining_time": "0:45:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3349, "total_steps": 3836, "loss": 0.1281, "learning_rate": 2.1713097932474586e-07, "epoch": 0.8729026162317141, "percentage": 87.3, "elapsed_time": "5:15:13", "remaining_time": "0:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3350, "total_steps": 3836, "loss": 0.1311, "learning_rate": 2.1625325726562009e-07, "epoch": 0.8731632619815594, "percentage": 87.33, "elapsed_time": "5:15:18", "remaining_time": "0:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3351, "total_steps": 3836, "loss": 0.1381, "learning_rate": 2.1537723263277883e-07, "epoch": 0.8734239077314045, "percentage": 87.36, "elapsed_time": "5:15:24", "remaining_time": "0:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3352, "total_steps": 3836, "loss": 0.1421, "learning_rate": 2.1450290607733903e-07, "epoch": 0.8736845534812498, "percentage": 87.38, "elapsed_time": "5:15:30", "remaining_time": "0:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3353, "total_steps": 3836, "loss": 0.1365, "learning_rate": 2.136302782491559e-07, "epoch": 0.873945199231095, "percentage": 87.41, "elapsed_time": "5:15:36", "remaining_time": "0:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3354, "total_steps": 3836, "loss": 0.1226, "learning_rate": 2.127593497968225e-07, "epoch": 0.8742058449809402, "percentage": 87.43, "elapsed_time": "5:15:41", "remaining_time": "0:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3355, "total_steps": 3836, "loss": 0.1408, "learning_rate": 2.1189012136766774e-07, "epoch": 0.8744664907307855, "percentage": 87.46, "elapsed_time": "5:15:46", "remaining_time": "0:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3356, "total_steps": 3836, "loss": 0.1341, "learning_rate": 2.1102259360775895e-07, "epoch": 0.8747271364806307, "percentage": 87.49, "elapsed_time": "5:15:52", "remaining_time": "0:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3357, "total_steps": 3836, "loss": 0.1342, "learning_rate": 2.1015676716189703e-07, "epoch": 0.874987782230476, "percentage": 87.51, "elapsed_time": "5:15:58", "remaining_time": "0:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3358, "total_steps": 3836, "loss": 0.1373, "learning_rate": 2.0929264267361888e-07, "epoch": 0.8752484279803212, "percentage": 87.54, "elapsed_time": "5:16:03", "remaining_time": "0:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3359, "total_steps": 3836, "loss": 0.1374, "learning_rate": 2.0843022078519848e-07, "epoch": 0.8755090737301665, "percentage": 87.57, "elapsed_time": "5:16:08", "remaining_time": "0:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3360, "total_steps": 3836, "loss": 0.1408, "learning_rate": 2.07569502137642e-07, "epoch": 0.8757697194800117, "percentage": 87.59, "elapsed_time": "5:16:14", "remaining_time": "0:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3361, "total_steps": 3836, "loss": 0.1196, "learning_rate": 2.067104873706907e-07, "epoch": 0.876030365229857, "percentage": 87.62, "elapsed_time": "5:16:19", "remaining_time": "0:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3362, "total_steps": 3836, "loss": 0.1407, "learning_rate": 2.0585317712281866e-07, "epoch": 0.8762910109797022, "percentage": 87.64, "elapsed_time": "5:16:25", "remaining_time": "0:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3363, "total_steps": 3836, "loss": 0.1308, "learning_rate": 2.0499757203123416e-07, "epoch": 0.8765516567295475, "percentage": 87.67, "elapsed_time": "5:16:31", "remaining_time": "0:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3364, "total_steps": 3836, "loss": 0.1317, "learning_rate": 2.0414367273187713e-07, "epoch": 0.8768123024793927, "percentage": 87.7, "elapsed_time": "5:16:36", "remaining_time": "0:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3365, "total_steps": 3836, "loss": 0.1283, "learning_rate": 2.032914798594196e-07, "epoch": 0.877072948229238, "percentage": 87.72, "elapsed_time": "5:16:41", "remaining_time": "0:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3366, "total_steps": 3836, "loss": 0.1375, "learning_rate": 2.0244099404726686e-07, "epoch": 0.8773335939790832, "percentage": 87.75, "elapsed_time": "5:16:47", "remaining_time": "0:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3367, "total_steps": 3836, "loss": 0.1498, "learning_rate": 2.015922159275538e-07, "epoch": 0.8775942397289285, "percentage": 87.77, "elapsed_time": "5:16:52", "remaining_time": "0:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3368, "total_steps": 3836, "loss": 0.1326, "learning_rate": 2.007451461311455e-07, "epoch": 0.8778548854787737, "percentage": 87.8, "elapsed_time": "5:16:57", "remaining_time": "0:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3369, "total_steps": 3836, "loss": 0.1328, "learning_rate": 1.9989978528763915e-07, "epoch": 0.8781155312286189, "percentage": 87.83, "elapsed_time": "5:17:02", "remaining_time": "0:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3370, "total_steps": 3836, "loss": 0.1369, "learning_rate": 1.990561340253608e-07, "epoch": 0.8783761769784642, "percentage": 87.85, "elapsed_time": "5:17:08", "remaining_time": "0:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3371, "total_steps": 3836, "loss": 0.1186, "learning_rate": 1.9821419297136546e-07, "epoch": 0.8786368227283093, "percentage": 87.88, "elapsed_time": "5:17:14", "remaining_time": "0:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3372, "total_steps": 3836, "loss": 0.1357, "learning_rate": 1.9737396275143816e-07, "epoch": 0.8788974684781546, "percentage": 87.9, "elapsed_time": "5:17:20", "remaining_time": "0:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3373, "total_steps": 3836, "loss": 0.1451, "learning_rate": 1.9653544399009183e-07, "epoch": 0.8791581142279998, "percentage": 87.93, "elapsed_time": "5:17:25", "remaining_time": "0:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3374, "total_steps": 3836, "loss": 0.1409, "learning_rate": 1.9569863731056544e-07, "epoch": 0.8794187599778451, "percentage": 87.96, "elapsed_time": "5:17:31", "remaining_time": "0:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3375, "total_steps": 3836, "loss": 0.1401, "learning_rate": 1.9486354333482866e-07, "epoch": 0.8796794057276903, "percentage": 87.98, "elapsed_time": "5:17:36", "remaining_time": "0:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3376, "total_steps": 3836, "loss": 0.1357, "learning_rate": 1.940301626835761e-07, "epoch": 0.8799400514775356, "percentage": 88.01, "elapsed_time": "5:17:41", "remaining_time": "0:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3377, "total_steps": 3836, "loss": 0.1348, "learning_rate": 1.9319849597622954e-07, "epoch": 0.8802006972273808, "percentage": 88.03, "elapsed_time": "5:17:46", "remaining_time": "0:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3378, "total_steps": 3836, "loss": 0.1429, "learning_rate": 1.9236854383093668e-07, "epoch": 0.8804613429772261, "percentage": 88.06, "elapsed_time": "5:17:53", "remaining_time": "0:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3379, "total_steps": 3836, "loss": 0.1307, "learning_rate": 1.9154030686457077e-07, "epoch": 0.8807219887270713, "percentage": 88.09, "elapsed_time": "5:17:58", "remaining_time": "0:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3380, "total_steps": 3836, "loss": 0.1305, "learning_rate": 1.9071378569273047e-07, "epoch": 0.8809826344769166, "percentage": 88.11, "elapsed_time": "5:18:04", "remaining_time": "0:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3381, "total_steps": 3836, "loss": 0.1321, "learning_rate": 1.8988898092973885e-07, "epoch": 0.8812432802267618, "percentage": 88.14, "elapsed_time": "5:18:10", "remaining_time": "0:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3382, "total_steps": 3836, "loss": 0.1239, "learning_rate": 1.8906589318864384e-07, "epoch": 0.8815039259766071, "percentage": 88.16, "elapsed_time": "5:18:15", "remaining_time": "0:42:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3383, "total_steps": 3836, "loss": 0.1475, "learning_rate": 1.882445230812166e-07, "epoch": 0.8817645717264523, "percentage": 88.19, "elapsed_time": "5:18:20", "remaining_time": "0:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3384, "total_steps": 3836, "loss": 0.1281, "learning_rate": 1.8742487121795188e-07, "epoch": 0.8820252174762975, "percentage": 88.22, "elapsed_time": "5:18:25", "remaining_time": "0:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3385, "total_steps": 3836, "loss": 0.1375, "learning_rate": 1.866069382080671e-07, "epoch": 0.8822858632261428, "percentage": 88.24, "elapsed_time": "5:18:31", "remaining_time": "0:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3386, "total_steps": 3836, "loss": 0.1356, "learning_rate": 1.8579072465950197e-07, "epoch": 0.882546508975988, "percentage": 88.27, "elapsed_time": "5:18:37", "remaining_time": "0:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3387, "total_steps": 3836, "loss": 0.1437, "learning_rate": 1.849762311789191e-07, "epoch": 0.8828071547258333, "percentage": 88.3, "elapsed_time": "5:18:42", "remaining_time": "0:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3388, "total_steps": 3836, "loss": 0.134, "learning_rate": 1.8416345837170114e-07, "epoch": 0.8830678004756785, "percentage": 88.32, "elapsed_time": "5:18:47", "remaining_time": "0:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3389, "total_steps": 3836, "loss": 0.1292, "learning_rate": 1.8335240684195427e-07, "epoch": 0.8833284462255238, "percentage": 88.35, "elapsed_time": "5:18:53", "remaining_time": "0:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3390, "total_steps": 3836, "loss": 0.1296, "learning_rate": 1.8254307719250214e-07, "epoch": 0.883589091975369, "percentage": 88.37, "elapsed_time": "5:18:58", "remaining_time": "0:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3391, "total_steps": 3836, "loss": 0.1382, "learning_rate": 1.8173547002489024e-07, "epoch": 0.8838497377252142, "percentage": 88.4, "elapsed_time": "5:19:04", "remaining_time": "0:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3392, "total_steps": 3836, "loss": 0.1407, "learning_rate": 1.8092958593938476e-07, "epoch": 0.8841103834750594, "percentage": 88.43, "elapsed_time": "5:19:09", "remaining_time": "0:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3393, "total_steps": 3836, "loss": 0.1363, "learning_rate": 1.8012542553496964e-07, "epoch": 0.8843710292249047, "percentage": 88.45, "elapsed_time": "5:19:14", "remaining_time": "0:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3394, "total_steps": 3836, "loss": 0.1237, "learning_rate": 1.793229894093479e-07, "epoch": 0.8846316749747499, "percentage": 88.48, "elapsed_time": "5:19:20", "remaining_time": "0:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3395, "total_steps": 3836, "loss": 0.1235, "learning_rate": 1.7852227815894242e-07, "epoch": 0.8848923207245952, "percentage": 88.5, "elapsed_time": "5:19:26", "remaining_time": "0:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3396, "total_steps": 3836, "loss": 0.1399, "learning_rate": 1.7772329237889158e-07, "epoch": 0.8851529664744404, "percentage": 88.53, "elapsed_time": "5:19:31", "remaining_time": "0:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3397, "total_steps": 3836, "loss": 0.1345, "learning_rate": 1.769260326630526e-07, "epoch": 0.8854136122242857, "percentage": 88.56, "elapsed_time": "5:19:36", "remaining_time": "0:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3398, "total_steps": 3836, "loss": 0.1336, "learning_rate": 1.7613049960400057e-07, "epoch": 0.8856742579741309, "percentage": 88.58, "elapsed_time": "5:19:41", "remaining_time": "0:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3399, "total_steps": 3836, "loss": 0.1233, "learning_rate": 1.753366937930262e-07, "epoch": 0.8859349037239761, "percentage": 88.61, "elapsed_time": "5:19:46", "remaining_time": "0:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3400, "total_steps": 3836, "loss": 0.1305, "learning_rate": 1.7454461582013665e-07, "epoch": 0.8861955494738214, "percentage": 88.63, "elapsed_time": "5:19:51", "remaining_time": "0:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3401, "total_steps": 3836, "loss": 0.1448, "learning_rate": 1.7375426627405433e-07, "epoch": 0.8864561952236666, "percentage": 88.66, "elapsed_time": "5:19:57", "remaining_time": "0:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3402, "total_steps": 3836, "loss": 0.1402, "learning_rate": 1.7296564574221796e-07, "epoch": 0.8867168409735119, "percentage": 88.69, "elapsed_time": "5:20:02", "remaining_time": "0:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3403, "total_steps": 3836, "loss": 0.1313, "learning_rate": 1.7217875481078034e-07, "epoch": 0.8869774867233571, "percentage": 88.71, "elapsed_time": "5:20:08", "remaining_time": "0:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3404, "total_steps": 3836, "loss": 0.1368, "learning_rate": 1.7139359406460888e-07, "epoch": 0.8872381324732024, "percentage": 88.74, "elapsed_time": "5:20:14", "remaining_time": "0:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3405, "total_steps": 3836, "loss": 0.1347, "learning_rate": 1.7061016408728537e-07, "epoch": 0.8874987782230476, "percentage": 88.76, "elapsed_time": "5:20:20", "remaining_time": "0:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3406, "total_steps": 3836, "loss": 0.1281, "learning_rate": 1.698284654611057e-07, "epoch": 0.8877594239728929, "percentage": 88.79, "elapsed_time": "5:20:25", "remaining_time": "0:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3407, "total_steps": 3836, "loss": 0.1444, "learning_rate": 1.6904849876707653e-07, "epoch": 0.8880200697227381, "percentage": 88.82, "elapsed_time": "5:20:30", "remaining_time": "0:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3408, "total_steps": 3836, "loss": 0.1371, "learning_rate": 1.6827026458492018e-07, "epoch": 0.8882807154725834, "percentage": 88.84, "elapsed_time": "5:20:36", "remaining_time": "0:40:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3409, "total_steps": 3836, "loss": 0.1373, "learning_rate": 1.6749376349306957e-07, "epoch": 0.8885413612224285, "percentage": 88.87, "elapsed_time": "5:20:41", "remaining_time": "0:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3410, "total_steps": 3836, "loss": 0.1408, "learning_rate": 1.6671899606866966e-07, "epoch": 0.8888020069722739, "percentage": 88.89, "elapsed_time": "5:20:47", "remaining_time": "0:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3411, "total_steps": 3836, "loss": 0.1266, "learning_rate": 1.6594596288757702e-07, "epoch": 0.889062652722119, "percentage": 88.92, "elapsed_time": "5:20:52", "remaining_time": "0:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3412, "total_steps": 3836, "loss": 0.1291, "learning_rate": 1.651746645243596e-07, "epoch": 0.8893232984719643, "percentage": 88.95, "elapsed_time": "5:20:58", "remaining_time": "0:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3413, "total_steps": 3836, "loss": 0.137, "learning_rate": 1.6440510155229544e-07, "epoch": 0.8895839442218095, "percentage": 88.97, "elapsed_time": "5:21:03", "remaining_time": "0:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3414, "total_steps": 3836, "loss": 0.1428, "learning_rate": 1.6363727454337202e-07, "epoch": 0.8898445899716547, "percentage": 89.0, "elapsed_time": "5:21:09", "remaining_time": "0:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3415, "total_steps": 3836, "loss": 0.1368, "learning_rate": 1.6287118406828868e-07, "epoch": 0.8901052357215, "percentage": 89.03, "elapsed_time": "5:21:14", "remaining_time": "0:39:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3416, "total_steps": 3836, "loss": 0.1253, "learning_rate": 1.6210683069645212e-07, "epoch": 0.8903658814713452, "percentage": 89.05, "elapsed_time": "5:21:20", "remaining_time": "0:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3417, "total_steps": 3836, "loss": 0.1353, "learning_rate": 1.6134421499597874e-07, "epoch": 0.8906265272211905, "percentage": 89.08, "elapsed_time": "5:21:26", "remaining_time": "0:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3418, "total_steps": 3836, "loss": 0.1422, "learning_rate": 1.6058333753369265e-07, "epoch": 0.8908871729710357, "percentage": 89.1, "elapsed_time": "5:21:31", "remaining_time": "0:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3419, "total_steps": 3836, "loss": 0.1325, "learning_rate": 1.59824198875127e-07, "epoch": 0.891147818720881, "percentage": 89.13, "elapsed_time": "5:21:37", "remaining_time": "0:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3420, "total_steps": 3836, "loss": 0.1371, "learning_rate": 1.5906679958452215e-07, "epoch": 0.8914084644707262, "percentage": 89.16, "elapsed_time": "5:21:42", "remaining_time": "0:39:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3421, "total_steps": 3836, "loss": 0.1472, "learning_rate": 1.583111402248247e-07, "epoch": 0.8916691102205715, "percentage": 89.18, "elapsed_time": "5:21:48", "remaining_time": "0:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3422, "total_steps": 3836, "loss": 0.1349, "learning_rate": 1.5755722135769036e-07, "epoch": 0.8919297559704167, "percentage": 89.21, "elapsed_time": "5:21:53", "remaining_time": "0:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3423, "total_steps": 3836, "loss": 0.1357, "learning_rate": 1.5680504354347868e-07, "epoch": 0.892190401720262, "percentage": 89.23, "elapsed_time": "5:21:59", "remaining_time": "0:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3424, "total_steps": 3836, "loss": 0.1375, "learning_rate": 1.5605460734125582e-07, "epoch": 0.8924510474701072, "percentage": 89.26, "elapsed_time": "5:22:05", "remaining_time": "0:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3425, "total_steps": 3836, "loss": 0.1444, "learning_rate": 1.5530591330879502e-07, "epoch": 0.8927116932199525, "percentage": 89.29, "elapsed_time": "5:22:10", "remaining_time": "0:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3426, "total_steps": 3836, "loss": 0.1447, "learning_rate": 1.545589620025731e-07, "epoch": 0.8929723389697977, "percentage": 89.31, "elapsed_time": "5:22:15", "remaining_time": "0:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3427, "total_steps": 3836, "loss": 0.1269, "learning_rate": 1.5381375397777122e-07, "epoch": 0.893232984719643, "percentage": 89.34, "elapsed_time": "5:22:21", "remaining_time": "0:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3428, "total_steps": 3836, "loss": 0.1333, "learning_rate": 1.530702897882766e-07, "epoch": 0.8934936304694882, "percentage": 89.36, "elapsed_time": "5:22:26", "remaining_time": "0:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3429, "total_steps": 3836, "loss": 0.1233, "learning_rate": 1.5232856998667862e-07, "epoch": 0.8937542762193333, "percentage": 89.39, "elapsed_time": "5:22:32", "remaining_time": "0:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3430, "total_steps": 3836, "loss": 0.1287, "learning_rate": 1.5158859512427044e-07, "epoch": 0.8940149219691786, "percentage": 89.42, "elapsed_time": "5:22:37", "remaining_time": "0:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3431, "total_steps": 3836, "loss": 0.1403, "learning_rate": 1.5085036575104906e-07, "epoch": 0.8942755677190238, "percentage": 89.44, "elapsed_time": "5:22:42", "remaining_time": "0:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3432, "total_steps": 3836, "loss": 0.1472, "learning_rate": 1.501138824157139e-07, "epoch": 0.8945362134688691, "percentage": 89.47, "elapsed_time": "5:22:47", "remaining_time": "0:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3433, "total_steps": 3836, "loss": 0.1318, "learning_rate": 1.4937914566566596e-07, "epoch": 0.8947968592187143, "percentage": 89.49, "elapsed_time": "5:22:52", "remaining_time": "0:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3434, "total_steps": 3836, "loss": 0.1342, "learning_rate": 1.4864615604700872e-07, "epoch": 0.8950575049685596, "percentage": 89.52, "elapsed_time": "5:22:58", "remaining_time": "0:37:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3435, "total_steps": 3836, "loss": 0.1378, "learning_rate": 1.4791491410454633e-07, "epoch": 0.8953181507184048, "percentage": 89.55, "elapsed_time": "5:23:04", "remaining_time": "0:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3436, "total_steps": 3836, "loss": 0.1457, "learning_rate": 1.471854203817852e-07, "epoch": 0.8955787964682501, "percentage": 89.57, "elapsed_time": "5:23:09", "remaining_time": "0:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3437, "total_steps": 3836, "loss": 0.1406, "learning_rate": 1.4645767542093042e-07, "epoch": 0.8958394422180953, "percentage": 89.6, "elapsed_time": "5:23:15", "remaining_time": "0:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3438, "total_steps": 3836, "loss": 0.136, "learning_rate": 1.4573167976288994e-07, "epoch": 0.8961000879679406, "percentage": 89.62, "elapsed_time": "5:23:21", "remaining_time": "0:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3439, "total_steps": 3836, "loss": 0.1519, "learning_rate": 1.4500743394726956e-07, "epoch": 0.8963607337177858, "percentage": 89.65, "elapsed_time": "5:23:26", "remaining_time": "0:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3440, "total_steps": 3836, "loss": 0.1296, "learning_rate": 1.4428493851237403e-07, "epoch": 0.8966213794676311, "percentage": 89.68, "elapsed_time": "5:23:32", "remaining_time": "0:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3441, "total_steps": 3836, "loss": 0.1426, "learning_rate": 1.4356419399520928e-07, "epoch": 0.8968820252174763, "percentage": 89.7, "elapsed_time": "5:23:38", "remaining_time": "0:37:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3442, "total_steps": 3836, "loss": 0.1345, "learning_rate": 1.4284520093147818e-07, "epoch": 0.8971426709673216, "percentage": 89.73, "elapsed_time": "5:23:44", "remaining_time": "0:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3443, "total_steps": 3836, "loss": 0.1425, "learning_rate": 1.421279598555822e-07, "epoch": 0.8974033167171668, "percentage": 89.75, "elapsed_time": "5:23:49", "remaining_time": "0:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3444, "total_steps": 3836, "loss": 0.14, "learning_rate": 1.4141247130062069e-07, "epoch": 0.8976639624670121, "percentage": 89.78, "elapsed_time": "5:23:55", "remaining_time": "0:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3445, "total_steps": 3836, "loss": 0.1343, "learning_rate": 1.4069873579839023e-07, "epoch": 0.8979246082168573, "percentage": 89.81, "elapsed_time": "5:24:00", "remaining_time": "0:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3446, "total_steps": 3836, "loss": 0.138, "learning_rate": 1.3998675387938476e-07, "epoch": 0.8981852539667025, "percentage": 89.83, "elapsed_time": "5:24:06", "remaining_time": "0:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3447, "total_steps": 3836, "loss": 0.1168, "learning_rate": 1.3927652607279434e-07, "epoch": 0.8984458997165478, "percentage": 89.86, "elapsed_time": "5:24:11", "remaining_time": "0:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3448, "total_steps": 3836, "loss": 0.1291, "learning_rate": 1.3856805290650644e-07, "epoch": 0.898706545466393, "percentage": 89.89, "elapsed_time": "5:24:16", "remaining_time": "0:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3449, "total_steps": 3836, "loss": 0.1568, "learning_rate": 1.3786133490710284e-07, "epoch": 0.8989671912162382, "percentage": 89.91, "elapsed_time": "5:24:22", "remaining_time": "0:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3450, "total_steps": 3836, "loss": 0.143, "learning_rate": 1.3715637259986147e-07, "epoch": 0.8992278369660834, "percentage": 89.94, "elapsed_time": "5:24:28", "remaining_time": "0:36:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3451, "total_steps": 3836, "loss": 0.1285, "learning_rate": 1.364531665087554e-07, "epoch": 0.8994884827159287, "percentage": 89.96, "elapsed_time": "5:24:33", "remaining_time": "0:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3452, "total_steps": 3836, "loss": 0.1319, "learning_rate": 1.3575171715645235e-07, "epoch": 0.8997491284657739, "percentage": 89.99, "elapsed_time": "5:24:39", "remaining_time": "0:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3453, "total_steps": 3836, "loss": 0.1463, "learning_rate": 1.350520250643142e-07, "epoch": 0.9000097742156192, "percentage": 90.02, "elapsed_time": "5:24:45", "remaining_time": "0:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3454, "total_steps": 3836, "loss": 0.1444, "learning_rate": 1.343540907523963e-07, "epoch": 0.9002704199654644, "percentage": 90.04, "elapsed_time": "5:24:50", "remaining_time": "0:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3455, "total_steps": 3836, "loss": 0.1352, "learning_rate": 1.3365791473944928e-07, "epoch": 0.9005310657153097, "percentage": 90.07, "elapsed_time": "5:24:55", "remaining_time": "0:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3456, "total_steps": 3836, "loss": 0.1427, "learning_rate": 1.3296349754291366e-07, "epoch": 0.9007917114651549, "percentage": 90.09, "elapsed_time": "5:25:01", "remaining_time": "0:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3457, "total_steps": 3836, "loss": 0.1501, "learning_rate": 1.32270839678926e-07, "epoch": 0.9010523572150002, "percentage": 90.12, "elapsed_time": "5:25:07", "remaining_time": "0:35:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3458, "total_steps": 3836, "loss": 0.1322, "learning_rate": 1.3157994166231342e-07, "epoch": 0.9013130029648454, "percentage": 90.15, "elapsed_time": "5:25:12", "remaining_time": "0:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3459, "total_steps": 3836, "loss": 0.1303, "learning_rate": 1.3089080400659538e-07, "epoch": 0.9015736487146907, "percentage": 90.17, "elapsed_time": "5:25:18", "remaining_time": "0:35:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3460, "total_steps": 3836, "loss": 0.1312, "learning_rate": 1.3020342722398273e-07, "epoch": 0.9018342944645359, "percentage": 90.2, "elapsed_time": "5:25:24", "remaining_time": "0:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3461, "total_steps": 3836, "loss": 0.1376, "learning_rate": 1.295178118253787e-07, "epoch": 0.9020949402143811, "percentage": 90.22, "elapsed_time": "5:25:29", "remaining_time": "0:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3462, "total_steps": 3836, "loss": 0.1413, "learning_rate": 1.2883395832037516e-07, "epoch": 0.9023555859642264, "percentage": 90.25, "elapsed_time": "5:25:35", "remaining_time": "0:35:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3463, "total_steps": 3836, "loss": 0.146, "learning_rate": 1.2815186721725603e-07, "epoch": 0.9026162317140716, "percentage": 90.28, "elapsed_time": "5:25:41", "remaining_time": "0:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3464, "total_steps": 3836, "loss": 0.1425, "learning_rate": 1.2747153902299524e-07, "epoch": 0.9028768774639169, "percentage": 90.3, "elapsed_time": "5:25:46", "remaining_time": "0:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3465, "total_steps": 3836, "loss": 0.1337, "learning_rate": 1.2679297424325608e-07, "epoch": 0.9031375232137621, "percentage": 90.33, "elapsed_time": "5:25:51", "remaining_time": "0:34:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3466, "total_steps": 3836, "loss": 0.1269, "learning_rate": 1.2611617338239097e-07, "epoch": 0.9033981689636074, "percentage": 90.35, "elapsed_time": "5:25:57", "remaining_time": "0:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3467, "total_steps": 3836, "loss": 0.1416, "learning_rate": 1.254411369434419e-07, "epoch": 0.9036588147134526, "percentage": 90.38, "elapsed_time": "5:26:02", "remaining_time": "0:34:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3468, "total_steps": 3836, "loss": 0.1299, "learning_rate": 1.247678654281384e-07, "epoch": 0.9039194604632979, "percentage": 90.41, "elapsed_time": "5:26:08", "remaining_time": "0:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3469, "total_steps": 3836, "loss": 0.135, "learning_rate": 1.2409635933689934e-07, "epoch": 0.904180106213143, "percentage": 90.43, "elapsed_time": "5:26:14", "remaining_time": "0:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3470, "total_steps": 3836, "loss": 0.1467, "learning_rate": 1.234266191688302e-07, "epoch": 0.9044407519629883, "percentage": 90.46, "elapsed_time": "5:26:19", "remaining_time": "0:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3471, "total_steps": 3836, "loss": 0.1288, "learning_rate": 1.2275864542172556e-07, "epoch": 0.9047013977128335, "percentage": 90.48, "elapsed_time": "5:26:25", "remaining_time": "0:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3472, "total_steps": 3836, "loss": 0.1413, "learning_rate": 1.2209243859206577e-07, "epoch": 0.9049620434626788, "percentage": 90.51, "elapsed_time": "5:26:30", "remaining_time": "0:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3473, "total_steps": 3836, "loss": 0.1186, "learning_rate": 1.214279991750178e-07, "epoch": 0.905222689212524, "percentage": 90.54, "elapsed_time": "5:26:36", "remaining_time": "0:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3474, "total_steps": 3836, "loss": 0.1317, "learning_rate": 1.2076532766443578e-07, "epoch": 0.9054833349623693, "percentage": 90.56, "elapsed_time": "5:26:42", "remaining_time": "0:34:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3475, "total_steps": 3836, "loss": 0.1236, "learning_rate": 1.201044245528596e-07, "epoch": 0.9057439807122145, "percentage": 90.59, "elapsed_time": "5:26:48", "remaining_time": "0:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3476, "total_steps": 3836, "loss": 0.1366, "learning_rate": 1.1944529033151436e-07, "epoch": 0.9060046264620597, "percentage": 90.62, "elapsed_time": "5:26:53", "remaining_time": "0:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3477, "total_steps": 3836, "loss": 0.1232, "learning_rate": 1.1878792549031071e-07, "epoch": 0.906265272211905, "percentage": 90.64, "elapsed_time": "5:26:59", "remaining_time": "0:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3478, "total_steps": 3836, "loss": 0.1337, "learning_rate": 1.1813233051784417e-07, "epoch": 0.9065259179617502, "percentage": 90.67, "elapsed_time": "5:27:04", "remaining_time": "0:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3479, "total_steps": 3836, "loss": 0.1276, "learning_rate": 1.1747850590139497e-07, "epoch": 0.9067865637115955, "percentage": 90.69, "elapsed_time": "5:27:09", "remaining_time": "0:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3480, "total_steps": 3836, "loss": 0.1351, "learning_rate": 1.1682645212692634e-07, "epoch": 0.9070472094614407, "percentage": 90.72, "elapsed_time": "5:27:15", "remaining_time": "0:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3481, "total_steps": 3836, "loss": 0.152, "learning_rate": 1.1617616967908751e-07, "epoch": 0.907307855211286, "percentage": 90.75, "elapsed_time": "5:27:20", "remaining_time": "0:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3482, "total_steps": 3836, "loss": 0.1307, "learning_rate": 1.1552765904120966e-07, "epoch": 0.9075685009611312, "percentage": 90.77, "elapsed_time": "5:27:26", "remaining_time": "0:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3483, "total_steps": 3836, "loss": 0.1364, "learning_rate": 1.1488092069530666e-07, "epoch": 0.9078291467109765, "percentage": 90.8, "elapsed_time": "5:27:32", "remaining_time": "0:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3484, "total_steps": 3836, "loss": 0.1316, "learning_rate": 1.1423595512207591e-07, "epoch": 0.9080897924608217, "percentage": 90.82, "elapsed_time": "5:27:36", "remaining_time": "0:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3485, "total_steps": 3836, "loss": 0.1289, "learning_rate": 1.1359276280089731e-07, "epoch": 0.908350438210667, "percentage": 90.85, "elapsed_time": "5:27:42", "remaining_time": "0:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3486, "total_steps": 3836, "loss": 0.1296, "learning_rate": 1.1295134420983179e-07, "epoch": 0.9086110839605122, "percentage": 90.88, "elapsed_time": "5:27:48", "remaining_time": "0:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3487, "total_steps": 3836, "loss": 0.1387, "learning_rate": 1.1231169982562324e-07, "epoch": 0.9088717297103575, "percentage": 90.9, "elapsed_time": "5:27:54", "remaining_time": "0:32:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3488, "total_steps": 3836, "loss": 0.1274, "learning_rate": 1.1167383012369609e-07, "epoch": 0.9091323754602026, "percentage": 90.93, "elapsed_time": "5:27:59", "remaining_time": "0:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3489, "total_steps": 3836, "loss": 0.1344, "learning_rate": 1.1103773557815528e-07, "epoch": 0.909393021210048, "percentage": 90.95, "elapsed_time": "5:28:04", "remaining_time": "0:32:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3490, "total_steps": 3836, "loss": 0.1278, "learning_rate": 1.1040341666178733e-07, "epoch": 0.9096536669598931, "percentage": 90.98, "elapsed_time": "5:28:10", "remaining_time": "0:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3491, "total_steps": 3836, "loss": 0.1401, "learning_rate": 1.0977087384605845e-07, "epoch": 0.9099143127097383, "percentage": 91.01, "elapsed_time": "5:28:16", "remaining_time": "0:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3492, "total_steps": 3836, "loss": 0.1532, "learning_rate": 1.0914010760111476e-07, "epoch": 0.9101749584595836, "percentage": 91.03, "elapsed_time": "5:28:22", "remaining_time": "0:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3493, "total_steps": 3836, "loss": 0.1261, "learning_rate": 1.0851111839578182e-07, "epoch": 0.9104356042094288, "percentage": 91.06, "elapsed_time": "5:28:27", "remaining_time": "0:32:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3494, "total_steps": 3836, "loss": 0.1346, "learning_rate": 1.078839066975651e-07, "epoch": 0.9106962499592741, "percentage": 91.08, "elapsed_time": "5:28:32", "remaining_time": "0:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3495, "total_steps": 3836, "loss": 0.1286, "learning_rate": 1.072584729726478e-07, "epoch": 0.9109568957091193, "percentage": 91.11, "elapsed_time": "5:28:38", "remaining_time": "0:32:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3496, "total_steps": 3836, "loss": 0.1345, "learning_rate": 1.0663481768589196e-07, "epoch": 0.9112175414589646, "percentage": 91.14, "elapsed_time": "5:28:43", "remaining_time": "0:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3497, "total_steps": 3836, "loss": 0.1302, "learning_rate": 1.0601294130083845e-07, "epoch": 0.9114781872088098, "percentage": 91.16, "elapsed_time": "5:28:48", "remaining_time": "0:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3498, "total_steps": 3836, "loss": 0.1433, "learning_rate": 1.0539284427970559e-07, "epoch": 0.9117388329586551, "percentage": 91.19, "elapsed_time": "5:28:54", "remaining_time": "0:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3499, "total_steps": 3836, "loss": 0.1456, "learning_rate": 1.0477452708338886e-07, "epoch": 0.9119994787085003, "percentage": 91.21, "elapsed_time": "5:29:00", "remaining_time": "0:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 3836, "loss": 0.13, "learning_rate": 1.0415799017146094e-07, "epoch": 0.9122601244583456, "percentage": 91.24, "elapsed_time": "5:29:05", "remaining_time": "0:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 3836, "eval_loss": 0.13526123762130737, "epoch": 0.9122601244583456, "percentage": 91.24, "elapsed_time": "5:30:00", "remaining_time": "0:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3501, "total_steps": 3836, "loss": 0.1447, "learning_rate": 1.0354323400217136e-07, "epoch": 0.9125207702081908, "percentage": 91.27, "elapsed_time": "5:30:06", "remaining_time": "0:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3502, "total_steps": 3836, "loss": 0.1367, "learning_rate": 1.029302590324463e-07, "epoch": 0.9127814159580361, "percentage": 91.29, "elapsed_time": "5:30:11", "remaining_time": "0:31:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3503, "total_steps": 3836, "loss": 0.1359, "learning_rate": 1.0231906571788769e-07, "epoch": 0.9130420617078813, "percentage": 91.32, "elapsed_time": "5:30:17", "remaining_time": "0:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3504, "total_steps": 3836, "loss": 0.1406, "learning_rate": 1.0170965451277382e-07, "epoch": 0.9133027074577266, "percentage": 91.35, "elapsed_time": "5:30:23", "remaining_time": "0:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3505, "total_steps": 3836, "loss": 0.1341, "learning_rate": 1.0110202587005763e-07, "epoch": 0.9135633532075718, "percentage": 91.37, "elapsed_time": "5:30:28", "remaining_time": "0:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3506, "total_steps": 3836, "loss": 0.1335, "learning_rate": 1.0049618024136703e-07, "epoch": 0.913823998957417, "percentage": 91.4, "elapsed_time": "5:30:34", "remaining_time": "0:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3507, "total_steps": 3836, "loss": 0.1246, "learning_rate": 9.9892118077006e-08, "epoch": 0.9140846447072623, "percentage": 91.42, "elapsed_time": "5:30:39", "remaining_time": "0:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3508, "total_steps": 3836, "loss": 0.1486, "learning_rate": 9.928983982595175e-08, "epoch": 0.9143452904571074, "percentage": 91.45, "elapsed_time": "5:30:46", "remaining_time": "0:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3509, "total_steps": 3836, "loss": 0.1359, "learning_rate": 9.868934593585594e-08, "epoch": 0.9146059362069527, "percentage": 91.48, "elapsed_time": "5:30:52", "remaining_time": "0:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3510, "total_steps": 3836, "loss": 0.1333, "learning_rate": 9.809063685304376e-08, "epoch": 0.9148665819567979, "percentage": 91.5, "elapsed_time": "5:30:57", "remaining_time": "0:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3511, "total_steps": 3836, "loss": 0.1432, "learning_rate": 9.749371302251398e-08, "epoch": 0.9151272277066432, "percentage": 91.53, "elapsed_time": "5:31:03", "remaining_time": "0:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3512, "total_steps": 3836, "loss": 0.1283, "learning_rate": 9.689857488793891e-08, "epoch": 0.9153878734564884, "percentage": 91.55, "elapsed_time": "5:31:09", "remaining_time": "0:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3513, "total_steps": 3836, "loss": 0.1404, "learning_rate": 9.63052228916625e-08, "epoch": 0.9156485192063337, "percentage": 91.58, "elapsed_time": "5:31:14", "remaining_time": "0:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3514, "total_steps": 3836, "loss": 0.1411, "learning_rate": 9.571365747470251e-08, "epoch": 0.9159091649561789, "percentage": 91.61, "elapsed_time": "5:31:20", "remaining_time": "0:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3515, "total_steps": 3836, "loss": 0.1277, "learning_rate": 9.51238790767478e-08, "epoch": 0.9161698107060242, "percentage": 91.63, "elapsed_time": "5:31:25", "remaining_time": "0:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3516, "total_steps": 3836, "loss": 0.1253, "learning_rate": 9.45358881361591e-08, "epoch": 0.9164304564558694, "percentage": 91.66, "elapsed_time": "5:31:30", "remaining_time": "0:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3517, "total_steps": 3836, "loss": 0.1387, "learning_rate": 9.394968508996905e-08, "epoch": 0.9166911022057147, "percentage": 91.68, "elapsed_time": "5:31:36", "remaining_time": "0:30:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3518, "total_steps": 3836, "loss": 0.1271, "learning_rate": 9.336527037388132e-08, "epoch": 0.9169517479555599, "percentage": 91.71, "elapsed_time": "5:31:41", "remaining_time": "0:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3519, "total_steps": 3836, "loss": 0.1446, "learning_rate": 9.278264442226931e-08, "epoch": 0.9172123937054052, "percentage": 91.74, "elapsed_time": "5:31:47", "remaining_time": "0:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3520, "total_steps": 3836, "loss": 0.1371, "learning_rate": 9.22018076681791e-08, "epoch": 0.9174730394552504, "percentage": 91.76, "elapsed_time": "5:31:53", "remaining_time": "0:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3521, "total_steps": 3836, "loss": 0.1277, "learning_rate": 9.162276054332509e-08, "epoch": 0.9177336852050956, "percentage": 91.79, "elapsed_time": "5:31:58", "remaining_time": "0:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3522, "total_steps": 3836, "loss": 0.1333, "learning_rate": 9.10455034780916e-08, "epoch": 0.9179943309549409, "percentage": 91.81, "elapsed_time": "5:32:04", "remaining_time": "0:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3523, "total_steps": 3836, "loss": 0.1373, "learning_rate": 9.047003690153322e-08, "epoch": 0.9182549767047861, "percentage": 91.84, "elapsed_time": "5:32:10", "remaining_time": "0:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3524, "total_steps": 3836, "loss": 0.1344, "learning_rate": 8.989636124137363e-08, "epoch": 0.9185156224546314, "percentage": 91.87, "elapsed_time": "5:32:15", "remaining_time": "0:29:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3525, "total_steps": 3836, "loss": 0.1302, "learning_rate": 8.932447692400509e-08, "epoch": 0.9187762682044766, "percentage": 91.89, "elapsed_time": "5:32:21", "remaining_time": "0:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3526, "total_steps": 3836, "loss": 0.1328, "learning_rate": 8.875438437448813e-08, "epoch": 0.9190369139543219, "percentage": 91.92, "elapsed_time": "5:32:26", "remaining_time": "0:29:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3527, "total_steps": 3836, "loss": 0.1341, "learning_rate": 8.818608401655243e-08, "epoch": 0.919297559704167, "percentage": 91.94, "elapsed_time": "5:32:31", "remaining_time": "0:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3528, "total_steps": 3836, "loss": 0.1342, "learning_rate": 8.761957627259509e-08, "epoch": 0.9195582054540123, "percentage": 91.97, "elapsed_time": "5:32:36", "remaining_time": "0:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3529, "total_steps": 3836, "loss": 0.1299, "learning_rate": 8.705486156367987e-08, "epoch": 0.9198188512038575, "percentage": 92.0, "elapsed_time": "5:32:42", "remaining_time": "0:28:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3530, "total_steps": 3836, "loss": 0.1276, "learning_rate": 8.649194030953989e-08, "epoch": 0.9200794969537028, "percentage": 92.02, "elapsed_time": "5:32:48", "remaining_time": "0:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3531, "total_steps": 3836, "loss": 0.15, "learning_rate": 8.59308129285738e-08, "epoch": 0.920340142703548, "percentage": 92.05, "elapsed_time": "5:32:53", "remaining_time": "0:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3532, "total_steps": 3836, "loss": 0.1247, "learning_rate": 8.537147983784716e-08, "epoch": 0.9206007884533933, "percentage": 92.08, "elapsed_time": "5:32:59", "remaining_time": "0:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3533, "total_steps": 3836, "loss": 0.1367, "learning_rate": 8.481394145309213e-08, "epoch": 0.9208614342032385, "percentage": 92.1, "elapsed_time": "5:33:04", "remaining_time": "0:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3534, "total_steps": 3836, "loss": 0.1373, "learning_rate": 8.425819818870667e-08, "epoch": 0.9211220799530838, "percentage": 92.13, "elapsed_time": "5:33:09", "remaining_time": "0:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3535, "total_steps": 3836, "loss": 0.1486, "learning_rate": 8.370425045775454e-08, "epoch": 0.921382725702929, "percentage": 92.15, "elapsed_time": "5:33:15", "remaining_time": "0:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3536, "total_steps": 3836, "loss": 0.1225, "learning_rate": 8.3152098671965e-08, "epoch": 0.9216433714527742, "percentage": 92.18, "elapsed_time": "5:33:20", "remaining_time": "0:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3537, "total_steps": 3836, "loss": 0.1336, "learning_rate": 8.260174324173336e-08, "epoch": 0.9219040172026195, "percentage": 92.21, "elapsed_time": "5:33:26", "remaining_time": "0:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3538, "total_steps": 3836, "loss": 0.1327, "learning_rate": 8.205318457611772e-08, "epoch": 0.9221646629524647, "percentage": 92.23, "elapsed_time": "5:33:32", "remaining_time": "0:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3539, "total_steps": 3836, "loss": 0.1316, "learning_rate": 8.150642308284218e-08, "epoch": 0.92242530870231, "percentage": 92.26, "elapsed_time": "5:33:37", "remaining_time": "0:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3540, "total_steps": 3836, "loss": 0.1394, "learning_rate": 8.096145916829529e-08, "epoch": 0.9226859544521552, "percentage": 92.28, "elapsed_time": "5:33:43", "remaining_time": "0:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3541, "total_steps": 3836, "loss": 0.1284, "learning_rate": 8.041829323752858e-08, "epoch": 0.9229466002020005, "percentage": 92.31, "elapsed_time": "5:33:49", "remaining_time": "0:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3542, "total_steps": 3836, "loss": 0.1328, "learning_rate": 7.98769256942572e-08, "epoch": 0.9232072459518457, "percentage": 92.34, "elapsed_time": "5:33:55", "remaining_time": "0:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3543, "total_steps": 3836, "loss": 0.1371, "learning_rate": 7.933735694086147e-08, "epoch": 0.923467891701691, "percentage": 92.36, "elapsed_time": "5:34:00", "remaining_time": "0:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3544, "total_steps": 3836, "loss": 0.1444, "learning_rate": 7.879958737838201e-08, "epoch": 0.9237285374515362, "percentage": 92.39, "elapsed_time": "5:34:06", "remaining_time": "0:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3545, "total_steps": 3836, "loss": 0.1293, "learning_rate": 7.826361740652321e-08, "epoch": 0.9239891832013815, "percentage": 92.41, "elapsed_time": "5:34:12", "remaining_time": "0:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3546, "total_steps": 3836, "loss": 0.1269, "learning_rate": 7.77294474236534e-08, "epoch": 0.9242498289512266, "percentage": 92.44, "elapsed_time": "5:34:17", "remaining_time": "0:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3547, "total_steps": 3836, "loss": 0.1306, "learning_rate": 7.719707782680108e-08, "epoch": 0.924510474701072, "percentage": 92.47, "elapsed_time": "5:34:22", "remaining_time": "0:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3548, "total_steps": 3836, "loss": 0.1393, "learning_rate": 7.66665090116575e-08, "epoch": 0.9247711204509171, "percentage": 92.49, "elapsed_time": "5:34:28", "remaining_time": "0:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3549, "total_steps": 3836, "loss": 0.1426, "learning_rate": 7.613774137257502e-08, "epoch": 0.9250317662007624, "percentage": 92.52, "elapsed_time": "5:34:34", "remaining_time": "0:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3550, "total_steps": 3836, "loss": 0.1227, "learning_rate": 7.561077530256755e-08, "epoch": 0.9252924119506076, "percentage": 92.54, "elapsed_time": "5:34:39", "remaining_time": "0:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3551, "total_steps": 3836, "loss": 0.1393, "learning_rate": 7.508561119331014e-08, "epoch": 0.9255530577004528, "percentage": 92.57, "elapsed_time": "5:34:45", "remaining_time": "0:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3552, "total_steps": 3836, "loss": 0.1328, "learning_rate": 7.456224943513779e-08, "epoch": 0.9258137034502981, "percentage": 92.6, "elapsed_time": "5:34:50", "remaining_time": "0:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3553, "total_steps": 3836, "loss": 0.1239, "learning_rate": 7.404069041704682e-08, "epoch": 0.9260743492001433, "percentage": 92.62, "elapsed_time": "5:34:56", "remaining_time": "0:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3554, "total_steps": 3836, "loss": 0.1441, "learning_rate": 7.352093452669324e-08, "epoch": 0.9263349949499886, "percentage": 92.65, "elapsed_time": "5:35:02", "remaining_time": "0:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3555, "total_steps": 3836, "loss": 0.1299, "learning_rate": 7.30029821503922e-08, "epoch": 0.9265956406998338, "percentage": 92.67, "elapsed_time": "5:35:07", "remaining_time": "0:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3556, "total_steps": 3836, "loss": 0.1362, "learning_rate": 7.248683367311937e-08, "epoch": 0.9268562864496791, "percentage": 92.7, "elapsed_time": "5:35:13", "remaining_time": "0:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3557, "total_steps": 3836, "loss": 0.1248, "learning_rate": 7.1972489478509e-08, "epoch": 0.9271169321995243, "percentage": 92.73, "elapsed_time": "5:35:18", "remaining_time": "0:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3558, "total_steps": 3836, "loss": 0.1341, "learning_rate": 7.145994994885497e-08, "epoch": 0.9273775779493696, "percentage": 92.75, "elapsed_time": "5:35:23", "remaining_time": "0:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3559, "total_steps": 3836, "loss": 0.1493, "learning_rate": 7.094921546510896e-08, "epoch": 0.9276382236992148, "percentage": 92.78, "elapsed_time": "5:35:29", "remaining_time": "0:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3560, "total_steps": 3836, "loss": 0.1392, "learning_rate": 7.044028640688122e-08, "epoch": 0.9278988694490601, "percentage": 92.81, "elapsed_time": "5:35:34", "remaining_time": "0:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3561, "total_steps": 3836, "loss": 0.1262, "learning_rate": 6.993316315244081e-08, "epoch": 0.9281595151989053, "percentage": 92.83, "elapsed_time": "5:35:40", "remaining_time": "0:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3562, "total_steps": 3836, "loss": 0.1301, "learning_rate": 6.942784607871373e-08, "epoch": 0.9284201609487506, "percentage": 92.86, "elapsed_time": "5:35:45", "remaining_time": "0:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3563, "total_steps": 3836, "loss": 0.1388, "learning_rate": 6.892433556128425e-08, "epoch": 0.9286808066985958, "percentage": 92.88, "elapsed_time": "5:35:50", "remaining_time": "0:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3564, "total_steps": 3836, "loss": 0.1381, "learning_rate": 6.842263197439303e-08, "epoch": 0.9289414524484411, "percentage": 92.91, "elapsed_time": "5:35:57", "remaining_time": "0:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3565, "total_steps": 3836, "loss": 0.1351, "learning_rate": 6.792273569093843e-08, "epoch": 0.9292020981982863, "percentage": 92.94, "elapsed_time": "5:36:02", "remaining_time": "0:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3566, "total_steps": 3836, "loss": 0.1315, "learning_rate": 6.742464708247548e-08, "epoch": 0.9294627439481314, "percentage": 92.96, "elapsed_time": "5:36:08", "remaining_time": "0:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3567, "total_steps": 3836, "loss": 0.1448, "learning_rate": 6.692836651921498e-08, "epoch": 0.9297233896979767, "percentage": 92.99, "elapsed_time": "5:36:14", "remaining_time": "0:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3568, "total_steps": 3836, "loss": 0.1473, "learning_rate": 6.643389437002462e-08, "epoch": 0.9299840354478219, "percentage": 93.01, "elapsed_time": "5:36:19", "remaining_time": "0:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3569, "total_steps": 3836, "loss": 0.1416, "learning_rate": 6.594123100242738e-08, "epoch": 0.9302446811976672, "percentage": 93.04, "elapsed_time": "5:36:25", "remaining_time": "0:25:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3570, "total_steps": 3836, "loss": 0.1361, "learning_rate": 6.545037678260257e-08, "epoch": 0.9305053269475124, "percentage": 93.07, "elapsed_time": "5:36:31", "remaining_time": "0:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3571, "total_steps": 3836, "loss": 0.1494, "learning_rate": 6.496133207538392e-08, "epoch": 0.9307659726973577, "percentage": 93.09, "elapsed_time": "5:36:36", "remaining_time": "0:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3572, "total_steps": 3836, "loss": 0.1347, "learning_rate": 6.447409724426063e-08, "epoch": 0.9310266184472029, "percentage": 93.12, "elapsed_time": "5:36:41", "remaining_time": "0:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3573, "total_steps": 3836, "loss": 0.1352, "learning_rate": 6.398867265137693e-08, "epoch": 0.9312872641970482, "percentage": 93.14, "elapsed_time": "5:36:47", "remaining_time": "0:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3574, "total_steps": 3836, "loss": 0.1357, "learning_rate": 6.350505865753142e-08, "epoch": 0.9315479099468934, "percentage": 93.17, "elapsed_time": "5:36:52", "remaining_time": "0:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3575, "total_steps": 3836, "loss": 0.1262, "learning_rate": 6.302325562217632e-08, "epoch": 0.9318085556967387, "percentage": 93.2, "elapsed_time": "5:36:58", "remaining_time": "0:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3576, "total_steps": 3836, "loss": 0.1315, "learning_rate": 6.254326390341958e-08, "epoch": 0.9320692014465839, "percentage": 93.22, "elapsed_time": "5:37:04", "remaining_time": "0:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3577, "total_steps": 3836, "loss": 0.1249, "learning_rate": 6.206508385802057e-08, "epoch": 0.9323298471964292, "percentage": 93.25, "elapsed_time": "5:37:10", "remaining_time": "0:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3578, "total_steps": 3836, "loss": 0.1464, "learning_rate": 6.158871584139303e-08, "epoch": 0.9325904929462744, "percentage": 93.27, "elapsed_time": "5:37:15", "remaining_time": "0:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3579, "total_steps": 3836, "loss": 0.1343, "learning_rate": 6.111416020760513e-08, "epoch": 0.9328511386961197, "percentage": 93.3, "elapsed_time": "5:37:21", "remaining_time": "0:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3580, "total_steps": 3836, "loss": 0.1231, "learning_rate": 6.06414173093764e-08, "epoch": 0.9331117844459649, "percentage": 93.33, "elapsed_time": "5:37:27", "remaining_time": "0:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3581, "total_steps": 3836, "loss": 0.1127, "learning_rate": 6.017048749807935e-08, "epoch": 0.9333724301958101, "percentage": 93.35, "elapsed_time": "5:37:32", "remaining_time": "0:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3582, "total_steps": 3836, "loss": 0.1392, "learning_rate": 5.970137112373903e-08, "epoch": 0.9336330759456554, "percentage": 93.38, "elapsed_time": "5:37:37", "remaining_time": "0:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3583, "total_steps": 3836, "loss": 0.1376, "learning_rate": 5.923406853503288e-08, "epoch": 0.9338937216955006, "percentage": 93.4, "elapsed_time": "5:37:42", "remaining_time": "0:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3584, "total_steps": 3836, "loss": 0.1371, "learning_rate": 5.876858007929004e-08, "epoch": 0.9341543674453459, "percentage": 93.43, "elapsed_time": "5:37:48", "remaining_time": "0:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3585, "total_steps": 3836, "loss": 0.1357, "learning_rate": 5.830490610249068e-08, "epoch": 0.934415013195191, "percentage": 93.46, "elapsed_time": "5:37:54", "remaining_time": "0:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3586, "total_steps": 3836, "loss": 0.1323, "learning_rate": 5.784304694926773e-08, "epoch": 0.9346756589450363, "percentage": 93.48, "elapsed_time": "5:37:59", "remaining_time": "0:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3587, "total_steps": 3836, "loss": 0.1419, "learning_rate": 5.738300296290411e-08, "epoch": 0.9349363046948815, "percentage": 93.51, "elapsed_time": "5:38:05", "remaining_time": "0:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3588, "total_steps": 3836, "loss": 0.1306, "learning_rate": 5.692477448533351e-08, "epoch": 0.9351969504447268, "percentage": 93.53, "elapsed_time": "5:38:09", "remaining_time": "0:23:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3589, "total_steps": 3836, "loss": 0.1473, "learning_rate": 5.6468361857140716e-08, "epoch": 0.935457596194572, "percentage": 93.56, "elapsed_time": "5:38:16", "remaining_time": "0:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3590, "total_steps": 3836, "loss": 0.1332, "learning_rate": 5.601376541756076e-08, "epoch": 0.9357182419444173, "percentage": 93.59, "elapsed_time": "5:38:21", "remaining_time": "0:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3591, "total_steps": 3836, "loss": 0.1364, "learning_rate": 5.5560985504478916e-08, "epoch": 0.9359788876942625, "percentage": 93.61, "elapsed_time": "5:38:27", "remaining_time": "0:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3592, "total_steps": 3836, "loss": 0.1204, "learning_rate": 5.511002245442987e-08, "epoch": 0.9362395334441078, "percentage": 93.64, "elapsed_time": "5:38:33", "remaining_time": "0:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3593, "total_steps": 3836, "loss": 0.132, "learning_rate": 5.4660876602598e-08, "epoch": 0.936500179193953, "percentage": 93.67, "elapsed_time": "5:38:38", "remaining_time": "0:22:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3594, "total_steps": 3836, "loss": 0.1404, "learning_rate": 5.4213548282817664e-08, "epoch": 0.9367608249437983, "percentage": 93.69, "elapsed_time": "5:38:44", "remaining_time": "0:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3595, "total_steps": 3836, "loss": 0.1442, "learning_rate": 5.376803782757095e-08, "epoch": 0.9370214706936435, "percentage": 93.72, "elapsed_time": "5:38:50", "remaining_time": "0:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3596, "total_steps": 3836, "loss": 0.1276, "learning_rate": 5.3324345567990485e-08, "epoch": 0.9372821164434887, "percentage": 93.74, "elapsed_time": "5:38:55", "remaining_time": "0:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3597, "total_steps": 3836, "loss": 0.1331, "learning_rate": 5.288247183385664e-08, "epoch": 0.937542762193334, "percentage": 93.77, "elapsed_time": "5:39:00", "remaining_time": "0:22:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3598, "total_steps": 3836, "loss": 0.1276, "learning_rate": 5.244241695359753e-08, "epoch": 0.9378034079431792, "percentage": 93.8, "elapsed_time": "5:39:06", "remaining_time": "0:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3599, "total_steps": 3836, "loss": 0.1284, "learning_rate": 5.200418125429069e-08, "epoch": 0.9380640536930245, "percentage": 93.82, "elapsed_time": "5:39:12", "remaining_time": "0:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3600, "total_steps": 3836, "loss": 0.1302, "learning_rate": 5.156776506166028e-08, "epoch": 0.9383246994428697, "percentage": 93.85, "elapsed_time": "5:39:17", "remaining_time": "0:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3601, "total_steps": 3836, "loss": 0.1285, "learning_rate": 5.1133168700078785e-08, "epoch": 0.938585345192715, "percentage": 93.87, "elapsed_time": "5:39:23", "remaining_time": "0:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3602, "total_steps": 3836, "loss": 0.1475, "learning_rate": 5.070039249256642e-08, "epoch": 0.9388459909425602, "percentage": 93.9, "elapsed_time": "5:39:28", "remaining_time": "0:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3603, "total_steps": 3836, "loss": 0.1241, "learning_rate": 5.026943676078977e-08, "epoch": 0.9391066366924055, "percentage": 93.93, "elapsed_time": "5:39:34", "remaining_time": "0:21:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3604, "total_steps": 3836, "loss": 0.1362, "learning_rate": 4.984030182506233e-08, "epoch": 0.9393672824422507, "percentage": 93.95, "elapsed_time": "5:39:40", "remaining_time": "0:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3605, "total_steps": 3836, "loss": 0.1334, "learning_rate": 4.94129880043448e-08, "epoch": 0.939627928192096, "percentage": 93.98, "elapsed_time": "5:39:45", "remaining_time": "0:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3606, "total_steps": 3836, "loss": 0.1244, "learning_rate": 4.89874956162445e-08, "epoch": 0.9398885739419411, "percentage": 94.0, "elapsed_time": "5:39:51", "remaining_time": "0:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3607, "total_steps": 3836, "loss": 0.1402, "learning_rate": 4.856382497701373e-08, "epoch": 0.9401492196917864, "percentage": 94.03, "elapsed_time": "5:39:56", "remaining_time": "0:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3608, "total_steps": 3836, "loss": 0.1287, "learning_rate": 4.814197640155199e-08, "epoch": 0.9404098654416316, "percentage": 94.06, "elapsed_time": "5:40:01", "remaining_time": "0:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3609, "total_steps": 3836, "loss": 0.1433, "learning_rate": 4.772195020340431e-08, "epoch": 0.9406705111914769, "percentage": 94.08, "elapsed_time": "5:40:07", "remaining_time": "0:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3610, "total_steps": 3836, "loss": 0.1449, "learning_rate": 4.73037466947604e-08, "epoch": 0.9409311569413221, "percentage": 94.11, "elapsed_time": "5:40:13", "remaining_time": "0:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3611, "total_steps": 3836, "loss": 0.1308, "learning_rate": 4.6887366186456065e-08, "epoch": 0.9411918026911673, "percentage": 94.13, "elapsed_time": "5:40:18", "remaining_time": "0:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3612, "total_steps": 3836, "loss": 0.1285, "learning_rate": 4.64728089879718e-08, "epoch": 0.9414524484410126, "percentage": 94.16, "elapsed_time": "5:40:23", "remaining_time": "0:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3613, "total_steps": 3836, "loss": 0.1255, "learning_rate": 4.606007540743307e-08, "epoch": 0.9417130941908578, "percentage": 94.19, "elapsed_time": "5:40:29", "remaining_time": "0:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3614, "total_steps": 3836, "loss": 0.124, "learning_rate": 4.564916575160977e-08, "epoch": 0.9419737399407031, "percentage": 94.21, "elapsed_time": "5:40:35", "remaining_time": "0:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3615, "total_steps": 3836, "loss": 0.1416, "learning_rate": 4.52400803259162e-08, "epoch": 0.9422343856905483, "percentage": 94.24, "elapsed_time": "5:40:40", "remaining_time": "0:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3616, "total_steps": 3836, "loss": 0.14, "learning_rate": 4.4832819434410535e-08, "epoch": 0.9424950314403936, "percentage": 94.26, "elapsed_time": "5:40:47", "remaining_time": "0:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3617, "total_steps": 3836, "loss": 0.1366, "learning_rate": 4.442738337979535e-08, "epoch": 0.9427556771902388, "percentage": 94.29, "elapsed_time": "5:40:52", "remaining_time": "0:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3618, "total_steps": 3836, "loss": 0.1425, "learning_rate": 4.402377246341627e-08, "epoch": 0.9430163229400841, "percentage": 94.32, "elapsed_time": "5:40:57", "remaining_time": "0:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3619, "total_steps": 3836, "loss": 0.1297, "learning_rate": 4.362198698526304e-08, "epoch": 0.9432769686899293, "percentage": 94.34, "elapsed_time": "5:41:03", "remaining_time": "0:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3620, "total_steps": 3836, "loss": 0.1339, "learning_rate": 4.322202724396818e-08, "epoch": 0.9435376144397746, "percentage": 94.37, "elapsed_time": "5:41:09", "remaining_time": "0:20:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3621, "total_steps": 3836, "loss": 0.1466, "learning_rate": 4.282389353680666e-08, "epoch": 0.9437982601896198, "percentage": 94.4, "elapsed_time": "5:41:14", "remaining_time": "0:20:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3622, "total_steps": 3836, "loss": 0.13, "learning_rate": 4.2427586159697886e-08, "epoch": 0.9440589059394651, "percentage": 94.42, "elapsed_time": "5:41:20", "remaining_time": "0:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3623, "total_steps": 3836, "loss": 0.1315, "learning_rate": 4.203310540720207e-08, "epoch": 0.9443195516893103, "percentage": 94.45, "elapsed_time": "5:41:26", "remaining_time": "0:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3624, "total_steps": 3836, "loss": 0.1365, "learning_rate": 4.164045157252272e-08, "epoch": 0.9445801974391556, "percentage": 94.47, "elapsed_time": "5:41:31", "remaining_time": "0:19:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3625, "total_steps": 3836, "loss": 0.1386, "learning_rate": 4.1249624947505006e-08, "epoch": 0.9448408431890007, "percentage": 94.5, "elapsed_time": "5:41:36", "remaining_time": "0:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3626, "total_steps": 3836, "loss": 0.1311, "learning_rate": 4.086062582263656e-08, "epoch": 0.945101488938846, "percentage": 94.53, "elapsed_time": "5:41:41", "remaining_time": "0:19:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3627, "total_steps": 3836, "loss": 0.1237, "learning_rate": 4.0473454487046374e-08, "epoch": 0.9453621346886912, "percentage": 94.55, "elapsed_time": "5:41:46", "remaining_time": "0:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3628, "total_steps": 3836, "loss": 0.1238, "learning_rate": 4.008811122850426e-08, "epoch": 0.9456227804385364, "percentage": 94.58, "elapsed_time": "5:41:52", "remaining_time": "0:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3629, "total_steps": 3836, "loss": 0.1231, "learning_rate": 3.9704596333422497e-08, "epoch": 0.9458834261883817, "percentage": 94.6, "elapsed_time": "5:41:58", "remaining_time": "0:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3630, "total_steps": 3836, "loss": 0.131, "learning_rate": 3.9322910086853625e-08, "epoch": 0.9461440719382269, "percentage": 94.63, "elapsed_time": "5:42:04", "remaining_time": "0:19:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3631, "total_steps": 3836, "loss": 0.1294, "learning_rate": 3.894305277249155e-08, "epoch": 0.9464047176880722, "percentage": 94.66, "elapsed_time": "5:42:09", "remaining_time": "0:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3632, "total_steps": 3836, "loss": 0.1259, "learning_rate": 3.856502467266987e-08, "epoch": 0.9466653634379174, "percentage": 94.68, "elapsed_time": "5:42:14", "remaining_time": "0:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3633, "total_steps": 3836, "loss": 0.1305, "learning_rate": 3.818882606836355e-08, "epoch": 0.9469260091877627, "percentage": 94.71, "elapsed_time": "5:42:20", "remaining_time": "0:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3634, "total_steps": 3836, "loss": 0.1304, "learning_rate": 3.7814457239187255e-08, "epoch": 0.9471866549376079, "percentage": 94.73, "elapsed_time": "5:42:25", "remaining_time": "0:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3635, "total_steps": 3836, "loss": 0.1228, "learning_rate": 3.7441918463395896e-08, "epoch": 0.9474473006874532, "percentage": 94.76, "elapsed_time": "5:42:31", "remaining_time": "0:18:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3636, "total_steps": 3836, "loss": 0.1393, "learning_rate": 3.707121001788438e-08, "epoch": 0.9477079464372984, "percentage": 94.79, "elapsed_time": "5:42:37", "remaining_time": "0:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3637, "total_steps": 3836, "loss": 0.1439, "learning_rate": 3.67023321781862e-08, "epoch": 0.9479685921871437, "percentage": 94.81, "elapsed_time": "5:42:43", "remaining_time": "0:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3638, "total_steps": 3836, "loss": 0.1275, "learning_rate": 3.633528521847507e-08, "epoch": 0.9482292379369889, "percentage": 94.84, "elapsed_time": "5:42:47", "remaining_time": "0:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3639, "total_steps": 3836, "loss": 0.1355, "learning_rate": 3.5970069411564166e-08, "epoch": 0.9484898836868342, "percentage": 94.86, "elapsed_time": "5:42:53", "remaining_time": "0:18:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3640, "total_steps": 3836, "loss": 0.1306, "learning_rate": 3.5606685028904686e-08, "epoch": 0.9487505294366794, "percentage": 94.89, "elapsed_time": "5:42:58", "remaining_time": "0:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3641, "total_steps": 3836, "loss": 0.1381, "learning_rate": 3.524513234058724e-08, "epoch": 0.9490111751865247, "percentage": 94.92, "elapsed_time": "5:43:04", "remaining_time": "0:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3642, "total_steps": 3836, "loss": 0.1369, "learning_rate": 3.4885411615341034e-08, "epoch": 0.9492718209363699, "percentage": 94.94, "elapsed_time": "5:43:09", "remaining_time": "0:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3643, "total_steps": 3836, "loss": 0.1338, "learning_rate": 3.452752312053331e-08, "epoch": 0.949532466686215, "percentage": 94.97, "elapsed_time": "5:43:15", "remaining_time": "0:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3644, "total_steps": 3836, "loss": 0.1352, "learning_rate": 3.4171467122169344e-08, "epoch": 0.9497931124360603, "percentage": 94.99, "elapsed_time": "5:43:20", "remaining_time": "0:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3645, "total_steps": 3836, "loss": 0.1398, "learning_rate": 3.381724388489327e-08, "epoch": 0.9500537581859055, "percentage": 95.02, "elapsed_time": "5:43:25", "remaining_time": "0:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3646, "total_steps": 3836, "loss": 0.1296, "learning_rate": 3.346485367198588e-08, "epoch": 0.9503144039357508, "percentage": 95.05, "elapsed_time": "5:43:30", "remaining_time": "0:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3647, "total_steps": 3836, "loss": 0.1267, "learning_rate": 3.311429674536654e-08, "epoch": 0.950575049685596, "percentage": 95.07, "elapsed_time": "5:43:36", "remaining_time": "0:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3648, "total_steps": 3836, "loss": 0.1288, "learning_rate": 3.2765573365591e-08, "epoch": 0.9508356954354413, "percentage": 95.1, "elapsed_time": "5:43:41", "remaining_time": "0:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3649, "total_steps": 3836, "loss": 0.1297, "learning_rate": 3.2418683791853034e-08, "epoch": 0.9510963411852865, "percentage": 95.13, "elapsed_time": "5:43:46", "remaining_time": "0:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3650, "total_steps": 3836, "loss": 0.1466, "learning_rate": 3.207362828198307e-08, "epoch": 0.9513569869351318, "percentage": 95.15, "elapsed_time": "5:43:52", "remaining_time": "0:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3651, "total_steps": 3836, "loss": 0.1265, "learning_rate": 3.173040709244818e-08, "epoch": 0.951617632684977, "percentage": 95.18, "elapsed_time": "5:43:58", "remaining_time": "0:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3652, "total_steps": 3836, "loss": 0.126, "learning_rate": 3.138902047835263e-08, "epoch": 0.9518782784348223, "percentage": 95.2, "elapsed_time": "5:44:03", "remaining_time": "0:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3653, "total_steps": 3836, "loss": 0.1395, "learning_rate": 3.1049468693436776e-08, "epoch": 0.9521389241846675, "percentage": 95.23, "elapsed_time": "5:44:09", "remaining_time": "0:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3654, "total_steps": 3836, "loss": 0.1418, "learning_rate": 3.071175199007653e-08, "epoch": 0.9523995699345128, "percentage": 95.26, "elapsed_time": "5:44:15", "remaining_time": "0:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3655, "total_steps": 3836, "loss": 0.1323, "learning_rate": 3.0375870619284983e-08, "epoch": 0.952660215684358, "percentage": 95.28, "elapsed_time": "5:44:21", "remaining_time": "0:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3656, "total_steps": 3836, "loss": 0.1275, "learning_rate": 3.00418248307105e-08, "epoch": 0.9529208614342033, "percentage": 95.31, "elapsed_time": "5:44:27", "remaining_time": "0:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3657, "total_steps": 3836, "loss": 0.1343, "learning_rate": 2.9709614872637237e-08, "epoch": 0.9531815071840485, "percentage": 95.33, "elapsed_time": "5:44:33", "remaining_time": "0:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3658, "total_steps": 3836, "loss": 0.1281, "learning_rate": 2.9379240991984635e-08, "epoch": 0.9534421529338937, "percentage": 95.36, "elapsed_time": "5:44:38", "remaining_time": "0:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3659, "total_steps": 3836, "loss": 0.1283, "learning_rate": 2.9050703434308214e-08, "epoch": 0.953702798683739, "percentage": 95.39, "elapsed_time": "5:44:44", "remaining_time": "0:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3660, "total_steps": 3836, "loss": 0.1215, "learning_rate": 2.8724002443797083e-08, "epoch": 0.9539634444335842, "percentage": 95.41, "elapsed_time": "5:44:50", "remaining_time": "0:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3661, "total_steps": 3836, "loss": 0.1411, "learning_rate": 2.839913826327728e-08, "epoch": 0.9542240901834295, "percentage": 95.44, "elapsed_time": "5:44:55", "remaining_time": "0:16:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3662, "total_steps": 3836, "loss": 0.134, "learning_rate": 2.807611113420816e-08, "epoch": 0.9544847359332747, "percentage": 95.46, "elapsed_time": "5:45:01", "remaining_time": "0:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3663, "total_steps": 3836, "loss": 0.1377, "learning_rate": 2.775492129668378e-08, "epoch": 0.95474538168312, "percentage": 95.49, "elapsed_time": "5:45:07", "remaining_time": "0:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3664, "total_steps": 3836, "loss": 0.1171, "learning_rate": 2.743556898943345e-08, "epoch": 0.9550060274329651, "percentage": 95.52, "elapsed_time": "5:45:12", "remaining_time": "0:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3665, "total_steps": 3836, "loss": 0.1327, "learning_rate": 2.7118054449820075e-08, "epoch": 0.9552666731828104, "percentage": 95.54, "elapsed_time": "5:45:18", "remaining_time": "0:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3666, "total_steps": 3836, "loss": 0.1421, "learning_rate": 2.680237791384044e-08, "epoch": 0.9555273189326556, "percentage": 95.57, "elapsed_time": "5:45:24", "remaining_time": "0:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3667, "total_steps": 3836, "loss": 0.1265, "learning_rate": 2.6488539616125464e-08, "epoch": 0.9557879646825009, "percentage": 95.59, "elapsed_time": "5:45:30", "remaining_time": "0:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3668, "total_steps": 3836, "loss": 0.1321, "learning_rate": 2.6176539789939947e-08, "epoch": 0.9560486104323461, "percentage": 95.62, "elapsed_time": "5:45:36", "remaining_time": "0:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3669, "total_steps": 3836, "loss": 0.1333, "learning_rate": 2.5866378667182557e-08, "epoch": 0.9563092561821914, "percentage": 95.65, "elapsed_time": "5:45:42", "remaining_time": "0:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3670, "total_steps": 3836, "loss": 0.1384, "learning_rate": 2.5558056478383887e-08, "epoch": 0.9565699019320366, "percentage": 95.67, "elapsed_time": "5:45:48", "remaining_time": "0:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3671, "total_steps": 3836, "loss": 0.1333, "learning_rate": 2.5251573452709232e-08, "epoch": 0.9568305476818819, "percentage": 95.7, "elapsed_time": "5:45:53", "remaining_time": "0:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3672, "total_steps": 3836, "loss": 0.139, "learning_rate": 2.4946929817956376e-08, "epoch": 0.9570911934317271, "percentage": 95.72, "elapsed_time": "5:45:58", "remaining_time": "0:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3673, "total_steps": 3836, "loss": 0.1448, "learning_rate": 2.4644125800555583e-08, "epoch": 0.9573518391815723, "percentage": 95.75, "elapsed_time": "5:46:04", "remaining_time": "0:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3674, "total_steps": 3836, "loss": 0.1347, "learning_rate": 2.4343161625570433e-08, "epoch": 0.9576124849314176, "percentage": 95.78, "elapsed_time": "5:46:10", "remaining_time": "0:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3675, "total_steps": 3836, "loss": 0.1327, "learning_rate": 2.4044037516696704e-08, "epoch": 0.9578731306812628, "percentage": 95.8, "elapsed_time": "5:46:16", "remaining_time": "0:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3676, "total_steps": 3836, "loss": 0.1313, "learning_rate": 2.3746753696262113e-08, "epoch": 0.9581337764311081, "percentage": 95.83, "elapsed_time": "5:46:21", "remaining_time": "0:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3677, "total_steps": 3836, "loss": 0.1287, "learning_rate": 2.3451310385227132e-08, "epoch": 0.9583944221809533, "percentage": 95.86, "elapsed_time": "5:46:26", "remaining_time": "0:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3678, "total_steps": 3836, "loss": 0.1411, "learning_rate": 2.3157707803184438e-08, "epoch": 0.9586550679307986, "percentage": 95.88, "elapsed_time": "5:46:32", "remaining_time": "0:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3679, "total_steps": 3836, "loss": 0.1389, "learning_rate": 2.28659461683578e-08, "epoch": 0.9589157136806438, "percentage": 95.91, "elapsed_time": "5:46:37", "remaining_time": "0:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3680, "total_steps": 3836, "loss": 0.1415, "learning_rate": 2.2576025697603198e-08, "epoch": 0.9591763594304891, "percentage": 95.93, "elapsed_time": "5:46:44", "remaining_time": "0:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3681, "total_steps": 3836, "loss": 0.1321, "learning_rate": 2.2287946606407983e-08, "epoch": 0.9594370051803343, "percentage": 95.96, "elapsed_time": "5:46:50", "remaining_time": "0:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3682, "total_steps": 3836, "loss": 0.1395, "learning_rate": 2.2001709108891155e-08, "epoch": 0.9596976509301796, "percentage": 95.99, "elapsed_time": "5:46:55", "remaining_time": "0:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3683, "total_steps": 3836, "loss": 0.122, "learning_rate": 2.1717313417802534e-08, "epoch": 0.9599582966800247, "percentage": 96.01, "elapsed_time": "5:47:01", "remaining_time": "0:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3684, "total_steps": 3836, "loss": 0.1548, "learning_rate": 2.143475974452275e-08, "epoch": 0.96021894242987, "percentage": 96.04, "elapsed_time": "5:47:06", "remaining_time": "0:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3685, "total_steps": 3836, "loss": 0.1372, "learning_rate": 2.115404829906437e-08, "epoch": 0.9604795881797152, "percentage": 96.06, "elapsed_time": "5:47:12", "remaining_time": "0:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3686, "total_steps": 3836, "loss": 0.1363, "learning_rate": 2.0875179290069934e-08, "epoch": 0.9607402339295605, "percentage": 96.09, "elapsed_time": "5:47:18", "remaining_time": "0:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3687, "total_steps": 3836, "loss": 0.127, "learning_rate": 2.0598152924812266e-08, "epoch": 0.9610008796794057, "percentage": 96.12, "elapsed_time": "5:47:23", "remaining_time": "0:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3688, "total_steps": 3836, "loss": 0.1304, "learning_rate": 2.032296940919526e-08, "epoch": 0.9612615254292509, "percentage": 96.14, "elapsed_time": "5:47:29", "remaining_time": "0:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3689, "total_steps": 3836, "loss": 0.1378, "learning_rate": 2.004962894775281e-08, "epoch": 0.9615221711790962, "percentage": 96.17, "elapsed_time": "5:47:34", "remaining_time": "0:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3690, "total_steps": 3836, "loss": 0.1405, "learning_rate": 1.9778131743649064e-08, "epoch": 0.9617828169289414, "percentage": 96.19, "elapsed_time": "5:47:40", "remaining_time": "0:13:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3691, "total_steps": 3836, "loss": 0.1353, "learning_rate": 1.9508477998678442e-08, "epoch": 0.9620434626787867, "percentage": 96.22, "elapsed_time": "5:47:46", "remaining_time": "0:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3692, "total_steps": 3836, "loss": 0.1256, "learning_rate": 1.9240667913264233e-08, "epoch": 0.9623041084286319, "percentage": 96.25, "elapsed_time": "5:47:52", "remaining_time": "0:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3693, "total_steps": 3836, "loss": 0.1404, "learning_rate": 1.8974701686459985e-08, "epoch": 0.9625647541784772, "percentage": 96.27, "elapsed_time": "5:47:57", "remaining_time": "0:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3694, "total_steps": 3836, "loss": 0.1374, "learning_rate": 1.8710579515948957e-08, "epoch": 0.9628253999283224, "percentage": 96.3, "elapsed_time": "5:48:03", "remaining_time": "0:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3695, "total_steps": 3836, "loss": 0.1294, "learning_rate": 1.8448301598043838e-08, "epoch": 0.9630860456781677, "percentage": 96.32, "elapsed_time": "5:48:08", "remaining_time": "0:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3696, "total_steps": 3836, "loss": 0.1412, "learning_rate": 1.8187868127685914e-08, "epoch": 0.9633466914280129, "percentage": 96.35, "elapsed_time": "5:48:14", "remaining_time": "0:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3697, "total_steps": 3836, "loss": 0.1237, "learning_rate": 1.7929279298446177e-08, "epoch": 0.9636073371778582, "percentage": 96.38, "elapsed_time": "5:48:19", "remaining_time": "0:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3698, "total_steps": 3836, "loss": 0.1368, "learning_rate": 1.767253530252422e-08, "epoch": 0.9638679829277034, "percentage": 96.4, "elapsed_time": "5:48:25", "remaining_time": "0:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3699, "total_steps": 3836, "loss": 0.133, "learning_rate": 1.74176363307485e-08, "epoch": 0.9641286286775487, "percentage": 96.43, "elapsed_time": "5:48:31", "remaining_time": "0:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3700, "total_steps": 3836, "loss": 0.133, "learning_rate": 1.716458257257636e-08, "epoch": 0.9643892744273939, "percentage": 96.45, "elapsed_time": "5:48:36", "remaining_time": "0:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3701, "total_steps": 3836, "loss": 0.1378, "learning_rate": 1.6913374216093458e-08, "epoch": 0.9646499201772392, "percentage": 96.48, "elapsed_time": "5:48:42", "remaining_time": "0:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3702, "total_steps": 3836, "loss": 0.1315, "learning_rate": 1.666401144801405e-08, "epoch": 0.9649105659270844, "percentage": 96.51, "elapsed_time": "5:48:47", "remaining_time": "0:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3703, "total_steps": 3836, "loss": 0.1411, "learning_rate": 1.6416494453680156e-08, "epoch": 0.9651712116769295, "percentage": 96.53, "elapsed_time": "5:48:52", "remaining_time": "0:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3704, "total_steps": 3836, "loss": 0.1442, "learning_rate": 1.6170823417062386e-08, "epoch": 0.9654318574267748, "percentage": 96.56, "elapsed_time": "5:48:57", "remaining_time": "0:12:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3705, "total_steps": 3836, "loss": 0.1216, "learning_rate": 1.592699852075885e-08, "epoch": 0.96569250317662, "percentage": 96.58, "elapsed_time": "5:49:02", "remaining_time": "0:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3706, "total_steps": 3836, "loss": 0.1446, "learning_rate": 1.568501994599625e-08, "epoch": 0.9659531489264653, "percentage": 96.61, "elapsed_time": "5:49:08", "remaining_time": "0:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3707, "total_steps": 3836, "loss": 0.1384, "learning_rate": 1.5444887872627934e-08, "epoch": 0.9662137946763105, "percentage": 96.64, "elapsed_time": "5:49:14", "remaining_time": "0:12:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3708, "total_steps": 3836, "loss": 0.135, "learning_rate": 1.5206602479135857e-08, "epoch": 0.9664744404261558, "percentage": 96.66, "elapsed_time": "5:49:20", "remaining_time": "0:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3709, "total_steps": 3836, "loss": 0.1246, "learning_rate": 1.4970163942628623e-08, "epoch": 0.966735086176001, "percentage": 96.69, "elapsed_time": "5:49:26", "remaining_time": "0:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3710, "total_steps": 3836, "loss": 0.1341, "learning_rate": 1.4735572438842605e-08, "epoch": 0.9669957319258463, "percentage": 96.72, "elapsed_time": "5:49:31", "remaining_time": "0:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3711, "total_steps": 3836, "loss": 0.1392, "learning_rate": 1.45028281421411e-08, "epoch": 0.9672563776756915, "percentage": 96.74, "elapsed_time": "5:49:36", "remaining_time": "0:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3712, "total_steps": 3836, "loss": 0.13, "learning_rate": 1.4271931225514624e-08, "epoch": 0.9675170234255368, "percentage": 96.77, "elapsed_time": "5:49:42", "remaining_time": "0:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3713, "total_steps": 3836, "loss": 0.1321, "learning_rate": 1.4042881860580338e-08, "epoch": 0.967777669175382, "percentage": 96.79, "elapsed_time": "5:49:47", "remaining_time": "0:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3714, "total_steps": 3836, "loss": 0.1363, "learning_rate": 1.381568021758234e-08, "epoch": 0.9680383149252273, "percentage": 96.82, "elapsed_time": "5:49:53", "remaining_time": "0:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3715, "total_steps": 3836, "loss": 0.1353, "learning_rate": 1.3590326465391656e-08, "epoch": 0.9682989606750725, "percentage": 96.85, "elapsed_time": "5:49:59", "remaining_time": "0:11:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3716, "total_steps": 3836, "loss": 0.1441, "learning_rate": 1.336682077150514e-08, "epoch": 0.9685596064249178, "percentage": 96.87, "elapsed_time": "5:50:05", "remaining_time": "0:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3717, "total_steps": 3836, "loss": 0.1329, "learning_rate": 1.3145163302046849e-08, "epoch": 0.968820252174763, "percentage": 96.9, "elapsed_time": "5:50:11", "remaining_time": "0:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3718, "total_steps": 3836, "loss": 0.1373, "learning_rate": 1.2925354221766661e-08, "epoch": 0.9690808979246082, "percentage": 96.92, "elapsed_time": "5:50:16", "remaining_time": "0:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3719, "total_steps": 3836, "loss": 0.1255, "learning_rate": 1.2707393694040838e-08, "epoch": 0.9693415436744535, "percentage": 96.95, "elapsed_time": "5:50:21", "remaining_time": "0:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3720, "total_steps": 3836, "loss": 0.1268, "learning_rate": 1.2491281880871175e-08, "epoch": 0.9696021894242987, "percentage": 96.98, "elapsed_time": "5:50:27", "remaining_time": "0:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3721, "total_steps": 3836, "loss": 0.1337, "learning_rate": 1.2277018942885855e-08, "epoch": 0.969862835174144, "percentage": 97.0, "elapsed_time": "5:50:32", "remaining_time": "0:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3722, "total_steps": 3836, "loss": 0.1272, "learning_rate": 1.206460503933915e-08, "epoch": 0.9701234809239891, "percentage": 97.03, "elapsed_time": "5:50:38", "remaining_time": "0:10:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3723, "total_steps": 3836, "loss": 0.1389, "learning_rate": 1.185404032811005e-08, "epoch": 0.9703841266738344, "percentage": 97.05, "elapsed_time": "5:50:43", "remaining_time": "0:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3724, "total_steps": 3836, "loss": 0.1356, "learning_rate": 1.1645324965704473e-08, "epoch": 0.9706447724236796, "percentage": 97.08, "elapsed_time": "5:50:48", "remaining_time": "0:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3725, "total_steps": 3836, "loss": 0.1383, "learning_rate": 1.143845910725222e-08, "epoch": 0.9709054181735249, "percentage": 97.11, "elapsed_time": "5:50:54", "remaining_time": "0:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3726, "total_steps": 3836, "loss": 0.1426, "learning_rate": 1.1233442906509462e-08, "epoch": 0.9711660639233701, "percentage": 97.13, "elapsed_time": "5:50:59", "remaining_time": "0:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3727, "total_steps": 3836, "loss": 0.1379, "learning_rate": 1.1030276515857364e-08, "epoch": 0.9714267096732154, "percentage": 97.16, "elapsed_time": "5:51:05", "remaining_time": "0:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3728, "total_steps": 3836, "loss": 0.1302, "learning_rate": 1.0828960086302075e-08, "epoch": 0.9716873554230606, "percentage": 97.18, "elapsed_time": "5:51:11", "remaining_time": "0:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3729, "total_steps": 3836, "loss": 0.131, "learning_rate": 1.0629493767475019e-08, "epoch": 0.9719480011729059, "percentage": 97.21, "elapsed_time": "5:51:17", "remaining_time": "0:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3730, "total_steps": 3836, "loss": 0.1285, "learning_rate": 1.0431877707632043e-08, "epoch": 0.9722086469227511, "percentage": 97.24, "elapsed_time": "5:51:23", "remaining_time": "0:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3731, "total_steps": 3836, "loss": 0.1396, "learning_rate": 1.0236112053654267e-08, "epoch": 0.9724692926725964, "percentage": 97.26, "elapsed_time": "5:51:29", "remaining_time": "0:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3732, "total_steps": 3836, "loss": 0.1376, "learning_rate": 1.0042196951046968e-08, "epoch": 0.9727299384224416, "percentage": 97.29, "elapsed_time": "5:51:34", "remaining_time": "0:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3733, "total_steps": 3836, "loss": 0.1327, "learning_rate": 9.850132543940127e-09, "epoch": 0.9729905841722868, "percentage": 97.31, "elapsed_time": "5:51:39", "remaining_time": "0:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3734, "total_steps": 3836, "loss": 0.1424, "learning_rate": 9.659918975088444e-09, "epoch": 0.9732512299221321, "percentage": 97.34, "elapsed_time": "5:51:45", "remaining_time": "0:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3735, "total_steps": 3836, "loss": 0.1339, "learning_rate": 9.47155638587105e-09, "epoch": 0.9735118756719773, "percentage": 97.37, "elapsed_time": "5:51:51", "remaining_time": "0:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3736, "total_steps": 3836, "loss": 0.1428, "learning_rate": 9.285044916290675e-09, "epoch": 0.9737725214218226, "percentage": 97.39, "elapsed_time": "5:51:57", "remaining_time": "0:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3737, "total_steps": 3836, "loss": 0.1243, "learning_rate": 9.100384704974486e-09, "epoch": 0.9740331671716678, "percentage": 97.42, "elapsed_time": "5:52:02", "remaining_time": "0:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3738, "total_steps": 3836, "loss": 0.1356, "learning_rate": 8.91757588917408e-09, "epoch": 0.9742938129215131, "percentage": 97.45, "elapsed_time": "5:52:08", "remaining_time": "0:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3739, "total_steps": 3836, "loss": 0.1359, "learning_rate": 8.73661860476438e-09, "epoch": 0.9745544586713583, "percentage": 97.47, "elapsed_time": "5:52:14", "remaining_time": "0:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3740, "total_steps": 3836, "loss": 0.1312, "learning_rate": 8.557512986244464e-09, "epoch": 0.9748151044212036, "percentage": 97.5, "elapsed_time": "5:52:19", "remaining_time": "0:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3741, "total_steps": 3836, "loss": 0.1351, "learning_rate": 8.380259166736738e-09, "epoch": 0.9750757501710487, "percentage": 97.52, "elapsed_time": "5:52:24", "remaining_time": "0:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3742, "total_steps": 3836, "loss": 0.1383, "learning_rate": 8.20485727798831e-09, "epoch": 0.975336395920894, "percentage": 97.55, "elapsed_time": "5:52:30", "remaining_time": "0:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3743, "total_steps": 3836, "loss": 0.131, "learning_rate": 8.031307450368232e-09, "epoch": 0.9755970416707392, "percentage": 97.58, "elapsed_time": "5:52:35", "remaining_time": "0:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3744, "total_steps": 3836, "loss": 0.1351, "learning_rate": 7.85960981287026e-09, "epoch": 0.9758576874205845, "percentage": 97.6, "elapsed_time": "5:52:41", "remaining_time": "0:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3745, "total_steps": 3836, "loss": 0.1422, "learning_rate": 7.68976449311093e-09, "epoch": 0.9761183331704297, "percentage": 97.63, "elapsed_time": "5:52:46", "remaining_time": "0:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3746, "total_steps": 3836, "loss": 0.129, "learning_rate": 7.521771617330365e-09, "epoch": 0.976378978920275, "percentage": 97.65, "elapsed_time": "5:52:52", "remaining_time": "0:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3747, "total_steps": 3836, "loss": 0.1345, "learning_rate": 7.3556313103911865e-09, "epoch": 0.9766396246701202, "percentage": 97.68, "elapsed_time": "5:52:58", "remaining_time": "0:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3748, "total_steps": 3836, "loss": 0.1359, "learning_rate": 7.191343695779618e-09, "epoch": 0.9769002704199654, "percentage": 97.71, "elapsed_time": "5:53:04", "remaining_time": "0:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3749, "total_steps": 3836, "loss": 0.1214, "learning_rate": 7.028908895604647e-09, "epoch": 0.9771609161698107, "percentage": 97.73, "elapsed_time": "5:53:09", "remaining_time": "0:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3750, "total_steps": 3836, "loss": 0.1272, "learning_rate": 6.86832703059831e-09, "epoch": 0.9774215619196559, "percentage": 97.76, "elapsed_time": "5:53:15", "remaining_time": "0:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3751, "total_steps": 3836, "loss": 0.143, "learning_rate": 6.709598220115132e-09, "epoch": 0.9776822076695012, "percentage": 97.78, "elapsed_time": "5:53:21", "remaining_time": "0:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3752, "total_steps": 3836, "loss": 0.13, "learning_rate": 6.552722582132687e-09, "epoch": 0.9779428534193464, "percentage": 97.81, "elapsed_time": "5:53:27", "remaining_time": "0:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3753, "total_steps": 3836, "loss": 0.1238, "learning_rate": 6.397700233250759e-09, "epoch": 0.9782034991691917, "percentage": 97.84, "elapsed_time": "5:53:33", "remaining_time": "0:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3754, "total_steps": 3836, "loss": 0.1351, "learning_rate": 6.24453128869218e-09, "epoch": 0.9784641449190369, "percentage": 97.86, "elapsed_time": "5:53:38", "remaining_time": "0:07:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3755, "total_steps": 3836, "loss": 0.1472, "learning_rate": 6.0932158623014385e-09, "epoch": 0.9787247906688822, "percentage": 97.89, "elapsed_time": "5:53:44", "remaining_time": "0:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3756, "total_steps": 3836, "loss": 0.1287, "learning_rate": 5.94375406654607e-09, "epoch": 0.9789854364187274, "percentage": 97.91, "elapsed_time": "5:53:50", "remaining_time": "0:07:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3757, "total_steps": 3836, "loss": 0.1339, "learning_rate": 5.796146012515824e-09, "epoch": 0.9792460821685727, "percentage": 97.94, "elapsed_time": "5:53:56", "remaining_time": "0:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3758, "total_steps": 3836, "loss": 0.1279, "learning_rate": 5.650391809922107e-09, "epoch": 0.9795067279184179, "percentage": 97.97, "elapsed_time": "5:54:01", "remaining_time": "0:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3759, "total_steps": 3836, "loss": 0.1303, "learning_rate": 5.506491567098537e-09, "epoch": 0.9797673736682632, "percentage": 97.99, "elapsed_time": "5:54:07", "remaining_time": "0:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3760, "total_steps": 3836, "loss": 0.1354, "learning_rate": 5.364445391001228e-09, "epoch": 0.9800280194181084, "percentage": 98.02, "elapsed_time": "5:54:13", "remaining_time": "0:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3761, "total_steps": 3836, "loss": 0.1374, "learning_rate": 5.2242533872082225e-09, "epoch": 0.9802886651679537, "percentage": 98.04, "elapsed_time": "5:54:18", "remaining_time": "0:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3762, "total_steps": 3836, "loss": 0.1423, "learning_rate": 5.085915659918672e-09, "epoch": 0.9805493109177988, "percentage": 98.07, "elapsed_time": "5:54:24", "remaining_time": "0:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3763, "total_steps": 3836, "loss": 0.1285, "learning_rate": 4.949432311954494e-09, "epoch": 0.980809956667644, "percentage": 98.1, "elapsed_time": "5:54:30", "remaining_time": "0:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3764, "total_steps": 3836, "loss": 0.1341, "learning_rate": 4.814803444758431e-09, "epoch": 0.9810706024174893, "percentage": 98.12, "elapsed_time": "5:54:35", "remaining_time": "0:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3765, "total_steps": 3836, "loss": 0.1327, "learning_rate": 4.68202915839544e-09, "epoch": 0.9813312481673345, "percentage": 98.15, "elapsed_time": "5:54:41", "remaining_time": "0:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3766, "total_steps": 3836, "loss": 0.1322, "learning_rate": 4.551109551551581e-09, "epoch": 0.9815918939171798, "percentage": 98.18, "elapsed_time": "5:54:45", "remaining_time": "0:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3767, "total_steps": 3836, "loss": 0.1446, "learning_rate": 4.422044721534846e-09, "epoch": 0.981852539667025, "percentage": 98.2, "elapsed_time": "5:54:51", "remaining_time": "0:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3768, "total_steps": 3836, "loss": 0.1394, "learning_rate": 4.294834764274614e-09, "epoch": 0.9821131854168703, "percentage": 98.23, "elapsed_time": "5:54:56", "remaining_time": "0:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3769, "total_steps": 3836, "loss": 0.1215, "learning_rate": 4.1694797743210835e-09, "epoch": 0.9823738311667155, "percentage": 98.25, "elapsed_time": "5:55:02", "remaining_time": "0:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3770, "total_steps": 3836, "loss": 0.1308, "learning_rate": 4.04597984484667e-09, "epoch": 0.9826344769165608, "percentage": 98.28, "elapsed_time": "5:55:08", "remaining_time": "0:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3771, "total_steps": 3836, "loss": 0.1252, "learning_rate": 3.924335067643781e-09, "epoch": 0.982895122666406, "percentage": 98.31, "elapsed_time": "5:55:13", "remaining_time": "0:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3772, "total_steps": 3836, "loss": 0.1271, "learning_rate": 3.804545533126758e-09, "epoch": 0.9831557684162513, "percentage": 98.33, "elapsed_time": "5:55:20", "remaining_time": "0:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3773, "total_steps": 3836, "loss": 0.1325, "learning_rate": 3.6866113303307696e-09, "epoch": 0.9834164141660965, "percentage": 98.36, "elapsed_time": "5:55:25", "remaining_time": "0:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3774, "total_steps": 3836, "loss": 0.1337, "learning_rate": 3.5705325469123644e-09, "epoch": 0.9836770599159418, "percentage": 98.38, "elapsed_time": "5:55:30", "remaining_time": "0:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3775, "total_steps": 3836, "loss": 0.1311, "learning_rate": 3.456309269148361e-09, "epoch": 0.983937705665787, "percentage": 98.41, "elapsed_time": "5:55:36", "remaining_time": "0:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3776, "total_steps": 3836, "loss": 0.1362, "learning_rate": 3.3439415819369604e-09, "epoch": 0.9841983514156323, "percentage": 98.44, "elapsed_time": "5:55:42", "remaining_time": "0:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3777, "total_steps": 3836, "loss": 0.1284, "learning_rate": 3.2334295687969084e-09, "epoch": 0.9844589971654775, "percentage": 98.46, "elapsed_time": "5:55:47", "remaining_time": "0:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3778, "total_steps": 3836, "loss": 0.1356, "learning_rate": 3.124773311867779e-09, "epoch": 0.9847196429153227, "percentage": 98.49, "elapsed_time": "5:55:53", "remaining_time": "0:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3779, "total_steps": 3836, "loss": 0.1299, "learning_rate": 3.0179728919099703e-09, "epoch": 0.984980288665168, "percentage": 98.51, "elapsed_time": "5:55:58", "remaining_time": "0:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3780, "total_steps": 3836, "loss": 0.1311, "learning_rate": 2.9130283883044285e-09, "epoch": 0.9852409344150131, "percentage": 98.54, "elapsed_time": "5:56:04", "remaining_time": "0:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3781, "total_steps": 3836, "loss": 0.1225, "learning_rate": 2.8099398790520926e-09, "epoch": 0.9855015801648584, "percentage": 98.57, "elapsed_time": "5:56:10", "remaining_time": "0:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3782, "total_steps": 3836, "loss": 0.1346, "learning_rate": 2.70870744077556e-09, "epoch": 0.9857622259147036, "percentage": 98.59, "elapsed_time": "5:56:15", "remaining_time": "0:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3783, "total_steps": 3836, "loss": 0.1189, "learning_rate": 2.6093311487168647e-09, "epoch": 0.9860228716645489, "percentage": 98.62, "elapsed_time": "5:56:21", "remaining_time": "0:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3784, "total_steps": 3836, "loss": 0.1331, "learning_rate": 2.5118110767388682e-09, "epoch": 0.9862835174143941, "percentage": 98.64, "elapsed_time": "5:56:26", "remaining_time": "0:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3785, "total_steps": 3836, "loss": 0.1254, "learning_rate": 2.4161472973247004e-09, "epoch": 0.9865441631642394, "percentage": 98.67, "elapsed_time": "5:56:32", "remaining_time": "0:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3786, "total_steps": 3836, "loss": 0.136, "learning_rate": 2.322339881577762e-09, "epoch": 0.9868048089140846, "percentage": 98.7, "elapsed_time": "5:56:38", "remaining_time": "0:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3787, "total_steps": 3836, "loss": 0.1341, "learning_rate": 2.2303888992220026e-09, "epoch": 0.9870654546639299, "percentage": 98.72, "elapsed_time": "5:56:43", "remaining_time": "0:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3788, "total_steps": 3836, "loss": 0.1209, "learning_rate": 2.140294418600808e-09, "epoch": 0.9873261004137751, "percentage": 98.75, "elapsed_time": "5:56:49", "remaining_time": "0:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3789, "total_steps": 3836, "loss": 0.1263, "learning_rate": 2.0520565066783905e-09, "epoch": 0.9875867461636204, "percentage": 98.77, "elapsed_time": "5:56:54", "remaining_time": "0:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3790, "total_steps": 3836, "loss": 0.1314, "learning_rate": 1.965675229038677e-09, "epoch": 0.9878473919134656, "percentage": 98.8, "elapsed_time": "5:57:00", "remaining_time": "0:04:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3791, "total_steps": 3836, "loss": 0.1276, "learning_rate": 1.881150649886143e-09, "epoch": 0.9881080376633109, "percentage": 98.83, "elapsed_time": "5:57:05", "remaining_time": "0:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3792, "total_steps": 3836, "loss": 0.1408, "learning_rate": 1.7984828320444236e-09, "epoch": 0.9883686834131561, "percentage": 98.85, "elapsed_time": "5:57:11", "remaining_time": "0:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3793, "total_steps": 3836, "loss": 0.1443, "learning_rate": 1.7176718369574242e-09, "epoch": 0.9886293291630014, "percentage": 98.88, "elapsed_time": "5:57:16", "remaining_time": "0:04:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3794, "total_steps": 3836, "loss": 0.1338, "learning_rate": 1.6387177246893205e-09, "epoch": 0.9888899749128466, "percentage": 98.91, "elapsed_time": "5:57:21", "remaining_time": "0:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3795, "total_steps": 3836, "loss": 0.1212, "learning_rate": 1.5616205539240038e-09, "epoch": 0.9891506206626918, "percentage": 98.93, "elapsed_time": "5:57:27", "remaining_time": "0:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3796, "total_steps": 3836, "loss": 0.1388, "learning_rate": 1.486380381964525e-09, "epoch": 0.9894112664125371, "percentage": 98.96, "elapsed_time": "5:57:32", "remaining_time": "0:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3797, "total_steps": 3836, "loss": 0.1386, "learning_rate": 1.4129972647344836e-09, "epoch": 0.9896719121623823, "percentage": 98.98, "elapsed_time": "5:57:38", "remaining_time": "0:03:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3798, "total_steps": 3836, "loss": 0.1331, "learning_rate": 1.3414712567769161e-09, "epoch": 0.9899325579122276, "percentage": 99.01, "elapsed_time": "5:57:44", "remaining_time": "0:03:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3799, "total_steps": 3836, "loss": 0.1246, "learning_rate": 1.271802411254297e-09, "epoch": 0.9901932036620728, "percentage": 99.04, "elapsed_time": "5:57:49", "remaining_time": "0:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3800, "total_steps": 3836, "loss": 0.1286, "learning_rate": 1.2039907799490935e-09, "epoch": 0.990453849411918, "percentage": 99.06, "elapsed_time": "5:57:55", "remaining_time": "0:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3801, "total_steps": 3836, "loss": 0.1484, "learning_rate": 1.138036413263488e-09, "epoch": 0.9907144951617632, "percentage": 99.09, "elapsed_time": "5:58:00", "remaining_time": "0:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3802, "total_steps": 3836, "loss": 0.1272, "learning_rate": 1.0739393602185454e-09, "epoch": 0.9909751409116085, "percentage": 99.11, "elapsed_time": "5:58:06", "remaining_time": "0:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3803, "total_steps": 3836, "loss": 0.1333, "learning_rate": 1.0116996684556014e-09, "epoch": 0.9912357866614537, "percentage": 99.14, "elapsed_time": "5:58:13", "remaining_time": "0:03:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3804, "total_steps": 3836, "loss": 0.1303, "learning_rate": 9.513173842348732e-10, "epoch": 0.991496432411299, "percentage": 99.17, "elapsed_time": "5:58:19", "remaining_time": "0:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3805, "total_steps": 3836, "loss": 0.1291, "learning_rate": 8.927925524365721e-10, "epoch": 0.9917570781611442, "percentage": 99.19, "elapsed_time": "5:58:25", "remaining_time": "0:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3806, "total_steps": 3836, "loss": 0.1215, "learning_rate": 8.361252165597911e-10, "epoch": 0.9920177239109895, "percentage": 99.22, "elapsed_time": "5:58:29", "remaining_time": "0:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3807, "total_steps": 3836, "loss": 0.1318, "learning_rate": 7.813154187236161e-10, "epoch": 0.9922783696608347, "percentage": 99.24, "elapsed_time": "5:58:34", "remaining_time": "0:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3808, "total_steps": 3836, "loss": 0.142, "learning_rate": 7.283631996662933e-10, "epoch": 0.99253901541068, "percentage": 99.27, "elapsed_time": "5:58:40", "remaining_time": "0:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3809, "total_steps": 3836, "loss": 0.1272, "learning_rate": 6.772685987449512e-10, "epoch": 0.9927996611605252, "percentage": 99.3, "elapsed_time": "5:58:46", "remaining_time": "0:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3810, "total_steps": 3836, "loss": 0.1379, "learning_rate": 6.28031653936434e-10, "epoch": 0.9930603069103704, "percentage": 99.32, "elapsed_time": "5:58:51", "remaining_time": "0:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3811, "total_steps": 3836, "loss": 0.1275, "learning_rate": 5.806524018367454e-10, "epoch": 0.9933209526602157, "percentage": 99.35, "elapsed_time": "5:58:58", "remaining_time": "0:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3812, "total_steps": 3836, "loss": 0.1286, "learning_rate": 5.351308776613273e-10, "epoch": 0.9935815984100609, "percentage": 99.37, "elapsed_time": "5:59:03", "remaining_time": "0:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3813, "total_steps": 3836, "loss": 0.1551, "learning_rate": 4.914671152447814e-10, "epoch": 0.9938422441599062, "percentage": 99.4, "elapsed_time": "5:59:08", "remaining_time": "0:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3814, "total_steps": 3836, "loss": 0.1256, "learning_rate": 4.49661147040592e-10, "epoch": 0.9941028899097514, "percentage": 99.43, "elapsed_time": "5:59:15", "remaining_time": "0:02:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3815, "total_steps": 3836, "loss": 0.1332, "learning_rate": 4.0971300412140367e-10, "epoch": 0.9943635356595967, "percentage": 99.45, "elapsed_time": "5:59:21", "remaining_time": "0:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3816, "total_steps": 3836, "loss": 0.1395, "learning_rate": 3.7162271617985357e-10, "epoch": 0.9946241814094419, "percentage": 99.48, "elapsed_time": "5:59:26", "remaining_time": "0:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3817, "total_steps": 3836, "loss": 0.1345, "learning_rate": 3.3539031152635125e-10, "epoch": 0.9948848271592872, "percentage": 99.5, "elapsed_time": "5:59:32", "remaining_time": "0:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3818, "total_steps": 3836, "loss": 0.1372, "learning_rate": 3.0101581709185424e-10, "epoch": 0.9951454729091324, "percentage": 99.53, "elapsed_time": "5:59:38", "remaining_time": "0:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3819, "total_steps": 3836, "loss": 0.1323, "learning_rate": 2.684992584250923e-10, "epoch": 0.9954061186589777, "percentage": 99.56, "elapsed_time": "5:59:43", "remaining_time": "0:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3820, "total_steps": 3836, "loss": 0.129, "learning_rate": 2.3784065969451043e-10, "epoch": 0.9956667644088228, "percentage": 99.58, "elapsed_time": "5:59:49", "remaining_time": "0:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3821, "total_steps": 3836, "loss": 0.12, "learning_rate": 2.0904004368799136e-10, "epoch": 0.9959274101586681, "percentage": 99.61, "elapsed_time": "5:59:54", "remaining_time": "0:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3822, "total_steps": 3836, "loss": 0.1318, "learning_rate": 1.8209743181146766e-10, "epoch": 0.9961880559085133, "percentage": 99.64, "elapsed_time": "5:59:59", "remaining_time": "0:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3823, "total_steps": 3836, "loss": 0.1352, "learning_rate": 1.570128440908647e-10, "epoch": 0.9964487016583586, "percentage": 99.66, "elapsed_time": "6:00:05", "remaining_time": "0:01:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3824, "total_steps": 3836, "loss": 0.1392, "learning_rate": 1.3378629917015772e-10, "epoch": 0.9967093474082038, "percentage": 99.69, "elapsed_time": "6:00:11", "remaining_time": "0:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3825, "total_steps": 3836, "loss": 0.1437, "learning_rate": 1.1241781431303723e-10, "epoch": 0.996969993158049, "percentage": 99.71, "elapsed_time": "6:00:17", "remaining_time": "0:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3826, "total_steps": 3836, "loss": 0.1359, "learning_rate": 9.290740540207621e-11, "epoch": 0.9972306389078943, "percentage": 99.74, "elapsed_time": "6:00:22", "remaining_time": "0:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3827, "total_steps": 3836, "loss": 0.1285, "learning_rate": 7.525508693845274e-11, "epoch": 0.9974912846577395, "percentage": 99.77, "elapsed_time": "6:00:27", "remaining_time": "0:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3828, "total_steps": 3836, "loss": 0.1358, "learning_rate": 5.94608720427825e-11, "epoch": 0.9977519304075848, "percentage": 99.79, "elapsed_time": "6:00:33", "remaining_time": "0:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3829, "total_steps": 3836, "loss": 0.1397, "learning_rate": 4.5524772453731103e-11, "epoch": 0.99801257615743, "percentage": 99.82, "elapsed_time": "6:00:39", "remaining_time": "0:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3830, "total_steps": 3836, "loss": 0.1386, "learning_rate": 3.344679853023447e-11, "epoch": 0.9982732219072753, "percentage": 99.84, "elapsed_time": "6:00:44", "remaining_time": "0:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3831, "total_steps": 3836, "loss": 0.1268, "learning_rate": 2.322695924900087e-11, "epoch": 0.9985338676571205, "percentage": 99.87, "elapsed_time": "6:00:49", "remaining_time": "0:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3832, "total_steps": 3836, "loss": 0.1479, "learning_rate": 1.4865262205898678e-11, "epoch": 0.9987945134069658, "percentage": 99.9, "elapsed_time": "6:00:54", "remaining_time": "0:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3833, "total_steps": 3836, "loss": 0.1109, "learning_rate": 8.361713616233946e-12, "epoch": 0.999055159156811, "percentage": 99.92, "elapsed_time": "6:01:00", "remaining_time": "0:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3834, "total_steps": 3836, "loss": 0.1413, "learning_rate": 3.716318313640166e-12, "epoch": 0.9993158049066563, "percentage": 99.95, "elapsed_time": "6:01:05", "remaining_time": "0:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3835, "total_steps": 3836, "loss": 0.1332, "learning_rate": 9.290797511884998e-13, "epoch": 0.9995764506565015, "percentage": 99.97, "elapsed_time": "6:01:10", "remaining_time": "0:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3836, "total_steps": 3836, "loss": 0.1303, "learning_rate": 0.0, "epoch": 0.9998370964063468, "percentage": 100.0, "elapsed_time": "6:01:16", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3836, "total_steps": 3836, "epoch": 0.9998370964063468, "percentage": 100.0, "elapsed_time": "6:01:16", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}