{"current_steps": 10, "total_steps": 410, "loss": 3.6679, "learning_rate": 1.2195121951219513e-05, "epoch": 0.02437538086532602, "percentage": 2.44, "elapsed_time": "0:02:03", "remaining_time": "1:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 410, "loss": 3.5098, "learning_rate": 2.4390243902439026e-05, "epoch": 0.04875076173065204, "percentage": 4.88, "elapsed_time": "0:04:06", "remaining_time": "1:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 410, "loss": 3.3353, "learning_rate": 3.6585365853658535e-05, "epoch": 0.07312614259597806, "percentage": 7.32, "elapsed_time": "0:06:08", "remaining_time": "1:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 410, "loss": 3.2341, "learning_rate": 4.878048780487805e-05, "epoch": 0.09750152346130408, "percentage": 9.76, "elapsed_time": "0:08:11", "remaining_time": "1:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 410, "loss": 3.1812, "learning_rate": 4.992664502959351e-05, "epoch": 0.1218769043266301, "percentage": 12.2, "elapsed_time": "0:10:14", "remaining_time": "1:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 410, "loss": 3.1662, "learning_rate": 4.967362490933723e-05, "epoch": 0.14625228519195613, "percentage": 14.63, "elapsed_time": "0:12:17", "remaining_time": "1:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 410, "loss": 3.0648, "learning_rate": 4.924186648858207e-05, "epoch": 0.17062766605728213, "percentage": 17.07, "elapsed_time": "0:14:19", "remaining_time": "1:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 410, "loss": 3.0025, "learning_rate": 4.863449747015384e-05, "epoch": 0.19500304692260817, "percentage": 19.51, "elapsed_time": "0:16:22", "remaining_time": "1:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 410, "loss": 2.9753, "learning_rate": 4.7855917698280054e-05, "epoch": 0.21937842778793418, "percentage": 21.95, "elapsed_time": "0:18:25", "remaining_time": "1:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 410, "loss": 3.0006, "learning_rate": 4.691176728566159e-05, "epoch": 0.2437538086532602, "percentage": 24.39, "elapsed_time": "0:20:28", "remaining_time": "1:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 410, "loss": 2.923, "learning_rate": 4.580888575591068e-05, "epoch": 0.2681291895185862, "percentage": 26.83, "elapsed_time": "0:22:30", "remaining_time": "1:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 410, "loss": 2.8956, "learning_rate": 4.455526249733178e-05, "epoch": 0.29250457038391225, "percentage": 29.27, "elapsed_time": "0:24:33", "remaining_time": "0:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 410, "loss": 2.8836, "learning_rate": 4.3159978886963226e-05, "epoch": 0.3168799512492383, "percentage": 31.71, "elapsed_time": "0:26:36", "remaining_time": "0:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 410, "loss": 2.8863, "learning_rate": 4.163314250413913e-05, "epoch": 0.34125533211456427, "percentage": 34.15, "elapsed_time": "0:28:39", "remaining_time": "0:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 410, "loss": 2.9099, "learning_rate": 3.9985813910135304e-05, "epoch": 0.3656307129798903, "percentage": 36.59, "elapsed_time": "0:30:41", "remaining_time": "0:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 410, "loss": 2.8218, "learning_rate": 3.8229926524315016e-05, "epoch": 0.39000609384521634, "percentage": 39.02, "elapsed_time": "0:32:44", "remaining_time": "0:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 410, "loss": 2.7813, "learning_rate": 3.6378200177200224e-05, "epoch": 0.4143814747105424, "percentage": 41.46, "elapsed_time": "0:34:47", "remaining_time": "0:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 410, "loss": 2.8867, "learning_rate": 3.444404896669865e-05, "epoch": 0.43875685557586835, "percentage": 43.9, "elapsed_time": "0:36:49", "remaining_time": "0:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 410, "loss": 2.8076, "learning_rate": 3.2441484084985865e-05, "epoch": 0.4631322364411944, "percentage": 46.34, "elapsed_time": "0:38:52", "remaining_time": "0:45:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 410, "loss": 2.8486, "learning_rate": 3.0385012319974537e-05, "epoch": 0.4875076173065204, "percentage": 48.78, "elapsed_time": "0:40:55", "remaining_time": "0:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 410, "loss": 2.7986, "learning_rate": 2.8289530966636625e-05, "epoch": 0.5118829981718465, "percentage": 51.22, "elapsed_time": "0:42:58", "remaining_time": "0:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 410, "loss": 2.792, "learning_rate": 2.617021990945197e-05, "epoch": 0.5362583790371724, "percentage": 53.66, "elapsed_time": "0:45:00", "remaining_time": "0:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 410, "loss": 2.836, "learning_rate": 2.4042431657749117e-05, "epoch": 0.5606337599024985, "percentage": 56.1, "elapsed_time": "0:47:03", "remaining_time": "0:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 410, "loss": 2.7748, "learning_rate": 2.1921580130533827e-05, "epoch": 0.5850091407678245, "percentage": 58.54, "elapsed_time": "0:49:06", "remaining_time": "0:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 410, "loss": 2.7994, "learning_rate": 1.9823028996459486e-05, "epoch": 0.6093845216331505, "percentage": 60.98, "elapsed_time": "0:51:09", "remaining_time": "0:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 410, "loss": 2.7459, "learning_rate": 1.7761980377816287e-05, "epoch": 0.6337599024984766, "percentage": 63.41, "elapsed_time": "0:53:11", "remaining_time": "0:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 410, "loss": 2.8381, "learning_rate": 1.5753364724779092e-05, "epoch": 0.6581352833638026, "percentage": 65.85, "elapsed_time": "0:55:14", "remaining_time": "0:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 410, "loss": 2.7299, "learning_rate": 1.381173265767623e-05, "epoch": 0.6825106642291285, "percentage": 68.29, "elapsed_time": "0:57:17", "remaining_time": "0:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 410, "loss": 2.7464, "learning_rate": 1.1951149560785167e-05, "epoch": 0.7068860450944546, "percentage": 70.73, "elapsed_time": "0:59:20", "remaining_time": "0:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 410, "loss": 2.7119, "learning_rate": 1.0185093691228534e-05, "epoch": 0.7312614259597806, "percentage": 73.17, "elapsed_time": "1:01:22", "remaining_time": "0:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 410, "loss": 2.6856, "learning_rate": 8.526358541080173e-06, "epoch": 0.7556368068251066, "percentage": 75.61, "elapsed_time": "1:03:25", "remaining_time": "0:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 410, "loss": 2.71, "learning_rate": 6.986960159980327e-06, "epoch": 0.7800121876904327, "percentage": 78.05, "elapsed_time": "1:05:28", "remaining_time": "0:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 410, "loss": 3.6679, "learning_rate": 1.2195121951219513e-05, "epoch": 0.02437538086532602, "percentage": 2.44, "elapsed_time": "0:02:04", "remaining_time": "1:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 410, "loss": 3.5098, "learning_rate": 2.4390243902439026e-05, "epoch": 0.04875076173065204, "percentage": 4.88, "elapsed_time": "0:04:09", "remaining_time": "1:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 410, "loss": 3.3353, "learning_rate": 3.6585365853658535e-05, "epoch": 0.07312614259597806, "percentage": 7.32, "elapsed_time": "0:06:13", "remaining_time": "1:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 410, "loss": 3.2342, "learning_rate": 4.878048780487805e-05, "epoch": 0.09750152346130408, "percentage": 9.76, "elapsed_time": "0:08:18", "remaining_time": "1:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 410, "loss": 3.1812, "learning_rate": 4.992664502959351e-05, "epoch": 0.1218769043266301, "percentage": 12.2, "elapsed_time": "0:10:22", "remaining_time": "1:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 410, "loss": 3.1661, "learning_rate": 4.967362490933723e-05, "epoch": 0.14625228519195613, "percentage": 14.63, "elapsed_time": "0:12:27", "remaining_time": "1:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 410, "loss": 3.0649, "learning_rate": 4.924186648858207e-05, "epoch": 0.17062766605728213, "percentage": 17.07, "elapsed_time": "0:14:32", "remaining_time": "1:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 410, "loss": 3.0024, "learning_rate": 4.863449747015384e-05, "epoch": 0.19500304692260817, "percentage": 19.51, "elapsed_time": "0:16:36", "remaining_time": "1:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 410, "loss": 2.9751, "learning_rate": 4.7855917698280054e-05, "epoch": 0.21937842778793418, "percentage": 21.95, "elapsed_time": "0:18:41", "remaining_time": "1:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 410, "loss": 3.0007, "learning_rate": 4.691176728566159e-05, "epoch": 0.2437538086532602, "percentage": 24.39, "elapsed_time": "0:20:45", "remaining_time": "1:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 410, "loss": 2.9229, "learning_rate": 4.580888575591068e-05, "epoch": 0.2681291895185862, "percentage": 26.83, "elapsed_time": "0:22:50", "remaining_time": "1:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 410, "loss": 2.8955, "learning_rate": 4.455526249733178e-05, "epoch": 0.29250457038391225, "percentage": 29.27, "elapsed_time": "0:24:54", "remaining_time": "1:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 410, "loss": 2.8837, "learning_rate": 4.3159978886963226e-05, "epoch": 0.3168799512492383, "percentage": 31.71, "elapsed_time": "0:26:59", "remaining_time": "0:58:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 410, "loss": 2.8862, "learning_rate": 4.163314250413913e-05, "epoch": 0.34125533211456427, "percentage": 34.15, "elapsed_time": "0:29:04", "remaining_time": "0:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 410, "loss": 2.9099, "learning_rate": 3.9985813910135304e-05, "epoch": 0.3656307129798903, "percentage": 36.59, "elapsed_time": "0:31:08", "remaining_time": "0:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 410, "loss": 2.8219, "learning_rate": 3.8229926524315016e-05, "epoch": 0.39000609384521634, "percentage": 39.02, "elapsed_time": "0:33:13", "remaining_time": "0:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 410, "loss": 2.7811, "learning_rate": 3.6378200177200224e-05, "epoch": 0.4143814747105424, "percentage": 41.46, "elapsed_time": "0:35:17", "remaining_time": "0:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 410, "loss": 2.8869, "learning_rate": 3.444404896669865e-05, "epoch": 0.43875685557586835, "percentage": 43.9, "elapsed_time": "0:37:22", "remaining_time": "0:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 410, "loss": 2.8078, "learning_rate": 3.2441484084985865e-05, "epoch": 0.4631322364411944, "percentage": 46.34, "elapsed_time": "0:39:27", "remaining_time": "0:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 410, "loss": 2.8488, "learning_rate": 3.0385012319974537e-05, "epoch": 0.4875076173065204, "percentage": 48.78, "elapsed_time": "0:41:31", "remaining_time": "0:43:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 410, "loss": 2.7989, "learning_rate": 2.8289530966636625e-05, "epoch": 0.5118829981718465, "percentage": 51.22, "elapsed_time": "0:43:36", "remaining_time": "0:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 410, "loss": 2.7921, "learning_rate": 2.617021990945197e-05, "epoch": 0.5362583790371724, "percentage": 53.66, "elapsed_time": "0:45:40", "remaining_time": "0:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 410, "loss": 2.8359, "learning_rate": 2.4042431657749117e-05, "epoch": 0.5606337599024985, "percentage": 56.1, "elapsed_time": "0:47:45", "remaining_time": "0:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 410, "loss": 2.7748, "learning_rate": 2.1921580130533827e-05, "epoch": 0.5850091407678245, "percentage": 58.54, "elapsed_time": "0:49:50", "remaining_time": "0:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 410, "loss": 2.7994, "learning_rate": 1.9823028996459486e-05, "epoch": 0.6093845216331505, "percentage": 60.98, "elapsed_time": "0:51:54", "remaining_time": "0:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 410, "loss": 2.7459, "learning_rate": 1.7761980377816287e-05, "epoch": 0.6337599024984766, "percentage": 63.41, "elapsed_time": "0:53:59", "remaining_time": "0:31:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 410, "loss": 2.838, "learning_rate": 1.5753364724779092e-05, "epoch": 0.6581352833638026, "percentage": 65.85, "elapsed_time": "0:56:03", "remaining_time": "0:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 410, "loss": 2.7298, "learning_rate": 1.381173265767623e-05, "epoch": 0.6825106642291285, "percentage": 68.29, "elapsed_time": "0:58:08", "remaining_time": "0:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 410, "loss": 2.7464, "learning_rate": 1.1951149560785167e-05, "epoch": 0.7068860450944546, "percentage": 70.73, "elapsed_time": "1:00:12", "remaining_time": "0:24:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 410, "loss": 2.7118, "learning_rate": 1.0185093691228534e-05, "epoch": 0.7312614259597806, "percentage": 73.17, "elapsed_time": "1:02:17", "remaining_time": "0:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 410, "loss": 2.6857, "learning_rate": 8.526358541080173e-06, "epoch": 0.7556368068251066, "percentage": 75.61, "elapsed_time": "1:04:21", "remaining_time": "0:20:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 410, "loss": 2.71, "learning_rate": 6.986960159980327e-06, "epoch": 0.7800121876904327, "percentage": 78.05, "elapsed_time": "1:06:26", "remaining_time": "0:18:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 410, "loss": 2.8041, "learning_rate": 5.578050109624511e-06, "epoch": 0.8043875685557587, "percentage": 80.49, "elapsed_time": "1:08:31", "remaining_time": "0:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 410, "loss": 2.6818, "learning_rate": 4.309834680692832e-06, "epoch": 0.8287629494210847, "percentage": 82.93, "elapsed_time": "1:10:35", "remaining_time": "0:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 410, "loss": 2.6666, "learning_rate": 3.1915009574206262e-06, "epoch": 0.8531383302864107, "percentage": 85.37, "elapsed_time": "1:12:40", "remaining_time": "0:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 410, "loss": 2.7277, "learning_rate": 2.231150265406512e-06, "epoch": 0.8775137111517367, "percentage": 87.8, "elapsed_time": "1:14:44", "remaining_time": "0:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 410, "loss": 2.7256, "learning_rate": 1.435739484768603e-06, "epoch": 0.9018890920170628, "percentage": 90.24, "elapsed_time": "1:16:49", "remaining_time": "0:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 410, "loss": 2.7143, "learning_rate": 8.110306537826601e-07, "epoch": 0.9262644728823888, "percentage": 92.68, "elapsed_time": "1:18:54", "remaining_time": "0:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 410, "loss": 2.7688, "learning_rate": 3.6154922807863643e-07, "epoch": 0.9506398537477148, "percentage": 95.12, "elapsed_time": "1:20:58", "remaining_time": "0:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 410, "loss": 2.7355, "learning_rate": 9.055129777021665e-08, "epoch": 0.9750152346130408, "percentage": 97.56, "elapsed_time": "1:23:03", "remaining_time": "0:02:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 410, "loss": 2.751, "learning_rate": 0.0, "epoch": 0.9993906154783668, "percentage": 100.0, "elapsed_time": "1:25:07", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 410, "epoch": 0.9993906154783668, "percentage": 100.0, "elapsed_time": "1:25:09", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}