{"current_steps": 5, "total_steps": 350, "loss": 0.9685, "learning_rate": 1.4285714285714285e-05, "epoch": 0.028429282160625444, "percentage": 1.43, "elapsed_time": "0:05:46", "remaining_time": "6:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 350, "loss": 0.5325, "learning_rate": 2.857142857142857e-05, "epoch": 0.05685856432125089, "percentage": 2.86, "elapsed_time": "0:11:34", "remaining_time": "6:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 350, "loss": 0.2362, "learning_rate": 4.2857142857142856e-05, "epoch": 0.08528784648187633, "percentage": 4.29, "elapsed_time": "0:17:22", "remaining_time": "6:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 350, "loss": 0.2163, "learning_rate": 5.714285714285714e-05, "epoch": 0.11371712864250177, "percentage": 5.71, "elapsed_time": "0:23:11", "remaining_time": "6:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 350, "loss": 0.2204, "learning_rate": 7.142857142857143e-05, "epoch": 0.14214641080312723, "percentage": 7.14, "elapsed_time": "0:29:00", "remaining_time": "6:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 350, "loss": 0.2098, "learning_rate": 8.571428571428571e-05, "epoch": 0.17057569296375266, "percentage": 8.57, "elapsed_time": "0:34:49", "remaining_time": "6:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 350, "loss": 0.1803, "learning_rate": 0.0001, "epoch": 0.19900497512437812, "percentage": 10.0, "elapsed_time": "0:40:37", "remaining_time": "6:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 350, "eval_loss": 0.16817478835582733, "epoch": 0.19900497512437812, "percentage": 10.0, "elapsed_time": "0:45:55", "remaining_time": "6:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 350, "loss": 0.1843, "learning_rate": 9.993784606094612e-05, "epoch": 0.22743425728500355, "percentage": 11.43, "elapsed_time": "0:51:49", "remaining_time": "6:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 350, "loss": 0.1751, "learning_rate": 9.975153876827008e-05, "epoch": 0.255863539445629, "percentage": 12.86, "elapsed_time": "0:57:37", "remaining_time": "6:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 350, "loss": 0.1722, "learning_rate": 9.944154131125642e-05, "epoch": 0.28429282160625446, "percentage": 14.29, "elapsed_time": "1:03:25", "remaining_time": "6:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 350, "loss": 0.165, "learning_rate": 9.900862439242719e-05, "epoch": 0.31272210376687987, "percentage": 15.71, "elapsed_time": "1:09:15", "remaining_time": "6:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 350, "loss": 0.1734, "learning_rate": 9.84538643114539e-05, "epoch": 0.3411513859275053, "percentage": 17.14, "elapsed_time": "1:15:06", "remaining_time": "6:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 350, "loss": 0.1476, "learning_rate": 9.777864028930705e-05, "epoch": 0.3695806680881308, "percentage": 18.57, "elapsed_time": "1:20:54", "remaining_time": "5:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 350, "loss": 0.1583, "learning_rate": 9.698463103929542e-05, "epoch": 0.39800995024875624, "percentage": 20.0, "elapsed_time": "1:26:41", "remaining_time": "5:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 350, "eval_loss": 0.15481097996234894, "epoch": 0.39800995024875624, "percentage": 20.0, "elapsed_time": "1:31:59", "remaining_time": "6:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 350, "loss": 0.1632, "learning_rate": 9.607381059352038e-05, "epoch": 0.42643923240938164, "percentage": 21.43, "elapsed_time": "1:37:50", "remaining_time": "5:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 350, "loss": 0.1503, "learning_rate": 9.504844339512095e-05, "epoch": 0.4548685145700071, "percentage": 22.86, "elapsed_time": "1:43:41", "remaining_time": "5:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 350, "loss": 0.1527, "learning_rate": 9.391107866851143e-05, "epoch": 0.48329779673063256, "percentage": 24.29, "elapsed_time": "1:49:28", "remaining_time": "5:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 350, "loss": 0.1523, "learning_rate": 9.266454408160779e-05, "epoch": 0.511727078891258, "percentage": 25.71, "elapsed_time": "1:55:17", "remaining_time": "5:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 350, "loss": 0.1512, "learning_rate": 9.131193871579975e-05, "epoch": 0.5401563610518835, "percentage": 27.14, "elapsed_time": "2:01:03", "remaining_time": "5:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 350, "loss": 0.1485, "learning_rate": 8.985662536114613e-05, "epoch": 0.5685856432125089, "percentage": 28.57, "elapsed_time": "2:06:52", "remaining_time": "5:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 350, "loss": 0.1439, "learning_rate": 8.83022221559489e-05, "epoch": 0.5970149253731343, "percentage": 30.0, "elapsed_time": "2:12:39", "remaining_time": "5:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 350, "eval_loss": 0.14900080859661102, "epoch": 0.5970149253731343, "percentage": 30.0, "elapsed_time": "2:17:57", "remaining_time": "5:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 350, "loss": 0.1459, "learning_rate": 8.665259359149132e-05, "epoch": 0.6254442075337597, "percentage": 31.43, "elapsed_time": "2:23:48", "remaining_time": "5:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 350, "loss": 0.1367, "learning_rate": 8.491184090430364e-05, "epoch": 0.6538734896943852, "percentage": 32.86, "elapsed_time": "2:29:37", "remaining_time": "5:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 350, "loss": 0.1468, "learning_rate": 8.308429187984297e-05, "epoch": 0.6823027718550106, "percentage": 34.29, "elapsed_time": "2:35:26", "remaining_time": "4:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 350, "loss": 0.1349, "learning_rate": 8.117449009293668e-05, "epoch": 0.7107320540156361, "percentage": 35.71, "elapsed_time": "2:41:13", "remaining_time": "4:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 350, "loss": 0.1411, "learning_rate": 7.91871836117395e-05, "epoch": 0.7391613361762616, "percentage": 37.14, "elapsed_time": "2:47:03", "remaining_time": "4:42:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 350, "loss": 0.1663, "learning_rate": 7.712731319328798e-05, "epoch": 0.767590618336887, "percentage": 38.57, "elapsed_time": "2:52:52", "remaining_time": "4:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 350, "loss": 0.1488, "learning_rate": 7.500000000000001e-05, "epoch": 0.7960199004975125, "percentage": 40.0, "elapsed_time": "2:58:42", "remaining_time": "4:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 350, "eval_loss": 0.13560061156749725, "epoch": 0.7960199004975125, "percentage": 40.0, "elapsed_time": "3:03:58", "remaining_time": "4:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 350, "loss": 0.1426, "learning_rate": 7.281053286765815e-05, "epoch": 0.8244491826581379, "percentage": 41.43, "elapsed_time": "3:09:48", "remaining_time": "4:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 350, "loss": 0.1542, "learning_rate": 7.056435515653059e-05, "epoch": 0.8528784648187633, "percentage": 42.86, "elapsed_time": "3:15:35", "remaining_time": "4:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 350, "loss": 0.1455, "learning_rate": 6.826705121831976e-05, "epoch": 0.8813077469793887, "percentage": 44.29, "elapsed_time": "3:21:25", "remaining_time": "4:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 350, "loss": 0.1376, "learning_rate": 6.592433251258423e-05, "epoch": 0.9097370291400142, "percentage": 45.71, "elapsed_time": "3:27:12", "remaining_time": "4:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 350, "loss": 0.1352, "learning_rate": 6.354202340715026e-05, "epoch": 0.9381663113006397, "percentage": 47.14, "elapsed_time": "3:32:59", "remaining_time": "3:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 350, "loss": 0.1402, "learning_rate": 6.112604669781572e-05, "epoch": 0.9665955934612651, "percentage": 48.57, "elapsed_time": "3:38:48", "remaining_time": "3:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 350, "loss": 0.1385, "learning_rate": 5.868240888334653e-05, "epoch": 0.9950248756218906, "percentage": 50.0, "elapsed_time": "3:44:37", "remaining_time": "3:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 350, "eval_loss": 0.136678546667099, "epoch": 0.9950248756218906, "percentage": 50.0, "elapsed_time": "3:49:55", "remaining_time": "3:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 350, "loss": 0.1232, "learning_rate": 5.621718523237427e-05, "epoch": 1.023454157782516, "percentage": 51.43, "elapsed_time": "3:55:40", "remaining_time": "3:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 350, "loss": 0.1148, "learning_rate": 5.373650467932122e-05, "epoch": 1.0518834399431414, "percentage": 52.86, "elapsed_time": "4:01:30", "remaining_time": "3:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 350, "loss": 0.1272, "learning_rate": 5.124653458690365e-05, "epoch": 1.080312722103767, "percentage": 54.29, "elapsed_time": "4:07:18", "remaining_time": "3:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 350, "loss": 0.111, "learning_rate": 4.875346541309637e-05, "epoch": 1.1087420042643923, "percentage": 55.71, "elapsed_time": "4:13:07", "remaining_time": "3:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 350, "loss": 0.1284, "learning_rate": 4.626349532067879e-05, "epoch": 1.1371712864250179, "percentage": 57.14, "elapsed_time": "4:18:54", "remaining_time": "3:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 350, "loss": 0.1214, "learning_rate": 4.378281476762576e-05, "epoch": 1.1656005685856432, "percentage": 58.57, "elapsed_time": "4:24:42", "remaining_time": "3:07:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 350, "loss": 0.1092, "learning_rate": 4.131759111665349e-05, "epoch": 1.1940298507462686, "percentage": 60.0, "elapsed_time": "4:30:29", "remaining_time": "3:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 350, "eval_loss": 0.13155004382133484, "epoch": 1.1940298507462686, "percentage": 60.0, "elapsed_time": "4:35:48", "remaining_time": "3:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 350, "loss": 0.1128, "learning_rate": 3.887395330218429e-05, "epoch": 1.2224591329068941, "percentage": 61.43, "elapsed_time": "4:41:38", "remaining_time": "2:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 350, "loss": 0.1064, "learning_rate": 3.6457976592849754e-05, "epoch": 1.2508884150675195, "percentage": 62.86, "elapsed_time": "4:47:26", "remaining_time": "2:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 350, "loss": 0.1146, "learning_rate": 3.4075667487415785e-05, "epoch": 1.279317697228145, "percentage": 64.29, "elapsed_time": "4:53:14", "remaining_time": "2:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 350, "loss": 0.1118, "learning_rate": 3.173294878168025e-05, "epoch": 1.3077469793887704, "percentage": 65.71, "elapsed_time": "4:59:02", "remaining_time": "2:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 350, "loss": 0.1183, "learning_rate": 2.9435644843469436e-05, "epoch": 1.336176261549396, "percentage": 67.14, "elapsed_time": "5:04:51", "remaining_time": "2:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 350, "loss": 0.1248, "learning_rate": 2.718946713234185e-05, "epoch": 1.3646055437100213, "percentage": 68.57, "elapsed_time": "5:10:40", "remaining_time": "2:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 350, "loss": 0.1282, "learning_rate": 2.500000000000001e-05, "epoch": 1.3930348258706466, "percentage": 70.0, "elapsed_time": "5:16:27", "remaining_time": "2:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 350, "eval_loss": 0.12762804329395294, "epoch": 1.3930348258706466, "percentage": 70.0, "elapsed_time": "5:21:43", "remaining_time": "2:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 350, "loss": 0.1147, "learning_rate": 2.2872686806712035e-05, "epoch": 1.4214641080312722, "percentage": 71.43, "elapsed_time": "5:27:34", "remaining_time": "2:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 350, "loss": 0.1116, "learning_rate": 2.0812816388260518e-05, "epoch": 1.4498933901918978, "percentage": 72.86, "elapsed_time": "5:33:21", "remaining_time": "2:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 350, "loss": 0.0991, "learning_rate": 1.8825509907063327e-05, "epoch": 1.4783226723525231, "percentage": 74.29, "elapsed_time": "5:39:09", "remaining_time": "1:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 350, "loss": 0.1137, "learning_rate": 1.691570812015704e-05, "epoch": 1.5067519545131485, "percentage": 75.71, "elapsed_time": "5:44:58", "remaining_time": "1:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 350, "loss": 0.12, "learning_rate": 1.5088159095696363e-05, "epoch": 1.535181236673774, "percentage": 77.14, "elapsed_time": "5:50:46", "remaining_time": "1:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 350, "loss": 0.1055, "learning_rate": 1.3347406408508695e-05, "epoch": 1.5636105188343994, "percentage": 78.57, "elapsed_time": "5:56:34", "remaining_time": "1:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 350, "loss": 0.1135, "learning_rate": 1.1697777844051105e-05, "epoch": 1.5920398009950247, "percentage": 80.0, "elapsed_time": "6:02:21", "remaining_time": "1:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 350, "eval_loss": 0.1305658519268036, "epoch": 1.5920398009950247, "percentage": 80.0, "elapsed_time": "6:07:39", "remaining_time": "1:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 350, "loss": 0.1153, "learning_rate": 1.0143374638853891e-05, "epoch": 1.6204690831556503, "percentage": 81.43, "elapsed_time": "6:13:33", "remaining_time": "1:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 350, "loss": 0.1137, "learning_rate": 8.688061284200266e-06, "epoch": 1.6488983653162759, "percentage": 82.86, "elapsed_time": "6:19:20", "remaining_time": "1:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 350, "loss": 0.1002, "learning_rate": 7.33545591839222e-06, "epoch": 1.6773276474769012, "percentage": 84.29, "elapsed_time": "6:25:09", "remaining_time": "1:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 350, "loss": 0.1159, "learning_rate": 6.088921331488568e-06, "epoch": 1.7057569296375266, "percentage": 85.71, "elapsed_time": "6:30:57", "remaining_time": "1:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 350, "loss": 0.1151, "learning_rate": 4.951556604879048e-06, "epoch": 1.7341862117981521, "percentage": 87.14, "elapsed_time": "6:36:44", "remaining_time": "0:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 350, "loss": 0.0968, "learning_rate": 3.9261894064796135e-06, "epoch": 1.7626154939587777, "percentage": 88.57, "elapsed_time": "6:42:35", "remaining_time": "0:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 350, "loss": 0.1071, "learning_rate": 3.0153689607045845e-06, "epoch": 1.7910447761194028, "percentage": 90.0, "elapsed_time": "6:48:23", "remaining_time": "0:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 350, "eval_loss": 0.13068035244941711, "epoch": 1.7910447761194028, "percentage": 90.0, "elapsed_time": "6:53:41", "remaining_time": "0:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 350, "loss": 0.1052, "learning_rate": 2.221359710692961e-06, "epoch": 1.8194740582800284, "percentage": 91.43, "elapsed_time": "6:59:32", "remaining_time": "0:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 350, "loss": 0.1098, "learning_rate": 1.5461356885461075e-06, "epoch": 1.847903340440654, "percentage": 92.86, "elapsed_time": "7:05:19", "remaining_time": "0:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 350, "loss": 0.1062, "learning_rate": 9.913756075728087e-07, "epoch": 1.8763326226012793, "percentage": 94.29, "elapsed_time": "7:11:06", "remaining_time": "0:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 350, "loss": 0.12, "learning_rate": 5.584586887435739e-07, "epoch": 1.9047619047619047, "percentage": 95.71, "elapsed_time": "7:16:54", "remaining_time": "0:19:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 350, "loss": 0.1109, "learning_rate": 2.4846123172992954e-07, "epoch": 1.9331911869225302, "percentage": 97.14, "elapsed_time": "7:22:44", "remaining_time": "0:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 350, "loss": 0.1168, "learning_rate": 6.215393905388278e-08, "epoch": 1.9616204690831558, "percentage": 98.57, "elapsed_time": "7:28:33", "remaining_time": "0:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 350, "loss": 0.1075, "learning_rate": 0.0, "epoch": 1.9900497512437811, "percentage": 100.0, "elapsed_time": "7:34:22", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 350, "eval_loss": 0.1294924020767212, "epoch": 1.9900497512437811, "percentage": 100.0, "elapsed_time": "7:39:38", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 350, "epoch": 1.9900497512437811, "percentage": 100.0, "elapsed_time": "7:39:41", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}