sedrickkeh's picture
Training in progress, epoch 2
37c3f3a verified
{"current_steps": 10, "total_steps": 705, "loss": 0.7812, "lr": 5e-06, "epoch": 0.04239533651298357, "percentage": 1.42, "elapsed_time": "0:05:25", "remaining_time": "6:17:11"}
{"current_steps": 20, "total_steps": 705, "loss": 0.7056, "lr": 5e-06, "epoch": 0.08479067302596714, "percentage": 2.84, "elapsed_time": "0:10:45", "remaining_time": "6:08:39"}
{"current_steps": 30, "total_steps": 705, "loss": 0.6864, "lr": 5e-06, "epoch": 0.1271860095389507, "percentage": 4.26, "elapsed_time": "0:16:03", "remaining_time": "6:01:20"}
{"current_steps": 40, "total_steps": 705, "loss": 0.667, "lr": 5e-06, "epoch": 0.16958134605193428, "percentage": 5.67, "elapsed_time": "0:21:23", "remaining_time": "5:55:40"}
{"current_steps": 50, "total_steps": 705, "loss": 0.6614, "lr": 5e-06, "epoch": 0.21197668256491786, "percentage": 7.09, "elapsed_time": "0:26:40", "remaining_time": "5:49:31"}
{"current_steps": 60, "total_steps": 705, "loss": 0.6494, "lr": 5e-06, "epoch": 0.2543720190779014, "percentage": 8.51, "elapsed_time": "0:31:58", "remaining_time": "5:43:39"}
{"current_steps": 70, "total_steps": 705, "loss": 0.6484, "lr": 5e-06, "epoch": 0.296767355590885, "percentage": 9.93, "elapsed_time": "0:37:17", "remaining_time": "5:38:15"}
{"current_steps": 80, "total_steps": 705, "loss": 0.6363, "lr": 5e-06, "epoch": 0.33916269210386857, "percentage": 11.35, "elapsed_time": "0:42:33", "remaining_time": "5:32:28"}
{"current_steps": 90, "total_steps": 705, "loss": 0.6235, "lr": 5e-06, "epoch": 0.3815580286168522, "percentage": 12.77, "elapsed_time": "0:47:50", "remaining_time": "5:26:54"}
{"current_steps": 100, "total_steps": 705, "loss": 0.6281, "lr": 5e-06, "epoch": 0.4239533651298357, "percentage": 14.18, "elapsed_time": "0:53:09", "remaining_time": "5:21:38"}
{"current_steps": 110, "total_steps": 705, "loss": 0.6178, "lr": 5e-06, "epoch": 0.4663487016428193, "percentage": 15.6, "elapsed_time": "0:58:29", "remaining_time": "5:16:23"}
{"current_steps": 120, "total_steps": 705, "loss": 0.6124, "lr": 5e-06, "epoch": 0.5087440381558028, "percentage": 17.02, "elapsed_time": "1:03:50", "remaining_time": "5:11:11"}
{"current_steps": 130, "total_steps": 705, "loss": 0.6141, "lr": 5e-06, "epoch": 0.5511393746687865, "percentage": 18.44, "elapsed_time": "1:09:07", "remaining_time": "5:05:46"}
{"current_steps": 140, "total_steps": 705, "loss": 0.6075, "lr": 5e-06, "epoch": 0.59353471118177, "percentage": 19.86, "elapsed_time": "1:14:27", "remaining_time": "5:00:28"}
{"current_steps": 150, "total_steps": 705, "loss": 0.6058, "lr": 5e-06, "epoch": 0.6359300476947536, "percentage": 21.28, "elapsed_time": "1:19:48", "remaining_time": "4:55:17"}
{"current_steps": 160, "total_steps": 705, "loss": 0.6085, "lr": 5e-06, "epoch": 0.6783253842077371, "percentage": 22.7, "elapsed_time": "1:25:07", "remaining_time": "4:49:56"}
{"current_steps": 170, "total_steps": 705, "loss": 0.6041, "lr": 5e-06, "epoch": 0.7207207207207207, "percentage": 24.11, "elapsed_time": "1:30:25", "remaining_time": "4:44:34"}
{"current_steps": 180, "total_steps": 705, "loss": 0.5979, "lr": 5e-06, "epoch": 0.7631160572337043, "percentage": 25.53, "elapsed_time": "1:35:43", "remaining_time": "4:39:12"}
{"current_steps": 190, "total_steps": 705, "loss": 0.6059, "lr": 5e-06, "epoch": 0.8055113937466879, "percentage": 26.95, "elapsed_time": "1:41:05", "remaining_time": "4:33:59"}
{"current_steps": 200, "total_steps": 705, "loss": 0.6003, "lr": 5e-06, "epoch": 0.8479067302596714, "percentage": 28.37, "elapsed_time": "1:46:26", "remaining_time": "4:28:45"}
{"current_steps": 210, "total_steps": 705, "loss": 0.603, "lr": 5e-06, "epoch": 0.890302066772655, "percentage": 29.79, "elapsed_time": "1:51:45", "remaining_time": "4:23:25"}
{"current_steps": 220, "total_steps": 705, "loss": 0.5992, "lr": 5e-06, "epoch": 0.9326974032856385, "percentage": 31.21, "elapsed_time": "1:57:05", "remaining_time": "4:18:08"}
{"current_steps": 230, "total_steps": 705, "loss": 0.5889, "lr": 5e-06, "epoch": 0.9750927397986221, "percentage": 32.62, "elapsed_time": "2:02:25", "remaining_time": "4:12:50"}
{"current_steps": 235, "total_steps": 705, "eval_loss": 0.6008393168449402, "epoch": 0.9962904080551139, "percentage": 33.33, "elapsed_time": "2:07:53", "remaining_time": "4:15:46"}
{"current_steps": 240, "total_steps": 705, "loss": 0.6229, "lr": 5e-06, "epoch": 1.0206677265500794, "percentage": 34.04, "elapsed_time": "2:11:40", "remaining_time": "4:15:07"}
{"current_steps": 250, "total_steps": 705, "loss": 0.5427, "lr": 5e-06, "epoch": 1.063063063063063, "percentage": 35.46, "elapsed_time": "2:17:01", "remaining_time": "4:09:23"}
{"current_steps": 260, "total_steps": 705, "loss": 0.539, "lr": 5e-06, "epoch": 1.1054583995760465, "percentage": 36.88, "elapsed_time": "2:22:21", "remaining_time": "4:03:39"}
{"current_steps": 270, "total_steps": 705, "loss": 0.5482, "lr": 5e-06, "epoch": 1.1478537360890302, "percentage": 38.3, "elapsed_time": "2:27:42", "remaining_time": "3:57:58"}
{"current_steps": 280, "total_steps": 705, "loss": 0.5468, "lr": 5e-06, "epoch": 1.1902490726020138, "percentage": 39.72, "elapsed_time": "2:33:03", "remaining_time": "3:52:19"}
{"current_steps": 290, "total_steps": 705, "loss": 0.5423, "lr": 5e-06, "epoch": 1.2326444091149973, "percentage": 41.13, "elapsed_time": "2:38:24", "remaining_time": "3:46:41"}
{"current_steps": 300, "total_steps": 705, "loss": 0.5456, "lr": 5e-06, "epoch": 1.275039745627981, "percentage": 42.55, "elapsed_time": "2:43:41", "remaining_time": "3:40:59"}
{"current_steps": 310, "total_steps": 705, "loss": 0.5459, "lr": 5e-06, "epoch": 1.3174350821409644, "percentage": 43.97, "elapsed_time": "2:49:01", "remaining_time": "3:35:22"}
{"current_steps": 320, "total_steps": 705, "loss": 0.5489, "lr": 5e-06, "epoch": 1.359830418653948, "percentage": 45.39, "elapsed_time": "2:54:22", "remaining_time": "3:29:47"}
{"current_steps": 330, "total_steps": 705, "loss": 0.543, "lr": 5e-06, "epoch": 1.4022257551669317, "percentage": 46.81, "elapsed_time": "2:59:39", "remaining_time": "3:24:09"}
{"current_steps": 340, "total_steps": 705, "loss": 0.5441, "lr": 5e-06, "epoch": 1.4446210916799151, "percentage": 48.23, "elapsed_time": "3:04:56", "remaining_time": "3:18:32"}
{"current_steps": 350, "total_steps": 705, "loss": 0.5439, "lr": 5e-06, "epoch": 1.4870164281928988, "percentage": 49.65, "elapsed_time": "3:10:17", "remaining_time": "3:13:00"}
{"current_steps": 360, "total_steps": 705, "loss": 0.5354, "lr": 5e-06, "epoch": 1.5294117647058822, "percentage": 51.06, "elapsed_time": "3:15:37", "remaining_time": "3:07:28"}
{"current_steps": 370, "total_steps": 705, "loss": 0.5399, "lr": 5e-06, "epoch": 1.571807101218866, "percentage": 52.48, "elapsed_time": "3:20:58", "remaining_time": "3:01:57"}
{"current_steps": 380, "total_steps": 705, "loss": 0.5481, "lr": 5e-06, "epoch": 1.6142024377318496, "percentage": 53.9, "elapsed_time": "3:26:18", "remaining_time": "2:56:27"}
{"current_steps": 390, "total_steps": 705, "loss": 0.5411, "lr": 5e-06, "epoch": 1.6565977742448332, "percentage": 55.32, "elapsed_time": "3:31:39", "remaining_time": "2:50:56"}
{"current_steps": 400, "total_steps": 705, "loss": 0.5459, "lr": 5e-06, "epoch": 1.6989931107578167, "percentage": 56.74, "elapsed_time": "3:36:59", "remaining_time": "2:45:27"}
{"current_steps": 410, "total_steps": 705, "loss": 0.5402, "lr": 5e-06, "epoch": 1.7413884472708, "percentage": 58.16, "elapsed_time": "3:42:17", "remaining_time": "2:39:56"}
{"current_steps": 420, "total_steps": 705, "loss": 0.5364, "lr": 5e-06, "epoch": 1.7837837837837838, "percentage": 59.57, "elapsed_time": "3:47:36", "remaining_time": "2:34:27"}
{"current_steps": 430, "total_steps": 705, "loss": 0.5339, "lr": 5e-06, "epoch": 1.8261791202967674, "percentage": 60.99, "elapsed_time": "3:52:57", "remaining_time": "2:28:58"}
{"current_steps": 440, "total_steps": 705, "loss": 0.5395, "lr": 5e-06, "epoch": 1.8685744568097509, "percentage": 62.41, "elapsed_time": "3:58:17", "remaining_time": "2:23:31"}
{"current_steps": 450, "total_steps": 705, "loss": 0.5362, "lr": 5e-06, "epoch": 1.9109697933227345, "percentage": 63.83, "elapsed_time": "4:03:36", "remaining_time": "2:18:02"}
{"current_steps": 460, "total_steps": 705, "loss": 0.5468, "lr": 5e-06, "epoch": 1.953365129835718, "percentage": 65.25, "elapsed_time": "4:08:56", "remaining_time": "2:12:35"}
{"current_steps": 470, "total_steps": 705, "loss": 0.5378, "lr": 5e-06, "epoch": 1.9957604663487016, "percentage": 66.67, "elapsed_time": "4:14:17", "remaining_time": "2:07:08"}
{"current_steps": 470, "total_steps": 705, "eval_loss": 0.5872675180435181, "epoch": 1.9957604663487016, "percentage": 66.67, "elapsed_time": "4:17:10", "remaining_time": "2:08:35"}
{"current_steps": 480, "total_steps": 705, "loss": 0.5322, "lr": 5e-06, "epoch": 2.041335453100159, "percentage": 68.09, "elapsed_time": "4:23:40", "remaining_time": "2:03:35"}
{"current_steps": 490, "total_steps": 705, "loss": 0.4803, "lr": 5e-06, "epoch": 2.0837307896131425, "percentage": 69.5, "elapsed_time": "4:29:00", "remaining_time": "1:58:01"}
{"current_steps": 500, "total_steps": 705, "loss": 0.4798, "lr": 5e-06, "epoch": 2.126126126126126, "percentage": 70.92, "elapsed_time": "4:34:17", "remaining_time": "1:52:27"}
{"current_steps": 510, "total_steps": 705, "loss": 0.4835, "lr": 5e-06, "epoch": 2.16852146263911, "percentage": 72.34, "elapsed_time": "4:39:35", "remaining_time": "1:46:54"}
{"current_steps": 520, "total_steps": 705, "loss": 0.4882, "lr": 5e-06, "epoch": 2.210916799152093, "percentage": 73.76, "elapsed_time": "4:44:54", "remaining_time": "1:41:21"}
{"current_steps": 530, "total_steps": 705, "loss": 0.4915, "lr": 5e-06, "epoch": 2.2533121356650767, "percentage": 75.18, "elapsed_time": "4:50:14", "remaining_time": "1:35:50"}
{"current_steps": 540, "total_steps": 705, "loss": 0.4829, "lr": 5e-06, "epoch": 2.2957074721780604, "percentage": 76.6, "elapsed_time": "4:55:34", "remaining_time": "1:30:18"}
{"current_steps": 550, "total_steps": 705, "loss": 0.4853, "lr": 5e-06, "epoch": 2.338102808691044, "percentage": 78.01, "elapsed_time": "5:00:52", "remaining_time": "1:24:47"}
{"current_steps": 560, "total_steps": 705, "loss": 0.4841, "lr": 5e-06, "epoch": 2.3804981452040277, "percentage": 79.43, "elapsed_time": "5:06:12", "remaining_time": "1:19:17"}
{"current_steps": 570, "total_steps": 705, "loss": 0.4821, "lr": 5e-06, "epoch": 2.4228934817170114, "percentage": 80.85, "elapsed_time": "5:11:31", "remaining_time": "1:13:47"}
{"current_steps": 580, "total_steps": 705, "loss": 0.4951, "lr": 5e-06, "epoch": 2.4652888182299946, "percentage": 82.27, "elapsed_time": "5:16:50", "remaining_time": "1:08:17"}
{"current_steps": 590, "total_steps": 705, "loss": 0.4808, "lr": 5e-06, "epoch": 2.5076841547429782, "percentage": 83.69, "elapsed_time": "5:22:10", "remaining_time": "1:02:47"}
{"current_steps": 600, "total_steps": 705, "loss": 0.4858, "lr": 5e-06, "epoch": 2.550079491255962, "percentage": 85.11, "elapsed_time": "5:27:30", "remaining_time": "0:57:18"}
{"current_steps": 610, "total_steps": 705, "loss": 0.4862, "lr": 5e-06, "epoch": 2.5924748277689456, "percentage": 86.52, "elapsed_time": "5:32:49", "remaining_time": "0:51:50"}
{"current_steps": 620, "total_steps": 705, "loss": 0.4837, "lr": 5e-06, "epoch": 2.6348701642819288, "percentage": 87.94, "elapsed_time": "5:38:08", "remaining_time": "0:46:21"}
{"current_steps": 630, "total_steps": 705, "loss": 0.4863, "lr": 5e-06, "epoch": 2.6772655007949124, "percentage": 89.36, "elapsed_time": "5:43:26", "remaining_time": "0:40:53"}
{"current_steps": 640, "total_steps": 705, "loss": 0.4851, "lr": 5e-06, "epoch": 2.719660837307896, "percentage": 90.78, "elapsed_time": "5:48:43", "remaining_time": "0:35:25"}
{"current_steps": 650, "total_steps": 705, "loss": 0.4834, "lr": 5e-06, "epoch": 2.7620561738208798, "percentage": 92.2, "elapsed_time": "5:54:01", "remaining_time": "0:29:57"}
{"current_steps": 660, "total_steps": 705, "loss": 0.4813, "lr": 5e-06, "epoch": 2.8044515103338634, "percentage": 93.62, "elapsed_time": "5:59:20", "remaining_time": "0:24:30"}
{"current_steps": 670, "total_steps": 705, "loss": 0.4839, "lr": 5e-06, "epoch": 2.846846846846847, "percentage": 95.04, "elapsed_time": "6:04:41", "remaining_time": "0:19:03"}
{"current_steps": 680, "total_steps": 705, "loss": 0.4889, "lr": 5e-06, "epoch": 2.8892421833598303, "percentage": 96.45, "elapsed_time": "6:10:01", "remaining_time": "0:13:36"}
{"current_steps": 690, "total_steps": 705, "loss": 0.4859, "lr": 5e-06, "epoch": 2.931637519872814, "percentage": 97.87, "elapsed_time": "6:15:20", "remaining_time": "0:08:09"}
{"current_steps": 700, "total_steps": 705, "loss": 0.4895, "lr": 5e-06, "epoch": 2.9740328563857976, "percentage": 99.29, "elapsed_time": "6:20:41", "remaining_time": "0:02:43"}
{"current_steps": 705, "total_steps": 705, "eval_loss": 0.586609423160553, "epoch": 2.9952305246422894, "percentage": 100.0, "elapsed_time": "6:27:23", "remaining_time": "0:00:00"}
{"current_steps": 705, "total_steps": 705, "epoch": 2.9952305246422894, "percentage": 100.0, "elapsed_time": "6:28:59", "remaining_time": "0:00:00"}