|
{"current_steps": 1, "total_steps": 855, "loss": 0.057, "lr": 1.1627906976744186e-06, "epoch": 0.005822416302765648, "percentage": 0.12, "elapsed_time": "0:00:11", "remaining_time": "2:49:14"} |
|
{"current_steps": 2, "total_steps": 855, "loss": 0.0549, "lr": 2.325581395348837e-06, "epoch": 0.011644832605531296, "percentage": 0.23, "elapsed_time": "0:00:22", "remaining_time": "2:37:16"} |
|
{"current_steps": 3, "total_steps": 855, "loss": 0.0583, "lr": 3.488372093023256e-06, "epoch": 0.017467248908296942, "percentage": 0.35, "elapsed_time": "0:00:32", "remaining_time": "2:34:14"} |
|
{"current_steps": 4, "total_steps": 855, "loss": 0.0543, "lr": 4.651162790697674e-06, "epoch": 0.023289665211062592, "percentage": 0.47, "elapsed_time": "0:00:42", "remaining_time": "2:31:44"} |
|
{"current_steps": 5, "total_steps": 855, "loss": 0.0536, "lr": 5.8139534883720935e-06, "epoch": 0.02911208151382824, "percentage": 0.58, "elapsed_time": "0:00:53", "remaining_time": "2:30:43"} |
|
{"current_steps": 5, "total_steps": 855, "eval_loss": 0.05216066539287567, "epoch": 0.02911208151382824, "percentage": 0.58, "elapsed_time": "0:00:58", "remaining_time": "2:46:34"} |
|
{"current_steps": 6, "total_steps": 855, "loss": 0.0538, "lr": 6.976744186046512e-06, "epoch": 0.034934497816593885, "percentage": 0.7, "elapsed_time": "0:01:09", "remaining_time": "2:43:00"} |
|
{"current_steps": 7, "total_steps": 855, "loss": 0.0524, "lr": 8.139534883720931e-06, "epoch": 0.040756914119359534, "percentage": 0.82, "elapsed_time": "0:01:19", "remaining_time": "2:40:27"} |
|
{"current_steps": 8, "total_steps": 855, "loss": 0.0461, "lr": 9.302325581395349e-06, "epoch": 0.046579330422125184, "percentage": 0.94, "elapsed_time": "0:01:30", "remaining_time": "2:39:12"} |
|
{"current_steps": 9, "total_steps": 855, "loss": 0.0422, "lr": 1.0465116279069768e-05, "epoch": 0.05240174672489083, "percentage": 1.05, "elapsed_time": "0:01:40", "remaining_time": "2:37:41"} |
|
{"current_steps": 10, "total_steps": 855, "loss": 0.0383, "lr": 1.1627906976744187e-05, "epoch": 0.05822416302765648, "percentage": 1.17, "elapsed_time": "0:01:50", "remaining_time": "2:36:04"} |
|
{"current_steps": 10, "total_steps": 855, "eval_loss": 0.03332599997520447, "epoch": 0.05822416302765648, "percentage": 1.17, "elapsed_time": "0:01:56", "remaining_time": "2:43:55"} |
|
{"current_steps": 11, "total_steps": 855, "loss": 0.0335, "lr": 1.2790697674418606e-05, "epoch": 0.06404657933042213, "percentage": 1.29, "elapsed_time": "0:02:06", "remaining_time": "2:42:17"} |
|
{"current_steps": 12, "total_steps": 855, "loss": 0.0298, "lr": 1.3953488372093024e-05, "epoch": 0.06986899563318777, "percentage": 1.4, "elapsed_time": "0:02:17", "remaining_time": "2:40:53"} |
|
{"current_steps": 13, "total_steps": 855, "loss": 0.0285, "lr": 1.5116279069767441e-05, "epoch": 0.07569141193595343, "percentage": 1.52, "elapsed_time": "0:02:27", "remaining_time": "2:39:33"} |
|
{"current_steps": 14, "total_steps": 855, "loss": 0.0234, "lr": 1.6279069767441862e-05, "epoch": 0.08151382823871907, "percentage": 1.64, "elapsed_time": "0:02:38", "remaining_time": "2:38:18"} |
|
{"current_steps": 15, "total_steps": 855, "loss": 0.0217, "lr": 1.744186046511628e-05, "epoch": 0.08733624454148471, "percentage": 1.75, "elapsed_time": "0:02:48", "remaining_time": "2:37:14"} |
|
{"current_steps": 15, "total_steps": 855, "eval_loss": 0.021105380728840828, "epoch": 0.08733624454148471, "percentage": 1.75, "elapsed_time": "0:02:54", "remaining_time": "2:42:27"} |
|
{"current_steps": 16, "total_steps": 855, "loss": 0.0218, "lr": 1.8604651162790697e-05, "epoch": 0.09315866084425037, "percentage": 1.87, "elapsed_time": "0:03:04", "remaining_time": "2:41:13"} |
|
{"current_steps": 17, "total_steps": 855, "loss": 0.0207, "lr": 1.9767441860465116e-05, "epoch": 0.09898107714701601, "percentage": 1.99, "elapsed_time": "0:03:14", "remaining_time": "2:40:05"} |
|
{"current_steps": 18, "total_steps": 855, "loss": 0.0201, "lr": 2.0930232558139536e-05, "epoch": 0.10480349344978165, "percentage": 2.11, "elapsed_time": "0:03:25", "remaining_time": "2:39:00"} |
|
{"current_steps": 19, "total_steps": 855, "loss": 0.0205, "lr": 2.2093023255813955e-05, "epoch": 0.11062590975254731, "percentage": 2.22, "elapsed_time": "0:03:35", "remaining_time": "2:38:03"} |
|
{"current_steps": 20, "total_steps": 855, "loss": 0.0192, "lr": 2.3255813953488374e-05, "epoch": 0.11644832605531295, "percentage": 2.34, "elapsed_time": "0:03:46", "remaining_time": "2:37:18"} |
|
{"current_steps": 20, "total_steps": 855, "eval_loss": 0.015968428924679756, "epoch": 0.11644832605531295, "percentage": 2.34, "elapsed_time": "0:03:51", "remaining_time": "2:41:17"} |
|
{"current_steps": 21, "total_steps": 855, "loss": 0.0169, "lr": 2.441860465116279e-05, "epoch": 0.1222707423580786, "percentage": 2.46, "elapsed_time": "0:04:02", "remaining_time": "2:40:17"} |
|
{"current_steps": 22, "total_steps": 855, "loss": 0.0158, "lr": 2.5581395348837212e-05, "epoch": 0.12809315866084425, "percentage": 2.57, "elapsed_time": "0:04:12", "remaining_time": "2:39:18"} |
|
{"current_steps": 23, "total_steps": 855, "loss": 0.0147, "lr": 2.674418604651163e-05, "epoch": 0.1339155749636099, "percentage": 2.69, "elapsed_time": "0:04:22", "remaining_time": "2:38:30"} |
|
{"current_steps": 24, "total_steps": 855, "loss": 0.0148, "lr": 2.7906976744186048e-05, "epoch": 0.13973799126637554, "percentage": 2.81, "elapsed_time": "0:04:33", "remaining_time": "2:37:45"} |
|
{"current_steps": 25, "total_steps": 855, "loss": 0.0144, "lr": 2.9069767441860467e-05, "epoch": 0.14556040756914118, "percentage": 2.92, "elapsed_time": "0:04:43", "remaining_time": "2:37:03"} |
|
{"current_steps": 25, "total_steps": 855, "eval_loss": 0.013340415433049202, "epoch": 0.14556040756914118, "percentage": 2.92, "elapsed_time": "0:04:49", "remaining_time": "2:40:10"} |
|
{"current_steps": 26, "total_steps": 855, "loss": 0.0144, "lr": 3.0232558139534883e-05, "epoch": 0.15138282387190685, "percentage": 3.04, "elapsed_time": "0:04:59", "remaining_time": "2:39:15"} |
|
{"current_steps": 27, "total_steps": 855, "loss": 0.0147, "lr": 3.13953488372093e-05, "epoch": 0.1572052401746725, "percentage": 3.16, "elapsed_time": "0:05:10", "remaining_time": "2:38:28"} |
|
{"current_steps": 28, "total_steps": 855, "loss": 0.0132, "lr": 3.2558139534883724e-05, "epoch": 0.16302765647743814, "percentage": 3.27, "elapsed_time": "0:05:20", "remaining_time": "2:37:46"} |
|
{"current_steps": 29, "total_steps": 855, "loss": 0.0131, "lr": 3.372093023255814e-05, "epoch": 0.16885007278020378, "percentage": 3.39, "elapsed_time": "0:05:30", "remaining_time": "2:37:06"} |
|
{"current_steps": 30, "total_steps": 855, "loss": 0.0127, "lr": 3.488372093023256e-05, "epoch": 0.17467248908296942, "percentage": 3.51, "elapsed_time": "0:05:41", "remaining_time": "2:36:26"} |
|
{"current_steps": 30, "total_steps": 855, "eval_loss": 0.011912389658391476, "epoch": 0.17467248908296942, "percentage": 3.51, "elapsed_time": "0:05:46", "remaining_time": "2:39:00"} |
|
{"current_steps": 31, "total_steps": 855, "loss": 0.0136, "lr": 3.604651162790698e-05, "epoch": 0.1804949053857351, "percentage": 3.63, "elapsed_time": "0:05:57", "remaining_time": "2:38:18"} |
|
{"current_steps": 32, "total_steps": 855, "loss": 0.013, "lr": 3.7209302325581394e-05, "epoch": 0.18631732168850074, "percentage": 3.74, "elapsed_time": "0:06:07", "remaining_time": "2:37:35"} |
|
{"current_steps": 33, "total_steps": 855, "loss": 0.0137, "lr": 3.837209302325582e-05, "epoch": 0.19213973799126638, "percentage": 3.86, "elapsed_time": "0:06:17", "remaining_time": "2:36:55"} |
|
{"current_steps": 34, "total_steps": 855, "loss": 0.0127, "lr": 3.953488372093023e-05, "epoch": 0.19796215429403202, "percentage": 3.98, "elapsed_time": "0:06:28", "remaining_time": "2:36:15"} |
|
{"current_steps": 35, "total_steps": 855, "loss": 0.0113, "lr": 4.0697674418604655e-05, "epoch": 0.20378457059679767, "percentage": 4.09, "elapsed_time": "0:06:38", "remaining_time": "2:35:43"} |
|
{"current_steps": 35, "total_steps": 855, "eval_loss": 0.010942057706415653, "epoch": 0.20378457059679767, "percentage": 4.09, "elapsed_time": "0:06:44", "remaining_time": "2:37:54"} |
|
{"current_steps": 36, "total_steps": 855, "loss": 0.0124, "lr": 4.186046511627907e-05, "epoch": 0.2096069868995633, "percentage": 4.21, "elapsed_time": "0:06:54", "remaining_time": "2:37:19"} |
|
{"current_steps": 37, "total_steps": 855, "loss": 0.0116, "lr": 4.302325581395349e-05, "epoch": 0.21542940320232898, "percentage": 4.33, "elapsed_time": "0:07:05", "remaining_time": "2:36:41"} |
|
{"current_steps": 38, "total_steps": 855, "loss": 0.0126, "lr": 4.418604651162791e-05, "epoch": 0.22125181950509462, "percentage": 4.44, "elapsed_time": "0:07:15", "remaining_time": "2:36:08"} |
|
{"current_steps": 39, "total_steps": 855, "loss": 0.0126, "lr": 4.5348837209302326e-05, "epoch": 0.22707423580786026, "percentage": 4.56, "elapsed_time": "0:07:26", "remaining_time": "2:35:35"} |
|
{"current_steps": 40, "total_steps": 855, "loss": 0.0115, "lr": 4.651162790697675e-05, "epoch": 0.2328966521106259, "percentage": 4.68, "elapsed_time": "0:07:36", "remaining_time": "2:35:03"} |
|
{"current_steps": 40, "total_steps": 855, "eval_loss": 0.010366181842982769, "epoch": 0.2328966521106259, "percentage": 4.68, "elapsed_time": "0:07:42", "remaining_time": "2:36:59"} |
|
{"current_steps": 41, "total_steps": 855, "loss": 0.0106, "lr": 4.7674418604651164e-05, "epoch": 0.23871906841339155, "percentage": 4.8, "elapsed_time": "0:07:52", "remaining_time": "2:36:25"} |
|
{"current_steps": 42, "total_steps": 855, "loss": 0.0112, "lr": 4.883720930232558e-05, "epoch": 0.2445414847161572, "percentage": 4.91, "elapsed_time": "0:08:03", "remaining_time": "2:35:52"} |
|
{"current_steps": 43, "total_steps": 855, "loss": 0.0119, "lr": 5e-05, "epoch": 0.25036390101892286, "percentage": 5.03, "elapsed_time": "0:08:13", "remaining_time": "2:35:22"} |
|
{"current_steps": 44, "total_steps": 855, "loss": 0.011, "lr": 5.1162790697674425e-05, "epoch": 0.2561863173216885, "percentage": 5.15, "elapsed_time": "0:08:23", "remaining_time": "2:34:48"} |
|
{"current_steps": 45, "total_steps": 855, "loss": 0.0105, "lr": 5.232558139534884e-05, "epoch": 0.26200873362445415, "percentage": 5.26, "elapsed_time": "0:08:34", "remaining_time": "2:34:18"} |
|
{"current_steps": 45, "total_steps": 855, "eval_loss": 0.009811058640480042, "epoch": 0.26200873362445415, "percentage": 5.26, "elapsed_time": "0:08:39", "remaining_time": "2:35:59"} |
|
{"current_steps": 46, "total_steps": 855, "loss": 0.0103, "lr": 5.348837209302326e-05, "epoch": 0.2678311499272198, "percentage": 5.38, "elapsed_time": "0:08:50", "remaining_time": "2:35:27"} |
|
{"current_steps": 47, "total_steps": 855, "loss": 0.0112, "lr": 5.465116279069767e-05, "epoch": 0.27365356622998543, "percentage": 5.5, "elapsed_time": "0:09:00", "remaining_time": "2:34:52"} |
|
{"current_steps": 48, "total_steps": 855, "loss": 0.0094, "lr": 5.5813953488372095e-05, "epoch": 0.2794759825327511, "percentage": 5.61, "elapsed_time": "0:09:11", "remaining_time": "2:34:24"} |
|
{"current_steps": 49, "total_steps": 855, "loss": 0.0106, "lr": 5.697674418604652e-05, "epoch": 0.2852983988355167, "percentage": 5.73, "elapsed_time": "0:09:21", "remaining_time": "2:33:57"} |
|
{"current_steps": 50, "total_steps": 855, "loss": 0.0099, "lr": 5.8139534883720933e-05, "epoch": 0.29112081513828236, "percentage": 5.85, "elapsed_time": "0:09:32", "remaining_time": "2:33:30"} |
|
{"current_steps": 50, "total_steps": 855, "eval_loss": 0.009307770058512688, "epoch": 0.29112081513828236, "percentage": 5.85, "elapsed_time": "0:09:37", "remaining_time": "2:35:01"} |
|
{"current_steps": 51, "total_steps": 855, "loss": 0.0103, "lr": 5.9302325581395356e-05, "epoch": 0.29694323144104806, "percentage": 5.96, "elapsed_time": "0:10:14", "remaining_time": "2:41:21"} |
|
{"current_steps": 52, "total_steps": 855, "loss": 0.0096, "lr": 6.0465116279069765e-05, "epoch": 0.3027656477438137, "percentage": 6.08, "elapsed_time": "0:10:24", "remaining_time": "2:40:45"} |
|
{"current_steps": 53, "total_steps": 855, "loss": 0.009, "lr": 6.162790697674418e-05, "epoch": 0.30858806404657935, "percentage": 6.2, "elapsed_time": "0:10:34", "remaining_time": "2:40:06"} |
|
{"current_steps": 54, "total_steps": 855, "loss": 0.01, "lr": 6.27906976744186e-05, "epoch": 0.314410480349345, "percentage": 6.32, "elapsed_time": "0:10:45", "remaining_time": "2:39:30"} |
|
{"current_steps": 55, "total_steps": 855, "loss": 0.0102, "lr": 6.395348837209303e-05, "epoch": 0.32023289665211063, "percentage": 6.43, "elapsed_time": "0:10:55", "remaining_time": "2:38:57"} |
|
{"current_steps": 55, "total_steps": 855, "eval_loss": 0.009018822573125362, "epoch": 0.32023289665211063, "percentage": 6.43, "elapsed_time": "0:11:01", "remaining_time": "2:40:18"} |
|
{"current_steps": 56, "total_steps": 855, "loss": 0.0088, "lr": 6.511627906976745e-05, "epoch": 0.3260553129548763, "percentage": 6.55, "elapsed_time": "0:11:11", "remaining_time": "2:39:41"} |
|
{"current_steps": 57, "total_steps": 855, "loss": 0.0096, "lr": 6.627906976744186e-05, "epoch": 0.3318777292576419, "percentage": 6.67, "elapsed_time": "0:11:21", "remaining_time": "2:39:04"} |
|
{"current_steps": 58, "total_steps": 855, "loss": 0.0092, "lr": 6.744186046511628e-05, "epoch": 0.33770014556040756, "percentage": 6.78, "elapsed_time": "0:11:32", "remaining_time": "2:38:30"} |
|
{"current_steps": 59, "total_steps": 855, "loss": 0.0098, "lr": 6.86046511627907e-05, "epoch": 0.3435225618631732, "percentage": 6.9, "elapsed_time": "0:11:42", "remaining_time": "2:37:57"} |
|
{"current_steps": 60, "total_steps": 855, "loss": 0.0092, "lr": 6.976744186046513e-05, "epoch": 0.34934497816593885, "percentage": 7.02, "elapsed_time": "0:11:52", "remaining_time": "2:37:23"} |
|
{"current_steps": 60, "total_steps": 855, "eval_loss": 0.008659596554934978, "epoch": 0.34934497816593885, "percentage": 7.02, "elapsed_time": "0:11:58", "remaining_time": "2:38:39"} |
|
{"current_steps": 61, "total_steps": 855, "loss": 0.009, "lr": 7.093023255813955e-05, "epoch": 0.3551673944687045, "percentage": 7.13, "elapsed_time": "0:12:08", "remaining_time": "2:38:03"} |
|
{"current_steps": 62, "total_steps": 855, "loss": 0.0087, "lr": 7.209302325581396e-05, "epoch": 0.3609898107714702, "percentage": 7.25, "elapsed_time": "0:12:19", "remaining_time": "2:37:32"} |
|
{"current_steps": 63, "total_steps": 855, "loss": 0.0096, "lr": 7.325581395348837e-05, "epoch": 0.36681222707423583, "percentage": 7.37, "elapsed_time": "0:12:29", "remaining_time": "2:37:01"} |
|
{"current_steps": 64, "total_steps": 855, "loss": 0.0095, "lr": 7.441860465116279e-05, "epoch": 0.3726346433770015, "percentage": 7.49, "elapsed_time": "0:12:39", "remaining_time": "2:36:30"} |
|
{"current_steps": 65, "total_steps": 855, "loss": 0.0093, "lr": 7.558139534883721e-05, "epoch": 0.3784570596797671, "percentage": 7.6, "elapsed_time": "0:12:50", "remaining_time": "2:36:00"} |
|
{"current_steps": 65, "total_steps": 855, "eval_loss": 0.0085279056802392, "epoch": 0.3784570596797671, "percentage": 7.6, "elapsed_time": "0:12:55", "remaining_time": "2:37:08"} |
|
{"current_steps": 66, "total_steps": 855, "loss": 0.0093, "lr": 7.674418604651163e-05, "epoch": 0.38427947598253276, "percentage": 7.72, "elapsed_time": "0:13:06", "remaining_time": "2:36:38"} |
|
{"current_steps": 67, "total_steps": 855, "loss": 0.0095, "lr": 7.790697674418606e-05, "epoch": 0.3901018922852984, "percentage": 7.84, "elapsed_time": "0:13:16", "remaining_time": "2:36:08"} |
|
{"current_steps": 68, "total_steps": 855, "loss": 0.0089, "lr": 7.906976744186047e-05, "epoch": 0.39592430858806404, "percentage": 7.95, "elapsed_time": "0:13:26", "remaining_time": "2:35:39"} |
|
{"current_steps": 69, "total_steps": 855, "loss": 0.0096, "lr": 8.023255813953489e-05, "epoch": 0.4017467248908297, "percentage": 8.07, "elapsed_time": "0:13:37", "remaining_time": "2:35:10"} |
|
{"current_steps": 70, "total_steps": 855, "loss": 0.0084, "lr": 8.139534883720931e-05, "epoch": 0.40756914119359533, "percentage": 8.19, "elapsed_time": "0:13:47", "remaining_time": "2:34:43"} |
|
{"current_steps": 70, "total_steps": 855, "eval_loss": 0.008337407372891903, "epoch": 0.40756914119359533, "percentage": 8.19, "elapsed_time": "0:13:53", "remaining_time": "2:35:46"} |
|
{"current_steps": 71, "total_steps": 855, "loss": 0.0084, "lr": 8.255813953488373e-05, "epoch": 0.413391557496361, "percentage": 8.3, "elapsed_time": "0:14:03", "remaining_time": "2:35:19"} |
|
{"current_steps": 72, "total_steps": 855, "loss": 0.0086, "lr": 8.372093023255814e-05, "epoch": 0.4192139737991266, "percentage": 8.42, "elapsed_time": "0:14:14", "remaining_time": "2:34:51"} |
|
{"current_steps": 73, "total_steps": 855, "loss": 0.0091, "lr": 8.488372093023255e-05, "epoch": 0.42503639010189226, "percentage": 8.54, "elapsed_time": "0:14:24", "remaining_time": "2:34:22"} |
|
{"current_steps": 74, "total_steps": 855, "loss": 0.0088, "lr": 8.604651162790697e-05, "epoch": 0.43085880640465796, "percentage": 8.65, "elapsed_time": "0:14:35", "remaining_time": "2:33:55"} |
|
{"current_steps": 75, "total_steps": 855, "loss": 0.0088, "lr": 8.72093023255814e-05, "epoch": 0.4366812227074236, "percentage": 8.77, "elapsed_time": "0:14:45", "remaining_time": "2:33:30"} |
|
{"current_steps": 75, "total_steps": 855, "eval_loss": 0.008286843076348305, "epoch": 0.4366812227074236, "percentage": 8.77, "elapsed_time": "0:14:51", "remaining_time": "2:34:29"} |
|
{"current_steps": 76, "total_steps": 855, "loss": 0.0096, "lr": 8.837209302325582e-05, "epoch": 0.44250363901018924, "percentage": 8.89, "elapsed_time": "0:15:01", "remaining_time": "2:34:03"} |
|
{"current_steps": 77, "total_steps": 855, "loss": 0.0084, "lr": 8.953488372093024e-05, "epoch": 0.4483260553129549, "percentage": 9.01, "elapsed_time": "0:15:12", "remaining_time": "2:33:37"} |
|
{"current_steps": 78, "total_steps": 855, "loss": 0.0079, "lr": 9.069767441860465e-05, "epoch": 0.45414847161572053, "percentage": 9.12, "elapsed_time": "0:15:22", "remaining_time": "2:33:12"} |
|
{"current_steps": 79, "total_steps": 855, "loss": 0.0094, "lr": 9.186046511627907e-05, "epoch": 0.45997088791848617, "percentage": 9.24, "elapsed_time": "0:15:33", "remaining_time": "2:32:48"} |
|
{"current_steps": 80, "total_steps": 855, "loss": 0.0084, "lr": 9.30232558139535e-05, "epoch": 0.4657933042212518, "percentage": 9.36, "elapsed_time": "0:15:44", "remaining_time": "2:32:25"} |
|
{"current_steps": 80, "total_steps": 855, "eval_loss": 0.007919220253825188, "epoch": 0.4657933042212518, "percentage": 9.36, "elapsed_time": "0:15:49", "remaining_time": "2:33:20"} |
|
{"current_steps": 81, "total_steps": 855, "loss": 0.0086, "lr": 9.418604651162792e-05, "epoch": 0.47161572052401746, "percentage": 9.47, "elapsed_time": "0:16:00", "remaining_time": "2:32:56"} |
|
{"current_steps": 82, "total_steps": 855, "loss": 0.0089, "lr": 9.534883720930233e-05, "epoch": 0.4774381368267831, "percentage": 9.59, "elapsed_time": "0:16:10", "remaining_time": "2:32:31"} |
|
{"current_steps": 83, "total_steps": 855, "loss": 0.0086, "lr": 9.651162790697675e-05, "epoch": 0.48326055312954874, "percentage": 9.71, "elapsed_time": "0:16:21", "remaining_time": "2:32:07"} |
|
{"current_steps": 84, "total_steps": 855, "loss": 0.0087, "lr": 9.767441860465116e-05, "epoch": 0.4890829694323144, "percentage": 9.82, "elapsed_time": "0:16:31", "remaining_time": "2:31:42"} |
|
{"current_steps": 85, "total_steps": 855, "loss": 0.0086, "lr": 9.883720930232558e-05, "epoch": 0.4949053857350801, "percentage": 9.94, "elapsed_time": "0:16:42", "remaining_time": "2:31:17"} |
|
{"current_steps": 85, "total_steps": 855, "eval_loss": 0.0079297861084342, "epoch": 0.4949053857350801, "percentage": 9.94, "elapsed_time": "0:16:47", "remaining_time": "2:32:07"} |
|
{"current_steps": 86, "total_steps": 855, "loss": 0.0089, "lr": 0.0001, "epoch": 0.5007278020378457, "percentage": 10.06, "elapsed_time": "0:16:57", "remaining_time": "2:31:41"} |
|
{"current_steps": 87, "total_steps": 855, "loss": 0.0087, "lr": 9.999958275948725e-05, "epoch": 0.5065502183406113, "percentage": 10.18, "elapsed_time": "0:17:08", "remaining_time": "2:31:15"} |
|
{"current_steps": 88, "total_steps": 855, "loss": 0.0088, "lr": 9.999833104491258e-05, "epoch": 0.512372634643377, "percentage": 10.29, "elapsed_time": "0:17:18", "remaining_time": "2:30:50"} |
|
{"current_steps": 89, "total_steps": 855, "loss": 0.0088, "lr": 9.999624487716665e-05, "epoch": 0.5181950509461426, "percentage": 10.41, "elapsed_time": "0:17:28", "remaining_time": "2:30:26"} |
|
{"current_steps": 90, "total_steps": 855, "loss": 0.0079, "lr": 9.99933242910668e-05, "epoch": 0.5240174672489083, "percentage": 10.53, "elapsed_time": "0:17:39", "remaining_time": "2:30:04"} |
|
{"current_steps": 90, "total_steps": 855, "eval_loss": 0.0078043341636657715, "epoch": 0.5240174672489083, "percentage": 10.53, "elapsed_time": "0:17:44", "remaining_time": "2:30:51"} |
|
{"current_steps": 91, "total_steps": 855, "loss": 0.0082, "lr": 9.998956933535648e-05, "epoch": 0.529839883551674, "percentage": 10.64, "elapsed_time": "0:17:55", "remaining_time": "2:30:25"} |
|
{"current_steps": 92, "total_steps": 855, "loss": 0.0083, "lr": 9.99849800727045e-05, "epoch": 0.5356622998544396, "percentage": 10.76, "elapsed_time": "0:18:05", "remaining_time": "2:30:02"} |
|
{"current_steps": 93, "total_steps": 855, "loss": 0.0079, "lr": 9.99795565797039e-05, "epoch": 0.5414847161572053, "percentage": 10.88, "elapsed_time": "0:18:15", "remaining_time": "2:29:39"} |
|
{"current_steps": 94, "total_steps": 855, "loss": 0.0077, "lr": 9.997329894687073e-05, "epoch": 0.5473071324599709, "percentage": 10.99, "elapsed_time": "0:18:26", "remaining_time": "2:29:16"} |
|
{"current_steps": 95, "total_steps": 855, "loss": 0.0083, "lr": 9.996620727864252e-05, "epoch": 0.5531295487627366, "percentage": 11.11, "elapsed_time": "0:18:36", "remaining_time": "2:28:53"} |
|
{"current_steps": 95, "total_steps": 855, "eval_loss": 0.007659674622118473, "epoch": 0.5531295487627366, "percentage": 11.11, "elapsed_time": "0:18:42", "remaining_time": "2:29:38"} |
|
{"current_steps": 96, "total_steps": 855, "loss": 0.0087, "lr": 9.995828169337649e-05, "epoch": 0.5589519650655022, "percentage": 11.23, "elapsed_time": "0:18:52", "remaining_time": "2:29:17"} |
|
{"current_steps": 97, "total_steps": 855, "loss": 0.0084, "lr": 9.994952232334766e-05, "epoch": 0.5647743813682679, "percentage": 11.35, "elapsed_time": "0:19:03", "remaining_time": "2:28:56"} |
|
{"current_steps": 98, "total_steps": 855, "loss": 0.0088, "lr": 9.993992931474662e-05, "epoch": 0.5705967976710334, "percentage": 11.46, "elapsed_time": "0:19:13", "remaining_time": "2:28:33"} |
|
{"current_steps": 99, "total_steps": 855, "loss": 0.0082, "lr": 9.9929502827677e-05, "epoch": 0.5764192139737991, "percentage": 11.58, "elapsed_time": "0:19:24", "remaining_time": "2:28:10"} |
|
{"current_steps": 100, "total_steps": 855, "loss": 0.0086, "lr": 9.991824303615293e-05, "epoch": 0.5822416302765647, "percentage": 11.7, "elapsed_time": "0:19:34", "remaining_time": "2:27:49"} |
|
{"current_steps": 100, "total_steps": 855, "eval_loss": 0.007812130730599165, "epoch": 0.5822416302765647, "percentage": 11.7, "elapsed_time": "0:19:40", "remaining_time": "2:28:32"} |
|
{"current_steps": 101, "total_steps": 855, "loss": 0.0079, "lr": 9.990615012809607e-05, "epoch": 0.5880640465793304, "percentage": 11.81, "elapsed_time": "0:20:33", "remaining_time": "2:33:31"} |
|
{"current_steps": 102, "total_steps": 855, "loss": 0.0079, "lr": 9.989322430533246e-05, "epoch": 0.5938864628820961, "percentage": 11.93, "elapsed_time": "0:20:44", "remaining_time": "2:33:05"} |
|
{"current_steps": 103, "total_steps": 855, "loss": 0.0077, "lr": 9.987946578358917e-05, "epoch": 0.5997088791848617, "percentage": 12.05, "elapsed_time": "0:20:54", "remaining_time": "2:32:40"} |
|
{"current_steps": 104, "total_steps": 855, "loss": 0.0086, "lr": 9.986487479249072e-05, "epoch": 0.6055312954876274, "percentage": 12.16, "elapsed_time": "0:21:04", "remaining_time": "2:32:14"} |
|
{"current_steps": 105, "total_steps": 855, "loss": 0.0089, "lr": 9.98494515755552e-05, "epoch": 0.611353711790393, "percentage": 12.28, "elapsed_time": "0:21:15", "remaining_time": "2:31:48"} |
|
{"current_steps": 105, "total_steps": 855, "eval_loss": 0.007567914668470621, "epoch": 0.611353711790393, "percentage": 12.28, "elapsed_time": "0:21:20", "remaining_time": "2:32:28"} |
|
{"current_steps": 106, "total_steps": 855, "loss": 0.0081, "lr": 9.983319639019025e-05, "epoch": 0.6171761280931587, "percentage": 12.4, "elapsed_time": "0:21:31", "remaining_time": "2:32:05"} |
|
{"current_steps": 107, "total_steps": 855, "loss": 0.0082, "lr": 9.981610950768873e-05, "epoch": 0.6229985443959243, "percentage": 12.51, "elapsed_time": "0:21:41", "remaining_time": "2:31:41"} |
|
{"current_steps": 108, "total_steps": 855, "loss": 0.0094, "lr": 9.979819121322427e-05, "epoch": 0.62882096069869, "percentage": 12.63, "elapsed_time": "0:21:52", "remaining_time": "2:31:17"} |
|
{"current_steps": 109, "total_steps": 855, "loss": 0.008, "lr": 9.977944180584636e-05, "epoch": 0.6346433770014556, "percentage": 12.75, "elapsed_time": "0:22:02", "remaining_time": "2:30:53"} |
|
{"current_steps": 110, "total_steps": 855, "loss": 0.0075, "lr": 9.975986159847553e-05, "epoch": 0.6404657933042213, "percentage": 12.87, "elapsed_time": "0:22:13", "remaining_time": "2:30:29"} |
|
{"current_steps": 110, "total_steps": 855, "eval_loss": 0.007617466617375612, "epoch": 0.6404657933042213, "percentage": 12.87, "elapsed_time": "0:22:18", "remaining_time": "2:31:07"} |
|
{"current_steps": 111, "total_steps": 855, "loss": 0.0095, "lr": 9.973945091789795e-05, "epoch": 0.6462882096069869, "percentage": 12.98, "elapsed_time": "0:22:29", "remaining_time": "2:30:43"} |
|
{"current_steps": 112, "total_steps": 855, "loss": 0.0082, "lr": 9.97182101047602e-05, "epoch": 0.6521106259097526, "percentage": 13.1, "elapsed_time": "0:22:39", "remaining_time": "2:30:19"} |
|
{"current_steps": 113, "total_steps": 855, "loss": 0.0081, "lr": 9.969613951356338e-05, "epoch": 0.6579330422125182, "percentage": 13.22, "elapsed_time": "0:22:49", "remaining_time": "2:29:54"} |
|
{"current_steps": 114, "total_steps": 855, "loss": 0.0081, "lr": 9.967323951265726e-05, "epoch": 0.6637554585152838, "percentage": 13.33, "elapsed_time": "0:23:00", "remaining_time": "2:29:31"} |
|
{"current_steps": 115, "total_steps": 855, "loss": 0.0078, "lr": 9.964951048423416e-05, "epoch": 0.6695778748180495, "percentage": 13.45, "elapsed_time": "0:23:10", "remaining_time": "2:29:07"} |
|
{"current_steps": 115, "total_steps": 855, "eval_loss": 0.0075353775173425674, "epoch": 0.6695778748180495, "percentage": 13.45, "elapsed_time": "0:23:16", "remaining_time": "2:29:43"} |
|
{"current_steps": 116, "total_steps": 855, "loss": 0.0082, "lr": 9.962495282432256e-05, "epoch": 0.6754002911208151, "percentage": 13.57, "elapsed_time": "0:23:26", "remaining_time": "2:29:20"} |
|
{"current_steps": 117, "total_steps": 855, "loss": 0.0076, "lr": 9.959956694278052e-05, "epoch": 0.6812227074235808, "percentage": 13.68, "elapsed_time": "0:23:37", "remaining_time": "2:28:58"} |
|
{"current_steps": 118, "total_steps": 855, "loss": 0.0095, "lr": 9.957335326328874e-05, "epoch": 0.6870451237263464, "percentage": 13.8, "elapsed_time": "0:23:47", "remaining_time": "2:28:36"} |
|
{"current_steps": 119, "total_steps": 855, "loss": 0.0078, "lr": 9.954631222334357e-05, "epoch": 0.6928675400291121, "percentage": 13.92, "elapsed_time": "0:23:58", "remaining_time": "2:28:14"} |
|
{"current_steps": 120, "total_steps": 855, "loss": 0.0079, "lr": 9.951844427424973e-05, "epoch": 0.6986899563318777, "percentage": 14.04, "elapsed_time": "0:24:08", "remaining_time": "2:27:52"} |
|
{"current_steps": 120, "total_steps": 855, "eval_loss": 0.007408523932099342, "epoch": 0.6986899563318777, "percentage": 14.04, "elapsed_time": "0:24:14", "remaining_time": "2:28:27"} |
|
{"current_steps": 121, "total_steps": 855, "loss": 0.008, "lr": 9.948974988111271e-05, "epoch": 0.7045123726346434, "percentage": 14.15, "elapsed_time": "0:24:24", "remaining_time": "2:28:05"} |
|
{"current_steps": 122, "total_steps": 855, "loss": 0.0079, "lr": 9.946022952283105e-05, "epoch": 0.710334788937409, "percentage": 14.27, "elapsed_time": "0:24:35", "remaining_time": "2:27:44"} |
|
{"current_steps": 123, "total_steps": 855, "loss": 0.0083, "lr": 9.94298836920883e-05, "epoch": 0.7161572052401747, "percentage": 14.39, "elapsed_time": "0:24:45", "remaining_time": "2:27:22"} |
|
{"current_steps": 124, "total_steps": 855, "loss": 0.0077, "lr": 9.939871289534487e-05, "epoch": 0.7219796215429404, "percentage": 14.5, "elapsed_time": "0:24:56", "remaining_time": "2:26:59"} |
|
{"current_steps": 125, "total_steps": 855, "loss": 0.0078, "lr": 9.936671765282956e-05, "epoch": 0.727802037845706, "percentage": 14.62, "elapsed_time": "0:25:06", "remaining_time": "2:26:37"} |
|
{"current_steps": 125, "total_steps": 855, "eval_loss": 0.0072646611370146275, "epoch": 0.727802037845706, "percentage": 14.62, "elapsed_time": "0:25:12", "remaining_time": "2:27:10"} |
|
{"current_steps": 126, "total_steps": 855, "loss": 0.0072, "lr": 9.933389849853079e-05, "epoch": 0.7336244541484717, "percentage": 14.74, "elapsed_time": "0:25:22", "remaining_time": "2:26:48"} |
|
{"current_steps": 127, "total_steps": 855, "loss": 0.0075, "lr": 9.93002559801878e-05, "epoch": 0.7394468704512372, "percentage": 14.85, "elapsed_time": "0:25:32", "remaining_time": "2:26:26"} |
|
{"current_steps": 128, "total_steps": 855, "loss": 0.0075, "lr": 9.926579065928145e-05, "epoch": 0.745269286754003, "percentage": 14.97, "elapsed_time": "0:25:43", "remaining_time": "2:26:04"} |
|
{"current_steps": 129, "total_steps": 855, "loss": 0.0077, "lr": 9.923050311102487e-05, "epoch": 0.7510917030567685, "percentage": 15.09, "elapsed_time": "0:25:53", "remaining_time": "2:25:43"} |
|
{"current_steps": 130, "total_steps": 855, "loss": 0.008, "lr": 9.919439392435386e-05, "epoch": 0.7569141193595342, "percentage": 15.2, "elapsed_time": "0:26:04", "remaining_time": "2:25:23"} |
|
{"current_steps": 130, "total_steps": 855, "eval_loss": 0.0071721505373716354, "epoch": 0.7569141193595342, "percentage": 15.2, "elapsed_time": "0:26:09", "remaining_time": "2:25:54"} |
|
{"current_steps": 131, "total_steps": 855, "loss": 0.0075, "lr": 9.915746370191702e-05, "epoch": 0.7627365356622998, "percentage": 15.32, "elapsed_time": "0:26:20", "remaining_time": "2:25:33"} |
|
{"current_steps": 132, "total_steps": 855, "loss": 0.0084, "lr": 9.911971306006577e-05, "epoch": 0.7685589519650655, "percentage": 15.44, "elapsed_time": "0:26:30", "remaining_time": "2:25:11"} |
|
{"current_steps": 133, "total_steps": 855, "loss": 0.0073, "lr": 9.908114262884398e-05, "epoch": 0.7743813682678311, "percentage": 15.56, "elapsed_time": "0:26:40", "remaining_time": "2:24:50"} |
|
{"current_steps": 134, "total_steps": 855, "loss": 0.0075, "lr": 9.904175305197751e-05, "epoch": 0.7802037845705968, "percentage": 15.67, "elapsed_time": "0:26:51", "remaining_time": "2:24:29"} |
|
{"current_steps": 135, "total_steps": 855, "loss": 0.0077, "lr": 9.900154498686348e-05, "epoch": 0.7860262008733624, "percentage": 15.79, "elapsed_time": "0:27:01", "remaining_time": "2:24:07"} |
|
{"current_steps": 135, "total_steps": 855, "eval_loss": 0.007017082534730434, "epoch": 0.7860262008733624, "percentage": 15.79, "elapsed_time": "0:27:07", "remaining_time": "2:24:37"} |
|
{"current_steps": 136, "total_steps": 855, "loss": 0.0075, "lr": 9.89605191045592e-05, "epoch": 0.7918486171761281, "percentage": 15.91, "elapsed_time": "0:27:17", "remaining_time": "2:24:17"} |
|
{"current_steps": 137, "total_steps": 855, "loss": 0.0073, "lr": 9.89186760897711e-05, "epoch": 0.7976710334788938, "percentage": 16.02, "elapsed_time": "0:27:27", "remaining_time": "2:23:56"} |
|
{"current_steps": 138, "total_steps": 855, "loss": 0.008, "lr": 9.887601664084321e-05, "epoch": 0.8034934497816594, "percentage": 16.14, "elapsed_time": "0:27:38", "remaining_time": "2:23:36"} |
|
{"current_steps": 139, "total_steps": 855, "loss": 0.0086, "lr": 9.883254146974554e-05, "epoch": 0.8093158660844251, "percentage": 16.26, "elapsed_time": "0:27:48", "remaining_time": "2:23:16"} |
|
{"current_steps": 140, "total_steps": 855, "loss": 0.0079, "lr": 9.87882513020622e-05, "epoch": 0.8151382823871907, "percentage": 16.37, "elapsed_time": "0:27:59", "remaining_time": "2:22:56"} |
|
{"current_steps": 140, "total_steps": 855, "eval_loss": 0.0069827428087592125, "epoch": 0.8151382823871907, "percentage": 16.37, "elapsed_time": "0:28:05", "remaining_time": "2:23:25"} |
|
{"current_steps": 141, "total_steps": 855, "loss": 0.0075, "lr": 9.874314687697927e-05, "epoch": 0.8209606986899564, "percentage": 16.49, "elapsed_time": "0:28:15", "remaining_time": "2:23:05"} |
|
{"current_steps": 142, "total_steps": 855, "loss": 0.0074, "lr": 9.869722894727252e-05, "epoch": 0.826783114992722, "percentage": 16.61, "elapsed_time": "0:28:25", "remaining_time": "2:22:44"} |
|
{"current_steps": 143, "total_steps": 855, "loss": 0.0078, "lr": 9.865049827929475e-05, "epoch": 0.8326055312954876, "percentage": 16.73, "elapsed_time": "0:28:36", "remaining_time": "2:22:25"} |
|
{"current_steps": 144, "total_steps": 855, "loss": 0.0075, "lr": 9.860295565296307e-05, "epoch": 0.8384279475982532, "percentage": 16.84, "elapsed_time": "0:28:46", "remaining_time": "2:22:04"} |
|
{"current_steps": 145, "total_steps": 855, "loss": 0.0071, "lr": 9.855460186174587e-05, "epoch": 0.8442503639010189, "percentage": 16.96, "elapsed_time": "0:28:56", "remaining_time": "2:21:44"} |
|
{"current_steps": 145, "total_steps": 855, "eval_loss": 0.006980584003031254, "epoch": 0.8442503639010189, "percentage": 16.96, "elapsed_time": "0:29:02", "remaining_time": "2:22:11"} |
|
{"current_steps": 146, "total_steps": 855, "loss": 0.0073, "lr": 9.850543771264959e-05, "epoch": 0.8500727802037845, "percentage": 17.08, "elapsed_time": "0:29:12", "remaining_time": "2:21:51"} |
|
{"current_steps": 147, "total_steps": 855, "loss": 0.008, "lr": 9.845546402620523e-05, "epoch": 0.8558951965065502, "percentage": 17.19, "elapsed_time": "0:29:22", "remaining_time": "2:21:31"} |
|
{"current_steps": 148, "total_steps": 855, "loss": 0.0077, "lr": 9.840468163645463e-05, "epoch": 0.8617176128093159, "percentage": 17.31, "elapsed_time": "0:29:33", "remaining_time": "2:21:11"} |
|
{"current_steps": 149, "total_steps": 855, "loss": 0.0072, "lr": 9.835309139093659e-05, "epoch": 0.8675400291120815, "percentage": 17.43, "elapsed_time": "0:29:43", "remaining_time": "2:20:51"} |
|
{"current_steps": 150, "total_steps": 855, "loss": 0.0072, "lr": 9.830069415067275e-05, "epoch": 0.8733624454148472, "percentage": 17.54, "elapsed_time": "0:29:54", "remaining_time": "2:20:31"} |
|
{"current_steps": 150, "total_steps": 855, "eval_loss": 0.0071106115356087685, "epoch": 0.8733624454148472, "percentage": 17.54, "elapsed_time": "0:29:59", "remaining_time": "2:20:58"} |
|
{"current_steps": 151, "total_steps": 855, "loss": 0.0075, "lr": 9.824749079015318e-05, "epoch": 0.8791848617176128, "percentage": 17.66, "elapsed_time": "0:30:37", "remaining_time": "2:22:49"} |
|
{"current_steps": 152, "total_steps": 855, "loss": 0.0072, "lr": 9.819348219732177e-05, "epoch": 0.8850072780203785, "percentage": 17.78, "elapsed_time": "0:30:48", "remaining_time": "2:22:29"} |
|
{"current_steps": 153, "total_steps": 855, "loss": 0.0072, "lr": 9.813866927356142e-05, "epoch": 0.8908296943231441, "percentage": 17.89, "elapsed_time": "0:30:58", "remaining_time": "2:22:08"} |
|
{"current_steps": 154, "total_steps": 855, "loss": 0.007, "lr": 9.808305293367905e-05, "epoch": 0.8966521106259098, "percentage": 18.01, "elapsed_time": "0:31:09", "remaining_time": "2:21:49"} |
|
{"current_steps": 155, "total_steps": 855, "loss": 0.0076, "lr": 9.802663410589023e-05, "epoch": 0.9024745269286754, "percentage": 18.13, "elapsed_time": "0:31:19", "remaining_time": "2:21:29"} |
|
{"current_steps": 155, "total_steps": 855, "eval_loss": 0.006998821161687374, "epoch": 0.9024745269286754, "percentage": 18.13, "elapsed_time": "0:31:25", "remaining_time": "2:21:54"} |
|
{"current_steps": 156, "total_steps": 855, "loss": 0.0073, "lr": 9.796941373180385e-05, "epoch": 0.9082969432314411, "percentage": 18.25, "elapsed_time": "0:31:35", "remaining_time": "2:21:34"} |
|
{"current_steps": 157, "total_steps": 855, "loss": 0.0075, "lr": 9.791139276640615e-05, "epoch": 0.9141193595342066, "percentage": 18.36, "elapsed_time": "0:31:46", "remaining_time": "2:21:14"} |
|
{"current_steps": 158, "total_steps": 855, "loss": 0.0076, "lr": 9.78525721780451e-05, "epoch": 0.9199417758369723, "percentage": 18.48, "elapsed_time": "0:31:56", "remaining_time": "2:20:53"} |
|
{"current_steps": 159, "total_steps": 855, "loss": 0.0069, "lr": 9.779295294841397e-05, "epoch": 0.925764192139738, "percentage": 18.6, "elapsed_time": "0:32:06", "remaining_time": "2:20:35"} |
|
{"current_steps": 160, "total_steps": 855, "loss": 0.0075, "lr": 9.773253607253507e-05, "epoch": 0.9315866084425036, "percentage": 18.71, "elapsed_time": "0:32:17", "remaining_time": "2:20:14"} |
|
{"current_steps": 160, "total_steps": 855, "eval_loss": 0.0070083122700452805, "epoch": 0.9315866084425036, "percentage": 18.71, "elapsed_time": "0:32:22", "remaining_time": "2:20:39"} |
|
{"current_steps": 161, "total_steps": 855, "loss": 0.0068, "lr": 9.767132255874315e-05, "epoch": 0.9374090247452693, "percentage": 18.83, "elapsed_time": "0:32:33", "remaining_time": "2:20:20"} |
|
{"current_steps": 162, "total_steps": 855, "loss": 0.0073, "lr": 9.76093134286685e-05, "epoch": 0.9432314410480349, "percentage": 18.95, "elapsed_time": "0:32:43", "remaining_time": "2:20:00"} |
|
{"current_steps": 163, "total_steps": 855, "loss": 0.0071, "lr": 9.754650971722e-05, "epoch": 0.9490538573508006, "percentage": 19.06, "elapsed_time": "0:32:53", "remaining_time": "2:19:40"} |
|
{"current_steps": 164, "total_steps": 855, "loss": 0.0071, "lr": 9.748291247256773e-05, "epoch": 0.9548762736535662, "percentage": 19.18, "elapsed_time": "0:33:04", "remaining_time": "2:19:20"} |
|
{"current_steps": 165, "total_steps": 855, "loss": 0.0074, "lr": 9.74185227561256e-05, "epoch": 0.9606986899563319, "percentage": 19.3, "elapsed_time": "0:33:14", "remaining_time": "2:19:01"} |
|
{"current_steps": 165, "total_steps": 855, "eval_loss": 0.006897931452840567, "epoch": 0.9606986899563319, "percentage": 19.3, "elapsed_time": "0:33:20", "remaining_time": "2:19:24"} |
|
{"current_steps": 166, "total_steps": 855, "loss": 0.007, "lr": 9.735334164253352e-05, "epoch": 0.9665211062590975, "percentage": 19.42, "elapsed_time": "0:33:30", "remaining_time": "2:19:04"} |
|
{"current_steps": 167, "total_steps": 855, "loss": 0.0076, "lr": 9.728737021963954e-05, "epoch": 0.9723435225618632, "percentage": 19.53, "elapsed_time": "0:33:41", "remaining_time": "2:18:46"} |
|
{"current_steps": 168, "total_steps": 855, "loss": 0.0072, "lr": 9.722060958848168e-05, "epoch": 0.9781659388646288, "percentage": 19.65, "elapsed_time": "0:33:51", "remaining_time": "2:18:26"} |
|
{"current_steps": 169, "total_steps": 855, "loss": 0.0071, "lr": 9.715306086326954e-05, "epoch": 0.9839883551673945, "percentage": 19.77, "elapsed_time": "0:34:01", "remaining_time": "2:18:07"} |
|
{"current_steps": 170, "total_steps": 855, "loss": 0.0073, "lr": 9.70847251713657e-05, "epoch": 0.9898107714701602, "percentage": 19.88, "elapsed_time": "0:34:12", "remaining_time": "2:17:48"} |
|
{"current_steps": 170, "total_steps": 855, "eval_loss": 0.006916682235896587, "epoch": 0.9898107714701602, "percentage": 19.88, "elapsed_time": "0:34:17", "remaining_time": "2:18:11"} |
|
{"current_steps": 171, "total_steps": 855, "loss": 0.0074, "lr": 9.701560365326695e-05, "epoch": 0.9956331877729258, "percentage": 20.0, "elapsed_time": "0:34:28", "remaining_time": "2:17:52"} |
|
{"current_steps": 172, "total_steps": 855, "loss": 0.0092, "lr": 9.694569746258515e-05, "epoch": 1.0014556040756915, "percentage": 20.12, "elapsed_time": "0:34:38", "remaining_time": "2:17:34"} |
|
{"current_steps": 173, "total_steps": 855, "loss": 0.0067, "lr": 9.687500776602813e-05, "epoch": 1.007278020378457, "percentage": 20.23, "elapsed_time": "0:34:49", "remaining_time": "2:17:15"} |
|
{"current_steps": 174, "total_steps": 855, "loss": 0.0074, "lr": 9.680353574338011e-05, "epoch": 1.0131004366812226, "percentage": 20.35, "elapsed_time": "0:34:59", "remaining_time": "2:16:57"} |
|
{"current_steps": 175, "total_steps": 855, "loss": 0.007, "lr": 9.6731282587482e-05, "epoch": 1.0189228529839884, "percentage": 20.47, "elapsed_time": "0:35:09", "remaining_time": "2:16:38"} |
|
{"current_steps": 175, "total_steps": 855, "eval_loss": 0.006880656350404024, "epoch": 1.0189228529839884, "percentage": 20.47, "elapsed_time": "0:35:15", "remaining_time": "2:16:59"} |
|
{"current_steps": 176, "total_steps": 855, "loss": 0.0078, "lr": 9.665824950421156e-05, "epoch": 1.024745269286754, "percentage": 20.58, "elapsed_time": "0:35:25", "remaining_time": "2:16:41"} |
|
{"current_steps": 177, "total_steps": 855, "loss": 0.007, "lr": 9.658443771246322e-05, "epoch": 1.0305676855895196, "percentage": 20.7, "elapsed_time": "0:35:36", "remaining_time": "2:16:22"} |
|
{"current_steps": 178, "total_steps": 855, "loss": 0.0071, "lr": 9.650984844412779e-05, "epoch": 1.0363901018922852, "percentage": 20.82, "elapsed_time": "0:35:46", "remaining_time": "2:16:04"} |
|
{"current_steps": 179, "total_steps": 855, "loss": 0.0067, "lr": 9.643448294407186e-05, "epoch": 1.042212518195051, "percentage": 20.94, "elapsed_time": "0:35:56", "remaining_time": "2:15:45"} |
|
{"current_steps": 180, "total_steps": 855, "loss": 0.0072, "lr": 9.635834247011702e-05, "epoch": 1.0480349344978166, "percentage": 21.05, "elapsed_time": "0:36:07", "remaining_time": "2:15:27"} |
|
{"current_steps": 180, "total_steps": 855, "eval_loss": 0.006873424164950848, "epoch": 1.0480349344978166, "percentage": 21.05, "elapsed_time": "0:36:13", "remaining_time": "2:15:49"} |
|
{"current_steps": 181, "total_steps": 855, "loss": 0.0068, "lr": 9.628142829301886e-05, "epoch": 1.0538573508005822, "percentage": 21.17, "elapsed_time": "0:36:23", "remaining_time": "2:15:30"} |
|
{"current_steps": 182, "total_steps": 855, "loss": 0.0062, "lr": 9.620374169644584e-05, "epoch": 1.059679767103348, "percentage": 21.29, "elapsed_time": "0:36:33", "remaining_time": "2:15:12"} |
|
{"current_steps": 183, "total_steps": 855, "loss": 0.0071, "lr": 9.612528397695777e-05, "epoch": 1.0655021834061136, "percentage": 21.4, "elapsed_time": "0:36:44", "remaining_time": "2:14:54"} |
|
{"current_steps": 184, "total_steps": 855, "loss": 0.007, "lr": 9.60460564439842e-05, "epoch": 1.0713245997088792, "percentage": 21.52, "elapsed_time": "0:36:54", "remaining_time": "2:14:36"} |
|
{"current_steps": 185, "total_steps": 855, "loss": 0.0068, "lr": 9.59660604198026e-05, "epoch": 1.0771470160116448, "percentage": 21.64, "elapsed_time": "0:37:05", "remaining_time": "2:14:19"} |
|
{"current_steps": 185, "total_steps": 855, "eval_loss": 0.006770225707441568, "epoch": 1.0771470160116448, "percentage": 21.64, "elapsed_time": "0:37:10", "remaining_time": "2:14:39"} |
|
{"current_steps": 186, "total_steps": 855, "loss": 0.0075, "lr": 9.588529723951625e-05, "epoch": 1.0829694323144106, "percentage": 21.75, "elapsed_time": "0:37:21", "remaining_time": "2:14:21"} |
|
{"current_steps": 187, "total_steps": 855, "loss": 0.0062, "lr": 9.5803768251032e-05, "epoch": 1.0887918486171762, "percentage": 21.87, "elapsed_time": "0:37:31", "remaining_time": "2:14:03"} |
|
{"current_steps": 188, "total_steps": 855, "loss": 0.007, "lr": 9.57214748150377e-05, "epoch": 1.0946142649199417, "percentage": 21.99, "elapsed_time": "0:37:42", "remaining_time": "2:13:46"} |
|
{"current_steps": 189, "total_steps": 855, "loss": 0.0068, "lr": 9.563841830497957e-05, "epoch": 1.1004366812227073, "percentage": 22.11, "elapsed_time": "0:37:52", "remaining_time": "2:13:28"} |
|
{"current_steps": 190, "total_steps": 855, "loss": 0.0067, "lr": 9.555460010703927e-05, "epoch": 1.1062590975254731, "percentage": 22.22, "elapsed_time": "0:38:03", "remaining_time": "2:13:11"} |
|
{"current_steps": 190, "total_steps": 855, "eval_loss": 0.006855105049908161, "epoch": 1.1062590975254731, "percentage": 22.22, "elapsed_time": "0:38:08", "remaining_time": "2:13:30"} |
|
{"current_steps": 191, "total_steps": 855, "loss": 0.0069, "lr": 9.54700216201107e-05, "epoch": 1.1120815138282387, "percentage": 22.34, "elapsed_time": "0:38:19", "remaining_time": "2:13:12"} |
|
{"current_steps": 192, "total_steps": 855, "loss": 0.007, "lr": 9.53846842557767e-05, "epoch": 1.1179039301310043, "percentage": 22.46, "elapsed_time": "0:38:29", "remaining_time": "2:12:55"} |
|
{"current_steps": 193, "total_steps": 855, "loss": 0.0068, "lr": 9.529858943828549e-05, "epoch": 1.1237263464337701, "percentage": 22.57, "elapsed_time": "0:38:40", "remaining_time": "2:12:38"} |
|
{"current_steps": 194, "total_steps": 855, "loss": 0.0071, "lr": 9.521173860452694e-05, "epoch": 1.1295487627365357, "percentage": 22.69, "elapsed_time": "0:38:50", "remaining_time": "2:12:20"} |
|
{"current_steps": 195, "total_steps": 855, "loss": 0.0075, "lr": 9.512413320400847e-05, "epoch": 1.1353711790393013, "percentage": 22.81, "elapsed_time": "0:39:01", "remaining_time": "2:12:03"} |
|
{"current_steps": 195, "total_steps": 855, "eval_loss": 0.006784664932638407, "epoch": 1.1353711790393013, "percentage": 22.81, "elapsed_time": "0:39:06", "remaining_time": "2:12:22"} |
|
{"current_steps": 196, "total_steps": 855, "loss": 0.0073, "lr": 9.503577469883098e-05, "epoch": 1.1411935953420669, "percentage": 22.92, "elapsed_time": "0:39:17", "remaining_time": "2:12:04"} |
|
{"current_steps": 197, "total_steps": 855, "loss": 0.007, "lr": 9.494666456366442e-05, "epoch": 1.1470160116448327, "percentage": 23.04, "elapsed_time": "0:39:27", "remaining_time": "2:11:47"} |
|
{"current_steps": 198, "total_steps": 855, "loss": 0.0064, "lr": 9.485680428572308e-05, "epoch": 1.1528384279475983, "percentage": 23.16, "elapsed_time": "0:39:38", "remaining_time": "2:11:31"} |
|
{"current_steps": 199, "total_steps": 855, "loss": 0.0067, "lr": 9.476619536474091e-05, "epoch": 1.1586608442503639, "percentage": 23.27, "elapsed_time": "0:39:48", "remaining_time": "2:11:14"} |
|
{"current_steps": 200, "total_steps": 855, "loss": 0.0072, "lr": 9.467483931294644e-05, "epoch": 1.1644832605531295, "percentage": 23.39, "elapsed_time": "0:39:58", "remaining_time": "2:10:56"} |
|
{"current_steps": 200, "total_steps": 855, "eval_loss": 0.006834269501268864, "epoch": 1.1644832605531295, "percentage": 23.39, "elapsed_time": "0:40:04", "remaining_time": "2:11:15"} |
|
{"current_steps": 201, "total_steps": 855, "loss": 0.0067, "lr": 9.458273765503749e-05, "epoch": 1.1703056768558953, "percentage": 23.51, "elapsed_time": "0:40:42", "remaining_time": "2:12:27"} |
|
{"current_steps": 202, "total_steps": 855, "loss": 0.0071, "lr": 9.448989192815579e-05, "epoch": 1.1761280931586608, "percentage": 23.63, "elapsed_time": "0:40:52", "remaining_time": "2:12:09"} |
|
{"current_steps": 203, "total_steps": 855, "loss": 0.0069, "lr": 9.439630368186126e-05, "epoch": 1.1819505094614264, "percentage": 23.74, "elapsed_time": "0:41:03", "remaining_time": "2:11:51"} |
|
{"current_steps": 204, "total_steps": 855, "loss": 0.0068, "lr": 9.430197447810624e-05, "epoch": 1.1877729257641922, "percentage": 23.86, "elapsed_time": "0:41:13", "remaining_time": "2:11:33"} |
|
{"current_steps": 205, "total_steps": 855, "loss": 0.0075, "lr": 9.420690589120934e-05, "epoch": 1.1935953420669578, "percentage": 23.98, "elapsed_time": "0:41:24", "remaining_time": "2:11:16"} |
|
{"current_steps": 205, "total_steps": 855, "eval_loss": 0.006762022618204355, "epoch": 1.1935953420669578, "percentage": 23.98, "elapsed_time": "0:41:29", "remaining_time": "2:11:34"} |
|
{"current_steps": 206, "total_steps": 855, "loss": 0.0069, "lr": 9.411109950782919e-05, "epoch": 1.1994177583697234, "percentage": 24.09, "elapsed_time": "0:41:40", "remaining_time": "2:11:16"} |
|
{"current_steps": 207, "total_steps": 855, "loss": 0.0065, "lr": 9.401455692693798e-05, "epoch": 1.205240174672489, "percentage": 24.21, "elapsed_time": "0:41:50", "remaining_time": "2:10:58"} |
|
{"current_steps": 208, "total_steps": 855, "loss": 0.0068, "lr": 9.391727975979475e-05, "epoch": 1.2110625909752548, "percentage": 24.33, "elapsed_time": "0:42:00", "remaining_time": "2:10:41"} |
|
{"current_steps": 209, "total_steps": 855, "loss": 0.0069, "lr": 9.381926962991847e-05, "epoch": 1.2168850072780204, "percentage": 24.44, "elapsed_time": "0:42:11", "remaining_time": "2:10:23"} |
|
{"current_steps": 210, "total_steps": 855, "loss": 0.0066, "lr": 9.372052817306106e-05, "epoch": 1.222707423580786, "percentage": 24.56, "elapsed_time": "0:42:21", "remaining_time": "2:10:06"} |
|
{"current_steps": 210, "total_steps": 855, "eval_loss": 0.006686727050691843, "epoch": 1.222707423580786, "percentage": 24.56, "elapsed_time": "0:42:27", "remaining_time": "2:10:23"} |
|
{"current_steps": 211, "total_steps": 855, "loss": 0.0069, "lr": 9.362105703717996e-05, "epoch": 1.2285298398835516, "percentage": 24.68, "elapsed_time": "0:42:37", "remaining_time": "2:10:05"} |
|
{"current_steps": 212, "total_steps": 855, "loss": 0.0069, "lr": 9.352085788241064e-05, "epoch": 1.2343522561863174, "percentage": 24.8, "elapsed_time": "0:42:47", "remaining_time": "2:09:48"} |
|
{"current_steps": 213, "total_steps": 855, "loss": 0.0071, "lr": 9.3419932381039e-05, "epoch": 1.240174672489083, "percentage": 24.91, "elapsed_time": "0:42:58", "remaining_time": "2:09:30"} |
|
{"current_steps": 214, "total_steps": 855, "loss": 0.0067, "lr": 9.331828221747335e-05, "epoch": 1.2459970887918486, "percentage": 25.03, "elapsed_time": "0:43:08", "remaining_time": "2:09:14"} |
|
{"current_steps": 215, "total_steps": 855, "loss": 0.0068, "lr": 9.321590908821635e-05, "epoch": 1.2518195050946144, "percentage": 25.15, "elapsed_time": "0:43:19", "remaining_time": "2:08:57"} |
|
{"current_steps": 215, "total_steps": 855, "eval_loss": 0.006763411220163107, "epoch": 1.2518195050946144, "percentage": 25.15, "elapsed_time": "0:43:24", "remaining_time": "2:09:14"} |
|
{"current_steps": 216, "total_steps": 855, "loss": 0.0065, "lr": 9.311281470183667e-05, "epoch": 1.25764192139738, "percentage": 25.26, "elapsed_time": "0:43:35", "remaining_time": "2:08:57"} |
|
{"current_steps": 217, "total_steps": 855, "loss": 0.0071, "lr": 9.30090007789405e-05, "epoch": 1.2634643377001455, "percentage": 25.38, "elapsed_time": "0:43:45", "remaining_time": "2:08:40"} |
|
{"current_steps": 218, "total_steps": 855, "loss": 0.0072, "lr": 9.29044690521428e-05, "epoch": 1.2692867540029111, "percentage": 25.5, "elapsed_time": "0:43:56", "remaining_time": "2:08:23"} |
|
{"current_steps": 219, "total_steps": 855, "loss": 0.0065, "lr": 9.279922126603845e-05, "epoch": 1.2751091703056767, "percentage": 25.61, "elapsed_time": "0:44:06", "remaining_time": "2:08:06"} |
|
{"current_steps": 220, "total_steps": 855, "loss": 0.007, "lr": 9.269325917717307e-05, "epoch": 1.2809315866084425, "percentage": 25.73, "elapsed_time": "0:44:17", "remaining_time": "2:07:49"} |
|
{"current_steps": 220, "total_steps": 855, "eval_loss": 0.006922724656760693, "epoch": 1.2809315866084425, "percentage": 25.73, "elapsed_time": "0:44:22", "remaining_time": "2:08:05"} |
|
{"current_steps": 221, "total_steps": 855, "loss": 0.0069, "lr": 9.258658455401366e-05, "epoch": 1.2867540029112081, "percentage": 25.85, "elapsed_time": "0:44:33", "remaining_time": "2:07:49"} |
|
{"current_steps": 222, "total_steps": 855, "loss": 0.0066, "lr": 9.247919917691923e-05, "epoch": 1.2925764192139737, "percentage": 25.96, "elapsed_time": "0:44:43", "remaining_time": "2:07:32"} |
|
{"current_steps": 223, "total_steps": 855, "loss": 0.0072, "lr": 9.237110483811096e-05, "epoch": 1.2983988355167395, "percentage": 26.08, "elapsed_time": "0:44:54", "remaining_time": "2:07:15"} |
|
{"current_steps": 224, "total_steps": 855, "loss": 0.0066, "lr": 9.226230334164236e-05, "epoch": 1.304221251819505, "percentage": 26.2, "elapsed_time": "0:45:04", "remaining_time": "2:06:58"} |
|
{"current_steps": 225, "total_steps": 855, "loss": 0.0065, "lr": 9.215279650336911e-05, "epoch": 1.3100436681222707, "percentage": 26.32, "elapsed_time": "0:45:14", "remaining_time": "2:06:41"} |
|
{"current_steps": 225, "total_steps": 855, "eval_loss": 0.006786634214222431, "epoch": 1.3100436681222707, "percentage": 26.32, "elapsed_time": "0:45:20", "remaining_time": "2:06:56"} |
|
{"current_steps": 226, "total_steps": 855, "loss": 0.0066, "lr": 9.204258615091879e-05, "epoch": 1.3158660844250365, "percentage": 26.43, "elapsed_time": "0:45:30", "remaining_time": "2:06:39"} |
|
{"current_steps": 227, "total_steps": 855, "loss": 0.0064, "lr": 9.193167412366035e-05, "epoch": 1.321688500727802, "percentage": 26.55, "elapsed_time": "0:45:40", "remaining_time": "2:06:21"} |
|
{"current_steps": 228, "total_steps": 855, "loss": 0.007, "lr": 9.182006227267344e-05, "epoch": 1.3275109170305677, "percentage": 26.67, "elapsed_time": "0:45:50", "remaining_time": "2:06:05"} |
|
{"current_steps": 229, "total_steps": 855, "loss": 0.0071, "lr": 9.170775246071748e-05, "epoch": 1.3333333333333333, "percentage": 26.78, "elapsed_time": "0:46:01", "remaining_time": "2:05:48"} |
|
{"current_steps": 230, "total_steps": 855, "loss": 0.0063, "lr": 9.159474656220063e-05, "epoch": 1.3391557496360988, "percentage": 26.9, "elapsed_time": "0:46:11", "remaining_time": "2:05:31"} |
|
{"current_steps": 230, "total_steps": 855, "eval_loss": 0.006848746910691261, "epoch": 1.3391557496360988, "percentage": 26.9, "elapsed_time": "0:46:17", "remaining_time": "2:05:46"} |
|
{"current_steps": 231, "total_steps": 855, "loss": 0.0074, "lr": 9.148104646314845e-05, "epoch": 1.3449781659388647, "percentage": 27.02, "elapsed_time": "0:46:27", "remaining_time": "2:05:29"} |
|
{"current_steps": 232, "total_steps": 855, "loss": 0.0065, "lr": 9.136665406117244e-05, "epoch": 1.3508005822416302, "percentage": 27.13, "elapsed_time": "0:46:37", "remaining_time": "2:05:12"} |
|
{"current_steps": 233, "total_steps": 855, "loss": 0.0071, "lr": 9.125157126543838e-05, "epoch": 1.3566229985443958, "percentage": 27.25, "elapsed_time": "0:46:48", "remaining_time": "2:04:56"} |
|
{"current_steps": 234, "total_steps": 855, "loss": 0.0069, "lr": 9.113579999663446e-05, "epoch": 1.3624454148471616, "percentage": 27.37, "elapsed_time": "0:46:58", "remaining_time": "2:04:39"} |
|
{"current_steps": 235, "total_steps": 855, "loss": 0.0068, "lr": 9.101934218693923e-05, "epoch": 1.3682678311499272, "percentage": 27.49, "elapsed_time": "0:47:08", "remaining_time": "2:04:22"} |
|
{"current_steps": 235, "total_steps": 855, "eval_loss": 0.00672443863004446, "epoch": 1.3682678311499272, "percentage": 27.49, "elapsed_time": "0:47:14", "remaining_time": "2:04:37"} |
|
{"current_steps": 236, "total_steps": 855, "loss": 0.0071, "lr": 9.090219977998932e-05, "epoch": 1.3740902474526928, "percentage": 27.6, "elapsed_time": "0:47:24", "remaining_time": "2:04:21"} |
|
{"current_steps": 237, "total_steps": 855, "loss": 0.0074, "lr": 9.078437473084706e-05, "epoch": 1.3799126637554586, "percentage": 27.72, "elapsed_time": "0:47:35", "remaining_time": "2:04:05"} |
|
{"current_steps": 238, "total_steps": 855, "loss": 0.0067, "lr": 9.066586900596781e-05, "epoch": 1.3857350800582242, "percentage": 27.84, "elapsed_time": "0:47:45", "remaining_time": "2:03:48"} |
|
{"current_steps": 239, "total_steps": 855, "loss": 0.0065, "lr": 9.054668458316713e-05, "epoch": 1.3915574963609898, "percentage": 27.95, "elapsed_time": "0:47:55", "remaining_time": "2:03:32"} |
|
{"current_steps": 240, "total_steps": 855, "loss": 0.0066, "lr": 9.042682345158782e-05, "epoch": 1.3973799126637554, "percentage": 28.07, "elapsed_time": "0:48:06", "remaining_time": "2:03:16"} |
|
{"current_steps": 240, "total_steps": 855, "eval_loss": 0.006713456474244595, "epoch": 1.3973799126637554, "percentage": 28.07, "elapsed_time": "0:48:11", "remaining_time": "2:03:30"} |
|
{"current_steps": 241, "total_steps": 855, "loss": 0.0067, "lr": 9.030628761166669e-05, "epoch": 1.403202328966521, "percentage": 28.19, "elapsed_time": "0:48:22", "remaining_time": "2:03:14"} |
|
{"current_steps": 242, "total_steps": 855, "loss": 0.0073, "lr": 9.018507907510114e-05, "epoch": 1.4090247452692868, "percentage": 28.3, "elapsed_time": "0:48:32", "remaining_time": "2:02:58"} |
|
{"current_steps": 243, "total_steps": 855, "loss": 0.0067, "lr": 9.006319986481568e-05, "epoch": 1.4148471615720524, "percentage": 28.42, "elapsed_time": "0:48:43", "remaining_time": "2:02:42"} |
|
{"current_steps": 244, "total_steps": 855, "loss": 0.0066, "lr": 8.994065201492803e-05, "epoch": 1.420669577874818, "percentage": 28.54, "elapsed_time": "0:48:53", "remaining_time": "2:02:25"} |
|
{"current_steps": 245, "total_steps": 855, "loss": 0.0063, "lr": 8.981743757071536e-05, "epoch": 1.4264919941775838, "percentage": 28.65, "elapsed_time": "0:49:03", "remaining_time": "2:02:09"} |
|
{"current_steps": 245, "total_steps": 855, "eval_loss": 0.006786659825593233, "epoch": 1.4264919941775838, "percentage": 28.65, "elapsed_time": "0:49:09", "remaining_time": "2:02:23"} |
|
{"current_steps": 246, "total_steps": 855, "loss": 0.0072, "lr": 8.969355858857994e-05, "epoch": 1.4323144104803494, "percentage": 28.77, "elapsed_time": "0:49:19", "remaining_time": "2:02:07"} |
|
{"current_steps": 247, "total_steps": 855, "loss": 0.0066, "lr": 8.956901713601499e-05, "epoch": 1.438136826783115, "percentage": 28.89, "elapsed_time": "0:49:30", "remaining_time": "2:01:51"} |
|
{"current_steps": 248, "total_steps": 855, "loss": 0.0066, "lr": 8.944381529157009e-05, "epoch": 1.4439592430858808, "percentage": 29.01, "elapsed_time": "0:49:40", "remaining_time": "2:01:35"} |
|
{"current_steps": 249, "total_steps": 855, "loss": 0.0063, "lr": 8.93179551448165e-05, "epoch": 1.4497816593886463, "percentage": 29.12, "elapsed_time": "0:49:51", "remaining_time": "2:01:19"} |
|
{"current_steps": 250, "total_steps": 855, "loss": 0.0069, "lr": 8.919143879631231e-05, "epoch": 1.455604075691412, "percentage": 29.24, "elapsed_time": "0:50:01", "remaining_time": "2:01:03"} |
|
{"current_steps": 250, "total_steps": 855, "eval_loss": 0.006825124844908714, "epoch": 1.455604075691412, "percentage": 29.24, "elapsed_time": "0:50:07", "remaining_time": "2:01:17"} |
|
{"current_steps": 251, "total_steps": 855, "loss": 0.007, "lr": 8.906426835756736e-05, "epoch": 1.4614264919941775, "percentage": 29.36, "elapsed_time": "0:50:44", "remaining_time": "2:02:07"} |
|
{"current_steps": 252, "total_steps": 855, "loss": 0.0065, "lr": 8.893644595100803e-05, "epoch": 1.467248908296943, "percentage": 29.47, "elapsed_time": "0:50:55", "remaining_time": "2:01:50"} |
|
{"current_steps": 253, "total_steps": 855, "loss": 0.0068, "lr": 8.880797370994178e-05, "epoch": 1.473071324599709, "percentage": 29.59, "elapsed_time": "0:51:05", "remaining_time": "2:01:34"} |
|
{"current_steps": 254, "total_steps": 855, "loss": 0.0071, "lr": 8.867885377852155e-05, "epoch": 1.4788937409024745, "percentage": 29.71, "elapsed_time": "0:51:16", "remaining_time": "2:01:18"} |
|
{"current_steps": 255, "total_steps": 855, "loss": 0.0068, "lr": 8.854908831170998e-05, "epoch": 1.48471615720524, "percentage": 29.82, "elapsed_time": "0:51:26", "remaining_time": "2:01:02"} |
|
{"current_steps": 255, "total_steps": 855, "eval_loss": 0.0067093223333358765, "epoch": 1.48471615720524, "percentage": 29.82, "elapsed_time": "0:51:32", "remaining_time": "2:01:15"} |
|
{"current_steps": 256, "total_steps": 855, "loss": 0.0071, "lr": 8.841867947524349e-05, "epoch": 1.490538573508006, "percentage": 29.94, "elapsed_time": "0:51:42", "remaining_time": "2:00:59"} |
|
{"current_steps": 257, "total_steps": 855, "loss": 0.0068, "lr": 8.828762944559606e-05, "epoch": 1.4963609898107715, "percentage": 30.06, "elapsed_time": "0:51:53", "remaining_time": "2:00:43"} |
|
{"current_steps": 258, "total_steps": 855, "loss": 0.0066, "lr": 8.815594040994295e-05, "epoch": 1.502183406113537, "percentage": 30.18, "elapsed_time": "0:52:03", "remaining_time": "2:00:27"} |
|
{"current_steps": 259, "total_steps": 855, "loss": 0.0068, "lr": 8.802361456612421e-05, "epoch": 1.5080058224163029, "percentage": 30.29, "elapsed_time": "0:52:13", "remaining_time": "2:00:11"} |
|
{"current_steps": 260, "total_steps": 855, "loss": 0.0067, "lr": 8.789065412260793e-05, "epoch": 1.5138282387190685, "percentage": 30.41, "elapsed_time": "0:52:24", "remaining_time": "1:59:55"} |
|
{"current_steps": 260, "total_steps": 855, "eval_loss": 0.006685526110231876, "epoch": 1.5138282387190685, "percentage": 30.41, "elapsed_time": "0:52:29", "remaining_time": "2:00:08"} |
|
{"current_steps": 261, "total_steps": 855, "loss": 0.0068, "lr": 8.775706129845348e-05, "epoch": 1.519650655021834, "percentage": 30.53, "elapsed_time": "0:52:40", "remaining_time": "1:59:52"} |
|
{"current_steps": 262, "total_steps": 855, "loss": 0.0068, "lr": 8.762283832327436e-05, "epoch": 1.5254730713245999, "percentage": 30.64, "elapsed_time": "0:52:50", "remaining_time": "1:59:36"} |
|
{"current_steps": 263, "total_steps": 855, "loss": 0.0068, "lr": 8.748798743720115e-05, "epoch": 1.5312954876273652, "percentage": 30.76, "elapsed_time": "0:53:01", "remaining_time": "1:59:20"} |
|
{"current_steps": 264, "total_steps": 855, "loss": 0.0062, "lr": 8.735251089084391e-05, "epoch": 1.537117903930131, "percentage": 30.88, "elapsed_time": "0:53:11", "remaining_time": "1:59:04"} |
|
{"current_steps": 265, "total_steps": 855, "loss": 0.0063, "lr": 8.721641094525481e-05, "epoch": 1.5429403202328966, "percentage": 30.99, "elapsed_time": "0:53:21", "remaining_time": "1:58:48"} |
|
{"current_steps": 265, "total_steps": 855, "eval_loss": 0.006542210932821035, "epoch": 1.5429403202328966, "percentage": 30.99, "elapsed_time": "0:53:27", "remaining_time": "1:59:00"} |
|
{"current_steps": 266, "total_steps": 855, "loss": 0.007, "lr": 8.707968987189028e-05, "epoch": 1.5487627365356622, "percentage": 31.11, "elapsed_time": "0:53:37", "remaining_time": "1:58:44"} |
|
{"current_steps": 267, "total_steps": 855, "loss": 0.0064, "lr": 8.694234995257318e-05, "epoch": 1.554585152838428, "percentage": 31.23, "elapsed_time": "0:53:48", "remaining_time": "1:58:29"} |
|
{"current_steps": 268, "total_steps": 855, "loss": 0.0064, "lr": 8.680439347945459e-05, "epoch": 1.5604075691411936, "percentage": 31.35, "elapsed_time": "0:53:58", "remaining_time": "1:58:13"} |
|
{"current_steps": 269, "total_steps": 855, "loss": 0.0067, "lr": 8.666582275497576e-05, "epoch": 1.5662299854439592, "percentage": 31.46, "elapsed_time": "0:54:08", "remaining_time": "1:57:57"} |
|
{"current_steps": 270, "total_steps": 855, "loss": 0.0066, "lr": 8.652664009182945e-05, "epoch": 1.572052401746725, "percentage": 31.58, "elapsed_time": "0:54:19", "remaining_time": "1:57:42"} |
|
{"current_steps": 270, "total_steps": 855, "eval_loss": 0.006687200628221035, "epoch": 1.572052401746725, "percentage": 31.58, "elapsed_time": "0:54:25", "remaining_time": "1:57:54"} |
|
{"current_steps": 271, "total_steps": 855, "loss": 0.0065, "lr": 8.638684781292151e-05, "epoch": 1.5778748180494906, "percentage": 31.7, "elapsed_time": "0:54:35", "remaining_time": "1:57:38"} |
|
{"current_steps": 272, "total_steps": 855, "loss": 0.0067, "lr": 8.624644825133201e-05, "epoch": 1.5836972343522562, "percentage": 31.81, "elapsed_time": "0:54:45", "remaining_time": "1:57:22"} |
|
{"current_steps": 273, "total_steps": 855, "loss": 0.0065, "lr": 8.610544375027635e-05, "epoch": 1.589519650655022, "percentage": 31.93, "elapsed_time": "0:54:56", "remaining_time": "1:57:07"} |
|
{"current_steps": 274, "total_steps": 855, "loss": 0.0066, "lr": 8.596383666306617e-05, "epoch": 1.5953420669577874, "percentage": 32.05, "elapsed_time": "0:55:06", "remaining_time": "1:56:51"} |
|
{"current_steps": 275, "total_steps": 855, "loss": 0.0063, "lr": 8.582162935306999e-05, "epoch": 1.6011644832605532, "percentage": 32.16, "elapsed_time": "0:55:17", "remaining_time": "1:56:36"} |
|
{"current_steps": 275, "total_steps": 855, "eval_loss": 0.006565714720636606, "epoch": 1.6011644832605532, "percentage": 32.16, "elapsed_time": "0:55:22", "remaining_time": "1:56:48"} |
|
{"current_steps": 276, "total_steps": 855, "loss": 0.0066, "lr": 8.567882419367386e-05, "epoch": 1.6069868995633187, "percentage": 32.28, "elapsed_time": "0:55:33", "remaining_time": "1:56:32"} |
|
{"current_steps": 277, "total_steps": 855, "loss": 0.0069, "lr": 8.553542356824169e-05, "epoch": 1.6128093158660843, "percentage": 32.4, "elapsed_time": "0:55:43", "remaining_time": "1:56:17"} |
|
{"current_steps": 278, "total_steps": 855, "loss": 0.0068, "lr": 8.539142987007551e-05, "epoch": 1.6186317321688501, "percentage": 32.51, "elapsed_time": "0:55:54", "remaining_time": "1:56:01"} |
|
{"current_steps": 279, "total_steps": 855, "loss": 0.0067, "lr": 8.52468455023755e-05, "epoch": 1.6244541484716157, "percentage": 32.63, "elapsed_time": "0:56:04", "remaining_time": "1:55:45"} |
|
{"current_steps": 280, "total_steps": 855, "loss": 0.0064, "lr": 8.510167287819987e-05, "epoch": 1.6302765647743813, "percentage": 32.75, "elapsed_time": "0:56:14", "remaining_time": "1:55:29"} |
|
{"current_steps": 280, "total_steps": 855, "eval_loss": 0.006600580643862486, "epoch": 1.6302765647743813, "percentage": 32.75, "elapsed_time": "0:56:20", "remaining_time": "1:55:41"} |
|
{"current_steps": 281, "total_steps": 855, "loss": 0.0063, "lr": 8.495591442042464e-05, "epoch": 1.6360989810771471, "percentage": 32.87, "elapsed_time": "0:56:30", "remaining_time": "1:55:25"} |
|
{"current_steps": 282, "total_steps": 855, "loss": 0.0068, "lr": 8.480957256170315e-05, "epoch": 1.6419213973799127, "percentage": 32.98, "elapsed_time": "0:56:40", "remaining_time": "1:55:10"} |
|
{"current_steps": 283, "total_steps": 855, "loss": 0.0068, "lr": 8.466264974442548e-05, "epoch": 1.6477438136826783, "percentage": 33.1, "elapsed_time": "0:56:51", "remaining_time": "1:54:54"} |
|
{"current_steps": 284, "total_steps": 855, "loss": 0.0066, "lr": 8.451514842067771e-05, "epoch": 1.6535662299854441, "percentage": 33.22, "elapsed_time": "0:57:01", "remaining_time": "1:54:39"} |
|
{"current_steps": 285, "total_steps": 855, "loss": 0.0066, "lr": 8.436707105220096e-05, "epoch": 1.6593886462882095, "percentage": 33.33, "elapsed_time": "0:57:12", "remaining_time": "1:54:24"} |
|
{"current_steps": 285, "total_steps": 855, "eval_loss": 0.006613303907215595, "epoch": 1.6593886462882095, "percentage": 33.33, "elapsed_time": "0:57:17", "remaining_time": "1:54:35"} |
|
{"current_steps": 286, "total_steps": 855, "loss": 0.0068, "lr": 8.42184201103503e-05, "epoch": 1.6652110625909753, "percentage": 33.45, "elapsed_time": "0:57:28", "remaining_time": "1:54:20"} |
|
{"current_steps": 287, "total_steps": 855, "loss": 0.0063, "lr": 8.406919807605356e-05, "epoch": 1.6710334788937409, "percentage": 33.57, "elapsed_time": "0:57:38", "remaining_time": "1:54:04"} |
|
{"current_steps": 288, "total_steps": 855, "loss": 0.0062, "lr": 8.391940743976985e-05, "epoch": 1.6768558951965065, "percentage": 33.68, "elapsed_time": "0:57:48", "remaining_time": "1:53:49"} |
|
{"current_steps": 289, "total_steps": 855, "loss": 0.0066, "lr": 8.376905070144804e-05, "epoch": 1.6826783114992723, "percentage": 33.8, "elapsed_time": "0:57:59", "remaining_time": "1:53:34"} |
|
{"current_steps": 290, "total_steps": 855, "loss": 0.0068, "lr": 8.361813037048504e-05, "epoch": 1.6885007278020379, "percentage": 33.92, "elapsed_time": "0:58:09", "remaining_time": "1:53:19"} |
|
{"current_steps": 290, "total_steps": 855, "eval_loss": 0.006485569756478071, "epoch": 1.6885007278020379, "percentage": 33.92, "elapsed_time": "0:58:15", "remaining_time": "1:53:30"} |
|
{"current_steps": 291, "total_steps": 855, "loss": 0.0065, "lr": 8.346664896568389e-05, "epoch": 1.6943231441048034, "percentage": 34.04, "elapsed_time": "0:58:25", "remaining_time": "1:53:15"} |
|
{"current_steps": 292, "total_steps": 855, "loss": 0.0068, "lr": 8.331460901521178e-05, "epoch": 1.7001455604075693, "percentage": 34.15, "elapsed_time": "0:58:36", "remaining_time": "1:52:59"} |
|
{"current_steps": 293, "total_steps": 855, "loss": 0.0067, "lr": 8.316201305655775e-05, "epoch": 1.7059679767103348, "percentage": 34.27, "elapsed_time": "0:58:46", "remaining_time": "1:52:44"} |
|
{"current_steps": 294, "total_steps": 855, "loss": 0.0064, "lr": 8.300886363649048e-05, "epoch": 1.7117903930131004, "percentage": 34.39, "elapsed_time": "0:58:57", "remaining_time": "1:52:29"} |
|
{"current_steps": 295, "total_steps": 855, "loss": 0.0065, "lr": 8.285516331101562e-05, "epoch": 1.7176128093158662, "percentage": 34.5, "elapsed_time": "0:59:07", "remaining_time": "1:52:14"} |
|
{"current_steps": 295, "total_steps": 855, "eval_loss": 0.00643718708306551, "epoch": 1.7176128093158662, "percentage": 34.5, "elapsed_time": "0:59:13", "remaining_time": "1:52:24"} |
|
{"current_steps": 296, "total_steps": 855, "loss": 0.0063, "lr": 8.270091464533333e-05, "epoch": 1.7234352256186316, "percentage": 34.62, "elapsed_time": "0:59:23", "remaining_time": "1:52:09"} |
|
{"current_steps": 297, "total_steps": 855, "loss": 0.0068, "lr": 8.254612021379526e-05, "epoch": 1.7292576419213974, "percentage": 34.74, "elapsed_time": "0:59:33", "remaining_time": "1:51:54"} |
|
{"current_steps": 298, "total_steps": 855, "loss": 0.0064, "lr": 8.239078259986178e-05, "epoch": 1.735080058224163, "percentage": 34.85, "elapsed_time": "0:59:43", "remaining_time": "1:51:38"} |
|
{"current_steps": 299, "total_steps": 855, "loss": 0.0067, "lr": 8.223490439605865e-05, "epoch": 1.7409024745269286, "percentage": 34.97, "elapsed_time": "0:59:54", "remaining_time": "1:51:24"} |
|
{"current_steps": 300, "total_steps": 855, "loss": 0.0064, "lr": 8.2078488203934e-05, "epoch": 1.7467248908296944, "percentage": 35.09, "elapsed_time": "1:00:04", "remaining_time": "1:51:09"} |
|
{"current_steps": 300, "total_steps": 855, "eval_loss": 0.0063818395137786865, "epoch": 1.7467248908296944, "percentage": 35.09, "elapsed_time": "1:00:10", "remaining_time": "1:51:19"} |
|
{"current_steps": 301, "total_steps": 855, "loss": 0.0063, "lr": 8.192153663401467e-05, "epoch": 1.75254730713246, "percentage": 35.2, "elapsed_time": "1:00:46", "remaining_time": "1:51:51"} |
|
{"current_steps": 302, "total_steps": 855, "loss": 0.0067, "lr": 8.176405230576286e-05, "epoch": 1.7583697234352256, "percentage": 35.32, "elapsed_time": "1:00:57", "remaining_time": "1:51:36"} |
|
{"current_steps": 303, "total_steps": 855, "loss": 0.006, "lr": 8.160603784753217e-05, "epoch": 1.7641921397379914, "percentage": 35.44, "elapsed_time": "1:01:07", "remaining_time": "1:51:21"} |
|
{"current_steps": 304, "total_steps": 855, "loss": 0.0065, "lr": 8.144749589652398e-05, "epoch": 1.7700145560407567, "percentage": 35.56, "elapsed_time": "1:01:17", "remaining_time": "1:51:06"} |
|
{"current_steps": 305, "total_steps": 855, "loss": 0.0068, "lr": 8.12884290987433e-05, "epoch": 1.7758369723435226, "percentage": 35.67, "elapsed_time": "1:01:28", "remaining_time": "1:50:51"} |
|
{"current_steps": 305, "total_steps": 855, "eval_loss": 0.006364970467984676, "epoch": 1.7758369723435226, "percentage": 35.67, "elapsed_time": "1:01:33", "remaining_time": "1:51:01"} |
|
{"current_steps": 306, "total_steps": 855, "loss": 0.0065, "lr": 8.112884010895461e-05, "epoch": 1.7816593886462884, "percentage": 35.79, "elapsed_time": "1:01:44", "remaining_time": "1:50:45"} |
|
{"current_steps": 307, "total_steps": 855, "loss": 0.0062, "lr": 8.096873159063759e-05, "epoch": 1.7874818049490537, "percentage": 35.91, "elapsed_time": "1:01:54", "remaining_time": "1:50:30"} |
|
{"current_steps": 308, "total_steps": 855, "loss": 0.0068, "lr": 8.080810621594263e-05, "epoch": 1.7933042212518195, "percentage": 36.02, "elapsed_time": "1:02:04", "remaining_time": "1:50:15"} |
|
{"current_steps": 309, "total_steps": 855, "loss": 0.0065, "lr": 8.06469666656463e-05, "epoch": 1.7991266375545851, "percentage": 36.14, "elapsed_time": "1:02:15", "remaining_time": "1:50:00"} |
|
{"current_steps": 310, "total_steps": 855, "loss": 0.0063, "lr": 8.048531562910655e-05, "epoch": 1.8049490538573507, "percentage": 36.26, "elapsed_time": "1:02:25", "remaining_time": "1:49:44"} |
|
{"current_steps": 310, "total_steps": 855, "eval_loss": 0.006376221776008606, "epoch": 1.8049490538573507, "percentage": 36.26, "elapsed_time": "1:02:31", "remaining_time": "1:49:54"} |
|
{"current_steps": 311, "total_steps": 855, "loss": 0.0065, "lr": 8.03231558042178e-05, "epoch": 1.8107714701601165, "percentage": 36.37, "elapsed_time": "1:02:41", "remaining_time": "1:49:39"} |
|
{"current_steps": 312, "total_steps": 855, "loss": 0.0067, "lr": 8.016048989736602e-05, "epoch": 1.8165938864628821, "percentage": 36.49, "elapsed_time": "1:02:51", "remaining_time": "1:49:24"} |
|
{"current_steps": 313, "total_steps": 855, "loss": 0.0065, "lr": 7.999732062338347e-05, "epoch": 1.8224163027656477, "percentage": 36.61, "elapsed_time": "1:03:02", "remaining_time": "1:49:09"} |
|
{"current_steps": 314, "total_steps": 855, "loss": 0.0062, "lr": 7.983365070550339e-05, "epoch": 1.8282387190684135, "percentage": 36.73, "elapsed_time": "1:03:12", "remaining_time": "1:48:54"} |
|
{"current_steps": 315, "total_steps": 855, "loss": 0.0067, "lr": 7.96694828753146e-05, "epoch": 1.8340611353711789, "percentage": 36.84, "elapsed_time": "1:03:22", "remaining_time": "1:48:39"} |
|
{"current_steps": 315, "total_steps": 855, "eval_loss": 0.006389850750565529, "epoch": 1.8340611353711789, "percentage": 36.84, "elapsed_time": "1:03:28", "remaining_time": "1:48:48"} |
|
{"current_steps": 316, "total_steps": 855, "loss": 0.0067, "lr": 7.950481987271589e-05, "epoch": 1.8398835516739447, "percentage": 36.96, "elapsed_time": "1:03:38", "remaining_time": "1:48:33"} |
|
{"current_steps": 317, "total_steps": 855, "loss": 0.0064, "lr": 7.933966444587031e-05, "epoch": 1.8457059679767105, "percentage": 37.08, "elapsed_time": "1:03:49", "remaining_time": "1:48:18"} |
|
{"current_steps": 318, "total_steps": 855, "loss": 0.0066, "lr": 7.917401935115922e-05, "epoch": 1.8515283842794759, "percentage": 37.19, "elapsed_time": "1:03:59", "remaining_time": "1:48:03"} |
|
{"current_steps": 319, "total_steps": 855, "loss": 0.0068, "lr": 7.900788735313643e-05, "epoch": 1.8573508005822417, "percentage": 37.31, "elapsed_time": "1:04:10", "remaining_time": "1:47:49"} |
|
{"current_steps": 320, "total_steps": 855, "loss": 0.0065, "lr": 7.884127122448189e-05, "epoch": 1.8631732168850073, "percentage": 37.43, "elapsed_time": "1:04:20", "remaining_time": "1:47:34"} |
|
{"current_steps": 320, "total_steps": 855, "eval_loss": 0.006468661595135927, "epoch": 1.8631732168850073, "percentage": 37.43, "elapsed_time": "1:04:26", "remaining_time": "1:47:43"} |
|
{"current_steps": 321, "total_steps": 855, "loss": 0.0067, "lr": 7.867417374595561e-05, "epoch": 1.8689956331877728, "percentage": 37.54, "elapsed_time": "1:04:36", "remaining_time": "1:47:28"} |
|
{"current_steps": 322, "total_steps": 855, "loss": 0.0064, "lr": 7.850659770635104e-05, "epoch": 1.8748180494905387, "percentage": 37.66, "elapsed_time": "1:04:46", "remaining_time": "1:47:13"} |
|
{"current_steps": 323, "total_steps": 855, "loss": 0.0064, "lr": 7.833854590244876e-05, "epoch": 1.8806404657933042, "percentage": 37.78, "elapsed_time": "1:04:57", "remaining_time": "1:46:59"} |
|
{"current_steps": 324, "total_steps": 855, "loss": 0.0066, "lr": 7.817002113896954e-05, "epoch": 1.8864628820960698, "percentage": 37.89, "elapsed_time": "1:05:07", "remaining_time": "1:46:44"} |
|
{"current_steps": 325, "total_steps": 855, "loss": 0.006, "lr": 7.800102622852776e-05, "epoch": 1.8922852983988356, "percentage": 38.01, "elapsed_time": "1:05:18", "remaining_time": "1:46:29"} |
|
{"current_steps": 325, "total_steps": 855, "eval_loss": 0.006382644176483154, "epoch": 1.8922852983988356, "percentage": 38.01, "elapsed_time": "1:05:23", "remaining_time": "1:46:38"} |
|
{"current_steps": 326, "total_steps": 855, "loss": 0.0066, "lr": 7.783156399158433e-05, "epoch": 1.898107714701601, "percentage": 38.13, "elapsed_time": "1:05:34", "remaining_time": "1:46:24"} |
|
{"current_steps": 327, "total_steps": 855, "loss": 0.0069, "lr": 7.766163725639968e-05, "epoch": 1.9039301310043668, "percentage": 38.25, "elapsed_time": "1:05:44", "remaining_time": "1:46:09"} |
|
{"current_steps": 328, "total_steps": 855, "loss": 0.0062, "lr": 7.749124885898654e-05, "epoch": 1.9097525473071326, "percentage": 38.36, "elapsed_time": "1:05:55", "remaining_time": "1:45:54"} |
|
{"current_steps": 329, "total_steps": 855, "loss": 0.0068, "lr": 7.73204016430626e-05, "epoch": 1.915574963609898, "percentage": 38.48, "elapsed_time": "1:06:05", "remaining_time": "1:45:39"} |
|
{"current_steps": 330, "total_steps": 855, "loss": 0.0064, "lr": 7.714909846000304e-05, "epoch": 1.9213973799126638, "percentage": 38.6, "elapsed_time": "1:06:15", "remaining_time": "1:45:25"} |
|
{"current_steps": 330, "total_steps": 855, "eval_loss": 0.006392226554453373, "epoch": 1.9213973799126638, "percentage": 38.6, "elapsed_time": "1:06:21", "remaining_time": "1:45:34"} |
|
{"current_steps": 331, "total_steps": 855, "loss": 0.0068, "lr": 7.697734216879302e-05, "epoch": 1.9272197962154294, "percentage": 38.71, "elapsed_time": "1:06:31", "remaining_time": "1:45:19"} |
|
{"current_steps": 332, "total_steps": 855, "loss": 0.0068, "lr": 7.680513563597982e-05, "epoch": 1.933042212518195, "percentage": 38.83, "elapsed_time": "1:06:42", "remaining_time": "1:45:04"} |
|
{"current_steps": 333, "total_steps": 855, "loss": 0.0065, "lr": 7.663248173562514e-05, "epoch": 1.9388646288209608, "percentage": 38.95, "elapsed_time": "1:06:52", "remaining_time": "1:44:49"} |
|
{"current_steps": 334, "total_steps": 855, "loss": 0.0063, "lr": 7.645938334925704e-05, "epoch": 1.9446870451237264, "percentage": 39.06, "elapsed_time": "1:07:02", "remaining_time": "1:44:35"} |
|
{"current_steps": 335, "total_steps": 855, "loss": 0.0065, "lr": 7.628584336582191e-05, "epoch": 1.950509461426492, "percentage": 39.18, "elapsed_time": "1:07:13", "remaining_time": "1:44:20"} |
|
{"current_steps": 335, "total_steps": 855, "eval_loss": 0.006440624129027128, "epoch": 1.950509461426492, "percentage": 39.18, "elapsed_time": "1:07:18", "remaining_time": "1:44:29"} |
|
{"current_steps": 336, "total_steps": 855, "loss": 0.0064, "lr": 7.611186468163625e-05, "epoch": 1.9563318777292578, "percentage": 39.3, "elapsed_time": "1:07:29", "remaining_time": "1:44:14"} |
|
{"current_steps": 337, "total_steps": 855, "loss": 0.0061, "lr": 7.593745020033822e-05, "epoch": 1.9621542940320231, "percentage": 39.42, "elapsed_time": "1:07:39", "remaining_time": "1:44:00"} |
|
{"current_steps": 338, "total_steps": 855, "loss": 0.0062, "lr": 7.576260283283936e-05, "epoch": 1.967976710334789, "percentage": 39.53, "elapsed_time": "1:07:50", "remaining_time": "1:43:45"} |
|
{"current_steps": 339, "total_steps": 855, "loss": 0.0063, "lr": 7.558732549727587e-05, "epoch": 1.9737991266375547, "percentage": 39.65, "elapsed_time": "1:08:00", "remaining_time": "1:43:31"} |
|
{"current_steps": 340, "total_steps": 855, "loss": 0.0061, "lr": 7.541162111895994e-05, "epoch": 1.9796215429403201, "percentage": 39.77, "elapsed_time": "1:08:11", "remaining_time": "1:43:16"} |
|
{"current_steps": 340, "total_steps": 855, "eval_loss": 0.006306340917944908, "epoch": 1.9796215429403201, "percentage": 39.77, "elapsed_time": "1:08:16", "remaining_time": "1:43:25"} |
|
{"current_steps": 341, "total_steps": 855, "loss": 0.0066, "lr": 7.523549263033103e-05, "epoch": 1.985443959243086, "percentage": 39.88, "elapsed_time": "1:08:27", "remaining_time": "1:43:11"} |
|
{"current_steps": 342, "total_steps": 855, "loss": 0.0064, "lr": 7.50589429709067e-05, "epoch": 1.9912663755458515, "percentage": 40.0, "elapsed_time": "1:08:37", "remaining_time": "1:42:56"} |
|
{"current_steps": 343, "total_steps": 855, "loss": 0.0073, "lr": 7.488197508723383e-05, "epoch": 1.997088791848617, "percentage": 40.12, "elapsed_time": "1:08:47", "remaining_time": "1:42:41"} |
|
{"current_steps": 344, "total_steps": 855, "loss": 0.0072, "lr": 7.470459193283919e-05, "epoch": 2.002911208151383, "percentage": 40.23, "elapsed_time": "1:08:58", "remaining_time": "1:42:27"} |
|
{"current_steps": 345, "total_steps": 855, "loss": 0.006, "lr": 7.452679646818037e-05, "epoch": 2.0087336244541483, "percentage": 40.35, "elapsed_time": "1:09:08", "remaining_time": "1:42:12"} |
|
{"current_steps": 345, "total_steps": 855, "eval_loss": 0.006319982931017876, "epoch": 2.0087336244541483, "percentage": 40.35, "elapsed_time": "1:09:14", "remaining_time": "1:42:21"} |
|
{"current_steps": 346, "total_steps": 855, "loss": 0.0059, "lr": 7.434859166059615e-05, "epoch": 2.014556040756914, "percentage": 40.47, "elapsed_time": "1:09:24", "remaining_time": "1:42:06"} |
|
{"current_steps": 347, "total_steps": 855, "loss": 0.0059, "lr": 7.416998048425717e-05, "epoch": 2.02037845705968, "percentage": 40.58, "elapsed_time": "1:09:35", "remaining_time": "1:41:52"} |
|
{"current_steps": 348, "total_steps": 855, "loss": 0.0066, "lr": 7.399096592011616e-05, "epoch": 2.0262008733624453, "percentage": 40.7, "elapsed_time": "1:09:45", "remaining_time": "1:41:38"} |
|
{"current_steps": 349, "total_steps": 855, "loss": 0.006, "lr": 7.381155095585828e-05, "epoch": 2.032023289665211, "percentage": 40.82, "elapsed_time": "1:09:56", "remaining_time": "1:41:23"} |
|
{"current_steps": 350, "total_steps": 855, "loss": 0.0058, "lr": 7.36317385858512e-05, "epoch": 2.037845705967977, "percentage": 40.94, "elapsed_time": "1:10:06", "remaining_time": "1:41:09"} |
|
{"current_steps": 350, "total_steps": 855, "eval_loss": 0.006265893578529358, "epoch": 2.037845705967977, "percentage": 40.94, "elapsed_time": "1:10:12", "remaining_time": "1:41:17"} |
|
{"current_steps": 351, "total_steps": 855, "loss": 0.006, "lr": 7.345153181109512e-05, "epoch": 2.0436681222707422, "percentage": 41.05, "elapsed_time": "1:10:48", "remaining_time": "1:41:39"} |
|
{"current_steps": 352, "total_steps": 855, "loss": 0.006, "lr": 7.327093363917275e-05, "epoch": 2.049490538573508, "percentage": 41.17, "elapsed_time": "1:10:58", "remaining_time": "1:41:24"} |
|
{"current_steps": 353, "total_steps": 855, "loss": 0.0062, "lr": 7.3089947084199e-05, "epoch": 2.055312954876274, "percentage": 41.29, "elapsed_time": "1:11:08", "remaining_time": "1:41:10"} |
|
{"current_steps": 354, "total_steps": 855, "loss": 0.0062, "lr": 7.290857516677085e-05, "epoch": 2.061135371179039, "percentage": 41.4, "elapsed_time": "1:11:18", "remaining_time": "1:40:55"} |
|
{"current_steps": 355, "total_steps": 855, "loss": 0.0057, "lr": 7.272682091391671e-05, "epoch": 2.066957787481805, "percentage": 41.52, "elapsed_time": "1:11:29", "remaining_time": "1:40:40"} |
|
{"current_steps": 355, "total_steps": 855, "eval_loss": 0.006287863478064537, "epoch": 2.066957787481805, "percentage": 41.52, "elapsed_time": "1:11:34", "remaining_time": "1:40:48"} |
|
{"current_steps": 356, "total_steps": 855, "loss": 0.0061, "lr": 7.254468735904616e-05, "epoch": 2.0727802037845704, "percentage": 41.64, "elapsed_time": "1:11:44", "remaining_time": "1:40:34"} |
|
{"current_steps": 357, "total_steps": 855, "loss": 0.006, "lr": 7.236217754189904e-05, "epoch": 2.078602620087336, "percentage": 41.75, "elapsed_time": "1:11:55", "remaining_time": "1:40:19"} |
|
{"current_steps": 358, "total_steps": 855, "loss": 0.0063, "lr": 7.217929450849497e-05, "epoch": 2.084425036390102, "percentage": 41.87, "elapsed_time": "1:12:05", "remaining_time": "1:40:05"} |
|
{"current_steps": 359, "total_steps": 855, "loss": 0.0063, "lr": 7.199604131108237e-05, "epoch": 2.0902474526928674, "percentage": 41.99, "elapsed_time": "1:12:16", "remaining_time": "1:39:50"} |
|
{"current_steps": 360, "total_steps": 855, "loss": 0.0059, "lr": 7.181242100808759e-05, "epoch": 2.096069868995633, "percentage": 42.11, "elapsed_time": "1:12:26", "remaining_time": "1:39:36"} |
|
{"current_steps": 360, "total_steps": 855, "eval_loss": 0.0062352512031793594, "epoch": 2.096069868995633, "percentage": 42.11, "elapsed_time": "1:12:32", "remaining_time": "1:39:44"} |
|
{"current_steps": 361, "total_steps": 855, "loss": 0.0065, "lr": 7.162843666406377e-05, "epoch": 2.101892285298399, "percentage": 42.22, "elapsed_time": "1:12:42", "remaining_time": "1:39:29"} |
|
{"current_steps": 362, "total_steps": 855, "loss": 0.0064, "lr": 7.14440913496398e-05, "epoch": 2.1077147016011644, "percentage": 42.34, "elapsed_time": "1:12:52", "remaining_time": "1:39:15"} |
|
{"current_steps": 363, "total_steps": 855, "loss": 0.0059, "lr": 7.125938814146901e-05, "epoch": 2.11353711790393, "percentage": 42.46, "elapsed_time": "1:13:03", "remaining_time": "1:39:00"} |
|
{"current_steps": 364, "total_steps": 855, "loss": 0.0064, "lr": 7.107433012217788e-05, "epoch": 2.119359534206696, "percentage": 42.57, "elapsed_time": "1:13:13", "remaining_time": "1:38:46"} |
|
{"current_steps": 365, "total_steps": 855, "loss": 0.0061, "lr": 7.08889203803145e-05, "epoch": 2.1251819505094613, "percentage": 42.69, "elapsed_time": "1:13:23", "remaining_time": "1:38:31"} |
|
{"current_steps": 365, "total_steps": 855, "eval_loss": 0.006345388479530811, "epoch": 2.1251819505094613, "percentage": 42.69, "elapsed_time": "1:13:29", "remaining_time": "1:38:39"} |
|
{"current_steps": 366, "total_steps": 855, "loss": 0.0058, "lr": 7.070316201029712e-05, "epoch": 2.131004366812227, "percentage": 42.81, "elapsed_time": "1:13:39", "remaining_time": "1:38:25"} |
|
{"current_steps": 367, "total_steps": 855, "loss": 0.006, "lr": 7.05170581123624e-05, "epoch": 2.1368267831149925, "percentage": 42.92, "elapsed_time": "1:13:50", "remaining_time": "1:38:10"} |
|
{"current_steps": 368, "total_steps": 855, "loss": 0.0061, "lr": 7.033061179251385e-05, "epoch": 2.1426491994177583, "percentage": 43.04, "elapsed_time": "1:14:00", "remaining_time": "1:37:56"} |
|
{"current_steps": 369, "total_steps": 855, "loss": 0.006, "lr": 7.01438261624697e-05, "epoch": 2.148471615720524, "percentage": 43.16, "elapsed_time": "1:14:11", "remaining_time": "1:37:42"} |
|
{"current_steps": 370, "total_steps": 855, "loss": 0.006, "lr": 6.995670433961133e-05, "epoch": 2.1542940320232895, "percentage": 43.27, "elapsed_time": "1:14:21", "remaining_time": "1:37:28"} |
|
{"current_steps": 370, "total_steps": 855, "eval_loss": 0.006326164118945599, "epoch": 2.1542940320232895, "percentage": 43.27, "elapsed_time": "1:14:27", "remaining_time": "1:37:35"} |
|
{"current_steps": 371, "total_steps": 855, "loss": 0.0059, "lr": 6.976924944693086e-05, "epoch": 2.1601164483260553, "percentage": 43.39, "elapsed_time": "1:14:37", "remaining_time": "1:37:21"} |
|
{"current_steps": 372, "total_steps": 855, "loss": 0.0062, "lr": 6.958146461297938e-05, "epoch": 2.165938864628821, "percentage": 43.51, "elapsed_time": "1:14:47", "remaining_time": "1:37:07"} |
|
{"current_steps": 373, "total_steps": 855, "loss": 0.0064, "lr": 6.939335297181446e-05, "epoch": 2.1717612809315865, "percentage": 43.63, "elapsed_time": "1:14:58", "remaining_time": "1:36:52"} |
|
{"current_steps": 374, "total_steps": 855, "loss": 0.006, "lr": 6.920491766294803e-05, "epoch": 2.1775836972343523, "percentage": 43.74, "elapsed_time": "1:15:08", "remaining_time": "1:36:38"} |
|
{"current_steps": 375, "total_steps": 855, "loss": 0.0062, "lr": 6.901616183129387e-05, "epoch": 2.183406113537118, "percentage": 43.86, "elapsed_time": "1:15:19", "remaining_time": "1:36:24"} |
|
{"current_steps": 375, "total_steps": 855, "eval_loss": 0.006338266655802727, "epoch": 2.183406113537118, "percentage": 43.86, "elapsed_time": "1:15:25", "remaining_time": "1:36:32"} |
|
{"current_steps": 376, "total_steps": 855, "loss": 0.0062, "lr": 6.88270886271152e-05, "epoch": 2.1892285298398835, "percentage": 43.98, "elapsed_time": "1:15:35", "remaining_time": "1:36:17"} |
|
{"current_steps": 377, "total_steps": 855, "loss": 0.0061, "lr": 6.863770120597204e-05, "epoch": 2.1950509461426493, "percentage": 44.09, "elapsed_time": "1:15:45", "remaining_time": "1:36:03"} |
|
{"current_steps": 378, "total_steps": 855, "loss": 0.0065, "lr": 6.844800272866856e-05, "epoch": 2.2008733624454146, "percentage": 44.21, "elapsed_time": "1:15:55", "remaining_time": "1:35:49"} |
|
{"current_steps": 379, "total_steps": 855, "loss": 0.0063, "lr": 6.825799636120038e-05, "epoch": 2.2066957787481805, "percentage": 44.33, "elapsed_time": "1:16:06", "remaining_time": "1:35:34"} |
|
{"current_steps": 380, "total_steps": 855, "loss": 0.0064, "lr": 6.806768527470166e-05, "epoch": 2.2125181950509463, "percentage": 44.44, "elapsed_time": "1:16:16", "remaining_time": "1:35:20"} |
|
{"current_steps": 380, "total_steps": 855, "eval_loss": 0.0062924763187766075, "epoch": 2.2125181950509463, "percentage": 44.44, "elapsed_time": "1:16:22", "remaining_time": "1:35:27"} |
|
{"current_steps": 381, "total_steps": 855, "loss": 0.0064, "lr": 6.787707264539221e-05, "epoch": 2.2183406113537116, "percentage": 44.56, "elapsed_time": "1:16:32", "remaining_time": "1:35:13"} |
|
{"current_steps": 382, "total_steps": 855, "loss": 0.006, "lr": 6.768616165452447e-05, "epoch": 2.2241630276564774, "percentage": 44.68, "elapsed_time": "1:16:43", "remaining_time": "1:34:59"} |
|
{"current_steps": 383, "total_steps": 855, "loss": 0.0057, "lr": 6.749495548833045e-05, "epoch": 2.2299854439592433, "percentage": 44.8, "elapsed_time": "1:16:53", "remaining_time": "1:34:45"} |
|
{"current_steps": 384, "total_steps": 855, "loss": 0.0061, "lr": 6.730345733796848e-05, "epoch": 2.2358078602620086, "percentage": 44.91, "elapsed_time": "1:17:03", "remaining_time": "1:34:31"} |
|
{"current_steps": 385, "total_steps": 855, "loss": 0.006, "lr": 6.711167039947004e-05, "epoch": 2.2416302765647744, "percentage": 45.03, "elapsed_time": "1:17:14", "remaining_time": "1:34:17"} |
|
{"current_steps": 385, "total_steps": 855, "eval_loss": 0.006232730578631163, "epoch": 2.2416302765647744, "percentage": 45.03, "elapsed_time": "1:17:19", "remaining_time": "1:34:24"} |
|
{"current_steps": 386, "total_steps": 855, "loss": 0.0059, "lr": 6.691959787368634e-05, "epoch": 2.2474526928675402, "percentage": 45.15, "elapsed_time": "1:17:30", "remaining_time": "1:34:10"} |
|
{"current_steps": 387, "total_steps": 855, "loss": 0.0065, "lr": 6.672724296623493e-05, "epoch": 2.2532751091703056, "percentage": 45.26, "elapsed_time": "1:17:40", "remaining_time": "1:33:56"} |
|
{"current_steps": 388, "total_steps": 855, "loss": 0.0063, "lr": 6.653460888744625e-05, "epoch": 2.2590975254730714, "percentage": 45.38, "elapsed_time": "1:17:51", "remaining_time": "1:33:42"} |
|
{"current_steps": 389, "total_steps": 855, "loss": 0.0063, "lr": 6.634169885230995e-05, "epoch": 2.2649199417758368, "percentage": 45.5, "elapsed_time": "1:18:01", "remaining_time": "1:33:28"} |
|
{"current_steps": 390, "total_steps": 855, "loss": 0.0062, "lr": 6.614851608042131e-05, "epoch": 2.2707423580786026, "percentage": 45.61, "elapsed_time": "1:18:12", "remaining_time": "1:33:14"} |
|
{"current_steps": 390, "total_steps": 855, "eval_loss": 0.006138971075415611, "epoch": 2.2707423580786026, "percentage": 45.61, "elapsed_time": "1:18:17", "remaining_time": "1:33:21"} |
|
{"current_steps": 391, "total_steps": 855, "loss": 0.0061, "lr": 6.59550637959275e-05, "epoch": 2.2765647743813684, "percentage": 45.73, "elapsed_time": "1:18:28", "remaining_time": "1:33:07"} |
|
{"current_steps": 392, "total_steps": 855, "loss": 0.0066, "lr": 6.576134522747372e-05, "epoch": 2.2823871906841338, "percentage": 45.85, "elapsed_time": "1:18:38", "remaining_time": "1:32:53"} |
|
{"current_steps": 393, "total_steps": 855, "loss": 0.0061, "lr": 6.556736360814936e-05, "epoch": 2.2882096069868996, "percentage": 45.96, "elapsed_time": "1:18:49", "remaining_time": "1:32:39"} |
|
{"current_steps": 394, "total_steps": 855, "loss": 0.006, "lr": 6.537312217543405e-05, "epoch": 2.2940320232896654, "percentage": 46.08, "elapsed_time": "1:18:59", "remaining_time": "1:32:25"} |
|
{"current_steps": 395, "total_steps": 855, "loss": 0.0061, "lr": 6.517862417114357e-05, "epoch": 2.2998544395924307, "percentage": 46.2, "elapsed_time": "1:19:10", "remaining_time": "1:32:11"} |
|
{"current_steps": 395, "total_steps": 855, "eval_loss": 0.006199044641107321, "epoch": 2.2998544395924307, "percentage": 46.2, "elapsed_time": "1:19:15", "remaining_time": "1:32:18"} |
|
{"current_steps": 396, "total_steps": 855, "loss": 0.0059, "lr": 6.498387284137582e-05, "epoch": 2.3056768558951966, "percentage": 46.32, "elapsed_time": "1:19:26", "remaining_time": "1:32:04"} |
|
{"current_steps": 397, "total_steps": 855, "loss": 0.0059, "lr": 6.478887143645655e-05, "epoch": 2.3114992721979624, "percentage": 46.43, "elapsed_time": "1:19:36", "remaining_time": "1:31:50"} |
|
{"current_steps": 398, "total_steps": 855, "loss": 0.006, "lr": 6.459362321088526e-05, "epoch": 2.3173216885007277, "percentage": 46.55, "elapsed_time": "1:19:47", "remaining_time": "1:31:36"} |
|
{"current_steps": 399, "total_steps": 855, "loss": 0.0055, "lr": 6.439813142328071e-05, "epoch": 2.3231441048034935, "percentage": 46.67, "elapsed_time": "1:19:57", "remaining_time": "1:31:22"} |
|
{"current_steps": 400, "total_steps": 855, "loss": 0.0063, "lr": 6.420239933632665e-05, "epoch": 2.328966521106259, "percentage": 46.78, "elapsed_time": "1:20:07", "remaining_time": "1:31:08"} |
|
{"current_steps": 400, "total_steps": 855, "eval_loss": 0.006286091636866331, "epoch": 2.328966521106259, "percentage": 46.78, "elapsed_time": "1:20:13", "remaining_time": "1:31:15"} |
|
{"current_steps": 401, "total_steps": 855, "loss": 0.0058, "lr": 6.400643021671734e-05, "epoch": 2.3347889374090247, "percentage": 46.9, "elapsed_time": "1:20:52", "remaining_time": "1:31:33"} |
|
{"current_steps": 402, "total_steps": 855, "loss": 0.006, "lr": 6.3810227335103e-05, "epoch": 2.3406113537117905, "percentage": 47.02, "elapsed_time": "1:21:02", "remaining_time": "1:31:19"} |
|
{"current_steps": 403, "total_steps": 855, "loss": 0.006, "lr": 6.36137939660353e-05, "epoch": 2.346433770014556, "percentage": 47.13, "elapsed_time": "1:21:12", "remaining_time": "1:31:05"} |
|
{"current_steps": 404, "total_steps": 855, "loss": 0.0062, "lr": 6.341713338791259e-05, "epoch": 2.3522561863173217, "percentage": 47.25, "elapsed_time": "1:21:23", "remaining_time": "1:30:51"} |
|
{"current_steps": 405, "total_steps": 855, "loss": 0.006, "lr": 6.32202488829253e-05, "epoch": 2.3580786026200875, "percentage": 47.37, "elapsed_time": "1:21:33", "remaining_time": "1:30:37"} |
|
{"current_steps": 405, "total_steps": 855, "eval_loss": 0.0061913831159472466, "epoch": 2.3580786026200875, "percentage": 47.37, "elapsed_time": "1:21:38", "remaining_time": "1:30:43"} |
|
{"current_steps": 406, "total_steps": 855, "loss": 0.0063, "lr": 6.302314373700114e-05, "epoch": 2.363901018922853, "percentage": 47.49, "elapsed_time": "1:21:49", "remaining_time": "1:30:29"} |
|
{"current_steps": 407, "total_steps": 855, "loss": 0.006, "lr": 6.282582123975011e-05, "epoch": 2.3697234352256187, "percentage": 47.6, "elapsed_time": "1:21:59", "remaining_time": "1:30:15"} |
|
{"current_steps": 408, "total_steps": 855, "loss": 0.0059, "lr": 6.26282846844099e-05, "epoch": 2.3755458515283845, "percentage": 47.72, "elapsed_time": "1:22:10", "remaining_time": "1:30:01"} |
|
{"current_steps": 409, "total_steps": 855, "loss": 0.0059, "lr": 6.243053736779059e-05, "epoch": 2.38136826783115, "percentage": 47.84, "elapsed_time": "1:22:20", "remaining_time": "1:29:47"} |
|
{"current_steps": 410, "total_steps": 855, "loss": 0.006, "lr": 6.22325825902199e-05, "epoch": 2.3871906841339157, "percentage": 47.95, "elapsed_time": "1:22:30", "remaining_time": "1:29:33"} |
|
{"current_steps": 410, "total_steps": 855, "eval_loss": 0.006266340613365173, "epoch": 2.3871906841339157, "percentage": 47.95, "elapsed_time": "1:22:36", "remaining_time": "1:29:39"} |
|
{"current_steps": 411, "total_steps": 855, "loss": 0.006, "lr": 6.203442365548791e-05, "epoch": 2.393013100436681, "percentage": 48.07, "elapsed_time": "1:22:46", "remaining_time": "1:29:25"} |
|
{"current_steps": 412, "total_steps": 855, "loss": 0.0059, "lr": 6.183606387079205e-05, "epoch": 2.398835516739447, "percentage": 48.19, "elapsed_time": "1:22:57", "remaining_time": "1:29:11"} |
|
{"current_steps": 413, "total_steps": 855, "loss": 0.006, "lr": 6.163750654668186e-05, "epoch": 2.4046579330422126, "percentage": 48.3, "elapsed_time": "1:23:07", "remaining_time": "1:28:57"} |
|
{"current_steps": 414, "total_steps": 855, "loss": 0.006, "lr": 6.143875499700371e-05, "epoch": 2.410480349344978, "percentage": 48.42, "elapsed_time": "1:23:18", "remaining_time": "1:28:44"} |
|
{"current_steps": 415, "total_steps": 855, "loss": 0.0057, "lr": 6.123981253884556e-05, "epoch": 2.416302765647744, "percentage": 48.54, "elapsed_time": "1:23:28", "remaining_time": "1:28:30"} |
|
{"current_steps": 415, "total_steps": 855, "eval_loss": 0.0062265838496387005, "epoch": 2.416302765647744, "percentage": 48.54, "elapsed_time": "1:23:34", "remaining_time": "1:28:36"} |
|
{"current_steps": 416, "total_steps": 855, "loss": 0.0061, "lr": 6.104068249248154e-05, "epoch": 2.4221251819505096, "percentage": 48.65, "elapsed_time": "1:23:44", "remaining_time": "1:28:22"} |
|
{"current_steps": 417, "total_steps": 855, "loss": 0.0061, "lr": 6.084136818131654e-05, "epoch": 2.427947598253275, "percentage": 48.77, "elapsed_time": "1:23:54", "remaining_time": "1:28:08"} |
|
{"current_steps": 418, "total_steps": 855, "loss": 0.0058, "lr": 6.064187293183079e-05, "epoch": 2.433770014556041, "percentage": 48.89, "elapsed_time": "1:24:05", "remaining_time": "1:27:54"} |
|
{"current_steps": 419, "total_steps": 855, "loss": 0.006, "lr": 6.044220007352429e-05, "epoch": 2.4395924308588066, "percentage": 49.01, "elapsed_time": "1:24:15", "remaining_time": "1:27:41"} |
|
{"current_steps": 420, "total_steps": 855, "loss": 0.0063, "lr": 6.024235293886128e-05, "epoch": 2.445414847161572, "percentage": 49.12, "elapsed_time": "1:24:26", "remaining_time": "1:27:27"} |
|
{"current_steps": 420, "total_steps": 855, "eval_loss": 0.006302733905613422, "epoch": 2.445414847161572, "percentage": 49.12, "elapsed_time": "1:24:31", "remaining_time": "1:27:32"} |
|
{"current_steps": 421, "total_steps": 855, "loss": 0.0062, "lr": 6.00423348632146e-05, "epoch": 2.451237263464338, "percentage": 49.24, "elapsed_time": "1:24:42", "remaining_time": "1:27:19"} |
|
{"current_steps": 422, "total_steps": 855, "loss": 0.006, "lr": 5.9842149184809994e-05, "epoch": 2.457059679767103, "percentage": 49.36, "elapsed_time": "1:24:52", "remaining_time": "1:27:05"} |
|
{"current_steps": 423, "total_steps": 855, "loss": 0.0063, "lr": 5.96417992446705e-05, "epoch": 2.462882096069869, "percentage": 49.47, "elapsed_time": "1:25:03", "remaining_time": "1:26:51"} |
|
{"current_steps": 424, "total_steps": 855, "loss": 0.0062, "lr": 5.944128838656059e-05, "epoch": 2.4687045123726348, "percentage": 49.59, "elapsed_time": "1:25:13", "remaining_time": "1:26:37"} |
|
{"current_steps": 425, "total_steps": 855, "loss": 0.0065, "lr": 5.9240619956930365e-05, "epoch": 2.4745269286754, "percentage": 49.71, "elapsed_time": "1:25:23", "remaining_time": "1:26:24"} |
|
{"current_steps": 425, "total_steps": 855, "eval_loss": 0.006210055667907, "epoch": 2.4745269286754, "percentage": 49.71, "elapsed_time": "1:25:29", "remaining_time": "1:26:29"} |
|
{"current_steps": 426, "total_steps": 855, "loss": 0.0057, "lr": 5.903979730485979e-05, "epoch": 2.480349344978166, "percentage": 49.82, "elapsed_time": "1:25:40", "remaining_time": "1:26:16"} |
|
{"current_steps": 427, "total_steps": 855, "loss": 0.0061, "lr": 5.8838823782002704e-05, "epoch": 2.4861717612809318, "percentage": 49.94, "elapsed_time": "1:25:50", "remaining_time": "1:26:02"} |
|
{"current_steps": 428, "total_steps": 855, "loss": 0.0057, "lr": 5.863770274253095e-05, "epoch": 2.491994177583697, "percentage": 50.06, "elapsed_time": "1:26:00", "remaining_time": "1:25:48"} |
|
{"current_steps": 429, "total_steps": 855, "loss": 0.0059, "lr": 5.843643754307835e-05, "epoch": 2.497816593886463, "percentage": 50.18, "elapsed_time": "1:26:11", "remaining_time": "1:25:35"} |
|
{"current_steps": 430, "total_steps": 855, "loss": 0.006, "lr": 5.8235031542684684e-05, "epoch": 2.5036390101892287, "percentage": 50.29, "elapsed_time": "1:26:21", "remaining_time": "1:25:21"} |
|
{"current_steps": 430, "total_steps": 855, "eval_loss": 0.0061637284234166145, "epoch": 2.5036390101892287, "percentage": 50.29, "elapsed_time": "1:26:27", "remaining_time": "1:25:27"} |
|
{"current_steps": 431, "total_steps": 855, "loss": 0.0061, "lr": 5.8033488102739696e-05, "epoch": 2.509461426491994, "percentage": 50.41, "elapsed_time": "1:26:37", "remaining_time": "1:25:13"} |
|
{"current_steps": 432, "total_steps": 855, "loss": 0.0057, "lr": 5.7831810586926895e-05, "epoch": 2.51528384279476, "percentage": 50.53, "elapsed_time": "1:26:48", "remaining_time": "1:24:59"} |
|
{"current_steps": 433, "total_steps": 855, "loss": 0.0058, "lr": 5.7630002361167504e-05, "epoch": 2.5211062590975253, "percentage": 50.64, "elapsed_time": "1:26:58", "remaining_time": "1:24:46"} |
|
{"current_steps": 434, "total_steps": 855, "loss": 0.0059, "lr": 5.7428066793564196e-05, "epoch": 2.526928675400291, "percentage": 50.76, "elapsed_time": "1:27:09", "remaining_time": "1:24:32"} |
|
{"current_steps": 435, "total_steps": 855, "loss": 0.0059, "lr": 5.7226007254344997e-05, "epoch": 2.532751091703057, "percentage": 50.88, "elapsed_time": "1:27:19", "remaining_time": "1:24:18"} |
|
{"current_steps": 435, "total_steps": 855, "eval_loss": 0.006212435197085142, "epoch": 2.532751091703057, "percentage": 50.88, "elapsed_time": "1:27:25", "remaining_time": "1:24:24"} |
|
{"current_steps": 436, "total_steps": 855, "loss": 0.0055, "lr": 5.70238271158069e-05, "epoch": 2.5385735080058223, "percentage": 50.99, "elapsed_time": "1:27:35", "remaining_time": "1:24:10"} |
|
{"current_steps": 437, "total_steps": 855, "loss": 0.0058, "lr": 5.682152975225973e-05, "epoch": 2.544395924308588, "percentage": 51.11, "elapsed_time": "1:27:45", "remaining_time": "1:23:56"} |
|
{"current_steps": 438, "total_steps": 855, "loss": 0.0057, "lr": 5.6619118539969684e-05, "epoch": 2.5502183406113534, "percentage": 51.23, "elapsed_time": "1:27:56", "remaining_time": "1:23:43"} |
|
{"current_steps": 439, "total_steps": 855, "loss": 0.0057, "lr": 5.64165968571031e-05, "epoch": 2.5560407569141192, "percentage": 51.35, "elapsed_time": "1:28:06", "remaining_time": "1:23:29"} |
|
{"current_steps": 440, "total_steps": 855, "loss": 0.0058, "lr": 5.621396808367001e-05, "epoch": 2.561863173216885, "percentage": 51.46, "elapsed_time": "1:28:16", "remaining_time": "1:23:15"} |
|
{"current_steps": 440, "total_steps": 855, "eval_loss": 0.006226742640137672, "epoch": 2.561863173216885, "percentage": 51.46, "elapsed_time": "1:28:22", "remaining_time": "1:23:21"} |
|
{"current_steps": 441, "total_steps": 855, "loss": 0.0062, "lr": 5.601123560146774e-05, "epoch": 2.567685589519651, "percentage": 51.58, "elapsed_time": "1:28:33", "remaining_time": "1:23:07"} |
|
{"current_steps": 442, "total_steps": 855, "loss": 0.0059, "lr": 5.5808402794024485e-05, "epoch": 2.5735080058224162, "percentage": 51.7, "elapsed_time": "1:28:43", "remaining_time": "1:22:54"} |
|
{"current_steps": 443, "total_steps": 855, "loss": 0.006, "lr": 5.560547304654282e-05, "epoch": 2.579330422125182, "percentage": 51.81, "elapsed_time": "1:28:53", "remaining_time": "1:22:40"} |
|
{"current_steps": 444, "total_steps": 855, "loss": 0.006, "lr": 5.540244974584325e-05, "epoch": 2.5851528384279474, "percentage": 51.93, "elapsed_time": "1:29:04", "remaining_time": "1:22:26"} |
|
{"current_steps": 445, "total_steps": 855, "loss": 0.0061, "lr": 5.519933628030758e-05, "epoch": 2.590975254730713, "percentage": 52.05, "elapsed_time": "1:29:14", "remaining_time": "1:22:13"} |
|
{"current_steps": 445, "total_steps": 855, "eval_loss": 0.006126726977527142, "epoch": 2.590975254730713, "percentage": 52.05, "elapsed_time": "1:29:20", "remaining_time": "1:22:18"} |
|
{"current_steps": 446, "total_steps": 855, "loss": 0.0062, "lr": 5.49961360398225e-05, "epoch": 2.596797671033479, "percentage": 52.16, "elapsed_time": "1:29:30", "remaining_time": "1:22:04"} |
|
{"current_steps": 447, "total_steps": 855, "loss": 0.006, "lr": 5.479285241572289e-05, "epoch": 2.6026200873362444, "percentage": 52.28, "elapsed_time": "1:29:41", "remaining_time": "1:21:51"} |
|
{"current_steps": 448, "total_steps": 855, "loss": 0.0059, "lr": 5.45894888007353e-05, "epoch": 2.60844250363901, "percentage": 52.4, "elapsed_time": "1:29:51", "remaining_time": "1:21:38"} |
|
{"current_steps": 449, "total_steps": 855, "loss": 0.0059, "lr": 5.43860485889213e-05, "epoch": 2.6142649199417756, "percentage": 52.51, "elapsed_time": "1:30:02", "remaining_time": "1:21:24"} |
|
{"current_steps": 450, "total_steps": 855, "loss": 0.0061, "lr": 5.41825351756208e-05, "epoch": 2.6200873362445414, "percentage": 52.63, "elapsed_time": "1:30:12", "remaining_time": "1:21:11"} |
|
{"current_steps": 450, "total_steps": 855, "eval_loss": 0.006082773674279451, "epoch": 2.6200873362445414, "percentage": 52.63, "elapsed_time": "1:30:18", "remaining_time": "1:21:16"} |
|
{"current_steps": 451, "total_steps": 855, "loss": 0.0061, "lr": 5.397895195739545e-05, "epoch": 2.625909752547307, "percentage": 52.75, "elapsed_time": "1:31:18", "remaining_time": "1:21:47"} |
|
{"current_steps": 452, "total_steps": 855, "loss": 0.0059, "lr": 5.377530233197191e-05, "epoch": 2.631732168850073, "percentage": 52.87, "elapsed_time": "1:31:29", "remaining_time": "1:21:33"} |
|
{"current_steps": 453, "total_steps": 855, "loss": 0.006, "lr": 5.3571589698185146e-05, "epoch": 2.6375545851528384, "percentage": 52.98, "elapsed_time": "1:31:39", "remaining_time": "1:21:20"} |
|
{"current_steps": 454, "total_steps": 855, "loss": 0.0058, "lr": 5.33678174559217e-05, "epoch": 2.643377001455604, "percentage": 53.1, "elapsed_time": "1:31:49", "remaining_time": "1:21:06"} |
|
{"current_steps": 455, "total_steps": 855, "loss": 0.0059, "lr": 5.316398900606295e-05, "epoch": 2.6491994177583695, "percentage": 53.22, "elapsed_time": "1:32:00", "remaining_time": "1:20:52"} |
|
{"current_steps": 455, "total_steps": 855, "eval_loss": 0.006173258647322655, "epoch": 2.6491994177583695, "percentage": 53.22, "elapsed_time": "1:32:05", "remaining_time": "1:20:57"} |
|
{"current_steps": 456, "total_steps": 855, "loss": 0.006, "lr": 5.296010775042841e-05, "epoch": 2.6550218340611353, "percentage": 53.33, "elapsed_time": "1:32:16", "remaining_time": "1:20:44"} |
|
{"current_steps": 457, "total_steps": 855, "loss": 0.0059, "lr": 5.275617709171883e-05, "epoch": 2.660844250363901, "percentage": 53.45, "elapsed_time": "1:32:26", "remaining_time": "1:20:30"} |
|
{"current_steps": 458, "total_steps": 855, "loss": 0.0061, "lr": 5.255220043345955e-05, "epoch": 2.6666666666666665, "percentage": 53.57, "elapsed_time": "1:32:36", "remaining_time": "1:20:16"} |
|
{"current_steps": 459, "total_steps": 855, "loss": 0.0058, "lr": 5.234818117994355e-05, "epoch": 2.6724890829694323, "percentage": 53.68, "elapsed_time": "1:32:47", "remaining_time": "1:20:02"} |
|
{"current_steps": 460, "total_steps": 855, "loss": 0.0057, "lr": 5.214412273617478e-05, "epoch": 2.6783114992721977, "percentage": 53.8, "elapsed_time": "1:32:57", "remaining_time": "1:19:49"} |
|
{"current_steps": 460, "total_steps": 855, "eval_loss": 0.006224961020052433, "epoch": 2.6783114992721977, "percentage": 53.8, "elapsed_time": "1:33:03", "remaining_time": "1:19:54"} |
|
{"current_steps": 461, "total_steps": 855, "loss": 0.0059, "lr": 5.1940028507811225e-05, "epoch": 2.6841339155749635, "percentage": 53.92, "elapsed_time": "1:33:13", "remaining_time": "1:19:40"} |
|
{"current_steps": 462, "total_steps": 855, "loss": 0.0055, "lr": 5.173590190110808e-05, "epoch": 2.6899563318777293, "percentage": 54.04, "elapsed_time": "1:33:23", "remaining_time": "1:19:26"} |
|
{"current_steps": 463, "total_steps": 855, "loss": 0.0054, "lr": 5.153174632286097e-05, "epoch": 2.695778748180495, "percentage": 54.15, "elapsed_time": "1:33:34", "remaining_time": "1:19:13"} |
|
{"current_steps": 464, "total_steps": 855, "loss": 0.0056, "lr": 5.132756518034901e-05, "epoch": 2.7016011644832605, "percentage": 54.27, "elapsed_time": "1:33:44", "remaining_time": "1:18:59"} |
|
{"current_steps": 465, "total_steps": 855, "loss": 0.0059, "lr": 5.112336188127799e-05, "epoch": 2.7074235807860263, "percentage": 54.39, "elapsed_time": "1:33:55", "remaining_time": "1:18:46"} |
|
{"current_steps": 465, "total_steps": 855, "eval_loss": 0.006092175841331482, "epoch": 2.7074235807860263, "percentage": 54.39, "elapsed_time": "1:34:00", "remaining_time": "1:18:50"} |
|
{"current_steps": 466, "total_steps": 855, "loss": 0.0064, "lr": 5.091913983372347e-05, "epoch": 2.7132459970887917, "percentage": 54.5, "elapsed_time": "1:34:11", "remaining_time": "1:18:37"} |
|
{"current_steps": 467, "total_steps": 855, "loss": 0.0057, "lr": 5.071490244607394e-05, "epoch": 2.7190684133915575, "percentage": 54.62, "elapsed_time": "1:34:21", "remaining_time": "1:18:23"} |
|
{"current_steps": 468, "total_steps": 855, "loss": 0.0056, "lr": 5.051065312697387e-05, "epoch": 2.7248908296943233, "percentage": 54.74, "elapsed_time": "1:34:32", "remaining_time": "1:18:10"} |
|
{"current_steps": 469, "total_steps": 855, "loss": 0.0058, "lr": 5.030639528526693e-05, "epoch": 2.7307132459970886, "percentage": 54.85, "elapsed_time": "1:34:42", "remaining_time": "1:17:56"} |
|
{"current_steps": 470, "total_steps": 855, "loss": 0.0058, "lr": 5.010213232993891e-05, "epoch": 2.7365356622998545, "percentage": 54.97, "elapsed_time": "1:34:52", "remaining_time": "1:17:43"} |
|
{"current_steps": 470, "total_steps": 855, "eval_loss": 0.0061721946112811565, "epoch": 2.7365356622998545, "percentage": 54.97, "elapsed_time": "1:34:58", "remaining_time": "1:17:47"} |
|
{"current_steps": 471, "total_steps": 855, "loss": 0.0054, "lr": 4.9897867670061085e-05, "epoch": 2.74235807860262, "percentage": 55.09, "elapsed_time": "1:35:08", "remaining_time": "1:17:34"} |
|
{"current_steps": 472, "total_steps": 855, "loss": 0.006, "lr": 4.969360471473308e-05, "epoch": 2.7481804949053856, "percentage": 55.2, "elapsed_time": "1:35:19", "remaining_time": "1:17:20"} |
|
{"current_steps": 473, "total_steps": 855, "loss": 0.0056, "lr": 4.948934687302613e-05, "epoch": 2.7540029112081514, "percentage": 55.32, "elapsed_time": "1:35:29", "remaining_time": "1:17:07"} |
|
{"current_steps": 474, "total_steps": 855, "loss": 0.0059, "lr": 4.928509755392607e-05, "epoch": 2.7598253275109172, "percentage": 55.44, "elapsed_time": "1:35:40", "remaining_time": "1:16:53"} |
|
{"current_steps": 475, "total_steps": 855, "loss": 0.0057, "lr": 4.9080860166276535e-05, "epoch": 2.7656477438136826, "percentage": 55.56, "elapsed_time": "1:35:50", "remaining_time": "1:16:40"} |
|
{"current_steps": 475, "total_steps": 855, "eval_loss": 0.006066991947591305, "epoch": 2.7656477438136826, "percentage": 55.56, "elapsed_time": "1:35:56", "remaining_time": "1:16:44"} |
|
{"current_steps": 476, "total_steps": 855, "loss": 0.006, "lr": 4.887663811872201e-05, "epoch": 2.7714701601164484, "percentage": 55.67, "elapsed_time": "1:36:06", "remaining_time": "1:16:31"} |
|
{"current_steps": 477, "total_steps": 855, "loss": 0.0057, "lr": 4.8672434819651006e-05, "epoch": 2.777292576419214, "percentage": 55.79, "elapsed_time": "1:36:16", "remaining_time": "1:16:17"} |
|
{"current_steps": 478, "total_steps": 855, "loss": 0.0057, "lr": 4.846825367713904e-05, "epoch": 2.7831149927219796, "percentage": 55.91, "elapsed_time": "1:36:27", "remaining_time": "1:16:04"} |
|
{"current_steps": 479, "total_steps": 855, "loss": 0.006, "lr": 4.826409809889193e-05, "epoch": 2.7889374090247454, "percentage": 56.02, "elapsed_time": "1:36:37", "remaining_time": "1:15:51"} |
|
{"current_steps": 480, "total_steps": 855, "loss": 0.0058, "lr": 4.80599714921888e-05, "epoch": 2.7947598253275108, "percentage": 56.14, "elapsed_time": "1:36:48", "remaining_time": "1:15:37"} |
|
{"current_steps": 480, "total_steps": 855, "eval_loss": 0.006135060451924801, "epoch": 2.7947598253275108, "percentage": 56.14, "elapsed_time": "1:36:53", "remaining_time": "1:15:41"} |
|
{"current_steps": 481, "total_steps": 855, "loss": 0.0055, "lr": 4.7855877263825224e-05, "epoch": 2.8005822416302766, "percentage": 56.26, "elapsed_time": "1:37:04", "remaining_time": "1:15:28"} |
|
{"current_steps": 482, "total_steps": 855, "loss": 0.0062, "lr": 4.765181882005645e-05, "epoch": 2.806404657933042, "percentage": 56.37, "elapsed_time": "1:37:14", "remaining_time": "1:15:15"} |
|
{"current_steps": 483, "total_steps": 855, "loss": 0.0056, "lr": 4.744779956654046e-05, "epoch": 2.8122270742358078, "percentage": 56.49, "elapsed_time": "1:37:24", "remaining_time": "1:15:01"} |
|
{"current_steps": 484, "total_steps": 855, "loss": 0.0054, "lr": 4.7243822908281185e-05, "epoch": 2.8180494905385736, "percentage": 56.61, "elapsed_time": "1:37:35", "remaining_time": "1:14:48"} |
|
{"current_steps": 485, "total_steps": 855, "loss": 0.0057, "lr": 4.703989224957161e-05, "epoch": 2.8238719068413394, "percentage": 56.73, "elapsed_time": "1:37:45", "remaining_time": "1:14:34"} |
|
{"current_steps": 485, "total_steps": 855, "eval_loss": 0.006029130890965462, "epoch": 2.8238719068413394, "percentage": 56.73, "elapsed_time": "1:37:51", "remaining_time": "1:14:39"} |
|
{"current_steps": 486, "total_steps": 855, "loss": 0.0061, "lr": 4.6836010993937054e-05, "epoch": 2.8296943231441047, "percentage": 56.84, "elapsed_time": "1:38:01", "remaining_time": "1:14:25"} |
|
{"current_steps": 487, "total_steps": 855, "loss": 0.0055, "lr": 4.663218254407831e-05, "epoch": 2.8355167394468705, "percentage": 56.96, "elapsed_time": "1:38:11", "remaining_time": "1:14:12"} |
|
{"current_steps": 488, "total_steps": 855, "loss": 0.0059, "lr": 4.6428410301814866e-05, "epoch": 2.841339155749636, "percentage": 57.08, "elapsed_time": "1:38:22", "remaining_time": "1:13:58"} |
|
{"current_steps": 489, "total_steps": 855, "loss": 0.0057, "lr": 4.6224697668028095e-05, "epoch": 2.8471615720524017, "percentage": 57.19, "elapsed_time": "1:38:32", "remaining_time": "1:13:45"} |
|
{"current_steps": 490, "total_steps": 855, "loss": 0.0059, "lr": 4.602104804260456e-05, "epoch": 2.8529839883551675, "percentage": 57.31, "elapsed_time": "1:38:43", "remaining_time": "1:13:32"} |
|
{"current_steps": 490, "total_steps": 855, "eval_loss": 0.006049655843526125, "epoch": 2.8529839883551675, "percentage": 57.31, "elapsed_time": "1:38:48", "remaining_time": "1:13:36"} |
|
{"current_steps": 491, "total_steps": 855, "loss": 0.0055, "lr": 4.5817464824379195e-05, "epoch": 2.858806404657933, "percentage": 57.43, "elapsed_time": "1:38:59", "remaining_time": "1:13:22"} |
|
{"current_steps": 492, "total_steps": 855, "loss": 0.006, "lr": 4.5613951411078716e-05, "epoch": 2.8646288209606987, "percentage": 57.54, "elapsed_time": "1:39:09", "remaining_time": "1:13:09"} |
|
{"current_steps": 493, "total_steps": 855, "loss": 0.0057, "lr": 4.54105111992647e-05, "epoch": 2.870451237263464, "percentage": 57.66, "elapsed_time": "1:39:19", "remaining_time": "1:12:56"} |
|
{"current_steps": 494, "total_steps": 855, "loss": 0.0058, "lr": 4.520714758427713e-05, "epoch": 2.87627365356623, "percentage": 57.78, "elapsed_time": "1:39:30", "remaining_time": "1:12:43"} |
|
{"current_steps": 495, "total_steps": 855, "loss": 0.0058, "lr": 4.5003863960177525e-05, "epoch": 2.8820960698689957, "percentage": 57.89, "elapsed_time": "1:39:40", "remaining_time": "1:12:29"} |
|
{"current_steps": 495, "total_steps": 855, "eval_loss": 0.006072193384170532, "epoch": 2.8820960698689957, "percentage": 57.89, "elapsed_time": "1:39:46", "remaining_time": "1:12:33"} |
|
{"current_steps": 496, "total_steps": 855, "loss": 0.0057, "lr": 4.4800663719692425e-05, "epoch": 2.8879184861717615, "percentage": 58.01, "elapsed_time": "1:39:56", "remaining_time": "1:12:20"} |
|
{"current_steps": 497, "total_steps": 855, "loss": 0.0058, "lr": 4.4597550254156753e-05, "epoch": 2.893740902474527, "percentage": 58.13, "elapsed_time": "1:40:07", "remaining_time": "1:12:07"} |
|
{"current_steps": 498, "total_steps": 855, "loss": 0.006, "lr": 4.439452695345719e-05, "epoch": 2.8995633187772927, "percentage": 58.25, "elapsed_time": "1:40:17", "remaining_time": "1:11:53"} |
|
{"current_steps": 499, "total_steps": 855, "loss": 0.0059, "lr": 4.419159720597553e-05, "epoch": 2.905385735080058, "percentage": 58.36, "elapsed_time": "1:40:28", "remaining_time": "1:11:40"} |
|
{"current_steps": 500, "total_steps": 855, "loss": 0.0059, "lr": 4.398876439853227e-05, "epoch": 2.911208151382824, "percentage": 58.48, "elapsed_time": "1:40:38", "remaining_time": "1:11:27"} |
|
{"current_steps": 500, "total_steps": 855, "eval_loss": 0.006019276101142168, "epoch": 2.911208151382824, "percentage": 58.48, "elapsed_time": "1:40:44", "remaining_time": "1:11:31"} |
|
{"current_steps": 501, "total_steps": 855, "loss": 0.0058, "lr": 4.378603191632999e-05, "epoch": 2.9170305676855897, "percentage": 58.6, "elapsed_time": "1:41:43", "remaining_time": "1:11:52"} |
|
{"current_steps": 502, "total_steps": 855, "loss": 0.0057, "lr": 4.3583403142896906e-05, "epoch": 2.922852983988355, "percentage": 58.71, "elapsed_time": "1:41:53", "remaining_time": "1:11:39"} |
|
{"current_steps": 503, "total_steps": 855, "loss": 0.006, "lr": 4.338088146003033e-05, "epoch": 2.928675400291121, "percentage": 58.83, "elapsed_time": "1:42:04", "remaining_time": "1:11:25"} |
|
{"current_steps": 504, "total_steps": 855, "loss": 0.0059, "lr": 4.317847024774029e-05, "epoch": 2.934497816593886, "percentage": 58.95, "elapsed_time": "1:42:14", "remaining_time": "1:11:12"} |
|
{"current_steps": 505, "total_steps": 855, "loss": 0.0058, "lr": 4.297617288419312e-05, "epoch": 2.940320232896652, "percentage": 59.06, "elapsed_time": "1:42:24", "remaining_time": "1:10:58"} |
|
{"current_steps": 505, "total_steps": 855, "eval_loss": 0.006044932175427675, "epoch": 2.940320232896652, "percentage": 59.06, "elapsed_time": "1:42:30", "remaining_time": "1:11:02"} |
|
{"current_steps": 506, "total_steps": 855, "loss": 0.0058, "lr": 4.277399274565502e-05, "epoch": 2.946142649199418, "percentage": 59.18, "elapsed_time": "1:42:40", "remaining_time": "1:10:49"} |
|
{"current_steps": 507, "total_steps": 855, "loss": 0.0058, "lr": 4.2571933206435816e-05, "epoch": 2.9519650655021836, "percentage": 59.3, "elapsed_time": "1:42:51", "remaining_time": "1:10:35"} |
|
{"current_steps": 508, "total_steps": 855, "loss": 0.0061, "lr": 4.2369997638832514e-05, "epoch": 2.957787481804949, "percentage": 59.42, "elapsed_time": "1:43:01", "remaining_time": "1:10:22"} |
|
{"current_steps": 509, "total_steps": 855, "loss": 0.0055, "lr": 4.2168189413073124e-05, "epoch": 2.963609898107715, "percentage": 59.53, "elapsed_time": "1:43:12", "remaining_time": "1:10:09"} |
|
{"current_steps": 510, "total_steps": 855, "loss": 0.0057, "lr": 4.1966511897260316e-05, "epoch": 2.96943231441048, "percentage": 59.65, "elapsed_time": "1:43:22", "remaining_time": "1:09:55"} |
|
{"current_steps": 510, "total_steps": 855, "eval_loss": 0.006063099019229412, "epoch": 2.96943231441048, "percentage": 59.65, "elapsed_time": "1:43:28", "remaining_time": "1:09:59"} |
|
{"current_steps": 511, "total_steps": 855, "loss": 0.0057, "lr": 4.1764968457315314e-05, "epoch": 2.975254730713246, "percentage": 59.77, "elapsed_time": "1:43:38", "remaining_time": "1:09:46"} |
|
{"current_steps": 512, "total_steps": 855, "loss": 0.006, "lr": 4.1563562456921656e-05, "epoch": 2.981077147016012, "percentage": 59.88, "elapsed_time": "1:43:48", "remaining_time": "1:09:32"} |
|
{"current_steps": 513, "total_steps": 855, "loss": 0.0061, "lr": 4.1362297257469055e-05, "epoch": 2.986899563318777, "percentage": 60.0, "elapsed_time": "1:43:59", "remaining_time": "1:09:19"} |
|
{"current_steps": 514, "total_steps": 855, "loss": 0.006, "lr": 4.11611762179973e-05, "epoch": 2.992721979621543, "percentage": 60.12, "elapsed_time": "1:44:09", "remaining_time": "1:09:06"} |
|
{"current_steps": 515, "total_steps": 855, "loss": 0.0066, "lr": 4.0960202695140235e-05, "epoch": 2.9985443959243083, "percentage": 60.23, "elapsed_time": "1:44:19", "remaining_time": "1:08:52"} |
|
{"current_steps": 515, "total_steps": 855, "eval_loss": 0.006052407436072826, "epoch": 2.9985443959243083, "percentage": 60.23, "elapsed_time": "1:44:25", "remaining_time": "1:08:56"} |
|
{"current_steps": 516, "total_steps": 855, "loss": 0.0061, "lr": 4.075938004306963e-05, "epoch": 3.004366812227074, "percentage": 60.35, "elapsed_time": "1:44:35", "remaining_time": "1:08:43"} |
|
{"current_steps": 517, "total_steps": 855, "loss": 0.0056, "lr": 4.0558711613439426e-05, "epoch": 3.01018922852984, "percentage": 60.47, "elapsed_time": "1:44:46", "remaining_time": "1:08:29"} |
|
{"current_steps": 518, "total_steps": 855, "loss": 0.0053, "lr": 4.0358200755329504e-05, "epoch": 3.0160116448326058, "percentage": 60.58, "elapsed_time": "1:44:56", "remaining_time": "1:08:16"} |
|
{"current_steps": 519, "total_steps": 855, "loss": 0.0055, "lr": 4.0157850815190025e-05, "epoch": 3.021834061135371, "percentage": 60.7, "elapsed_time": "1:45:07", "remaining_time": "1:08:03"} |
|
{"current_steps": 520, "total_steps": 855, "loss": 0.0055, "lr": 3.995766513678543e-05, "epoch": 3.027656477438137, "percentage": 60.82, "elapsed_time": "1:45:17", "remaining_time": "1:07:49"} |
|
{"current_steps": 520, "total_steps": 855, "eval_loss": 0.005997630301862955, "epoch": 3.027656477438137, "percentage": 60.82, "elapsed_time": "1:45:23", "remaining_time": "1:07:53"} |
|
{"current_steps": 521, "total_steps": 855, "loss": 0.0055, "lr": 3.975764706113872e-05, "epoch": 3.0334788937409023, "percentage": 60.94, "elapsed_time": "1:45:33", "remaining_time": "1:07:40"} |
|
{"current_steps": 522, "total_steps": 855, "loss": 0.0055, "lr": 3.95577999264757e-05, "epoch": 3.039301310043668, "percentage": 61.05, "elapsed_time": "1:45:43", "remaining_time": "1:07:26"} |
|
{"current_steps": 523, "total_steps": 855, "loss": 0.0056, "lr": 3.935812706816922e-05, "epoch": 3.045123726346434, "percentage": 61.17, "elapsed_time": "1:45:53", "remaining_time": "1:07:13"} |
|
{"current_steps": 524, "total_steps": 855, "loss": 0.0053, "lr": 3.9158631818683466e-05, "epoch": 3.0509461426491993, "percentage": 61.29, "elapsed_time": "1:46:04", "remaining_time": "1:07:00"} |
|
{"current_steps": 525, "total_steps": 855, "loss": 0.005, "lr": 3.895931750751847e-05, "epoch": 3.056768558951965, "percentage": 61.4, "elapsed_time": "1:46:14", "remaining_time": "1:06:47"} |
|
{"current_steps": 525, "total_steps": 855, "eval_loss": 0.005964680574834347, "epoch": 3.056768558951965, "percentage": 61.4, "elapsed_time": "1:46:20", "remaining_time": "1:06:50"} |
|
{"current_steps": 526, "total_steps": 855, "loss": 0.0052, "lr": 3.876018746115444e-05, "epoch": 3.062590975254731, "percentage": 61.52, "elapsed_time": "1:46:31", "remaining_time": "1:06:37"} |
|
{"current_steps": 527, "total_steps": 855, "loss": 0.0053, "lr": 3.85612450029963e-05, "epoch": 3.0684133915574963, "percentage": 61.64, "elapsed_time": "1:46:41", "remaining_time": "1:06:24"} |
|
{"current_steps": 528, "total_steps": 855, "loss": 0.005, "lr": 3.836249345331816e-05, "epoch": 3.074235807860262, "percentage": 61.75, "elapsed_time": "1:46:51", "remaining_time": "1:06:10"} |
|
{"current_steps": 529, "total_steps": 855, "loss": 0.0057, "lr": 3.8163936129207965e-05, "epoch": 3.080058224163028, "percentage": 61.87, "elapsed_time": "1:47:01", "remaining_time": "1:05:57"} |
|
{"current_steps": 530, "total_steps": 855, "loss": 0.0055, "lr": 3.7965576344512114e-05, "epoch": 3.0858806404657932, "percentage": 61.99, "elapsed_time": "1:47:12", "remaining_time": "1:05:44"} |
|
{"current_steps": 530, "total_steps": 855, "eval_loss": 0.005973320920020342, "epoch": 3.0858806404657932, "percentage": 61.99, "elapsed_time": "1:47:17", "remaining_time": "1:05:47"} |
|
{"current_steps": 531, "total_steps": 855, "loss": 0.0052, "lr": 3.776741740978011e-05, "epoch": 3.091703056768559, "percentage": 62.11, "elapsed_time": "1:47:28", "remaining_time": "1:05:34"} |
|
{"current_steps": 532, "total_steps": 855, "loss": 0.0054, "lr": 3.756946263220941e-05, "epoch": 3.0975254730713244, "percentage": 62.22, "elapsed_time": "1:47:39", "remaining_time": "1:05:21"} |
|
{"current_steps": 533, "total_steps": 855, "loss": 0.0052, "lr": 3.737171531559011e-05, "epoch": 3.1033478893740902, "percentage": 62.34, "elapsed_time": "1:47:49", "remaining_time": "1:05:08"} |
|
{"current_steps": 534, "total_steps": 855, "loss": 0.0056, "lr": 3.71741787602499e-05, "epoch": 3.109170305676856, "percentage": 62.46, "elapsed_time": "1:48:00", "remaining_time": "1:04:55"} |
|
{"current_steps": 535, "total_steps": 855, "loss": 0.0054, "lr": 3.697685626299889e-05, "epoch": 3.1149927219796214, "percentage": 62.57, "elapsed_time": "1:48:10", "remaining_time": "1:04:42"} |
|
{"current_steps": 535, "total_steps": 855, "eval_loss": 0.0059963371604681015, "epoch": 3.1149927219796214, "percentage": 62.57, "elapsed_time": "1:48:16", "remaining_time": "1:04:45"} |
|
{"current_steps": 536, "total_steps": 855, "loss": 0.0053, "lr": 3.6779751117074694e-05, "epoch": 3.120815138282387, "percentage": 62.69, "elapsed_time": "1:48:26", "remaining_time": "1:04:32"} |
|
{"current_steps": 537, "total_steps": 855, "loss": 0.0055, "lr": 3.658286661208741e-05, "epoch": 3.126637554585153, "percentage": 62.81, "elapsed_time": "1:48:36", "remaining_time": "1:04:19"} |
|
{"current_steps": 538, "total_steps": 855, "loss": 0.0055, "lr": 3.638620603396472e-05, "epoch": 3.1324599708879184, "percentage": 62.92, "elapsed_time": "1:48:47", "remaining_time": "1:04:06"} |
|
{"current_steps": 539, "total_steps": 855, "loss": 0.0055, "lr": 3.6189772664897005e-05, "epoch": 3.138282387190684, "percentage": 63.04, "elapsed_time": "1:48:57", "remaining_time": "1:03:52"} |
|
{"current_steps": 540, "total_steps": 855, "loss": 0.0055, "lr": 3.599356978328269e-05, "epoch": 3.14410480349345, "percentage": 63.16, "elapsed_time": "1:49:08", "remaining_time": "1:03:39"} |
|
{"current_steps": 540, "total_steps": 855, "eval_loss": 0.006012990139424801, "epoch": 3.14410480349345, "percentage": 63.16, "elapsed_time": "1:49:13", "remaining_time": "1:03:43"} |
|
{"current_steps": 541, "total_steps": 855, "loss": 0.0056, "lr": 3.5797600663673344e-05, "epoch": 3.1499272197962154, "percentage": 63.27, "elapsed_time": "1:49:24", "remaining_time": "1:03:30"} |
|
{"current_steps": 542, "total_steps": 855, "loss": 0.0052, "lr": 3.56018685767193e-05, "epoch": 3.155749636098981, "percentage": 63.39, "elapsed_time": "1:49:34", "remaining_time": "1:03:16"} |
|
{"current_steps": 543, "total_steps": 855, "loss": 0.0053, "lr": 3.540637678911475e-05, "epoch": 3.1615720524017465, "percentage": 63.51, "elapsed_time": "1:49:45", "remaining_time": "1:03:03"} |
|
{"current_steps": 544, "total_steps": 855, "loss": 0.0053, "lr": 3.521112856354346e-05, "epoch": 3.1673944687045124, "percentage": 63.63, "elapsed_time": "1:49:55", "remaining_time": "1:02:50"} |
|
{"current_steps": 545, "total_steps": 855, "loss": 0.0056, "lr": 3.5016127158624205e-05, "epoch": 3.173216885007278, "percentage": 63.74, "elapsed_time": "1:50:06", "remaining_time": "1:02:37"} |
|
{"current_steps": 545, "total_steps": 855, "eval_loss": 0.006045662332326174, "epoch": 3.173216885007278, "percentage": 63.74, "elapsed_time": "1:50:11", "remaining_time": "1:02:40"} |
|
{"current_steps": 546, "total_steps": 855, "loss": 0.0054, "lr": 3.482137582885644e-05, "epoch": 3.1790393013100435, "percentage": 63.86, "elapsed_time": "1:50:22", "remaining_time": "1:02:27"} |
|
{"current_steps": 547, "total_steps": 855, "loss": 0.0053, "lr": 3.462687782456596e-05, "epoch": 3.1848617176128093, "percentage": 63.98, "elapsed_time": "1:50:32", "remaining_time": "1:02:14"} |
|
{"current_steps": 548, "total_steps": 855, "loss": 0.0052, "lr": 3.443263639185065e-05, "epoch": 3.190684133915575, "percentage": 64.09, "elapsed_time": "1:50:42", "remaining_time": "1:02:01"} |
|
{"current_steps": 549, "total_steps": 855, "loss": 0.0055, "lr": 3.4238654772526305e-05, "epoch": 3.1965065502183405, "percentage": 64.21, "elapsed_time": "1:50:53", "remaining_time": "1:01:48"} |
|
{"current_steps": 550, "total_steps": 855, "loss": 0.0057, "lr": 3.404493620407252e-05, "epoch": 3.2023289665211063, "percentage": 64.33, "elapsed_time": "1:51:03", "remaining_time": "1:01:35"} |
|
{"current_steps": 550, "total_steps": 855, "eval_loss": 0.006035549100488424, "epoch": 3.2023289665211063, "percentage": 64.33, "elapsed_time": "1:51:09", "remaining_time": "1:01:38"} |
|
{"current_steps": 551, "total_steps": 855, "loss": 0.0051, "lr": 3.385148391957869e-05, "epoch": 3.208151382823872, "percentage": 64.44, "elapsed_time": "1:51:45", "remaining_time": "1:01:39"} |
|
{"current_steps": 552, "total_steps": 855, "loss": 0.0053, "lr": 3.3658301147690066e-05, "epoch": 3.2139737991266375, "percentage": 64.56, "elapsed_time": "1:51:56", "remaining_time": "1:01:26"} |
|
{"current_steps": 553, "total_steps": 855, "loss": 0.0057, "lr": 3.346539111255377e-05, "epoch": 3.2197962154294033, "percentage": 64.68, "elapsed_time": "1:52:06", "remaining_time": "1:01:13"} |
|
{"current_steps": 554, "total_steps": 855, "loss": 0.0055, "lr": 3.3272757033765085e-05, "epoch": 3.2256186317321687, "percentage": 64.8, "elapsed_time": "1:52:16", "remaining_time": "1:01:00"} |
|
{"current_steps": 555, "total_steps": 855, "loss": 0.0058, "lr": 3.3080402126313695e-05, "epoch": 3.2314410480349345, "percentage": 64.91, "elapsed_time": "1:52:27", "remaining_time": "1:00:47"} |
|
{"current_steps": 555, "total_steps": 855, "eval_loss": 0.006002995651215315, "epoch": 3.2314410480349345, "percentage": 64.91, "elapsed_time": "1:52:32", "remaining_time": "1:00:50"} |
|
{"current_steps": 556, "total_steps": 855, "loss": 0.0054, "lr": 3.2888329600529975e-05, "epoch": 3.2372634643377003, "percentage": 65.03, "elapsed_time": "1:52:42", "remaining_time": "1:00:36"} |
|
{"current_steps": 557, "total_steps": 855, "loss": 0.0053, "lr": 3.269654266203153e-05, "epoch": 3.2430858806404657, "percentage": 65.15, "elapsed_time": "1:52:53", "remaining_time": "1:00:23"} |
|
{"current_steps": 558, "total_steps": 855, "loss": 0.0054, "lr": 3.250504451166956e-05, "epoch": 3.2489082969432315, "percentage": 65.26, "elapsed_time": "1:53:03", "remaining_time": "1:00:10"} |
|
{"current_steps": 559, "total_steps": 855, "loss": 0.0053, "lr": 3.2313838345475547e-05, "epoch": 3.2547307132459973, "percentage": 65.38, "elapsed_time": "1:53:13", "remaining_time": "0:59:57"} |
|
{"current_steps": 560, "total_steps": 855, "loss": 0.0052, "lr": 3.212292735460781e-05, "epoch": 3.2605531295487626, "percentage": 65.5, "elapsed_time": "1:53:24", "remaining_time": "0:59:44"} |
|
{"current_steps": 560, "total_steps": 855, "eval_loss": 0.00597412558272481, "epoch": 3.2605531295487626, "percentage": 65.5, "elapsed_time": "1:53:29", "remaining_time": "0:59:47"} |
|
{"current_steps": 561, "total_steps": 855, "loss": 0.0055, "lr": 3.1932314725298345e-05, "epoch": 3.2663755458515285, "percentage": 65.61, "elapsed_time": "1:53:40", "remaining_time": "0:59:34"} |
|
{"current_steps": 562, "total_steps": 855, "loss": 0.005, "lr": 3.1742003638799625e-05, "epoch": 3.2721979621542943, "percentage": 65.73, "elapsed_time": "1:53:50", "remaining_time": "0:59:21"} |
|
{"current_steps": 563, "total_steps": 855, "loss": 0.0054, "lr": 3.1551997271331444e-05, "epoch": 3.2780203784570596, "percentage": 65.85, "elapsed_time": "1:54:01", "remaining_time": "0:59:08"} |
|
{"current_steps": 564, "total_steps": 855, "loss": 0.0054, "lr": 3.136229879402798e-05, "epoch": 3.2838427947598254, "percentage": 65.96, "elapsed_time": "1:54:11", "remaining_time": "0:58:55"} |
|
{"current_steps": 565, "total_steps": 855, "loss": 0.0058, "lr": 3.1172911372884806e-05, "epoch": 3.289665211062591, "percentage": 66.08, "elapsed_time": "1:54:22", "remaining_time": "0:58:42"} |
|
{"current_steps": 565, "total_steps": 855, "eval_loss": 0.005954680498689413, "epoch": 3.289665211062591, "percentage": 66.08, "elapsed_time": "1:54:27", "remaining_time": "0:58:45"} |
|
{"current_steps": 566, "total_steps": 855, "loss": 0.0051, "lr": 3.0983838168706124e-05, "epoch": 3.2954876273653566, "percentage": 66.2, "elapsed_time": "1:54:38", "remaining_time": "0:58:32"} |
|
{"current_steps": 567, "total_steps": 855, "loss": 0.0051, "lr": 3.0795082337051984e-05, "epoch": 3.3013100436681224, "percentage": 66.32, "elapsed_time": "1:54:48", "remaining_time": "0:58:18"} |
|
{"current_steps": 568, "total_steps": 855, "loss": 0.0052, "lr": 3.060664702818555e-05, "epoch": 3.307132459970888, "percentage": 66.43, "elapsed_time": "1:54:58", "remaining_time": "0:58:05"} |
|
{"current_steps": 569, "total_steps": 855, "loss": 0.0056, "lr": 3.0418535387020642e-05, "epoch": 3.3129548762736536, "percentage": 66.55, "elapsed_time": "1:55:09", "remaining_time": "0:57:52"} |
|
{"current_steps": 570, "total_steps": 855, "loss": 0.0051, "lr": 3.0230750553069155e-05, "epoch": 3.3187772925764194, "percentage": 66.67, "elapsed_time": "1:55:20", "remaining_time": "0:57:40"} |
|
{"current_steps": 570, "total_steps": 855, "eval_loss": 0.005825328174978495, "epoch": 3.3187772925764194, "percentage": 66.67, "elapsed_time": "1:55:25", "remaining_time": "0:57:42"} |
|
{"current_steps": 571, "total_steps": 855, "loss": 0.0054, "lr": 3.00432956603887e-05, "epoch": 3.3245997088791848, "percentage": 66.78, "elapsed_time": "1:55:36", "remaining_time": "0:57:29"} |
|
{"current_steps": 572, "total_steps": 855, "loss": 0.0054, "lr": 2.9856173837530288e-05, "epoch": 3.3304221251819506, "percentage": 66.9, "elapsed_time": "1:55:46", "remaining_time": "0:57:16"} |
|
{"current_steps": 573, "total_steps": 855, "loss": 0.0055, "lr": 2.966938820748616e-05, "epoch": 3.3362445414847164, "percentage": 67.02, "elapsed_time": "1:55:57", "remaining_time": "0:57:03"} |
|
{"current_steps": 574, "total_steps": 855, "loss": 0.0052, "lr": 2.9482941887637593e-05, "epoch": 3.3420669577874818, "percentage": 67.13, "elapsed_time": "1:56:07", "remaining_time": "0:56:50"} |
|
{"current_steps": 575, "total_steps": 855, "loss": 0.0051, "lr": 2.9296837989702896e-05, "epoch": 3.3478893740902476, "percentage": 67.25, "elapsed_time": "1:56:17", "remaining_time": "0:56:37"} |
|
{"current_steps": 575, "total_steps": 855, "eval_loss": 0.005916123278439045, "epoch": 3.3478893740902476, "percentage": 67.25, "elapsed_time": "1:56:23", "remaining_time": "0:56:40"} |
|
{"current_steps": 576, "total_steps": 855, "loss": 0.0053, "lr": 2.9111079619685522e-05, "epoch": 3.353711790393013, "percentage": 67.37, "elapsed_time": "1:56:34", "remaining_time": "0:56:27"} |
|
{"current_steps": 577, "total_steps": 855, "loss": 0.0049, "lr": 2.8925669877822132e-05, "epoch": 3.3595342066957787, "percentage": 67.49, "elapsed_time": "1:56:44", "remaining_time": "0:56:14"} |
|
{"current_steps": 578, "total_steps": 855, "loss": 0.0053, "lr": 2.8740611858530987e-05, "epoch": 3.3653566229985445, "percentage": 67.6, "elapsed_time": "1:56:54", "remaining_time": "0:56:01"} |
|
{"current_steps": 579, "total_steps": 855, "loss": 0.0053, "lr": 2.855590865036022e-05, "epoch": 3.37117903930131, "percentage": 67.72, "elapsed_time": "1:57:04", "remaining_time": "0:55:48"} |
|
{"current_steps": 580, "total_steps": 855, "loss": 0.0053, "lr": 2.8371563335936252e-05, "epoch": 3.3770014556040757, "percentage": 67.84, "elapsed_time": "1:57:15", "remaining_time": "0:55:35"} |
|
{"current_steps": 580, "total_steps": 855, "eval_loss": 0.0059220860712230206, "epoch": 3.3770014556040757, "percentage": 67.84, "elapsed_time": "1:57:21", "remaining_time": "0:55:38"} |
|
{"current_steps": 581, "total_steps": 855, "loss": 0.0053, "lr": 2.8187578991912438e-05, "epoch": 3.3828238719068415, "percentage": 67.95, "elapsed_time": "1:57:31", "remaining_time": "0:55:25"} |
|
{"current_steps": 582, "total_steps": 855, "loss": 0.0055, "lr": 2.8003958688917615e-05, "epoch": 3.388646288209607, "percentage": 68.07, "elapsed_time": "1:57:41", "remaining_time": "0:55:12"} |
|
{"current_steps": 583, "total_steps": 855, "loss": 0.0054, "lr": 2.7820705491505026e-05, "epoch": 3.3944687045123727, "percentage": 68.19, "elapsed_time": "1:57:52", "remaining_time": "0:54:59"} |
|
{"current_steps": 584, "total_steps": 855, "loss": 0.0051, "lr": 2.7637822458100976e-05, "epoch": 3.4002911208151385, "percentage": 68.3, "elapsed_time": "1:58:02", "remaining_time": "0:54:46"} |
|
{"current_steps": 585, "total_steps": 855, "loss": 0.0053, "lr": 2.7455312640953874e-05, "epoch": 3.406113537117904, "percentage": 68.42, "elapsed_time": "1:58:12", "remaining_time": "0:54:33"} |
|
{"current_steps": 585, "total_steps": 855, "eval_loss": 0.005873468238860369, "epoch": 3.406113537117904, "percentage": 68.42, "elapsed_time": "1:58:18", "remaining_time": "0:54:36"} |
|
{"current_steps": 586, "total_steps": 855, "loss": 0.0051, "lr": 2.727317908608329e-05, "epoch": 3.4119359534206697, "percentage": 68.54, "elapsed_time": "1:58:28", "remaining_time": "0:54:23"} |
|
{"current_steps": 587, "total_steps": 855, "loss": 0.005, "lr": 2.7091424833229158e-05, "epoch": 3.417758369723435, "percentage": 68.65, "elapsed_time": "1:58:39", "remaining_time": "0:54:10"} |
|
{"current_steps": 588, "total_steps": 855, "loss": 0.0054, "lr": 2.6910052915801005e-05, "epoch": 3.423580786026201, "percentage": 68.77, "elapsed_time": "1:58:49", "remaining_time": "0:53:57"} |
|
{"current_steps": 589, "total_steps": 855, "loss": 0.0051, "lr": 2.6729066360827282e-05, "epoch": 3.4294032023289667, "percentage": 68.89, "elapsed_time": "1:58:59", "remaining_time": "0:53:44"} |
|
{"current_steps": 590, "total_steps": 855, "loss": 0.0055, "lr": 2.654846818890489e-05, "epoch": 3.435225618631732, "percentage": 69.01, "elapsed_time": "1:59:10", "remaining_time": "0:53:31"} |
|
{"current_steps": 590, "total_steps": 855, "eval_loss": 0.0058377580717206, "epoch": 3.435225618631732, "percentage": 69.01, "elapsed_time": "1:59:15", "remaining_time": "0:53:33"} |
|
{"current_steps": 591, "total_steps": 855, "loss": 0.0054, "lr": 2.636826141414882e-05, "epoch": 3.441048034934498, "percentage": 69.12, "elapsed_time": "1:59:26", "remaining_time": "0:53:21"} |
|
{"current_steps": 592, "total_steps": 855, "loss": 0.0055, "lr": 2.618844904414173e-05, "epoch": 3.4468704512372637, "percentage": 69.24, "elapsed_time": "1:59:36", "remaining_time": "0:53:08"} |
|
{"current_steps": 593, "total_steps": 855, "loss": 0.005, "lr": 2.600903407988386e-05, "epoch": 3.452692867540029, "percentage": 69.36, "elapsed_time": "1:59:47", "remaining_time": "0:52:55"} |
|
{"current_steps": 594, "total_steps": 855, "loss": 0.0052, "lr": 2.5830019515742844e-05, "epoch": 3.458515283842795, "percentage": 69.47, "elapsed_time": "1:59:57", "remaining_time": "0:52:42"} |
|
{"current_steps": 595, "total_steps": 855, "loss": 0.0051, "lr": 2.565140833940387e-05, "epoch": 3.4643377001455606, "percentage": 69.59, "elapsed_time": "2:00:08", "remaining_time": "0:52:29"} |
|
{"current_steps": 595, "total_steps": 855, "eval_loss": 0.005910491105169058, "epoch": 3.4643377001455606, "percentage": 69.59, "elapsed_time": "2:00:13", "remaining_time": "0:52:32"} |
|
{"current_steps": 596, "total_steps": 855, "loss": 0.0055, "lr": 2.5473203531819655e-05, "epoch": 3.470160116448326, "percentage": 69.71, "elapsed_time": "2:00:24", "remaining_time": "0:52:19"} |
|
{"current_steps": 597, "total_steps": 855, "loss": 0.0054, "lr": 2.529540806716081e-05, "epoch": 3.475982532751092, "percentage": 69.82, "elapsed_time": "2:00:34", "remaining_time": "0:52:06"} |
|
{"current_steps": 598, "total_steps": 855, "loss": 0.0053, "lr": 2.5118024912766175e-05, "epoch": 3.481804949053857, "percentage": 69.94, "elapsed_time": "2:00:44", "remaining_time": "0:51:53"} |
|
{"current_steps": 599, "total_steps": 855, "loss": 0.0052, "lr": 2.4941057029093308e-05, "epoch": 3.487627365356623, "percentage": 70.06, "elapsed_time": "2:00:55", "remaining_time": "0:51:40"} |
|
{"current_steps": 600, "total_steps": 855, "loss": 0.0051, "lr": 2.4764507369669e-05, "epoch": 3.493449781659389, "percentage": 70.18, "elapsed_time": "2:01:05", "remaining_time": "0:51:27"} |
|
{"current_steps": 600, "total_steps": 855, "eval_loss": 0.005931612569838762, "epoch": 3.493449781659389, "percentage": 70.18, "elapsed_time": "2:01:11", "remaining_time": "0:51:30"} |
|
{"current_steps": 601, "total_steps": 855, "loss": 0.0053, "lr": 2.4588378881040063e-05, "epoch": 3.499272197962154, "percentage": 70.29, "elapsed_time": "2:01:46", "remaining_time": "0:51:28"} |
|
{"current_steps": 602, "total_steps": 855, "loss": 0.0054, "lr": 2.4412674502724144e-05, "epoch": 3.50509461426492, "percentage": 70.41, "elapsed_time": "2:01:57", "remaining_time": "0:51:15"} |
|
{"current_steps": 603, "total_steps": 855, "loss": 0.0053, "lr": 2.4237397167160652e-05, "epoch": 3.5109170305676853, "percentage": 70.53, "elapsed_time": "2:02:07", "remaining_time": "0:51:02"} |
|
{"current_steps": 604, "total_steps": 855, "loss": 0.0055, "lr": 2.40625497996618e-05, "epoch": 3.516739446870451, "percentage": 70.64, "elapsed_time": "2:02:18", "remaining_time": "0:50:49"} |
|
{"current_steps": 605, "total_steps": 855, "loss": 0.0055, "lr": 2.3888135318363762e-05, "epoch": 3.522561863173217, "percentage": 70.76, "elapsed_time": "2:02:28", "remaining_time": "0:50:36"} |
|
{"current_steps": 605, "total_steps": 855, "eval_loss": 0.00587079394608736, "epoch": 3.522561863173217, "percentage": 70.76, "elapsed_time": "2:02:33", "remaining_time": "0:50:38"} |
|
{"current_steps": 606, "total_steps": 855, "loss": 0.0053, "lr": 2.371415663417809e-05, "epoch": 3.5283842794759828, "percentage": 70.88, "elapsed_time": "2:02:44", "remaining_time": "0:50:25"} |
|
{"current_steps": 607, "total_steps": 855, "loss": 0.0053, "lr": 2.3540616650742965e-05, "epoch": 3.534206695778748, "percentage": 70.99, "elapsed_time": "2:02:54", "remaining_time": "0:50:12"} |
|
{"current_steps": 608, "total_steps": 855, "loss": 0.0052, "lr": 2.3367518264374882e-05, "epoch": 3.540029112081514, "percentage": 71.11, "elapsed_time": "2:03:04", "remaining_time": "0:50:00"} |
|
{"current_steps": 609, "total_steps": 855, "loss": 0.0049, "lr": 2.319486436402019e-05, "epoch": 3.5458515283842793, "percentage": 71.23, "elapsed_time": "2:03:15", "remaining_time": "0:49:47"} |
|
{"current_steps": 610, "total_steps": 855, "loss": 0.0055, "lr": 2.3022657831207002e-05, "epoch": 3.551673944687045, "percentage": 71.35, "elapsed_time": "2:03:25", "remaining_time": "0:49:34"} |
|
{"current_steps": 610, "total_steps": 855, "eval_loss": 0.005807011388242245, "epoch": 3.551673944687045, "percentage": 71.35, "elapsed_time": "2:03:31", "remaining_time": "0:49:36"} |
|
{"current_steps": 611, "total_steps": 855, "loss": 0.0054, "lr": 2.2850901539996973e-05, "epoch": 3.557496360989811, "percentage": 71.46, "elapsed_time": "2:03:41", "remaining_time": "0:49:23"} |
|
{"current_steps": 612, "total_steps": 855, "loss": 0.005, "lr": 2.2679598356937414e-05, "epoch": 3.5633187772925763, "percentage": 71.58, "elapsed_time": "2:03:51", "remaining_time": "0:49:10"} |
|
{"current_steps": 613, "total_steps": 855, "loss": 0.0052, "lr": 2.2508751141013462e-05, "epoch": 3.569141193595342, "percentage": 71.7, "elapsed_time": "2:04:02", "remaining_time": "0:48:58"} |
|
{"current_steps": 614, "total_steps": 855, "loss": 0.0052, "lr": 2.2338362743600326e-05, "epoch": 3.5749636098981075, "percentage": 71.81, "elapsed_time": "2:04:12", "remaining_time": "0:48:45"} |
|
{"current_steps": 615, "total_steps": 855, "loss": 0.0055, "lr": 2.2168436008415687e-05, "epoch": 3.5807860262008733, "percentage": 71.93, "elapsed_time": "2:04:22", "remaining_time": "0:48:32"} |
|
{"current_steps": 615, "total_steps": 855, "eval_loss": 0.005797410383820534, "epoch": 3.5807860262008733, "percentage": 71.93, "elapsed_time": "2:04:28", "remaining_time": "0:48:34"} |
|
{"current_steps": 616, "total_steps": 855, "loss": 0.0053, "lr": 2.199897377147225e-05, "epoch": 3.586608442503639, "percentage": 72.05, "elapsed_time": "2:04:39", "remaining_time": "0:48:21"} |
|
{"current_steps": 617, "total_steps": 855, "loss": 0.0054, "lr": 2.182997886103046e-05, "epoch": 3.592430858806405, "percentage": 72.16, "elapsed_time": "2:04:49", "remaining_time": "0:48:08"} |
|
{"current_steps": 618, "total_steps": 855, "loss": 0.0053, "lr": 2.166145409755125e-05, "epoch": 3.5982532751091703, "percentage": 72.28, "elapsed_time": "2:04:59", "remaining_time": "0:47:56"} |
|
{"current_steps": 619, "total_steps": 855, "loss": 0.0054, "lr": 2.149340229364896e-05, "epoch": 3.604075691411936, "percentage": 72.4, "elapsed_time": "2:05:10", "remaining_time": "0:47:43"} |
|
{"current_steps": 620, "total_steps": 855, "loss": 0.0051, "lr": 2.13258262540444e-05, "epoch": 3.6098981077147014, "percentage": 72.51, "elapsed_time": "2:05:20", "remaining_time": "0:47:30"} |
|
{"current_steps": 620, "total_steps": 855, "eval_loss": 0.005762726999819279, "epoch": 3.6098981077147014, "percentage": 72.51, "elapsed_time": "2:05:26", "remaining_time": "0:47:32"} |
|
{"current_steps": 621, "total_steps": 855, "loss": 0.0051, "lr": 2.1158728775518123e-05, "epoch": 3.6157205240174672, "percentage": 72.63, "elapsed_time": "2:05:36", "remaining_time": "0:47:19"} |
|
{"current_steps": 622, "total_steps": 855, "loss": 0.0051, "lr": 2.0992112646863583e-05, "epoch": 3.621542940320233, "percentage": 72.75, "elapsed_time": "2:05:46", "remaining_time": "0:47:07"} |
|
{"current_steps": 623, "total_steps": 855, "loss": 0.0048, "lr": 2.0825980648840786e-05, "epoch": 3.6273653566229984, "percentage": 72.87, "elapsed_time": "2:05:57", "remaining_time": "0:46:54"} |
|
{"current_steps": 624, "total_steps": 855, "loss": 0.0054, "lr": 2.0660335554129695e-05, "epoch": 3.6331877729257642, "percentage": 72.98, "elapsed_time": "2:06:07", "remaining_time": "0:46:41"} |
|
{"current_steps": 625, "total_steps": 855, "loss": 0.0054, "lr": 2.0495180127284107e-05, "epoch": 3.6390101892285296, "percentage": 73.1, "elapsed_time": "2:06:17", "remaining_time": "0:46:28"} |
|
{"current_steps": 625, "total_steps": 855, "eval_loss": 0.005716984160244465, "epoch": 3.6390101892285296, "percentage": 73.1, "elapsed_time": "2:06:23", "remaining_time": "0:46:30"} |
|
{"current_steps": 626, "total_steps": 855, "loss": 0.005, "lr": 2.0330517124685416e-05, "epoch": 3.6448326055312954, "percentage": 73.22, "elapsed_time": "2:06:34", "remaining_time": "0:46:18"} |
|
{"current_steps": 627, "total_steps": 855, "loss": 0.0053, "lr": 2.0166349294496623e-05, "epoch": 3.650655021834061, "percentage": 73.33, "elapsed_time": "2:06:44", "remaining_time": "0:46:05"} |
|
{"current_steps": 628, "total_steps": 855, "loss": 0.0052, "lr": 2.0002679376616534e-05, "epoch": 3.656477438136827, "percentage": 73.45, "elapsed_time": "2:06:54", "remaining_time": "0:45:52"} |
|
{"current_steps": 629, "total_steps": 855, "loss": 0.0053, "lr": 1.9839510102633985e-05, "epoch": 3.6622998544395924, "percentage": 73.57, "elapsed_time": "2:07:05", "remaining_time": "0:45:39"} |
|
{"current_steps": 630, "total_steps": 855, "loss": 0.0053, "lr": 1.9676844195782218e-05, "epoch": 3.668122270742358, "percentage": 73.68, "elapsed_time": "2:07:15", "remaining_time": "0:45:26"} |
|
{"current_steps": 630, "total_steps": 855, "eval_loss": 0.005713089369237423, "epoch": 3.668122270742358, "percentage": 73.68, "elapsed_time": "2:07:21", "remaining_time": "0:45:28"} |
|
{"current_steps": 631, "total_steps": 855, "loss": 0.0054, "lr": 1.9514684370893465e-05, "epoch": 3.6739446870451236, "percentage": 73.8, "elapsed_time": "2:07:31", "remaining_time": "0:45:16"} |
|
{"current_steps": 632, "total_steps": 855, "loss": 0.0054, "lr": 1.93530333343537e-05, "epoch": 3.6797671033478894, "percentage": 73.92, "elapsed_time": "2:07:41", "remaining_time": "0:45:03"} |
|
{"current_steps": 633, "total_steps": 855, "loss": 0.0055, "lr": 1.9191893784057375e-05, "epoch": 3.685589519650655, "percentage": 74.04, "elapsed_time": "2:07:52", "remaining_time": "0:44:50"} |
|
{"current_steps": 634, "total_steps": 855, "loss": 0.0053, "lr": 1.903126840936243e-05, "epoch": 3.6914119359534205, "percentage": 74.15, "elapsed_time": "2:08:02", "remaining_time": "0:44:38"} |
|
{"current_steps": 635, "total_steps": 855, "loss": 0.0052, "lr": 1.8871159891045393e-05, "epoch": 3.6972343522561864, "percentage": 74.27, "elapsed_time": "2:08:13", "remaining_time": "0:44:25"} |
|
{"current_steps": 635, "total_steps": 855, "eval_loss": 0.005719096399843693, "epoch": 3.6972343522561864, "percentage": 74.27, "elapsed_time": "2:08:18", "remaining_time": "0:44:27"} |
|
{"current_steps": 636, "total_steps": 855, "loss": 0.0052, "lr": 1.871157090125671e-05, "epoch": 3.7030567685589517, "percentage": 74.39, "elapsed_time": "2:08:29", "remaining_time": "0:44:14"} |
|
{"current_steps": 637, "total_steps": 855, "loss": 0.0052, "lr": 1.8552504103476015e-05, "epoch": 3.7088791848617175, "percentage": 74.5, "elapsed_time": "2:08:39", "remaining_time": "0:44:01"} |
|
{"current_steps": 638, "total_steps": 855, "loss": 0.0052, "lr": 1.8393962152467848e-05, "epoch": 3.7147016011644833, "percentage": 74.62, "elapsed_time": "2:08:50", "remaining_time": "0:43:49"} |
|
{"current_steps": 639, "total_steps": 855, "loss": 0.0052, "lr": 1.823594769423716e-05, "epoch": 3.720524017467249, "percentage": 74.74, "elapsed_time": "2:09:00", "remaining_time": "0:43:36"} |
|
{"current_steps": 640, "total_steps": 855, "loss": 0.0052, "lr": 1.807846336598533e-05, "epoch": 3.7263464337700145, "percentage": 74.85, "elapsed_time": "2:09:10", "remaining_time": "0:43:23"} |
|
{"current_steps": 640, "total_steps": 855, "eval_loss": 0.005699502769857645, "epoch": 3.7263464337700145, "percentage": 74.85, "elapsed_time": "2:09:16", "remaining_time": "0:43:25"} |
|
{"current_steps": 641, "total_steps": 855, "loss": 0.0052, "lr": 1.792151179606602e-05, "epoch": 3.7321688500727803, "percentage": 74.97, "elapsed_time": "2:09:26", "remaining_time": "0:43:12"} |
|
{"current_steps": 642, "total_steps": 855, "loss": 0.0048, "lr": 1.7765095603941352e-05, "epoch": 3.7379912663755457, "percentage": 75.09, "elapsed_time": "2:09:37", "remaining_time": "0:43:00"} |
|
{"current_steps": 643, "total_steps": 855, "loss": 0.0048, "lr": 1.760921740013823e-05, "epoch": 3.7438136826783115, "percentage": 75.2, "elapsed_time": "2:09:47", "remaining_time": "0:42:47"} |
|
{"current_steps": 644, "total_steps": 855, "loss": 0.0052, "lr": 1.7453879786204735e-05, "epoch": 3.7496360989810773, "percentage": 75.32, "elapsed_time": "2:09:57", "remaining_time": "0:42:34"} |
|
{"current_steps": 645, "total_steps": 855, "loss": 0.0052, "lr": 1.7299085354666682e-05, "epoch": 3.7554585152838427, "percentage": 75.44, "elapsed_time": "2:10:08", "remaining_time": "0:42:22"} |
|
{"current_steps": 645, "total_steps": 855, "eval_loss": 0.00575040839612484, "epoch": 3.7554585152838427, "percentage": 75.44, "elapsed_time": "2:10:13", "remaining_time": "0:42:24"} |
|
{"current_steps": 646, "total_steps": 855, "loss": 0.0052, "lr": 1.7144836688984396e-05, "epoch": 3.7612809315866085, "percentage": 75.56, "elapsed_time": "2:10:24", "remaining_time": "0:42:11"} |
|
{"current_steps": 647, "total_steps": 855, "loss": 0.0052, "lr": 1.6991136363509525e-05, "epoch": 3.767103347889374, "percentage": 75.67, "elapsed_time": "2:10:34", "remaining_time": "0:41:58"} |
|
{"current_steps": 648, "total_steps": 855, "loss": 0.0052, "lr": 1.6837986943442253e-05, "epoch": 3.7729257641921397, "percentage": 75.79, "elapsed_time": "2:10:44", "remaining_time": "0:41:45"} |
|
{"current_steps": 649, "total_steps": 855, "loss": 0.0053, "lr": 1.6685390984788233e-05, "epoch": 3.7787481804949055, "percentage": 75.91, "elapsed_time": "2:10:55", "remaining_time": "0:41:33"} |
|
{"current_steps": 650, "total_steps": 855, "loss": 0.0049, "lr": 1.6533351034316126e-05, "epoch": 3.7845705967976713, "percentage": 76.02, "elapsed_time": "2:11:05", "remaining_time": "0:41:20"} |
|
{"current_steps": 650, "total_steps": 855, "eval_loss": 0.005719504784792662, "epoch": 3.7845705967976713, "percentage": 76.02, "elapsed_time": "2:11:11", "remaining_time": "0:41:22"} |
|
{"current_steps": 651, "total_steps": 855, "loss": 0.0054, "lr": 1.6381869629514973e-05, "epoch": 3.7903930131004366, "percentage": 76.14, "elapsed_time": "2:11:49", "remaining_time": "0:41:18"} |
|
{"current_steps": 652, "total_steps": 855, "loss": 0.0051, "lr": 1.6230949298551966e-05, "epoch": 3.7962154294032024, "percentage": 76.26, "elapsed_time": "2:11:59", "remaining_time": "0:41:05"} |
|
{"current_steps": 653, "total_steps": 855, "loss": 0.0053, "lr": 1.608059256023016e-05, "epoch": 3.802037845705968, "percentage": 76.37, "elapsed_time": "2:12:10", "remaining_time": "0:40:53"} |
|
{"current_steps": 654, "total_steps": 855, "loss": 0.005, "lr": 1.5930801923946452e-05, "epoch": 3.8078602620087336, "percentage": 76.49, "elapsed_time": "2:12:20", "remaining_time": "0:40:40"} |
|
{"current_steps": 655, "total_steps": 855, "loss": 0.0055, "lr": 1.5781579889649696e-05, "epoch": 3.8136826783114994, "percentage": 76.61, "elapsed_time": "2:12:30", "remaining_time": "0:40:27"} |
|
{"current_steps": 655, "total_steps": 855, "eval_loss": 0.005695061758160591, "epoch": 3.8136826783114994, "percentage": 76.61, "elapsed_time": "2:12:36", "remaining_time": "0:40:29"} |
|
{"current_steps": 656, "total_steps": 855, "loss": 0.005, "lr": 1.5632928947799047e-05, "epoch": 3.819505094614265, "percentage": 76.73, "elapsed_time": "2:12:46", "remaining_time": "0:40:16"} |
|
{"current_steps": 657, "total_steps": 855, "loss": 0.005, "lr": 1.548485157932229e-05, "epoch": 3.8253275109170306, "percentage": 76.84, "elapsed_time": "2:12:56", "remaining_time": "0:40:04"} |
|
{"current_steps": 658, "total_steps": 855, "loss": 0.005, "lr": 1.533735025557453e-05, "epoch": 3.831149927219796, "percentage": 76.96, "elapsed_time": "2:13:07", "remaining_time": "0:39:51"} |
|
{"current_steps": 659, "total_steps": 855, "loss": 0.0051, "lr": 1.5190427438296861e-05, "epoch": 3.836972343522562, "percentage": 77.08, "elapsed_time": "2:13:17", "remaining_time": "0:39:38"} |
|
{"current_steps": 660, "total_steps": 855, "loss": 0.0052, "lr": 1.5044085579575378e-05, "epoch": 3.8427947598253276, "percentage": 77.19, "elapsed_time": "2:13:28", "remaining_time": "0:39:26"} |
|
{"current_steps": 660, "total_steps": 855, "eval_loss": 0.005662932991981506, "epoch": 3.8427947598253276, "percentage": 77.19, "elapsed_time": "2:13:33", "remaining_time": "0:39:27"} |
|
{"current_steps": 661, "total_steps": 855, "loss": 0.0051, "lr": 1.4898327121800155e-05, "epoch": 3.8486171761280934, "percentage": 77.31, "elapsed_time": "2:13:44", "remaining_time": "0:39:15"} |
|
{"current_steps": 662, "total_steps": 855, "loss": 0.0054, "lr": 1.4753154497624517e-05, "epoch": 3.8544395924308588, "percentage": 77.43, "elapsed_time": "2:13:55", "remaining_time": "0:39:02"} |
|
{"current_steps": 663, "total_steps": 855, "loss": 0.0048, "lr": 1.4608570129924492e-05, "epoch": 3.8602620087336246, "percentage": 77.54, "elapsed_time": "2:14:05", "remaining_time": "0:38:49"} |
|
{"current_steps": 664, "total_steps": 855, "loss": 0.0051, "lr": 1.4464576431758314e-05, "epoch": 3.86608442503639, "percentage": 77.66, "elapsed_time": "2:14:15", "remaining_time": "0:38:37"} |
|
{"current_steps": 665, "total_steps": 855, "loss": 0.005, "lr": 1.432117580632616e-05, "epoch": 3.8719068413391557, "percentage": 77.78, "elapsed_time": "2:14:25", "remaining_time": "0:38:24"} |
|
{"current_steps": 665, "total_steps": 855, "eval_loss": 0.005684440489858389, "epoch": 3.8719068413391557, "percentage": 77.78, "elapsed_time": "2:14:31", "remaining_time": "0:38:26"} |
|
{"current_steps": 666, "total_steps": 855, "loss": 0.0049, "lr": 1.4178370646930017e-05, "epoch": 3.8777292576419216, "percentage": 77.89, "elapsed_time": "2:14:41", "remaining_time": "0:38:13"} |
|
{"current_steps": 667, "total_steps": 855, "loss": 0.005, "lr": 1.4036163336933833e-05, "epoch": 3.883551673944687, "percentage": 78.01, "elapsed_time": "2:14:52", "remaining_time": "0:38:00"} |
|
{"current_steps": 668, "total_steps": 855, "loss": 0.0051, "lr": 1.3894556249723657e-05, "epoch": 3.8893740902474527, "percentage": 78.13, "elapsed_time": "2:15:02", "remaining_time": "0:37:48"} |
|
{"current_steps": 669, "total_steps": 855, "loss": 0.005, "lr": 1.3753551748668008e-05, "epoch": 3.895196506550218, "percentage": 78.25, "elapsed_time": "2:15:13", "remaining_time": "0:37:35"} |
|
{"current_steps": 670, "total_steps": 855, "loss": 0.005, "lr": 1.3613152187078505e-05, "epoch": 3.901018922852984, "percentage": 78.36, "elapsed_time": "2:15:23", "remaining_time": "0:37:23"} |
|
{"current_steps": 670, "total_steps": 855, "eval_loss": 0.005713718011975288, "epoch": 3.901018922852984, "percentage": 78.36, "elapsed_time": "2:15:29", "remaining_time": "0:37:24"} |
|
{"current_steps": 671, "total_steps": 855, "loss": 0.005, "lr": 1.3473359908170562e-05, "epoch": 3.9068413391557497, "percentage": 78.48, "elapsed_time": "2:15:39", "remaining_time": "0:37:12"} |
|
{"current_steps": 672, "total_steps": 855, "loss": 0.0049, "lr": 1.3334177245024249e-05, "epoch": 3.9126637554585155, "percentage": 78.6, "elapsed_time": "2:15:50", "remaining_time": "0:36:59"} |
|
{"current_steps": 673, "total_steps": 855, "loss": 0.0056, "lr": 1.3195606520545412e-05, "epoch": 3.918486171761281, "percentage": 78.71, "elapsed_time": "2:16:00", "remaining_time": "0:36:46"} |
|
{"current_steps": 674, "total_steps": 855, "loss": 0.0051, "lr": 1.3057650047426834e-05, "epoch": 3.9243085880640467, "percentage": 78.83, "elapsed_time": "2:16:11", "remaining_time": "0:36:34"} |
|
{"current_steps": 675, "total_steps": 855, "loss": 0.0051, "lr": 1.292031012810973e-05, "epoch": 3.930131004366812, "percentage": 78.95, "elapsed_time": "2:16:21", "remaining_time": "0:36:21"} |
|
{"current_steps": 675, "total_steps": 855, "eval_loss": 0.0056921918876469135, "epoch": 3.930131004366812, "percentage": 78.95, "elapsed_time": "2:16:27", "remaining_time": "0:36:23"} |
|
{"current_steps": 676, "total_steps": 855, "loss": 0.0049, "lr": 1.2783589054745216e-05, "epoch": 3.935953420669578, "percentage": 79.06, "elapsed_time": "2:16:37", "remaining_time": "0:36:10"} |
|
{"current_steps": 677, "total_steps": 855, "loss": 0.0054, "lr": 1.2647489109156108e-05, "epoch": 3.9417758369723437, "percentage": 79.18, "elapsed_time": "2:16:47", "remaining_time": "0:35:58"} |
|
{"current_steps": 678, "total_steps": 855, "loss": 0.005, "lr": 1.2512012562798864e-05, "epoch": 3.947598253275109, "percentage": 79.3, "elapsed_time": "2:16:58", "remaining_time": "0:35:45"} |
|
{"current_steps": 679, "total_steps": 855, "loss": 0.005, "lr": 1.237716167672564e-05, "epoch": 3.953420669577875, "percentage": 79.42, "elapsed_time": "2:17:08", "remaining_time": "0:35:32"} |
|
{"current_steps": 680, "total_steps": 855, "loss": 0.0054, "lr": 1.2242938701546546e-05, "epoch": 3.9592430858806402, "percentage": 79.53, "elapsed_time": "2:17:19", "remaining_time": "0:35:20"} |
|
{"current_steps": 680, "total_steps": 855, "eval_loss": 0.005726697389036417, "epoch": 3.9592430858806402, "percentage": 79.53, "elapsed_time": "2:17:24", "remaining_time": "0:35:21"} |
|
{"current_steps": 681, "total_steps": 855, "loss": 0.005, "lr": 1.2109345877392081e-05, "epoch": 3.965065502183406, "percentage": 79.65, "elapsed_time": "2:17:35", "remaining_time": "0:35:09"} |
|
{"current_steps": 682, "total_steps": 855, "loss": 0.0054, "lr": 1.1976385433875797e-05, "epoch": 3.970887918486172, "percentage": 79.77, "elapsed_time": "2:17:45", "remaining_time": "0:34:56"} |
|
{"current_steps": 683, "total_steps": 855, "loss": 0.0051, "lr": 1.1844059590057054e-05, "epoch": 3.9767103347889377, "percentage": 79.88, "elapsed_time": "2:17:55", "remaining_time": "0:34:44"} |
|
{"current_steps": 684, "total_steps": 855, "loss": 0.0051, "lr": 1.1712370554403956e-05, "epoch": 3.982532751091703, "percentage": 80.0, "elapsed_time": "2:18:06", "remaining_time": "0:34:31"} |
|
{"current_steps": 685, "total_steps": 855, "loss": 0.0052, "lr": 1.1581320524756516e-05, "epoch": 3.988355167394469, "percentage": 80.12, "elapsed_time": "2:18:16", "remaining_time": "0:34:18"} |
|
{"current_steps": 685, "total_steps": 855, "eval_loss": 0.005665612407028675, "epoch": 3.988355167394469, "percentage": 80.12, "elapsed_time": "2:18:22", "remaining_time": "0:34:20"} |
|
{"current_steps": 686, "total_steps": 855, "loss": 0.0053, "lr": 1.1450911688290034e-05, "epoch": 3.994177583697234, "percentage": 80.23, "elapsed_time": "2:18:32", "remaining_time": "0:34:07"} |
|
{"current_steps": 687, "total_steps": 855, "loss": 0.0061, "lr": 1.1321146221478463e-05, "epoch": 4.0, "percentage": 80.35, "elapsed_time": "2:18:42", "remaining_time": "0:33:55"} |
|
{"current_steps": 688, "total_steps": 855, "loss": 0.0046, "lr": 1.1192026290058234e-05, "epoch": 4.005822416302766, "percentage": 80.47, "elapsed_time": "2:18:53", "remaining_time": "0:33:42"} |
|
{"current_steps": 689, "total_steps": 855, "loss": 0.0047, "lr": 1.1063554048991965e-05, "epoch": 4.011644832605532, "percentage": 80.58, "elapsed_time": "2:19:03", "remaining_time": "0:33:30"} |
|
{"current_steps": 690, "total_steps": 855, "loss": 0.0046, "lr": 1.0935731642432644e-05, "epoch": 4.0174672489082965, "percentage": 80.7, "elapsed_time": "2:19:14", "remaining_time": "0:33:17"} |
|
{"current_steps": 690, "total_steps": 855, "eval_loss": 0.0056965467520058155, "epoch": 4.0174672489082965, "percentage": 80.7, "elapsed_time": "2:19:19", "remaining_time": "0:33:19"} |
|
{"current_steps": 691, "total_steps": 855, "loss": 0.0052, "lr": 1.0808561203687712e-05, "epoch": 4.023289665211062, "percentage": 80.82, "elapsed_time": "2:19:30", "remaining_time": "0:33:06"} |
|
{"current_steps": 692, "total_steps": 855, "loss": 0.0051, "lr": 1.0682044855183521e-05, "epoch": 4.029112081513828, "percentage": 80.94, "elapsed_time": "2:19:40", "remaining_time": "0:32:54"} |
|
{"current_steps": 693, "total_steps": 855, "loss": 0.0046, "lr": 1.0556184708429922e-05, "epoch": 4.034934497816594, "percentage": 81.05, "elapsed_time": "2:19:51", "remaining_time": "0:32:41"} |
|
{"current_steps": 694, "total_steps": 855, "loss": 0.0048, "lr": 1.0430982863985022e-05, "epoch": 4.04075691411936, "percentage": 81.17, "elapsed_time": "2:20:01", "remaining_time": "0:32:29"} |
|
{"current_steps": 695, "total_steps": 855, "loss": 0.0047, "lr": 1.0306441411420076e-05, "epoch": 4.046579330422126, "percentage": 81.29, "elapsed_time": "2:20:12", "remaining_time": "0:32:16"} |
|
{"current_steps": 695, "total_steps": 855, "eval_loss": 0.005697253625839949, "epoch": 4.046579330422126, "percentage": 81.29, "elapsed_time": "2:20:17", "remaining_time": "0:32:17"} |
|
{"current_steps": 696, "total_steps": 855, "loss": 0.0046, "lr": 1.0182562429284649e-05, "epoch": 4.0524017467248905, "percentage": 81.4, "elapsed_time": "2:20:28", "remaining_time": "0:32:05"} |
|
{"current_steps": 697, "total_steps": 855, "loss": 0.0047, "lr": 1.0059347985071959e-05, "epoch": 4.058224163027656, "percentage": 81.52, "elapsed_time": "2:20:38", "remaining_time": "0:31:52"} |
|
{"current_steps": 698, "total_steps": 855, "loss": 0.005, "lr": 9.936800135184332e-06, "epoch": 4.064046579330422, "percentage": 81.64, "elapsed_time": "2:20:48", "remaining_time": "0:31:40"} |
|
{"current_steps": 699, "total_steps": 855, "loss": 0.0046, "lr": 9.814920924898868e-06, "epoch": 4.069868995633188, "percentage": 81.75, "elapsed_time": "2:20:59", "remaining_time": "0:31:27"} |
|
{"current_steps": 700, "total_steps": 855, "loss": 0.0044, "lr": 9.693712388333315e-06, "epoch": 4.075691411935954, "percentage": 81.87, "elapsed_time": "2:21:09", "remaining_time": "0:31:15"} |
|
{"current_steps": 700, "total_steps": 855, "eval_loss": 0.005716563202440739, "epoch": 4.075691411935954, "percentage": 81.87, "elapsed_time": "2:21:15", "remaining_time": "0:31:16"} |
|
{"current_steps": 701, "total_steps": 855, "loss": 0.0048, "lr": 9.573176548412182e-06, "epoch": 4.081513828238719, "percentage": 81.99, "elapsed_time": "2:21:51", "remaining_time": "0:31:09"} |
|
{"current_steps": 702, "total_steps": 855, "loss": 0.0047, "lr": 9.45331541683287e-06, "epoch": 4.0873362445414845, "percentage": 82.11, "elapsed_time": "2:22:01", "remaining_time": "0:30:57"} |
|
{"current_steps": 703, "total_steps": 855, "loss": 0.0048, "lr": 9.334130994032203e-06, "epoch": 4.09315866084425, "percentage": 82.22, "elapsed_time": "2:22:12", "remaining_time": "0:30:44"} |
|
{"current_steps": 704, "total_steps": 855, "loss": 0.0045, "lr": 9.215625269152939e-06, "epoch": 4.098981077147016, "percentage": 82.34, "elapsed_time": "2:22:22", "remaining_time": "0:30:32"} |
|
{"current_steps": 705, "total_steps": 855, "loss": 0.0047, "lr": 9.097800220010689e-06, "epoch": 4.104803493449782, "percentage": 82.46, "elapsed_time": "2:22:32", "remaining_time": "0:30:19"} |
|
{"current_steps": 705, "total_steps": 855, "eval_loss": 0.0056772115640342236, "epoch": 4.104803493449782, "percentage": 82.46, "elapsed_time": "2:22:38", "remaining_time": "0:30:20"} |
|
{"current_steps": 706, "total_steps": 855, "loss": 0.0049, "lr": 8.980657813060783e-06, "epoch": 4.110625909752548, "percentage": 82.57, "elapsed_time": "2:22:48", "remaining_time": "0:30:08"} |
|
{"current_steps": 707, "total_steps": 855, "loss": 0.0047, "lr": 8.864200003365542e-06, "epoch": 4.116448326055313, "percentage": 82.69, "elapsed_time": "2:22:59", "remaining_time": "0:29:55"} |
|
{"current_steps": 708, "total_steps": 855, "loss": 0.0048, "lr": 8.748428734561614e-06, "epoch": 4.122270742358078, "percentage": 82.81, "elapsed_time": "2:23:09", "remaining_time": "0:29:43"} |
|
{"current_steps": 709, "total_steps": 855, "loss": 0.0046, "lr": 8.633345938827563e-06, "epoch": 4.128093158660844, "percentage": 82.92, "elapsed_time": "2:23:19", "remaining_time": "0:29:30"} |
|
{"current_steps": 710, "total_steps": 855, "loss": 0.0046, "lr": 8.518953536851565e-06, "epoch": 4.13391557496361, "percentage": 83.04, "elapsed_time": "2:23:30", "remaining_time": "0:29:18"} |
|
{"current_steps": 710, "total_steps": 855, "eval_loss": 0.0056624929420650005, "epoch": 4.13391557496361, "percentage": 83.04, "elapsed_time": "2:23:35", "remaining_time": "0:29:19"} |
|
{"current_steps": 711, "total_steps": 855, "loss": 0.0047, "lr": 8.405253437799388e-06, "epoch": 4.139737991266376, "percentage": 83.16, "elapsed_time": "2:23:46", "remaining_time": "0:29:07"} |
|
{"current_steps": 712, "total_steps": 855, "loss": 0.0047, "lr": 8.292247539282522e-06, "epoch": 4.145560407569141, "percentage": 83.27, "elapsed_time": "2:23:56", "remaining_time": "0:28:54"} |
|
{"current_steps": 713, "total_steps": 855, "loss": 0.0046, "lr": 8.179937727326576e-06, "epoch": 4.151382823871907, "percentage": 83.39, "elapsed_time": "2:24:07", "remaining_time": "0:28:42"} |
|
{"current_steps": 714, "total_steps": 855, "loss": 0.0049, "lr": 8.068325876339666e-06, "epoch": 4.157205240174672, "percentage": 83.51, "elapsed_time": "2:24:17", "remaining_time": "0:28:29"} |
|
{"current_steps": 715, "total_steps": 855, "loss": 0.0046, "lr": 7.95741384908123e-06, "epoch": 4.163027656477438, "percentage": 83.63, "elapsed_time": "2:24:28", "remaining_time": "0:28:17"} |
|
{"current_steps": 715, "total_steps": 855, "eval_loss": 0.005712661426514387, "epoch": 4.163027656477438, "percentage": 83.63, "elapsed_time": "2:24:33", "remaining_time": "0:28:18"} |
|
{"current_steps": 716, "total_steps": 855, "loss": 0.0046, "lr": 7.847203496630896e-06, "epoch": 4.168850072780204, "percentage": 83.74, "elapsed_time": "2:24:43", "remaining_time": "0:28:05"} |
|
{"current_steps": 717, "total_steps": 855, "loss": 0.0047, "lr": 7.73769665835764e-06, "epoch": 4.17467248908297, "percentage": 83.86, "elapsed_time": "2:24:54", "remaining_time": "0:27:53"} |
|
{"current_steps": 718, "total_steps": 855, "loss": 0.0046, "lr": 7.628895161889049e-06, "epoch": 4.180494905385735, "percentage": 83.98, "elapsed_time": "2:25:04", "remaining_time": "0:27:40"} |
|
{"current_steps": 719, "total_steps": 855, "loss": 0.0048, "lr": 7.520800823080793e-06, "epoch": 4.186317321688501, "percentage": 84.09, "elapsed_time": "2:25:14", "remaining_time": "0:27:28"} |
|
{"current_steps": 720, "total_steps": 855, "loss": 0.0048, "lr": 7.413415445986355e-06, "epoch": 4.192139737991266, "percentage": 84.21, "elapsed_time": "2:25:25", "remaining_time": "0:27:15"} |
|
{"current_steps": 720, "total_steps": 855, "eval_loss": 0.005738519597798586, "epoch": 4.192139737991266, "percentage": 84.21, "elapsed_time": "2:25:31", "remaining_time": "0:27:17"} |
|
{"current_steps": 721, "total_steps": 855, "loss": 0.0047, "lr": 7.306740822826957e-06, "epoch": 4.197962154294032, "percentage": 84.33, "elapsed_time": "2:25:41", "remaining_time": "0:27:04"} |
|
{"current_steps": 722, "total_steps": 855, "loss": 0.0048, "lr": 7.200778733961544e-06, "epoch": 4.203784570596798, "percentage": 84.44, "elapsed_time": "2:25:51", "remaining_time": "0:26:52"} |
|
{"current_steps": 723, "total_steps": 855, "loss": 0.0048, "lr": 7.095530947857199e-06, "epoch": 4.209606986899563, "percentage": 84.56, "elapsed_time": "2:26:02", "remaining_time": "0:26:39"} |
|
{"current_steps": 724, "total_steps": 855, "loss": 0.0047, "lr": 6.9909992210595076e-06, "epoch": 4.215429403202329, "percentage": 84.68, "elapsed_time": "2:26:12", "remaining_time": "0:26:27"} |
|
{"current_steps": 725, "total_steps": 855, "loss": 0.0047, "lr": 6.88718529816334e-06, "epoch": 4.2212518195050945, "percentage": 84.8, "elapsed_time": "2:26:23", "remaining_time": "0:26:14"} |
|
{"current_steps": 725, "total_steps": 855, "eval_loss": 0.005722955800592899, "epoch": 4.2212518195050945, "percentage": 84.8, "elapsed_time": "2:26:28", "remaining_time": "0:26:15"} |
|
{"current_steps": 726, "total_steps": 855, "loss": 0.0046, "lr": 6.784090911783664e-06, "epoch": 4.22707423580786, "percentage": 84.91, "elapsed_time": "2:26:39", "remaining_time": "0:26:03"} |
|
{"current_steps": 727, "total_steps": 855, "loss": 0.0051, "lr": 6.681717782526658e-06, "epoch": 4.232896652110626, "percentage": 85.03, "elapsed_time": "2:26:49", "remaining_time": "0:25:51"} |
|
{"current_steps": 728, "total_steps": 855, "loss": 0.0047, "lr": 6.5800676189610054e-06, "epoch": 4.238719068413392, "percentage": 85.15, "elapsed_time": "2:26:59", "remaining_time": "0:25:38"} |
|
{"current_steps": 729, "total_steps": 855, "loss": 0.0045, "lr": 6.47914211758937e-06, "epoch": 4.244541484716157, "percentage": 85.26, "elapsed_time": "2:27:10", "remaining_time": "0:25:26"} |
|
{"current_steps": 730, "total_steps": 855, "loss": 0.0048, "lr": 6.3789429628200615e-06, "epoch": 4.250363901018923, "percentage": 85.38, "elapsed_time": "2:27:20", "remaining_time": "0:25:13"} |
|
{"current_steps": 730, "total_steps": 855, "eval_loss": 0.005725468508899212, "epoch": 4.250363901018923, "percentage": 85.38, "elapsed_time": "2:27:26", "remaining_time": "0:25:14"} |
|
{"current_steps": 731, "total_steps": 855, "loss": 0.0046, "lr": 6.279471826938943e-06, "epoch": 4.2561863173216885, "percentage": 85.5, "elapsed_time": "2:27:36", "remaining_time": "0:25:02"} |
|
{"current_steps": 732, "total_steps": 855, "loss": 0.0045, "lr": 6.1807303700815225e-06, "epoch": 4.262008733624454, "percentage": 85.61, "elapsed_time": "2:27:46", "remaining_time": "0:24:49"} |
|
{"current_steps": 733, "total_steps": 855, "loss": 0.0044, "lr": 6.08272024020527e-06, "epoch": 4.26783114992722, "percentage": 85.73, "elapsed_time": "2:27:57", "remaining_time": "0:24:37"} |
|
{"current_steps": 734, "total_steps": 855, "loss": 0.0049, "lr": 5.985443073062036e-06, "epoch": 4.273653566229985, "percentage": 85.85, "elapsed_time": "2:28:07", "remaining_time": "0:24:25"} |
|
{"current_steps": 735, "total_steps": 855, "loss": 0.0047, "lr": 5.888900492170818e-06, "epoch": 4.279475982532751, "percentage": 85.96, "elapsed_time": "2:28:17", "remaining_time": "0:24:12"} |
|
{"current_steps": 735, "total_steps": 855, "eval_loss": 0.005731714423745871, "epoch": 4.279475982532751, "percentage": 85.96, "elapsed_time": "2:28:23", "remaining_time": "0:24:13"} |
|
{"current_steps": 736, "total_steps": 855, "loss": 0.0048, "lr": 5.7930941087906695e-06, "epoch": 4.285298398835517, "percentage": 86.08, "elapsed_time": "2:28:33", "remaining_time": "0:24:01"} |
|
{"current_steps": 737, "total_steps": 855, "loss": 0.0045, "lr": 5.698025521893763e-06, "epoch": 4.2911208151382825, "percentage": 86.2, "elapsed_time": "2:28:44", "remaining_time": "0:23:48"} |
|
{"current_steps": 738, "total_steps": 855, "loss": 0.0047, "lr": 5.603696318138751e-06, "epoch": 4.296943231441048, "percentage": 86.32, "elapsed_time": "2:28:54", "remaining_time": "0:23:36"} |
|
{"current_steps": 739, "total_steps": 855, "loss": 0.0049, "lr": 5.510108071844222e-06, "epoch": 4.302765647743814, "percentage": 86.43, "elapsed_time": "2:29:05", "remaining_time": "0:23:24"} |
|
{"current_steps": 740, "total_steps": 855, "loss": 0.0047, "lr": 5.4172623449625144e-06, "epoch": 4.308588064046579, "percentage": 86.55, "elapsed_time": "2:29:15", "remaining_time": "0:23:11"} |
|
{"current_steps": 740, "total_steps": 855, "eval_loss": 0.005700558423995972, "epoch": 4.308588064046579, "percentage": 86.55, "elapsed_time": "2:29:21", "remaining_time": "0:23:12"} |
|
{"current_steps": 741, "total_steps": 855, "loss": 0.0044, "lr": 5.325160687053571e-06, "epoch": 4.314410480349345, "percentage": 86.67, "elapsed_time": "2:29:31", "remaining_time": "0:23:00"} |
|
{"current_steps": 742, "total_steps": 855, "loss": 0.0047, "lr": 5.233804635259093e-06, "epoch": 4.320232896652111, "percentage": 86.78, "elapsed_time": "2:29:42", "remaining_time": "0:22:47"} |
|
{"current_steps": 743, "total_steps": 855, "loss": 0.0044, "lr": 5.143195714276927e-06, "epoch": 4.326055312954876, "percentage": 86.9, "elapsed_time": "2:29:52", "remaining_time": "0:22:35"} |
|
{"current_steps": 744, "total_steps": 855, "loss": 0.0049, "lr": 5.053335436335593e-06, "epoch": 4.331877729257642, "percentage": 87.02, "elapsed_time": "2:30:02", "remaining_time": "0:22:23"} |
|
{"current_steps": 745, "total_steps": 855, "loss": 0.0046, "lr": 4.964225301169023e-06, "epoch": 4.337700145560407, "percentage": 87.13, "elapsed_time": "2:30:13", "remaining_time": "0:22:10"} |
|
{"current_steps": 745, "total_steps": 855, "eval_loss": 0.005712580401450396, "epoch": 4.337700145560407, "percentage": 87.13, "elapsed_time": "2:30:18", "remaining_time": "0:22:11"} |
|
{"current_steps": 746, "total_steps": 855, "loss": 0.0047, "lr": 4.875866795991535e-06, "epoch": 4.343522561863173, "percentage": 87.25, "elapsed_time": "2:30:29", "remaining_time": "0:21:59"} |
|
{"current_steps": 747, "total_steps": 855, "loss": 0.0045, "lr": 4.788261395473065e-06, "epoch": 4.349344978165939, "percentage": 87.37, "elapsed_time": "2:30:39", "remaining_time": "0:21:46"} |
|
{"current_steps": 748, "total_steps": 855, "loss": 0.0046, "lr": 4.701410561714509e-06, "epoch": 4.355167394468705, "percentage": 87.49, "elapsed_time": "2:30:50", "remaining_time": "0:21:34"} |
|
{"current_steps": 749, "total_steps": 855, "loss": 0.0046, "lr": 4.615315744223319e-06, "epoch": 4.36098981077147, "percentage": 87.6, "elapsed_time": "2:31:00", "remaining_time": "0:21:22"} |
|
{"current_steps": 750, "total_steps": 855, "loss": 0.0047, "lr": 4.529978379889315e-06, "epoch": 4.366812227074236, "percentage": 87.72, "elapsed_time": "2:31:11", "remaining_time": "0:21:09"} |
|
{"current_steps": 750, "total_steps": 855, "eval_loss": 0.0057135578244924545, "epoch": 4.366812227074236, "percentage": 87.72, "elapsed_time": "2:31:17", "remaining_time": "0:21:10"} |
|
{"current_steps": 751, "total_steps": 855, "loss": 0.0045, "lr": 4.4453998929607385e-06, "epoch": 4.372634643377001, "percentage": 87.84, "elapsed_time": "2:32:09", "remaining_time": "0:21:04"} |
|
{"current_steps": 752, "total_steps": 855, "loss": 0.0046, "lr": 4.361581695020428e-06, "epoch": 4.378457059679767, "percentage": 87.95, "elapsed_time": "2:32:19", "remaining_time": "0:20:51"} |
|
{"current_steps": 753, "total_steps": 855, "loss": 0.0046, "lr": 4.278525184962312e-06, "epoch": 4.384279475982533, "percentage": 88.07, "elapsed_time": "2:32:30", "remaining_time": "0:20:39"} |
|
{"current_steps": 754, "total_steps": 855, "loss": 0.0048, "lr": 4.1962317489680106e-06, "epoch": 4.390101892285299, "percentage": 88.19, "elapsed_time": "2:32:40", "remaining_time": "0:20:27"} |
|
{"current_steps": 755, "total_steps": 855, "loss": 0.005, "lr": 4.114702760483752e-06, "epoch": 4.395924308588064, "percentage": 88.3, "elapsed_time": "2:32:51", "remaining_time": "0:20:14"} |
|
{"current_steps": 755, "total_steps": 855, "eval_loss": 0.0057435426861047745, "epoch": 4.395924308588064, "percentage": 88.3, "elapsed_time": "2:32:56", "remaining_time": "0:20:15"} |
|
{"current_steps": 756, "total_steps": 855, "loss": 0.0049, "lr": 4.03393958019741e-06, "epoch": 4.401746724890829, "percentage": 88.42, "elapsed_time": "2:33:07", "remaining_time": "0:20:03"} |
|
{"current_steps": 757, "total_steps": 855, "loss": 0.0044, "lr": 3.953943556015804e-06, "epoch": 4.407569141193595, "percentage": 88.54, "elapsed_time": "2:33:17", "remaining_time": "0:19:50"} |
|
{"current_steps": 758, "total_steps": 855, "loss": 0.0047, "lr": 3.874716023042235e-06, "epoch": 4.413391557496361, "percentage": 88.65, "elapsed_time": "2:33:27", "remaining_time": "0:19:38"} |
|
{"current_steps": 759, "total_steps": 855, "loss": 0.0048, "lr": 3.796258303554162e-06, "epoch": 4.419213973799127, "percentage": 88.77, "elapsed_time": "2:33:38", "remaining_time": "0:19:25"} |
|
{"current_steps": 760, "total_steps": 855, "loss": 0.0043, "lr": 3.71857170698115e-06, "epoch": 4.4250363901018925, "percentage": 88.89, "elapsed_time": "2:33:48", "remaining_time": "0:19:13"} |
|
{"current_steps": 760, "total_steps": 855, "eval_loss": 0.005737999454140663, "epoch": 4.4250363901018925, "percentage": 88.89, "elapsed_time": "2:33:54", "remaining_time": "0:19:14"} |
|
{"current_steps": 761, "total_steps": 855, "loss": 0.005, "lr": 3.6416575298830024e-06, "epoch": 4.430858806404658, "percentage": 89.01, "elapsed_time": "2:34:04", "remaining_time": "0:19:01"} |
|
{"current_steps": 762, "total_steps": 855, "loss": 0.0048, "lr": 3.565517055928147e-06, "epoch": 4.436681222707423, "percentage": 89.12, "elapsed_time": "2:34:15", "remaining_time": "0:18:49"} |
|
{"current_steps": 763, "total_steps": 855, "loss": 0.0047, "lr": 3.490151555872212e-06, "epoch": 4.442503639010189, "percentage": 89.24, "elapsed_time": "2:34:25", "remaining_time": "0:18:37"} |
|
{"current_steps": 764, "total_steps": 855, "loss": 0.0042, "lr": 3.4155622875367886e-06, "epoch": 4.448326055312955, "percentage": 89.36, "elapsed_time": "2:34:35", "remaining_time": "0:18:24"} |
|
{"current_steps": 765, "total_steps": 855, "loss": 0.0047, "lr": 3.3417504957884594e-06, "epoch": 4.454148471615721, "percentage": 89.47, "elapsed_time": "2:34:45", "remaining_time": "0:18:12"} |
|
{"current_steps": 765, "total_steps": 855, "eval_loss": 0.005743493791669607, "epoch": 4.454148471615721, "percentage": 89.47, "elapsed_time": "2:34:51", "remaining_time": "0:18:13"} |
|
{"current_steps": 766, "total_steps": 855, "loss": 0.0047, "lr": 3.268717412518013e-06, "epoch": 4.4599708879184865, "percentage": 89.59, "elapsed_time": "2:35:01", "remaining_time": "0:18:00"} |
|
{"current_steps": 767, "total_steps": 855, "loss": 0.0048, "lr": 3.196464256619902e-06, "epoch": 4.465793304221251, "percentage": 89.71, "elapsed_time": "2:35:12", "remaining_time": "0:17:48"} |
|
{"current_steps": 768, "total_steps": 855, "loss": 0.0046, "lr": 3.1249922339718685e-06, "epoch": 4.471615720524017, "percentage": 89.82, "elapsed_time": "2:35:22", "remaining_time": "0:17:36"} |
|
{"current_steps": 769, "total_steps": 855, "loss": 0.0049, "lr": 3.0543025374148546e-06, "epoch": 4.477438136826783, "percentage": 89.94, "elapsed_time": "2:35:32", "remaining_time": "0:17:23"} |
|
{"current_steps": 770, "total_steps": 855, "loss": 0.0047, "lr": 2.9843963467330704e-06, "epoch": 4.483260553129549, "percentage": 90.06, "elapsed_time": "2:35:43", "remaining_time": "0:17:11"} |
|
{"current_steps": 770, "total_steps": 855, "eval_loss": 0.005732374265789986, "epoch": 4.483260553129549, "percentage": 90.06, "elapsed_time": "2:35:48", "remaining_time": "0:17:12"} |
|
{"current_steps": 771, "total_steps": 855, "loss": 0.005, "lr": 2.915274828634307e-06, "epoch": 4.489082969432315, "percentage": 90.18, "elapsed_time": "2:35:59", "remaining_time": "0:16:59"} |
|
{"current_steps": 772, "total_steps": 855, "loss": 0.0047, "lr": 2.8469391367304756e-06, "epoch": 4.4949053857350805, "percentage": 90.29, "elapsed_time": "2:36:09", "remaining_time": "0:16:47"} |
|
{"current_steps": 773, "total_steps": 855, "loss": 0.0044, "lr": 2.7793904115183288e-06, "epoch": 4.500727802037845, "percentage": 90.41, "elapsed_time": "2:36:19", "remaining_time": "0:16:35"} |
|
{"current_steps": 774, "total_steps": 855, "loss": 0.0049, "lr": 2.712629780360465e-06, "epoch": 4.506550218340611, "percentage": 90.53, "elapsed_time": "2:36:30", "remaining_time": "0:16:22"} |
|
{"current_steps": 775, "total_steps": 855, "loss": 0.0046, "lr": 2.6466583574664916e-06, "epoch": 4.512372634643377, "percentage": 90.64, "elapsed_time": "2:36:40", "remaining_time": "0:16:10"} |
|
{"current_steps": 775, "total_steps": 855, "eval_loss": 0.005725707393139601, "epoch": 4.512372634643377, "percentage": 90.64, "elapsed_time": "2:36:46", "remaining_time": "0:16:10"} |
|
{"current_steps": 776, "total_steps": 855, "loss": 0.0047, "lr": 2.581477243874414e-06, "epoch": 4.518195050946143, "percentage": 90.76, "elapsed_time": "2:36:56", "remaining_time": "0:15:58"} |
|
{"current_steps": 777, "total_steps": 855, "loss": 0.0047, "lr": 2.5170875274322657e-06, "epoch": 4.524017467248909, "percentage": 90.88, "elapsed_time": "2:37:06", "remaining_time": "0:15:46"} |
|
{"current_steps": 778, "total_steps": 855, "loss": 0.0044, "lr": 2.453490282780002e-06, "epoch": 4.5298398835516736, "percentage": 90.99, "elapsed_time": "2:37:17", "remaining_time": "0:15:34"} |
|
{"current_steps": 779, "total_steps": 855, "loss": 0.0046, "lr": 2.390686571331502e-06, "epoch": 4.535662299854439, "percentage": 91.11, "elapsed_time": "2:37:27", "remaining_time": "0:15:21"} |
|
{"current_steps": 780, "total_steps": 855, "loss": 0.0047, "lr": 2.3286774412568603e-06, "epoch": 4.541484716157205, "percentage": 91.23, "elapsed_time": "2:37:37", "remaining_time": "0:15:09"} |
|
{"current_steps": 780, "total_steps": 855, "eval_loss": 0.005723342299461365, "epoch": 4.541484716157205, "percentage": 91.23, "elapsed_time": "2:37:43", "remaining_time": "0:15:09"} |
|
{"current_steps": 781, "total_steps": 855, "loss": 0.0045, "lr": 2.2674639274649355e-06, "epoch": 4.547307132459971, "percentage": 91.35, "elapsed_time": "2:37:53", "remaining_time": "0:14:57"} |
|
{"current_steps": 782, "total_steps": 855, "loss": 0.0045, "lr": 2.207047051586042e-06, "epoch": 4.553129548762737, "percentage": 91.46, "elapsed_time": "2:38:04", "remaining_time": "0:14:45"} |
|
{"current_steps": 783, "total_steps": 855, "loss": 0.0047, "lr": 2.147427821954906e-06, "epoch": 4.558951965065502, "percentage": 91.58, "elapsed_time": "2:38:14", "remaining_time": "0:14:33"} |
|
{"current_steps": 784, "total_steps": 855, "loss": 0.0049, "lr": 2.088607233593853e-06, "epoch": 4.5647743813682675, "percentage": 91.7, "elapsed_time": "2:38:24", "remaining_time": "0:14:20"} |
|
{"current_steps": 785, "total_steps": 855, "loss": 0.0047, "lr": 2.030586268196172e-06, "epoch": 4.570596797671033, "percentage": 91.81, "elapsed_time": "2:38:35", "remaining_time": "0:14:08"} |
|
{"current_steps": 785, "total_steps": 855, "eval_loss": 0.00571979396045208, "epoch": 4.570596797671033, "percentage": 91.81, "elapsed_time": "2:38:40", "remaining_time": "0:14:08"} |
|
{"current_steps": 786, "total_steps": 855, "loss": 0.0046, "lr": 1.973365894109769e-06, "epoch": 4.576419213973799, "percentage": 91.93, "elapsed_time": "2:38:50", "remaining_time": "0:13:56"} |
|
{"current_steps": 787, "total_steps": 855, "loss": 0.0047, "lr": 1.9169470663209675e-06, "epoch": 4.582241630276565, "percentage": 92.05, "elapsed_time": "2:39:01", "remaining_time": "0:13:44"} |
|
{"current_steps": 788, "total_steps": 855, "loss": 0.0046, "lr": 1.8613307264385815e-06, "epoch": 4.588064046579331, "percentage": 92.16, "elapsed_time": "2:39:11", "remaining_time": "0:13:32"} |
|
{"current_steps": 789, "total_steps": 855, "loss": 0.0045, "lr": 1.8065178026782315e-06, "epoch": 4.593886462882097, "percentage": 92.28, "elapsed_time": "2:39:22", "remaining_time": "0:13:19"} |
|
{"current_steps": 790, "total_steps": 855, "loss": 0.0048, "lr": 1.7525092098468144e-06, "epoch": 4.5997088791848615, "percentage": 92.4, "elapsed_time": "2:39:32", "remaining_time": "0:13:07"} |
|
{"current_steps": 790, "total_steps": 855, "eval_loss": 0.005728148389607668, "epoch": 4.5997088791848615, "percentage": 92.4, "elapsed_time": "2:39:38", "remaining_time": "0:13:08"} |
|
{"current_steps": 791, "total_steps": 855, "loss": 0.0047, "lr": 1.6993058493272485e-06, "epoch": 4.605531295487627, "percentage": 92.51, "elapsed_time": "2:39:48", "remaining_time": "0:12:55"} |
|
{"current_steps": 792, "total_steps": 855, "loss": 0.0046, "lr": 1.6469086090634134e-06, "epoch": 4.611353711790393, "percentage": 92.63, "elapsed_time": "2:39:58", "remaining_time": "0:12:43"} |
|
{"current_steps": 793, "total_steps": 855, "loss": 0.0045, "lr": 1.595318363545384e-06, "epoch": 4.617176128093159, "percentage": 92.75, "elapsed_time": "2:40:09", "remaining_time": "0:12:31"} |
|
{"current_steps": 794, "total_steps": 855, "loss": 0.0046, "lr": 1.5445359737947807e-06, "epoch": 4.622998544395925, "percentage": 92.87, "elapsed_time": "2:40:19", "remaining_time": "0:12:19"} |
|
{"current_steps": 795, "total_steps": 855, "loss": 0.0045, "lr": 1.4945622873504094e-06, "epoch": 4.62882096069869, "percentage": 92.98, "elapsed_time": "2:40:30", "remaining_time": "0:12:06"} |
|
{"current_steps": 795, "total_steps": 855, "eval_loss": 0.005716807674616575, "epoch": 4.62882096069869, "percentage": 92.98, "elapsed_time": "2:40:35", "remaining_time": "0:12:07"} |
|
{"current_steps": 796, "total_steps": 855, "loss": 0.0044, "lr": 1.445398138254128e-06, "epoch": 4.6346433770014555, "percentage": 93.1, "elapsed_time": "2:40:45", "remaining_time": "0:11:54"} |
|
{"current_steps": 797, "total_steps": 855, "loss": 0.0046, "lr": 1.3970443470369355e-06, "epoch": 4.640465793304221, "percentage": 93.22, "elapsed_time": "2:40:56", "remaining_time": "0:11:42"} |
|
{"current_steps": 798, "total_steps": 855, "loss": 0.0045, "lr": 1.349501720705254e-06, "epoch": 4.646288209606987, "percentage": 93.33, "elapsed_time": "2:41:06", "remaining_time": "0:11:30"} |
|
{"current_steps": 799, "total_steps": 855, "loss": 0.0048, "lr": 1.3027710527274807e-06, "epoch": 4.652110625909753, "percentage": 93.45, "elapsed_time": "2:41:16", "remaining_time": "0:11:18"} |
|
{"current_steps": 800, "total_steps": 855, "loss": 0.0045, "lr": 1.2568531230207236e-06, "epoch": 4.657933042212518, "percentage": 93.57, "elapsed_time": "2:41:27", "remaining_time": "0:11:06"} |
|
{"current_steps": 800, "total_steps": 855, "eval_loss": 0.005702358204871416, "epoch": 4.657933042212518, "percentage": 93.57, "elapsed_time": "2:41:33", "remaining_time": "0:11:06"} |
|
{"current_steps": 801, "total_steps": 855, "loss": 0.0047, "lr": 1.211748697937809e-06, "epoch": 4.663755458515284, "percentage": 93.68, "elapsed_time": "2:42:09", "remaining_time": "0:10:55"} |
|
{"current_steps": 802, "total_steps": 855, "loss": 0.0048, "lr": 1.1674585302544728e-06, "epoch": 4.669577874818049, "percentage": 93.8, "elapsed_time": "2:42:19", "remaining_time": "0:10:43"} |
|
{"current_steps": 803, "total_steps": 855, "loss": 0.0047, "lr": 1.1239833591567994e-06, "epoch": 4.675400291120815, "percentage": 93.92, "elapsed_time": "2:42:29", "remaining_time": "0:10:31"} |
|
{"current_steps": 804, "total_steps": 855, "loss": 0.0048, "lr": 1.0813239102289041e-06, "epoch": 4.681222707423581, "percentage": 94.04, "elapsed_time": "2:42:40", "remaining_time": "0:10:19"} |
|
{"current_steps": 805, "total_steps": 855, "loss": 0.0049, "lr": 1.0394808954408032e-06, "epoch": 4.687045123726346, "percentage": 94.15, "elapsed_time": "2:42:50", "remaining_time": "0:10:06"} |
|
{"current_steps": 805, "total_steps": 855, "eval_loss": 0.005704755429178476, "epoch": 4.687045123726346, "percentage": 94.15, "elapsed_time": "2:42:56", "remaining_time": "0:10:07"} |
|
{"current_steps": 806, "total_steps": 855, "loss": 0.0044, "lr": 9.984550131365288e-07, "epoch": 4.692867540029112, "percentage": 94.27, "elapsed_time": "2:43:06", "remaining_time": "0:09:54"} |
|
{"current_steps": 807, "total_steps": 855, "loss": 0.0046, "lr": 9.582469480224843e-07, "epoch": 4.698689956331878, "percentage": 94.39, "elapsed_time": "2:43:16", "remaining_time": "0:09:42"} |
|
{"current_steps": 808, "total_steps": 855, "loss": 0.0047, "lr": 9.188573711560233e-07, "epoch": 4.704512372634643, "percentage": 94.5, "elapsed_time": "2:43:27", "remaining_time": "0:09:30"} |
|
{"current_steps": 809, "total_steps": 855, "loss": 0.0048, "lr": 8.802869399342384e-07, "epoch": 4.710334788937409, "percentage": 94.62, "elapsed_time": "2:43:37", "remaining_time": "0:09:18"} |
|
{"current_steps": 810, "total_steps": 855, "loss": 0.0045, "lr": 8.42536298082991e-07, "epoch": 4.716157205240175, "percentage": 94.74, "elapsed_time": "2:43:47", "remaining_time": "0:09:05"} |
|
{"current_steps": 810, "total_steps": 855, "eval_loss": 0.0056949155405163765, "epoch": 4.716157205240175, "percentage": 94.74, "elapsed_time": "2:43:53", "remaining_time": "0:09:06"} |
|
{"current_steps": 811, "total_steps": 855, "loss": 0.0047, "lr": 8.056060756461537e-07, "epoch": 4.721979621542941, "percentage": 94.85, "elapsed_time": "2:44:03", "remaining_time": "0:08:54"} |
|
{"current_steps": 812, "total_steps": 855, "loss": 0.0047, "lr": 7.694968889751408e-07, "epoch": 4.727802037845706, "percentage": 94.97, "elapsed_time": "2:44:14", "remaining_time": "0:08:41"} |
|
{"current_steps": 813, "total_steps": 855, "loss": 0.0048, "lr": 7.342093407185613e-07, "epoch": 4.7336244541484715, "percentage": 95.09, "elapsed_time": "2:44:24", "remaining_time": "0:08:29"} |
|
{"current_steps": 814, "total_steps": 855, "loss": 0.0043, "lr": 6.997440198122152e-07, "epoch": 4.739446870451237, "percentage": 95.2, "elapsed_time": "2:44:35", "remaining_time": "0:08:17"} |
|
{"current_steps": 815, "total_steps": 855, "loss": 0.0045, "lr": 6.661015014692185e-07, "epoch": 4.745269286754003, "percentage": 95.32, "elapsed_time": "2:44:45", "remaining_time": "0:08:05"} |
|
{"current_steps": 815, "total_steps": 855, "eval_loss": 0.005708808079361916, "epoch": 4.745269286754003, "percentage": 95.32, "elapsed_time": "2:44:50", "remaining_time": "0:08:05"} |
|
{"current_steps": 816, "total_steps": 855, "loss": 0.0048, "lr": 6.332823471704441e-07, "epoch": 4.751091703056769, "percentage": 95.44, "elapsed_time": "2:45:01", "remaining_time": "0:07:53"} |
|
{"current_steps": 817, "total_steps": 855, "loss": 0.0043, "lr": 6.012871046551239e-07, "epoch": 4.756914119359534, "percentage": 95.56, "elapsed_time": "2:45:11", "remaining_time": "0:07:41"} |
|
{"current_steps": 818, "total_steps": 855, "loss": 0.0045, "lr": 5.701163079117e-07, "epoch": 4.7627365356623, "percentage": 95.67, "elapsed_time": "2:45:21", "remaining_time": "0:07:28"} |
|
{"current_steps": 819, "total_steps": 855, "loss": 0.0046, "lr": 5.397704771689549e-07, "epoch": 4.7685589519650655, "percentage": 95.79, "elapsed_time": "2:45:32", "remaining_time": "0:07:16"} |
|
{"current_steps": 820, "total_steps": 855, "loss": 0.0044, "lr": 5.102501188872899e-07, "epoch": 4.774381368267831, "percentage": 95.91, "elapsed_time": "2:45:42", "remaining_time": "0:07:04"} |
|
{"current_steps": 820, "total_steps": 855, "eval_loss": 0.005696544889360666, "epoch": 4.774381368267831, "percentage": 95.91, "elapsed_time": "2:45:48", "remaining_time": "0:07:04"} |
|
{"current_steps": 821, "total_steps": 855, "loss": 0.0049, "lr": 4.815557257502712e-07, "epoch": 4.780203784570597, "percentage": 96.02, "elapsed_time": "2:45:58", "remaining_time": "0:06:52"} |
|
{"current_steps": 822, "total_steps": 855, "loss": 0.0045, "lr": 4.5368777665643625e-07, "epoch": 4.786026200873362, "percentage": 96.14, "elapsed_time": "2:46:09", "remaining_time": "0:06:40"} |
|
{"current_steps": 823, "total_steps": 855, "loss": 0.0046, "lr": 4.266467367112725e-07, "epoch": 4.791848617176128, "percentage": 96.26, "elapsed_time": "2:46:19", "remaining_time": "0:06:28"} |
|
{"current_steps": 824, "total_steps": 855, "loss": 0.0045, "lr": 4.004330572194903e-07, "epoch": 4.797671033478894, "percentage": 96.37, "elapsed_time": "2:46:29", "remaining_time": "0:06:15"} |
|
{"current_steps": 825, "total_steps": 855, "loss": 0.0045, "lr": 3.7504717567743983e-07, "epoch": 4.8034934497816595, "percentage": 96.49, "elapsed_time": "2:46:39", "remaining_time": "0:06:03"} |
|
{"current_steps": 825, "total_steps": 855, "eval_loss": 0.005708719603717327, "epoch": 4.8034934497816595, "percentage": 96.49, "elapsed_time": "2:46:45", "remaining_time": "0:06:03"} |
|
{"current_steps": 826, "total_steps": 855, "loss": 0.0046, "lr": 3.504895157658561e-07, "epoch": 4.809315866084425, "percentage": 96.61, "elapsed_time": "2:46:56", "remaining_time": "0:05:51"} |
|
{"current_steps": 827, "total_steps": 855, "loss": 0.0047, "lr": 3.267604873427532e-07, "epoch": 4.81513828238719, "percentage": 96.73, "elapsed_time": "2:47:06", "remaining_time": "0:05:39"} |
|
{"current_steps": 828, "total_steps": 855, "loss": 0.0047, "lr": 3.0386048643662456e-07, "epoch": 4.820960698689956, "percentage": 96.84, "elapsed_time": "2:47:16", "remaining_time": "0:05:27"} |
|
{"current_steps": 829, "total_steps": 855, "loss": 0.0047, "lr": 2.8178989523979235e-07, "epoch": 4.826783114992722, "percentage": 96.96, "elapsed_time": "2:47:27", "remaining_time": "0:05:15"} |
|
{"current_steps": 830, "total_steps": 855, "loss": 0.0046, "lr": 2.605490821020462e-07, "epoch": 4.832605531295488, "percentage": 97.08, "elapsed_time": "2:47:37", "remaining_time": "0:05:02"} |
|
{"current_steps": 830, "total_steps": 855, "eval_loss": 0.005707500036805868, "epoch": 4.832605531295488, "percentage": 97.08, "elapsed_time": "2:47:43", "remaining_time": "0:05:03"} |
|
{"current_steps": 831, "total_steps": 855, "loss": 0.0044, "lr": 2.401384015244867e-07, "epoch": 4.8384279475982535, "percentage": 97.19, "elapsed_time": "2:47:54", "remaining_time": "0:04:50"} |
|
{"current_steps": 832, "total_steps": 855, "loss": 0.0046, "lr": 2.205581941536472e-07, "epoch": 4.844250363901019, "percentage": 97.31, "elapsed_time": "2:48:04", "remaining_time": "0:04:38"} |
|
{"current_steps": 833, "total_steps": 855, "loss": 0.0042, "lr": 2.0180878677573678e-07, "epoch": 4.850072780203784, "percentage": 97.43, "elapsed_time": "2:48:15", "remaining_time": "0:04:26"} |
|
{"current_steps": 834, "total_steps": 855, "loss": 0.0044, "lr": 1.8389049231126722e-07, "epoch": 4.85589519650655, "percentage": 97.54, "elapsed_time": "2:48:25", "remaining_time": "0:04:14"} |
|
{"current_steps": 835, "total_steps": 855, "loss": 0.0044, "lr": 1.6680360980976252e-07, "epoch": 4.861717612809316, "percentage": 97.66, "elapsed_time": "2:48:35", "remaining_time": "0:04:02"} |
|
{"current_steps": 835, "total_steps": 855, "eval_loss": 0.0056949337013065815, "epoch": 4.861717612809316, "percentage": 97.66, "elapsed_time": "2:48:41", "remaining_time": "0:04:02"} |
|
{"current_steps": 836, "total_steps": 855, "loss": 0.0048, "lr": 1.5054842444480742e-07, "epoch": 4.867540029112082, "percentage": 97.78, "elapsed_time": "2:48:51", "remaining_time": "0:03:50"} |
|
{"current_steps": 837, "total_steps": 855, "loss": 0.0044, "lr": 1.351252075092846e-07, "epoch": 4.873362445414847, "percentage": 97.89, "elapsed_time": "2:49:02", "remaining_time": "0:03:38"} |
|
{"current_steps": 838, "total_steps": 855, "loss": 0.0047, "lr": 1.2053421641082808e-07, "epoch": 4.879184861717613, "percentage": 98.01, "elapsed_time": "2:49:12", "remaining_time": "0:03:25"} |
|
{"current_steps": 839, "total_steps": 855, "loss": 0.0046, "lr": 1.06775694667538e-07, "epoch": 4.885007278020378, "percentage": 98.13, "elapsed_time": "2:49:23", "remaining_time": "0:03:13"} |
|
{"current_steps": 840, "total_steps": 855, "loss": 0.0044, "lr": 9.384987190392269e-08, "epoch": 4.890829694323144, "percentage": 98.25, "elapsed_time": "2:49:33", "remaining_time": "0:03:01"} |
|
{"current_steps": 840, "total_steps": 855, "eval_loss": 0.005698781926184893, "epoch": 4.890829694323144, "percentage": 98.25, "elapsed_time": "2:49:39", "remaining_time": "0:03:01"} |
|
{"current_steps": 841, "total_steps": 855, "loss": 0.0046, "lr": 8.175696384706277e-08, "epoch": 4.89665211062591, "percentage": 98.36, "elapsed_time": "2:49:49", "remaining_time": "0:02:49"} |
|
{"current_steps": 842, "total_steps": 855, "loss": 0.0043, "lr": 7.049717232300302e-08, "epoch": 4.902474526928676, "percentage": 98.48, "elapsed_time": "2:49:59", "remaining_time": "0:02:37"} |
|
{"current_steps": 843, "total_steps": 855, "loss": 0.0045, "lr": 6.007068525338832e-08, "epoch": 4.908296943231441, "percentage": 98.6, "elapsed_time": "2:50:10", "remaining_time": "0:02:25"} |
|
{"current_steps": 844, "total_steps": 855, "loss": 0.0046, "lr": 5.047767665233849e-08, "epoch": 4.914119359534206, "percentage": 98.71, "elapsed_time": "2:50:20", "remaining_time": "0:02:13"} |
|
{"current_steps": 845, "total_steps": 855, "loss": 0.0048, "lr": 4.171830662351717e-08, "epoch": 4.919941775836972, "percentage": 98.83, "elapsed_time": "2:50:30", "remaining_time": "0:02:01"} |
|
{"current_steps": 845, "total_steps": 855, "eval_loss": 0.005693158134818077, "epoch": 4.919941775836972, "percentage": 98.83, "elapsed_time": "2:50:36", "remaining_time": "0:02:01"} |
|
{"current_steps": 846, "total_steps": 855, "loss": 0.0046, "lr": 3.3792721357489565e-08, "epoch": 4.925764192139738, "percentage": 98.95, "elapsed_time": "2:50:46", "remaining_time": "0:01:49"} |
|
{"current_steps": 847, "total_steps": 855, "loss": 0.0045, "lr": 2.670105312926885e-08, "epoch": 4.931586608442504, "percentage": 99.06, "elapsed_time": "2:50:57", "remaining_time": "0:01:36"} |
|
{"current_steps": 848, "total_steps": 855, "loss": 0.0047, "lr": 2.0443420296101246e-08, "epoch": 4.9374090247452695, "percentage": 99.18, "elapsed_time": "2:51:07", "remaining_time": "0:01:24"} |
|
{"current_steps": 849, "total_steps": 855, "loss": 0.0047, "lr": 1.5019927295506497e-08, "epoch": 4.9432314410480345, "percentage": 99.3, "elapsed_time": "2:51:18", "remaining_time": "0:01:12"} |
|
{"current_steps": 850, "total_steps": 855, "loss": 0.0047, "lr": 1.0430664643529265e-08, "epoch": 4.9490538573508, "percentage": 99.42, "elapsed_time": "2:51:28", "remaining_time": "0:01:00"} |
|
{"current_steps": 850, "total_steps": 855, "eval_loss": 0.005704044830054045, "epoch": 4.9490538573508, "percentage": 99.42, "elapsed_time": "2:51:34", "remaining_time": "0:01:00"} |
|
{"current_steps": 851, "total_steps": 855, "loss": 0.0042, "lr": 6.675708933212566e-09, "epoch": 4.954876273653566, "percentage": 99.53, "elapsed_time": "2:52:35", "remaining_time": "0:00:48"} |
|
{"current_steps": 852, "total_steps": 855, "loss": 0.0045, "lr": 3.75512283335433e-09, "epoch": 4.960698689956332, "percentage": 99.65, "elapsed_time": "2:52:45", "remaining_time": "0:00:36"} |
|
{"current_steps": 853, "total_steps": 855, "loss": 0.0047, "lr": 1.668955087413826e-09, "epoch": 4.966521106259098, "percentage": 99.77, "elapsed_time": "2:52:55", "remaining_time": "0:00:24"} |
|
{"current_steps": 854, "total_steps": 855, "loss": 0.0047, "lr": 4.1724051275116027e-10, "epoch": 4.9723435225618635, "percentage": 99.88, "elapsed_time": "2:53:06", "remaining_time": "0:00:12"} |
|
{"current_steps": 855, "total_steps": 855, "loss": 0.0044, "lr": 0.0, "epoch": 4.978165938864628, "percentage": 100.0, "elapsed_time": "2:53:16", "remaining_time": "0:00:00"} |
|
{"current_steps": 855, "total_steps": 855, "eval_loss": 0.005699900444597006, "epoch": 4.978165938864628, "percentage": 100.0, "elapsed_time": "2:53:22", "remaining_time": "0:00:00"} |
|
{"current_steps": 855, "total_steps": 855, "epoch": 4.978165938864628, "percentage": 100.0, "elapsed_time": "2:53:48", "remaining_time": "0:00:00"} |
|
|