SKNahin commited on
Commit
5c5f9ff
1 Parent(s): 72cb103

Training in progress, step 1600

Browse files
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b611eaa12c86199fb759562b68ddf8fc8045d34f4cec519507f8497625934838
3
  size 4988025760
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:862d68c8006a4fbdd0323284c813809aa4fd77bc46faa1a4fd5ec47e178eb47c
3
  size 4988025760
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8093a616bf606c1984df70055bc021359d7dfe4b78a50adfed86be2da4a0d02e
3
  size 240691728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65b2a08317c67e89b0d39a2cfc3a47c493676cf5759947401a9325c00e94b7a0
3
  size 240691728
trainer_log.jsonl CHANGED
@@ -1210,3 +1210,403 @@
1210
  {"current_steps": 1210, "total_steps": 3906, "loss": 1.3978, "learning_rate": 3.162118822615485e-05, "epoch": 0.30976, "percentage": 30.98, "elapsed_time": "4:26:55", "remaining_time": "9:54:44"}
1211
  {"current_steps": 1211, "total_steps": 3906, "loss": 1.3983, "learning_rate": 3.1607957178003874e-05, "epoch": 0.310016, "percentage": 31.0, "elapsed_time": "4:27:08", "remaining_time": "9:54:31"}
1212
  {"current_steps": 1212, "total_steps": 3906, "loss": 1.4291, "learning_rate": 3.1594718464505896e-05, "epoch": 0.310272, "percentage": 31.03, "elapsed_time": "4:27:22", "remaining_time": "9:54:18"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1210
  {"current_steps": 1210, "total_steps": 3906, "loss": 1.3978, "learning_rate": 3.162118822615485e-05, "epoch": 0.30976, "percentage": 30.98, "elapsed_time": "4:26:55", "remaining_time": "9:54:44"}
1211
  {"current_steps": 1211, "total_steps": 3906, "loss": 1.3983, "learning_rate": 3.1607957178003874e-05, "epoch": 0.310016, "percentage": 31.0, "elapsed_time": "4:27:08", "remaining_time": "9:54:31"}
1212
  {"current_steps": 1212, "total_steps": 3906, "loss": 1.4291, "learning_rate": 3.1594718464505896e-05, "epoch": 0.310272, "percentage": 31.03, "elapsed_time": "4:27:22", "remaining_time": "9:54:18"}
1213
+ {"current_steps": 1213, "total_steps": 3906, "loss": 1.4169, "learning_rate": 3.158147209440315e-05, "epoch": 0.310528, "percentage": 31.05, "elapsed_time": "4:27:35", "remaining_time": "9:54:04"}
1214
+ {"current_steps": 1214, "total_steps": 3906, "loss": 1.4024, "learning_rate": 3.1568218076442904e-05, "epoch": 0.310784, "percentage": 31.08, "elapsed_time": "4:27:48", "remaining_time": "9:53:51"}
1215
+ {"current_steps": 1215, "total_steps": 3906, "loss": 1.3848, "learning_rate": 3.1554956419377476e-05, "epoch": 0.31104, "percentage": 31.11, "elapsed_time": "4:28:01", "remaining_time": "9:53:38"}
1216
+ {"current_steps": 1216, "total_steps": 3906, "loss": 1.3952, "learning_rate": 3.154168713196426e-05, "epoch": 0.311296, "percentage": 31.13, "elapsed_time": "4:28:14", "remaining_time": "9:53:24"}
1217
+ {"current_steps": 1217, "total_steps": 3906, "loss": 1.4513, "learning_rate": 3.1528410222965664e-05, "epoch": 0.311552, "percentage": 31.16, "elapsed_time": "4:28:28", "remaining_time": "9:53:11"}
1218
+ {"current_steps": 1218, "total_steps": 3906, "loss": 1.4055, "learning_rate": 3.151512570114911e-05, "epoch": 0.311808, "percentage": 31.18, "elapsed_time": "4:28:41", "remaining_time": "9:52:57"}
1219
+ {"current_steps": 1219, "total_steps": 3906, "loss": 1.3911, "learning_rate": 3.150183357528709e-05, "epoch": 0.312064, "percentage": 31.21, "elapsed_time": "4:28:54", "remaining_time": "9:52:44"}
1220
+ {"current_steps": 1220, "total_steps": 3906, "loss": 1.4421, "learning_rate": 3.1488533854157096e-05, "epoch": 0.31232, "percentage": 31.23, "elapsed_time": "4:29:07", "remaining_time": "9:52:31"}
1221
+ {"current_steps": 1221, "total_steps": 3906, "loss": 1.4059, "learning_rate": 3.1475226546541624e-05, "epoch": 0.312576, "percentage": 31.26, "elapsed_time": "4:29:20", "remaining_time": "9:52:17"}
1222
+ {"current_steps": 1222, "total_steps": 3906, "loss": 1.3935, "learning_rate": 3.14619116612282e-05, "epoch": 0.312832, "percentage": 31.29, "elapsed_time": "4:29:33", "remaining_time": "9:52:04"}
1223
+ {"current_steps": 1223, "total_steps": 3906, "loss": 1.367, "learning_rate": 3.144858920700935e-05, "epoch": 0.313088, "percentage": 31.31, "elapsed_time": "4:29:47", "remaining_time": "9:51:51"}
1224
+ {"current_steps": 1224, "total_steps": 3906, "loss": 1.3806, "learning_rate": 3.1435259192682575e-05, "epoch": 0.313344, "percentage": 31.34, "elapsed_time": "4:30:00", "remaining_time": "9:51:37"}
1225
+ {"current_steps": 1225, "total_steps": 3906, "loss": 1.3536, "learning_rate": 3.1421921627050416e-05, "epoch": 0.3136, "percentage": 31.36, "elapsed_time": "4:30:13", "remaining_time": "9:51:24"}
1226
+ {"current_steps": 1226, "total_steps": 3906, "loss": 1.3924, "learning_rate": 3.1408576518920346e-05, "epoch": 0.313856, "percentage": 31.39, "elapsed_time": "4:30:26", "remaining_time": "9:51:10"}
1227
+ {"current_steps": 1227, "total_steps": 3906, "loss": 1.3767, "learning_rate": 3.139522387710485e-05, "epoch": 0.314112, "percentage": 31.41, "elapsed_time": "4:30:39", "remaining_time": "9:50:57"}
1228
+ {"current_steps": 1228, "total_steps": 3906, "loss": 1.4227, "learning_rate": 3.13818637104214e-05, "epoch": 0.314368, "percentage": 31.44, "elapsed_time": "4:30:52", "remaining_time": "9:50:43"}
1229
+ {"current_steps": 1229, "total_steps": 3906, "loss": 1.3923, "learning_rate": 3.13684960276924e-05, "epoch": 0.314624, "percentage": 31.46, "elapsed_time": "4:31:05", "remaining_time": "9:50:30"}
1230
+ {"current_steps": 1230, "total_steps": 3906, "loss": 1.4874, "learning_rate": 3.135512083774524e-05, "epoch": 0.31488, "percentage": 31.49, "elapsed_time": "4:31:19", "remaining_time": "9:50:17"}
1231
+ {"current_steps": 1231, "total_steps": 3906, "loss": 1.434, "learning_rate": 3.134173814941227e-05, "epoch": 0.315136, "percentage": 31.52, "elapsed_time": "4:31:32", "remaining_time": "9:50:03"}
1232
+ {"current_steps": 1232, "total_steps": 3906, "loss": 1.4046, "learning_rate": 3.132834797153079e-05, "epoch": 0.315392, "percentage": 31.54, "elapsed_time": "4:31:45", "remaining_time": "9:49:50"}
1233
+ {"current_steps": 1233, "total_steps": 3906, "loss": 1.4447, "learning_rate": 3.131495031294303e-05, "epoch": 0.315648, "percentage": 31.57, "elapsed_time": "4:31:58", "remaining_time": "9:49:37"}
1234
+ {"current_steps": 1234, "total_steps": 3906, "loss": 1.4225, "learning_rate": 3.130154518249617e-05, "epoch": 0.315904, "percentage": 31.59, "elapsed_time": "4:32:11", "remaining_time": "9:49:23"}
1235
+ {"current_steps": 1235, "total_steps": 3906, "loss": 1.4147, "learning_rate": 3.1288132589042335e-05, "epoch": 0.31616, "percentage": 31.62, "elapsed_time": "4:32:25", "remaining_time": "9:49:10"}
1236
+ {"current_steps": 1236, "total_steps": 3906, "loss": 1.4012, "learning_rate": 3.1274712541438564e-05, "epoch": 0.316416, "percentage": 31.64, "elapsed_time": "4:32:38", "remaining_time": "9:48:57"}
1237
+ {"current_steps": 1237, "total_steps": 3906, "loss": 1.4041, "learning_rate": 3.126128504854682e-05, "epoch": 0.316672, "percentage": 31.67, "elapsed_time": "4:32:51", "remaining_time": "9:48:43"}
1238
+ {"current_steps": 1238, "total_steps": 3906, "loss": 1.4056, "learning_rate": 3.1247850119233995e-05, "epoch": 0.316928, "percentage": 31.69, "elapsed_time": "4:33:04", "remaining_time": "9:48:30"}
1239
+ {"current_steps": 1239, "total_steps": 3906, "loss": 1.41, "learning_rate": 3.1234407762371875e-05, "epoch": 0.317184, "percentage": 31.72, "elapsed_time": "4:33:17", "remaining_time": "9:48:16"}
1240
+ {"current_steps": 1240, "total_steps": 3906, "loss": 1.4256, "learning_rate": 3.1220957986837165e-05, "epoch": 0.31744, "percentage": 31.75, "elapsed_time": "4:33:30", "remaining_time": "9:48:03"}
1241
+ {"current_steps": 1241, "total_steps": 3906, "loss": 1.3845, "learning_rate": 3.120750080151145e-05, "epoch": 0.317696, "percentage": 31.77, "elapsed_time": "4:33:44", "remaining_time": "9:47:50"}
1242
+ {"current_steps": 1242, "total_steps": 3906, "loss": 1.3805, "learning_rate": 3.119403621528122e-05, "epoch": 0.317952, "percentage": 31.8, "elapsed_time": "4:33:57", "remaining_time": "9:47:36"}
1243
+ {"current_steps": 1243, "total_steps": 3906, "loss": 1.4314, "learning_rate": 3.118056423703787e-05, "epoch": 0.318208, "percentage": 31.82, "elapsed_time": "4:34:10", "remaining_time": "9:47:23"}
1244
+ {"current_steps": 1244, "total_steps": 3906, "loss": 1.4102, "learning_rate": 3.116708487567764e-05, "epoch": 0.318464, "percentage": 31.85, "elapsed_time": "4:34:23", "remaining_time": "9:47:10"}
1245
+ {"current_steps": 1245, "total_steps": 3906, "loss": 1.3789, "learning_rate": 3.1153598140101676e-05, "epoch": 0.31872, "percentage": 31.87, "elapsed_time": "4:34:36", "remaining_time": "9:46:57"}
1246
+ {"current_steps": 1246, "total_steps": 3906, "loss": 1.4489, "learning_rate": 3.114010403921597e-05, "epoch": 0.318976, "percentage": 31.9, "elapsed_time": "4:34:50", "remaining_time": "9:46:43"}
1247
+ {"current_steps": 1247, "total_steps": 3906, "loss": 1.4098, "learning_rate": 3.11266025819314e-05, "epoch": 0.319232, "percentage": 31.93, "elapsed_time": "4:35:03", "remaining_time": "9:46:30"}
1248
+ {"current_steps": 1248, "total_steps": 3906, "loss": 1.4293, "learning_rate": 3.1113093777163686e-05, "epoch": 0.319488, "percentage": 31.95, "elapsed_time": "4:35:16", "remaining_time": "9:46:17"}
1249
+ {"current_steps": 1249, "total_steps": 3906, "loss": 1.364, "learning_rate": 3.1099577633833406e-05, "epoch": 0.319744, "percentage": 31.98, "elapsed_time": "4:35:29", "remaining_time": "9:46:03"}
1250
+ {"current_steps": 1250, "total_steps": 3906, "loss": 1.4582, "learning_rate": 3.1086054160865985e-05, "epoch": 0.32, "percentage": 32.0, "elapsed_time": "4:35:42", "remaining_time": "9:45:50"}
1251
+ {"current_steps": 1251, "total_steps": 3906, "loss": 1.4147, "learning_rate": 3.107252336719168e-05, "epoch": 0.320256, "percentage": 32.03, "elapsed_time": "4:35:55", "remaining_time": "9:45:36"}
1252
+ {"current_steps": 1252, "total_steps": 3906, "loss": 1.4306, "learning_rate": 3.1058985261745596e-05, "epoch": 0.320512, "percentage": 32.05, "elapsed_time": "4:36:09", "remaining_time": "9:45:23"}
1253
+ {"current_steps": 1253, "total_steps": 3906, "loss": 1.4376, "learning_rate": 3.104543985346765e-05, "epoch": 0.320768, "percentage": 32.08, "elapsed_time": "4:36:22", "remaining_time": "9:45:09"}
1254
+ {"current_steps": 1254, "total_steps": 3906, "loss": 1.4405, "learning_rate": 3.10318871513026e-05, "epoch": 0.321024, "percentage": 32.1, "elapsed_time": "4:36:35", "remaining_time": "9:44:56"}
1255
+ {"current_steps": 1255, "total_steps": 3906, "loss": 1.4103, "learning_rate": 3.101832716420001e-05, "epoch": 0.32128, "percentage": 32.13, "elapsed_time": "4:36:48", "remaining_time": "9:44:43"}
1256
+ {"current_steps": 1256, "total_steps": 3906, "loss": 1.4084, "learning_rate": 3.1004759901114245e-05, "epoch": 0.321536, "percentage": 32.16, "elapsed_time": "4:37:01", "remaining_time": "9:44:30"}
1257
+ {"current_steps": 1257, "total_steps": 3906, "loss": 1.3816, "learning_rate": 3.09911853710045e-05, "epoch": 0.321792, "percentage": 32.18, "elapsed_time": "4:37:15", "remaining_time": "9:44:16"}
1258
+ {"current_steps": 1258, "total_steps": 3906, "loss": 1.3757, "learning_rate": 3.097760358283473e-05, "epoch": 0.322048, "percentage": 32.21, "elapsed_time": "4:37:28", "remaining_time": "9:44:03"}
1259
+ {"current_steps": 1259, "total_steps": 3906, "loss": 1.4663, "learning_rate": 3.096401454557374e-05, "epoch": 0.322304, "percentage": 32.23, "elapsed_time": "4:37:41", "remaining_time": "9:43:50"}
1260
+ {"current_steps": 1260, "total_steps": 3906, "loss": 1.4102, "learning_rate": 3.095041826819506e-05, "epoch": 0.32256, "percentage": 32.26, "elapsed_time": "4:37:54", "remaining_time": "9:43:36"}
1261
+ {"current_steps": 1261, "total_steps": 3906, "loss": 1.3755, "learning_rate": 3.093681475967705e-05, "epoch": 0.322816, "percentage": 32.28, "elapsed_time": "4:38:07", "remaining_time": "9:43:23"}
1262
+ {"current_steps": 1262, "total_steps": 3906, "loss": 1.4312, "learning_rate": 3.0923204029002815e-05, "epoch": 0.323072, "percentage": 32.31, "elapsed_time": "4:38:20", "remaining_time": "9:43:09"}
1263
+ {"current_steps": 1263, "total_steps": 3906, "loss": 1.3619, "learning_rate": 3.090958608516023e-05, "epoch": 0.323328, "percentage": 32.33, "elapsed_time": "4:38:34", "remaining_time": "9:42:56"}
1264
+ {"current_steps": 1264, "total_steps": 3906, "loss": 1.4412, "learning_rate": 3.089596093714196e-05, "epoch": 0.323584, "percentage": 32.36, "elapsed_time": "4:38:47", "remaining_time": "9:42:43"}
1265
+ {"current_steps": 1265, "total_steps": 3906, "loss": 1.3637, "learning_rate": 3.088232859394541e-05, "epoch": 0.32384, "percentage": 32.39, "elapsed_time": "4:39:00", "remaining_time": "9:42:29"}
1266
+ {"current_steps": 1266, "total_steps": 3906, "loss": 1.4028, "learning_rate": 3.086868906457271e-05, "epoch": 0.324096, "percentage": 32.41, "elapsed_time": "4:39:13", "remaining_time": "9:42:16"}
1267
+ {"current_steps": 1267, "total_steps": 3906, "loss": 1.3657, "learning_rate": 3.0855042358030795e-05, "epoch": 0.324352, "percentage": 32.44, "elapsed_time": "4:39:26", "remaining_time": "9:42:03"}
1268
+ {"current_steps": 1268, "total_steps": 3906, "loss": 1.3671, "learning_rate": 3.0841388483331284e-05, "epoch": 0.324608, "percentage": 32.46, "elapsed_time": "4:39:40", "remaining_time": "9:41:49"}
1269
+ {"current_steps": 1269, "total_steps": 3906, "loss": 1.3774, "learning_rate": 3.082772744949056e-05, "epoch": 0.324864, "percentage": 32.49, "elapsed_time": "4:39:53", "remaining_time": "9:41:36"}
1270
+ {"current_steps": 1270, "total_steps": 3906, "loss": 1.3822, "learning_rate": 3.0814059265529726e-05, "epoch": 0.32512, "percentage": 32.51, "elapsed_time": "4:40:06", "remaining_time": "9:41:22"}
1271
+ {"current_steps": 1271, "total_steps": 3906, "loss": 1.4003, "learning_rate": 3.08003839404746e-05, "epoch": 0.325376, "percentage": 32.54, "elapsed_time": "4:40:19", "remaining_time": "9:41:09"}
1272
+ {"current_steps": 1272, "total_steps": 3906, "loss": 1.4432, "learning_rate": 3.0786701483355716e-05, "epoch": 0.325632, "percentage": 32.57, "elapsed_time": "4:40:32", "remaining_time": "9:40:56"}
1273
+ {"current_steps": 1273, "total_steps": 3906, "loss": 1.4062, "learning_rate": 3.077301190320834e-05, "epoch": 0.325888, "percentage": 32.59, "elapsed_time": "4:40:45", "remaining_time": "9:40:42"}
1274
+ {"current_steps": 1274, "total_steps": 3906, "loss": 1.4306, "learning_rate": 3.075931520907241e-05, "epoch": 0.326144, "percentage": 32.62, "elapsed_time": "4:40:58", "remaining_time": "9:40:29"}
1275
+ {"current_steps": 1275, "total_steps": 3906, "loss": 1.4227, "learning_rate": 3.074561140999258e-05, "epoch": 0.3264, "percentage": 32.64, "elapsed_time": "4:41:12", "remaining_time": "9:40:16"}
1276
+ {"current_steps": 1276, "total_steps": 3906, "loss": 1.4058, "learning_rate": 3.073190051501819e-05, "epoch": 0.326656, "percentage": 32.67, "elapsed_time": "4:41:25", "remaining_time": "9:40:02"}
1277
+ {"current_steps": 1277, "total_steps": 3906, "loss": 1.4032, "learning_rate": 3.071818253320328e-05, "epoch": 0.326912, "percentage": 32.69, "elapsed_time": "4:41:38", "remaining_time": "9:39:49"}
1278
+ {"current_steps": 1278, "total_steps": 3906, "loss": 1.4103, "learning_rate": 3.070445747360654e-05, "epoch": 0.327168, "percentage": 32.72, "elapsed_time": "4:41:51", "remaining_time": "9:39:36"}
1279
+ {"current_steps": 1279, "total_steps": 3906, "loss": 1.459, "learning_rate": 3.0690725345291364e-05, "epoch": 0.327424, "percentage": 32.74, "elapsed_time": "4:42:05", "remaining_time": "9:39:23"}
1280
+ {"current_steps": 1280, "total_steps": 3906, "loss": 1.4052, "learning_rate": 3.06769861573258e-05, "epoch": 0.32768, "percentage": 32.77, "elapsed_time": "4:42:18", "remaining_time": "9:39:09"}
1281
+ {"current_steps": 1281, "total_steps": 3906, "loss": 1.4315, "learning_rate": 3.0663239918782555e-05, "epoch": 0.327936, "percentage": 32.8, "elapsed_time": "4:42:31", "remaining_time": "9:38:56"}
1282
+ {"current_steps": 1282, "total_steps": 3906, "loss": 1.3906, "learning_rate": 3.0649486638738994e-05, "epoch": 0.328192, "percentage": 32.82, "elapsed_time": "4:42:44", "remaining_time": "9:38:43"}
1283
+ {"current_steps": 1283, "total_steps": 3906, "loss": 1.4242, "learning_rate": 3.0635726326277145e-05, "epoch": 0.328448, "percentage": 32.85, "elapsed_time": "4:42:58", "remaining_time": "9:38:30"}
1284
+ {"current_steps": 1284, "total_steps": 3906, "loss": 1.4153, "learning_rate": 3.062195899048365e-05, "epoch": 0.328704, "percentage": 32.87, "elapsed_time": "4:43:11", "remaining_time": "9:38:18"}
1285
+ {"current_steps": 1285, "total_steps": 3906, "loss": 1.3687, "learning_rate": 3.060818464044984e-05, "epoch": 0.32896, "percentage": 32.9, "elapsed_time": "4:43:24", "remaining_time": "9:38:04"}
1286
+ {"current_steps": 1286, "total_steps": 3906, "loss": 1.4451, "learning_rate": 3.0594403285271604e-05, "epoch": 0.329216, "percentage": 32.92, "elapsed_time": "4:43:38", "remaining_time": "9:37:51"}
1287
+ {"current_steps": 1287, "total_steps": 3906, "loss": 1.4418, "learning_rate": 3.0580614934049524e-05, "epoch": 0.329472, "percentage": 32.95, "elapsed_time": "4:43:51", "remaining_time": "9:37:38"}
1288
+ {"current_steps": 1288, "total_steps": 3906, "loss": 1.3672, "learning_rate": 3.0566819595888775e-05, "epoch": 0.329728, "percentage": 32.97, "elapsed_time": "4:44:04", "remaining_time": "9:37:25"}
1289
+ {"current_steps": 1289, "total_steps": 3906, "loss": 1.3802, "learning_rate": 3.055301727989914e-05, "epoch": 0.329984, "percentage": 33.0, "elapsed_time": "4:44:18", "remaining_time": "9:37:12"}
1290
+ {"current_steps": 1290, "total_steps": 3906, "loss": 1.4245, "learning_rate": 3.053920799519502e-05, "epoch": 0.33024, "percentage": 33.03, "elapsed_time": "4:44:31", "remaining_time": "9:36:59"}
1291
+ {"current_steps": 1291, "total_steps": 3906, "loss": 1.4043, "learning_rate": 3.0525391750895426e-05, "epoch": 0.330496, "percentage": 33.05, "elapsed_time": "4:44:44", "remaining_time": "9:36:45"}
1292
+ {"current_steps": 1292, "total_steps": 3906, "loss": 1.4273, "learning_rate": 3.0511568556123934e-05, "epoch": 0.330752, "percentage": 33.08, "elapsed_time": "4:44:57", "remaining_time": "9:36:32"}
1293
+ {"current_steps": 1293, "total_steps": 3906, "loss": 1.4695, "learning_rate": 3.049773842000874e-05, "epoch": 0.331008, "percentage": 33.1, "elapsed_time": "4:45:10", "remaining_time": "9:36:19"}
1294
+ {"current_steps": 1294, "total_steps": 3906, "loss": 1.3931, "learning_rate": 3.0483901351682612e-05, "epoch": 0.331264, "percentage": 33.13, "elapsed_time": "4:45:24", "remaining_time": "9:36:05"}
1295
+ {"current_steps": 1295, "total_steps": 3906, "loss": 1.4059, "learning_rate": 3.0470057360282896e-05, "epoch": 0.33152, "percentage": 33.15, "elapsed_time": "4:45:37", "remaining_time": "9:35:52"}
1296
+ {"current_steps": 1296, "total_steps": 3906, "loss": 1.4334, "learning_rate": 3.0456206454951514e-05, "epoch": 0.331776, "percentage": 33.18, "elapsed_time": "4:45:50", "remaining_time": "9:35:39"}
1297
+ {"current_steps": 1297, "total_steps": 3906, "loss": 1.4683, "learning_rate": 3.0442348644834944e-05, "epoch": 0.332032, "percentage": 33.21, "elapsed_time": "4:46:03", "remaining_time": "9:35:26"}
1298
+ {"current_steps": 1298, "total_steps": 3906, "loss": 1.3984, "learning_rate": 3.042848393908423e-05, "epoch": 0.332288, "percentage": 33.23, "elapsed_time": "4:46:16", "remaining_time": "9:35:12"}
1299
+ {"current_steps": 1299, "total_steps": 3906, "loss": 1.4095, "learning_rate": 3.0414612346854972e-05, "epoch": 0.332544, "percentage": 33.26, "elapsed_time": "4:46:30", "remaining_time": "9:34:59"}
1300
+ {"current_steps": 1300, "total_steps": 3906, "loss": 1.4433, "learning_rate": 3.0400733877307316e-05, "epoch": 0.3328, "percentage": 33.28, "elapsed_time": "4:46:43", "remaining_time": "9:34:46"}
1301
+ {"current_steps": 1301, "total_steps": 3906, "loss": 1.3945, "learning_rate": 3.0386848539605947e-05, "epoch": 0.333056, "percentage": 33.31, "elapsed_time": "4:46:56", "remaining_time": "9:34:33"}
1302
+ {"current_steps": 1302, "total_steps": 3906, "loss": 1.4524, "learning_rate": 3.0372956342920088e-05, "epoch": 0.333312, "percentage": 33.33, "elapsed_time": "4:47:10", "remaining_time": "9:34:20"}
1303
+ {"current_steps": 1303, "total_steps": 3906, "loss": 1.3809, "learning_rate": 3.0359057296423487e-05, "epoch": 0.333568, "percentage": 33.36, "elapsed_time": "4:47:23", "remaining_time": "9:34:07"}
1304
+ {"current_steps": 1304, "total_steps": 3906, "loss": 1.3242, "learning_rate": 3.034515140929442e-05, "epoch": 0.333824, "percentage": 33.38, "elapsed_time": "4:47:36", "remaining_time": "9:33:54"}
1305
+ {"current_steps": 1305, "total_steps": 3906, "loss": 1.3987, "learning_rate": 3.0331238690715676e-05, "epoch": 0.33408, "percentage": 33.41, "elapsed_time": "4:47:49", "remaining_time": "9:33:40"}
1306
+ {"current_steps": 1306, "total_steps": 3906, "loss": 1.3937, "learning_rate": 3.0317319149874556e-05, "epoch": 0.334336, "percentage": 33.44, "elapsed_time": "4:48:02", "remaining_time": "9:33:27"}
1307
+ {"current_steps": 1307, "total_steps": 3906, "loss": 1.4053, "learning_rate": 3.0303392795962878e-05, "epoch": 0.334592, "percentage": 33.46, "elapsed_time": "4:48:16", "remaining_time": "9:33:13"}
1308
+ {"current_steps": 1308, "total_steps": 3906, "loss": 1.3845, "learning_rate": 3.028945963817694e-05, "epoch": 0.334848, "percentage": 33.49, "elapsed_time": "4:48:29", "remaining_time": "9:33:00"}
1309
+ {"current_steps": 1309, "total_steps": 3906, "loss": 1.4014, "learning_rate": 3.0275519685717546e-05, "epoch": 0.335104, "percentage": 33.51, "elapsed_time": "4:48:42", "remaining_time": "9:32:46"}
1310
+ {"current_steps": 1310, "total_steps": 3906, "loss": 1.3781, "learning_rate": 3.0261572947789975e-05, "epoch": 0.33536, "percentage": 33.54, "elapsed_time": "4:48:55", "remaining_time": "9:32:33"}
1311
+ {"current_steps": 1311, "total_steps": 3906, "loss": 1.4144, "learning_rate": 3.0247619433604e-05, "epoch": 0.335616, "percentage": 33.56, "elapsed_time": "4:49:08", "remaining_time": "9:32:20"}
1312
+ {"current_steps": 1312, "total_steps": 3906, "loss": 1.4027, "learning_rate": 3.0233659152373868e-05, "epoch": 0.335872, "percentage": 33.59, "elapsed_time": "4:49:21", "remaining_time": "9:32:06"}
1313
+ {"current_steps": 1313, "total_steps": 3906, "loss": 1.4412, "learning_rate": 3.0219692113318283e-05, "epoch": 0.336128, "percentage": 33.61, "elapsed_time": "4:49:35", "remaining_time": "9:31:53"}
1314
+ {"current_steps": 1314, "total_steps": 3906, "loss": 1.4148, "learning_rate": 3.0205718325660414e-05, "epoch": 0.336384, "percentage": 33.64, "elapsed_time": "4:49:48", "remaining_time": "9:31:39"}
1315
+ {"current_steps": 1315, "total_steps": 3906, "loss": 1.4019, "learning_rate": 3.01917377986279e-05, "epoch": 0.33664, "percentage": 33.67, "elapsed_time": "4:50:01", "remaining_time": "9:31:26"}
1316
+ {"current_steps": 1316, "total_steps": 3906, "loss": 1.3879, "learning_rate": 3.0177750541452826e-05, "epoch": 0.336896, "percentage": 33.69, "elapsed_time": "4:50:14", "remaining_time": "9:31:12"}
1317
+ {"current_steps": 1317, "total_steps": 3906, "loss": 1.3705, "learning_rate": 3.0163756563371697e-05, "epoch": 0.337152, "percentage": 33.72, "elapsed_time": "4:50:27", "remaining_time": "9:30:59"}
1318
+ {"current_steps": 1318, "total_steps": 3906, "loss": 1.4404, "learning_rate": 3.0149755873625486e-05, "epoch": 0.337408, "percentage": 33.74, "elapsed_time": "4:50:40", "remaining_time": "9:30:46"}
1319
+ {"current_steps": 1319, "total_steps": 3906, "loss": 1.4013, "learning_rate": 3.01357484814596e-05, "epoch": 0.337664, "percentage": 33.77, "elapsed_time": "4:50:53", "remaining_time": "9:30:32"}
1320
+ {"current_steps": 1320, "total_steps": 3906, "loss": 1.3926, "learning_rate": 3.0121734396123848e-05, "epoch": 0.33792, "percentage": 33.79, "elapsed_time": "4:51:07", "remaining_time": "9:30:19"}
1321
+ {"current_steps": 1321, "total_steps": 3906, "loss": 1.4442, "learning_rate": 3.010771362687246e-05, "epoch": 0.338176, "percentage": 33.82, "elapsed_time": "4:51:20", "remaining_time": "9:30:06"}
1322
+ {"current_steps": 1322, "total_steps": 3906, "loss": 1.4205, "learning_rate": 3.0093686182964102e-05, "epoch": 0.338432, "percentage": 33.85, "elapsed_time": "4:51:33", "remaining_time": "9:29:53"}
1323
+ {"current_steps": 1323, "total_steps": 3906, "loss": 1.3799, "learning_rate": 3.0079652073661846e-05, "epoch": 0.338688, "percentage": 33.87, "elapsed_time": "4:51:46", "remaining_time": "9:29:39"}
1324
+ {"current_steps": 1324, "total_steps": 3906, "loss": 1.475, "learning_rate": 3.0065611308233134e-05, "epoch": 0.338944, "percentage": 33.9, "elapsed_time": "4:51:59", "remaining_time": "9:29:26"}
1325
+ {"current_steps": 1325, "total_steps": 3906, "loss": 1.3881, "learning_rate": 3.0051563895949836e-05, "epoch": 0.3392, "percentage": 33.92, "elapsed_time": "4:52:13", "remaining_time": "9:29:12"}
1326
+ {"current_steps": 1326, "total_steps": 3906, "loss": 1.4598, "learning_rate": 3.0037509846088197e-05, "epoch": 0.339456, "percentage": 33.95, "elapsed_time": "4:52:26", "remaining_time": "9:28:59"}
1327
+ {"current_steps": 1327, "total_steps": 3906, "loss": 1.3696, "learning_rate": 3.0023449167928854e-05, "epoch": 0.339712, "percentage": 33.97, "elapsed_time": "4:52:39", "remaining_time": "9:28:46"}
1328
+ {"current_steps": 1328, "total_steps": 3906, "loss": 1.3955, "learning_rate": 3.0009381870756808e-05, "epoch": 0.339968, "percentage": 34.0, "elapsed_time": "4:52:52", "remaining_time": "9:28:32"}
1329
+ {"current_steps": 1329, "total_steps": 3906, "loss": 1.4023, "learning_rate": 2.9995307963861443e-05, "epoch": 0.340224, "percentage": 34.02, "elapsed_time": "4:53:05", "remaining_time": "9:28:19"}
1330
+ {"current_steps": 1330, "total_steps": 3906, "loss": 1.3582, "learning_rate": 2.9981227456536502e-05, "epoch": 0.34048, "percentage": 34.05, "elapsed_time": "4:53:18", "remaining_time": "9:28:06"}
1331
+ {"current_steps": 1331, "total_steps": 3906, "loss": 1.3384, "learning_rate": 2.996714035808008e-05, "epoch": 0.340736, "percentage": 34.08, "elapsed_time": "4:53:32", "remaining_time": "9:27:52"}
1332
+ {"current_steps": 1332, "total_steps": 3906, "loss": 1.3892, "learning_rate": 2.9953046677794648e-05, "epoch": 0.340992, "percentage": 34.1, "elapsed_time": "4:53:45", "remaining_time": "9:27:39"}
1333
+ {"current_steps": 1333, "total_steps": 3906, "loss": 1.3885, "learning_rate": 2.993894642498699e-05, "epoch": 0.341248, "percentage": 34.13, "elapsed_time": "4:53:58", "remaining_time": "9:27:26"}
1334
+ {"current_steps": 1334, "total_steps": 3906, "loss": 1.3966, "learning_rate": 2.9924839608968254e-05, "epoch": 0.341504, "percentage": 34.15, "elapsed_time": "4:54:11", "remaining_time": "9:27:12"}
1335
+ {"current_steps": 1335, "total_steps": 3906, "loss": 1.3983, "learning_rate": 2.991072623905392e-05, "epoch": 0.34176, "percentage": 34.18, "elapsed_time": "4:54:24", "remaining_time": "9:26:59"}
1336
+ {"current_steps": 1336, "total_steps": 3906, "loss": 1.4132, "learning_rate": 2.989660632456379e-05, "epoch": 0.342016, "percentage": 34.2, "elapsed_time": "4:54:37", "remaining_time": "9:26:46"}
1337
+ {"current_steps": 1337, "total_steps": 3906, "loss": 1.3827, "learning_rate": 2.988247987482198e-05, "epoch": 0.342272, "percentage": 34.23, "elapsed_time": "4:54:51", "remaining_time": "9:26:32"}
1338
+ {"current_steps": 1338, "total_steps": 3906, "loss": 1.3821, "learning_rate": 2.9868346899156938e-05, "epoch": 0.342528, "percentage": 34.25, "elapsed_time": "4:55:04", "remaining_time": "9:26:19"}
1339
+ {"current_steps": 1339, "total_steps": 3906, "loss": 1.4158, "learning_rate": 2.9854207406901413e-05, "epoch": 0.342784, "percentage": 34.28, "elapsed_time": "4:55:17", "remaining_time": "9:26:06"}
1340
+ {"current_steps": 1340, "total_steps": 3906, "loss": 1.3897, "learning_rate": 2.984006140739246e-05, "epoch": 0.34304, "percentage": 34.31, "elapsed_time": "4:55:30", "remaining_time": "9:25:52"}
1341
+ {"current_steps": 1341, "total_steps": 3906, "loss": 1.4366, "learning_rate": 2.982590890997143e-05, "epoch": 0.343296, "percentage": 34.33, "elapsed_time": "4:55:43", "remaining_time": "9:25:39"}
1342
+ {"current_steps": 1342, "total_steps": 3906, "loss": 1.4035, "learning_rate": 2.9811749923983958e-05, "epoch": 0.343552, "percentage": 34.36, "elapsed_time": "4:55:56", "remaining_time": "9:25:26"}
1343
+ {"current_steps": 1343, "total_steps": 3906, "loss": 1.418, "learning_rate": 2.9797584458779973e-05, "epoch": 0.343808, "percentage": 34.38, "elapsed_time": "4:56:10", "remaining_time": "9:25:12"}
1344
+ {"current_steps": 1344, "total_steps": 3906, "loss": 1.366, "learning_rate": 2.9783412523713688e-05, "epoch": 0.344064, "percentage": 34.41, "elapsed_time": "4:56:23", "remaining_time": "9:24:59"}
1345
+ {"current_steps": 1345, "total_steps": 3906, "loss": 1.428, "learning_rate": 2.9769234128143565e-05, "epoch": 0.34432, "percentage": 34.43, "elapsed_time": "4:56:36", "remaining_time": "9:24:46"}
1346
+ {"current_steps": 1346, "total_steps": 3906, "loss": 1.3757, "learning_rate": 2.9755049281432354e-05, "epoch": 0.344576, "percentage": 34.46, "elapsed_time": "4:56:49", "remaining_time": "9:24:32"}
1347
+ {"current_steps": 1347, "total_steps": 3906, "loss": 1.4476, "learning_rate": 2.974085799294707e-05, "epoch": 0.344832, "percentage": 34.49, "elapsed_time": "4:57:02", "remaining_time": "9:24:19"}
1348
+ {"current_steps": 1348, "total_steps": 3906, "loss": 1.3657, "learning_rate": 2.9726660272058948e-05, "epoch": 0.345088, "percentage": 34.51, "elapsed_time": "4:57:15", "remaining_time": "9:24:05"}
1349
+ {"current_steps": 1349, "total_steps": 3906, "loss": 1.3682, "learning_rate": 2.97124561281435e-05, "epoch": 0.345344, "percentage": 34.54, "elapsed_time": "4:57:28", "remaining_time": "9:23:52"}
1350
+ {"current_steps": 1350, "total_steps": 3906, "loss": 1.3964, "learning_rate": 2.9698245570580488e-05, "epoch": 0.3456, "percentage": 34.56, "elapsed_time": "4:57:42", "remaining_time": "9:23:39"}
1351
+ {"current_steps": 1351, "total_steps": 3906, "loss": 1.4048, "learning_rate": 2.9684028608753874e-05, "epoch": 0.345856, "percentage": 34.59, "elapsed_time": "4:57:55", "remaining_time": "9:23:25"}
1352
+ {"current_steps": 1352, "total_steps": 3906, "loss": 1.3801, "learning_rate": 2.9669805252051884e-05, "epoch": 0.346112, "percentage": 34.61, "elapsed_time": "4:58:08", "remaining_time": "9:23:12"}
1353
+ {"current_steps": 1353, "total_steps": 3906, "loss": 1.3964, "learning_rate": 2.9655575509866935e-05, "epoch": 0.346368, "percentage": 34.64, "elapsed_time": "4:58:21", "remaining_time": "9:22:58"}
1354
+ {"current_steps": 1354, "total_steps": 3906, "loss": 1.393, "learning_rate": 2.9641339391595685e-05, "epoch": 0.346624, "percentage": 34.66, "elapsed_time": "4:58:34", "remaining_time": "9:22:45"}
1355
+ {"current_steps": 1355, "total_steps": 3906, "loss": 1.4146, "learning_rate": 2.9627096906639e-05, "epoch": 0.34688, "percentage": 34.69, "elapsed_time": "4:58:47", "remaining_time": "9:22:32"}
1356
+ {"current_steps": 1356, "total_steps": 3906, "loss": 1.3954, "learning_rate": 2.9612848064401934e-05, "epoch": 0.347136, "percentage": 34.72, "elapsed_time": "4:59:00", "remaining_time": "9:22:18"}
1357
+ {"current_steps": 1357, "total_steps": 3906, "loss": 1.3973, "learning_rate": 2.959859287429376e-05, "epoch": 0.347392, "percentage": 34.74, "elapsed_time": "4:59:14", "remaining_time": "9:22:05"}
1358
+ {"current_steps": 1358, "total_steps": 3906, "loss": 1.3594, "learning_rate": 2.9584331345727924e-05, "epoch": 0.347648, "percentage": 34.77, "elapsed_time": "4:59:27", "remaining_time": "9:21:51"}
1359
+ {"current_steps": 1359, "total_steps": 3906, "loss": 1.3644, "learning_rate": 2.9570063488122077e-05, "epoch": 0.347904, "percentage": 34.79, "elapsed_time": "4:59:40", "remaining_time": "9:21:38"}
1360
+ {"current_steps": 1360, "total_steps": 3906, "loss": 1.3972, "learning_rate": 2.9555789310898025e-05, "epoch": 0.34816, "percentage": 34.82, "elapsed_time": "4:59:53", "remaining_time": "9:21:25"}
1361
+ {"current_steps": 1361, "total_steps": 3906, "loss": 1.3761, "learning_rate": 2.954150882348177e-05, "epoch": 0.348416, "percentage": 34.84, "elapsed_time": "5:00:06", "remaining_time": "9:21:12"}
1362
+ {"current_steps": 1362, "total_steps": 3906, "loss": 1.4657, "learning_rate": 2.952722203530347e-05, "epoch": 0.348672, "percentage": 34.87, "elapsed_time": "5:00:20", "remaining_time": "9:20:58"}
1363
+ {"current_steps": 1363, "total_steps": 3906, "loss": 1.3721, "learning_rate": 2.9512928955797443e-05, "epoch": 0.348928, "percentage": 34.9, "elapsed_time": "5:00:33", "remaining_time": "9:20:45"}
1364
+ {"current_steps": 1364, "total_steps": 3906, "loss": 1.3842, "learning_rate": 2.9498629594402167e-05, "epoch": 0.349184, "percentage": 34.92, "elapsed_time": "5:00:46", "remaining_time": "9:20:31"}
1365
+ {"current_steps": 1365, "total_steps": 3906, "loss": 1.407, "learning_rate": 2.9484323960560273e-05, "epoch": 0.34944, "percentage": 34.95, "elapsed_time": "5:00:59", "remaining_time": "9:20:18"}
1366
+ {"current_steps": 1366, "total_steps": 3906, "loss": 1.4074, "learning_rate": 2.9470012063718508e-05, "epoch": 0.349696, "percentage": 34.97, "elapsed_time": "5:01:12", "remaining_time": "9:20:05"}
1367
+ {"current_steps": 1367, "total_steps": 3906, "loss": 1.3886, "learning_rate": 2.9455693913327788e-05, "epoch": 0.349952, "percentage": 35.0, "elapsed_time": "5:01:25", "remaining_time": "9:19:51"}
1368
+ {"current_steps": 1368, "total_steps": 3906, "loss": 1.421, "learning_rate": 2.9441369518843138e-05, "epoch": 0.350208, "percentage": 35.02, "elapsed_time": "5:01:38", "remaining_time": "9:19:38"}
1369
+ {"current_steps": 1369, "total_steps": 3906, "loss": 1.4226, "learning_rate": 2.9427038889723708e-05, "epoch": 0.350464, "percentage": 35.05, "elapsed_time": "5:01:52", "remaining_time": "9:19:25"}
1370
+ {"current_steps": 1370, "total_steps": 3906, "loss": 1.386, "learning_rate": 2.941270203543278e-05, "epoch": 0.35072, "percentage": 35.07, "elapsed_time": "5:02:05", "remaining_time": "9:19:11"}
1371
+ {"current_steps": 1371, "total_steps": 3906, "loss": 1.3876, "learning_rate": 2.9398358965437726e-05, "epoch": 0.350976, "percentage": 35.1, "elapsed_time": "5:02:18", "remaining_time": "9:18:58"}
1372
+ {"current_steps": 1372, "total_steps": 3906, "loss": 1.4214, "learning_rate": 2.9384009689210038e-05, "epoch": 0.351232, "percentage": 35.13, "elapsed_time": "5:02:31", "remaining_time": "9:18:45"}
1373
+ {"current_steps": 1373, "total_steps": 3906, "loss": 1.3733, "learning_rate": 2.9369654216225294e-05, "epoch": 0.351488, "percentage": 35.15, "elapsed_time": "5:02:44", "remaining_time": "9:18:31"}
1374
+ {"current_steps": 1374, "total_steps": 3906, "loss": 1.4051, "learning_rate": 2.9355292555963185e-05, "epoch": 0.351744, "percentage": 35.18, "elapsed_time": "5:02:58", "remaining_time": "9:18:18"}
1375
+ {"current_steps": 1375, "total_steps": 3906, "loss": 1.3585, "learning_rate": 2.9340924717907455e-05, "epoch": 0.352, "percentage": 35.2, "elapsed_time": "5:03:11", "remaining_time": "9:18:05"}
1376
+ {"current_steps": 1376, "total_steps": 3906, "loss": 1.3668, "learning_rate": 2.932655071154596e-05, "epoch": 0.352256, "percentage": 35.23, "elapsed_time": "5:03:24", "remaining_time": "9:17:51"}
1377
+ {"current_steps": 1377, "total_steps": 3906, "loss": 1.3845, "learning_rate": 2.9312170546370605e-05, "epoch": 0.352512, "percentage": 35.25, "elapsed_time": "5:03:37", "remaining_time": "9:17:38"}
1378
+ {"current_steps": 1378, "total_steps": 3906, "loss": 1.3894, "learning_rate": 2.9297784231877382e-05, "epoch": 0.352768, "percentage": 35.28, "elapsed_time": "5:03:50", "remaining_time": "9:17:25"}
1379
+ {"current_steps": 1379, "total_steps": 3906, "loss": 1.3088, "learning_rate": 2.9283391777566325e-05, "epoch": 0.353024, "percentage": 35.3, "elapsed_time": "5:04:04", "remaining_time": "9:17:11"}
1380
+ {"current_steps": 1380, "total_steps": 3906, "loss": 1.4052, "learning_rate": 2.9268993192941547e-05, "epoch": 0.35328, "percentage": 35.33, "elapsed_time": "5:04:17", "remaining_time": "9:16:58"}
1381
+ {"current_steps": 1381, "total_steps": 3906, "loss": 1.4289, "learning_rate": 2.9254588487511175e-05, "epoch": 0.353536, "percentage": 35.36, "elapsed_time": "5:04:30", "remaining_time": "9:16:45"}
1382
+ {"current_steps": 1382, "total_steps": 3906, "loss": 1.4168, "learning_rate": 2.9240177670787406e-05, "epoch": 0.353792, "percentage": 35.38, "elapsed_time": "5:04:43", "remaining_time": "9:16:32"}
1383
+ {"current_steps": 1383, "total_steps": 3906, "loss": 1.3699, "learning_rate": 2.9225760752286452e-05, "epoch": 0.354048, "percentage": 35.41, "elapsed_time": "5:04:56", "remaining_time": "9:16:18"}
1384
+ {"current_steps": 1384, "total_steps": 3906, "loss": 1.4088, "learning_rate": 2.9211337741528587e-05, "epoch": 0.354304, "percentage": 35.43, "elapsed_time": "5:05:10", "remaining_time": "9:16:05"}
1385
+ {"current_steps": 1385, "total_steps": 3906, "loss": 1.392, "learning_rate": 2.9196908648038067e-05, "epoch": 0.35456, "percentage": 35.46, "elapsed_time": "5:05:23", "remaining_time": "9:15:52"}
1386
+ {"current_steps": 1386, "total_steps": 3906, "loss": 1.3823, "learning_rate": 2.91824734813432e-05, "epoch": 0.354816, "percentage": 35.48, "elapsed_time": "5:05:36", "remaining_time": "9:15:39"}
1387
+ {"current_steps": 1387, "total_steps": 3906, "loss": 1.363, "learning_rate": 2.9168032250976276e-05, "epoch": 0.355072, "percentage": 35.51, "elapsed_time": "5:05:49", "remaining_time": "9:15:25"}
1388
+ {"current_steps": 1388, "total_steps": 3906, "loss": 1.4184, "learning_rate": 2.9153584966473603e-05, "epoch": 0.355328, "percentage": 35.54, "elapsed_time": "5:06:02", "remaining_time": "9:15:12"}
1389
+ {"current_steps": 1389, "total_steps": 3906, "loss": 1.3679, "learning_rate": 2.913913163737549e-05, "epoch": 0.355584, "percentage": 35.56, "elapsed_time": "5:06:16", "remaining_time": "9:14:59"}
1390
+ {"current_steps": 1390, "total_steps": 3906, "loss": 1.386, "learning_rate": 2.9124672273226235e-05, "epoch": 0.35584, "percentage": 35.59, "elapsed_time": "5:06:29", "remaining_time": "9:14:45"}
1391
+ {"current_steps": 1391, "total_steps": 3906, "loss": 1.4224, "learning_rate": 2.9110206883574116e-05, "epoch": 0.356096, "percentage": 35.61, "elapsed_time": "5:06:42", "remaining_time": "9:14:32"}
1392
+ {"current_steps": 1392, "total_steps": 3906, "loss": 1.392, "learning_rate": 2.9095735477971394e-05, "epoch": 0.356352, "percentage": 35.64, "elapsed_time": "5:06:55", "remaining_time": "9:14:19"}
1393
+ {"current_steps": 1393, "total_steps": 3906, "loss": 1.4451, "learning_rate": 2.908125806597431e-05, "epoch": 0.356608, "percentage": 35.66, "elapsed_time": "5:07:08", "remaining_time": "9:14:05"}
1394
+ {"current_steps": 1394, "total_steps": 3906, "loss": 1.3578, "learning_rate": 2.9066774657143044e-05, "epoch": 0.356864, "percentage": 35.69, "elapsed_time": "5:07:21", "remaining_time": "9:13:52"}
1395
+ {"current_steps": 1395, "total_steps": 3906, "loss": 1.3947, "learning_rate": 2.905228526104177e-05, "epoch": 0.35712, "percentage": 35.71, "elapsed_time": "5:07:35", "remaining_time": "9:13:39"}
1396
+ {"current_steps": 1396, "total_steps": 3906, "loss": 1.3946, "learning_rate": 2.9037789887238604e-05, "epoch": 0.357376, "percentage": 35.74, "elapsed_time": "5:07:48", "remaining_time": "9:13:26"}
1397
+ {"current_steps": 1397, "total_steps": 3906, "loss": 1.3639, "learning_rate": 2.9023288545305603e-05, "epoch": 0.357632, "percentage": 35.77, "elapsed_time": "5:08:01", "remaining_time": "9:13:12"}
1398
+ {"current_steps": 1398, "total_steps": 3906, "loss": 1.3902, "learning_rate": 2.9008781244818757e-05, "epoch": 0.357888, "percentage": 35.79, "elapsed_time": "5:08:14", "remaining_time": "9:12:59"}
1399
+ {"current_steps": 1399, "total_steps": 3906, "loss": 1.3904, "learning_rate": 2.8994267995358023e-05, "epoch": 0.358144, "percentage": 35.82, "elapsed_time": "5:08:27", "remaining_time": "9:12:45"}
1400
+ {"current_steps": 1400, "total_steps": 3906, "loss": 1.3436, "learning_rate": 2.8979748806507246e-05, "epoch": 0.3584, "percentage": 35.84, "elapsed_time": "5:08:40", "remaining_time": "9:12:32"}
1401
+ {"current_steps": 1401, "total_steps": 3906, "loss": 1.4263, "learning_rate": 2.8965223687854228e-05, "epoch": 0.358656, "percentage": 35.87, "elapsed_time": "5:08:54", "remaining_time": "9:12:19"}
1402
+ {"current_steps": 1402, "total_steps": 3906, "loss": 1.4104, "learning_rate": 2.895069264899067e-05, "epoch": 0.358912, "percentage": 35.89, "elapsed_time": "5:09:07", "remaining_time": "9:12:05"}
1403
+ {"current_steps": 1403, "total_steps": 3906, "loss": 1.3894, "learning_rate": 2.8936155699512177e-05, "epoch": 0.359168, "percentage": 35.92, "elapsed_time": "5:09:20", "remaining_time": "9:11:52"}
1404
+ {"current_steps": 1404, "total_steps": 3906, "loss": 1.4188, "learning_rate": 2.8921612849018264e-05, "epoch": 0.359424, "percentage": 35.94, "elapsed_time": "5:09:33", "remaining_time": "9:11:39"}
1405
+ {"current_steps": 1405, "total_steps": 3906, "loss": 1.4038, "learning_rate": 2.8907064107112352e-05, "epoch": 0.35968, "percentage": 35.97, "elapsed_time": "5:09:46", "remaining_time": "9:11:26"}
1406
+ {"current_steps": 1406, "total_steps": 3906, "loss": 1.3864, "learning_rate": 2.8892509483401733e-05, "epoch": 0.359936, "percentage": 36.0, "elapsed_time": "5:10:00", "remaining_time": "9:11:12"}
1407
+ {"current_steps": 1407, "total_steps": 3906, "loss": 1.3794, "learning_rate": 2.88779489874976e-05, "epoch": 0.360192, "percentage": 36.02, "elapsed_time": "5:10:13", "remaining_time": "9:10:59"}
1408
+ {"current_steps": 1408, "total_steps": 3906, "loss": 1.4033, "learning_rate": 2.886338262901502e-05, "epoch": 0.360448, "percentage": 36.05, "elapsed_time": "5:10:26", "remaining_time": "9:10:46"}
1409
+ {"current_steps": 1409, "total_steps": 3906, "loss": 1.3653, "learning_rate": 2.8848810417572926e-05, "epoch": 0.360704, "percentage": 36.07, "elapsed_time": "5:10:39", "remaining_time": "9:10:32"}
1410
+ {"current_steps": 1410, "total_steps": 3906, "loss": 1.3987, "learning_rate": 2.883423236279411e-05, "epoch": 0.36096, "percentage": 36.1, "elapsed_time": "5:10:52", "remaining_time": "9:10:19"}
1411
+ {"current_steps": 1411, "total_steps": 3906, "loss": 1.3528, "learning_rate": 2.8819648474305242e-05, "epoch": 0.361216, "percentage": 36.12, "elapsed_time": "5:11:05", "remaining_time": "9:10:06"}
1412
+ {"current_steps": 1412, "total_steps": 3906, "loss": 1.4338, "learning_rate": 2.8805058761736826e-05, "epoch": 0.361472, "percentage": 36.15, "elapsed_time": "5:11:19", "remaining_time": "9:09:52"}
1413
+ {"current_steps": 1413, "total_steps": 3906, "loss": 1.3277, "learning_rate": 2.8790463234723228e-05, "epoch": 0.361728, "percentage": 36.18, "elapsed_time": "5:11:32", "remaining_time": "9:09:39"}
1414
+ {"current_steps": 1414, "total_steps": 3906, "loss": 1.4364, "learning_rate": 2.8775861902902637e-05, "epoch": 0.361984, "percentage": 36.2, "elapsed_time": "5:11:45", "remaining_time": "9:09:26"}
1415
+ {"current_steps": 1415, "total_steps": 3906, "loss": 1.3876, "learning_rate": 2.876125477591709e-05, "epoch": 0.36224, "percentage": 36.23, "elapsed_time": "5:11:58", "remaining_time": "9:09:12"}
1416
+ {"current_steps": 1416, "total_steps": 3906, "loss": 1.4215, "learning_rate": 2.8746641863412442e-05, "epoch": 0.362496, "percentage": 36.25, "elapsed_time": "5:12:11", "remaining_time": "9:08:59"}
1417
+ {"current_steps": 1417, "total_steps": 3906, "loss": 1.4017, "learning_rate": 2.8732023175038367e-05, "epoch": 0.362752, "percentage": 36.28, "elapsed_time": "5:12:25", "remaining_time": "9:08:46"}
1418
+ {"current_steps": 1418, "total_steps": 3906, "loss": 1.4023, "learning_rate": 2.8717398720448354e-05, "epoch": 0.363008, "percentage": 36.3, "elapsed_time": "5:12:38", "remaining_time": "9:08:32"}
1419
+ {"current_steps": 1419, "total_steps": 3906, "loss": 1.3576, "learning_rate": 2.8702768509299713e-05, "epoch": 0.363264, "percentage": 36.33, "elapsed_time": "5:12:51", "remaining_time": "9:08:19"}
1420
+ {"current_steps": 1420, "total_steps": 3906, "loss": 1.3771, "learning_rate": 2.8688132551253546e-05, "epoch": 0.36352, "percentage": 36.35, "elapsed_time": "5:13:04", "remaining_time": "9:08:06"}
1421
+ {"current_steps": 1421, "total_steps": 3906, "loss": 1.3749, "learning_rate": 2.8673490855974734e-05, "epoch": 0.363776, "percentage": 36.38, "elapsed_time": "5:13:17", "remaining_time": "9:07:52"}
1422
+ {"current_steps": 1422, "total_steps": 3906, "loss": 1.3891, "learning_rate": 2.865884343313197e-05, "epoch": 0.364032, "percentage": 36.41, "elapsed_time": "5:13:30", "remaining_time": "9:07:39"}
1423
+ {"current_steps": 1423, "total_steps": 3906, "loss": 1.4419, "learning_rate": 2.8644190292397724e-05, "epoch": 0.364288, "percentage": 36.43, "elapsed_time": "5:13:44", "remaining_time": "9:07:26"}
1424
+ {"current_steps": 1424, "total_steps": 3906, "loss": 1.3506, "learning_rate": 2.8629531443448235e-05, "epoch": 0.364544, "percentage": 36.46, "elapsed_time": "5:13:57", "remaining_time": "9:07:12"}
1425
+ {"current_steps": 1425, "total_steps": 3906, "loss": 1.3921, "learning_rate": 2.8614866895963516e-05, "epoch": 0.3648, "percentage": 36.48, "elapsed_time": "5:14:10", "remaining_time": "9:06:59"}
1426
+ {"current_steps": 1426, "total_steps": 3906, "loss": 1.3865, "learning_rate": 2.8600196659627338e-05, "epoch": 0.365056, "percentage": 36.51, "elapsed_time": "5:14:23", "remaining_time": "9:06:46"}
1427
+ {"current_steps": 1427, "total_steps": 3906, "loss": 1.3525, "learning_rate": 2.8585520744127237e-05, "epoch": 0.365312, "percentage": 36.53, "elapsed_time": "5:14:36", "remaining_time": "9:06:33"}
1428
+ {"current_steps": 1428, "total_steps": 3906, "loss": 1.3653, "learning_rate": 2.857083915915449e-05, "epoch": 0.365568, "percentage": 36.56, "elapsed_time": "5:14:50", "remaining_time": "9:06:19"}
1429
+ {"current_steps": 1429, "total_steps": 3906, "loss": 1.4021, "learning_rate": 2.8556151914404134e-05, "epoch": 0.365824, "percentage": 36.58, "elapsed_time": "5:15:03", "remaining_time": "9:06:06"}
1430
+ {"current_steps": 1430, "total_steps": 3906, "loss": 1.3832, "learning_rate": 2.8541459019574917e-05, "epoch": 0.36608, "percentage": 36.61, "elapsed_time": "5:15:16", "remaining_time": "9:05:53"}
1431
+ {"current_steps": 1431, "total_steps": 3906, "loss": 1.4137, "learning_rate": 2.8526760484369343e-05, "epoch": 0.366336, "percentage": 36.64, "elapsed_time": "5:15:29", "remaining_time": "9:05:40"}
1432
+ {"current_steps": 1432, "total_steps": 3906, "loss": 1.4292, "learning_rate": 2.851205631849363e-05, "epoch": 0.366592, "percentage": 36.66, "elapsed_time": "5:15:42", "remaining_time": "9:05:26"}
1433
+ {"current_steps": 1433, "total_steps": 3906, "loss": 1.3847, "learning_rate": 2.8497346531657707e-05, "epoch": 0.366848, "percentage": 36.69, "elapsed_time": "5:15:56", "remaining_time": "9:05:13"}
1434
+ {"current_steps": 1434, "total_steps": 3906, "loss": 1.3454, "learning_rate": 2.8482631133575234e-05, "epoch": 0.367104, "percentage": 36.71, "elapsed_time": "5:16:09", "remaining_time": "9:05:00"}
1435
+ {"current_steps": 1435, "total_steps": 3906, "loss": 1.4246, "learning_rate": 2.8467910133963563e-05, "epoch": 0.36736, "percentage": 36.74, "elapsed_time": "5:16:22", "remaining_time": "9:04:46"}
1436
+ {"current_steps": 1436, "total_steps": 3906, "loss": 1.394, "learning_rate": 2.8453183542543743e-05, "epoch": 0.367616, "percentage": 36.76, "elapsed_time": "5:16:35", "remaining_time": "9:04:33"}
1437
+ {"current_steps": 1437, "total_steps": 3906, "loss": 1.3712, "learning_rate": 2.8438451369040517e-05, "epoch": 0.367872, "percentage": 36.79, "elapsed_time": "5:16:48", "remaining_time": "9:04:20"}
1438
+ {"current_steps": 1438, "total_steps": 3906, "loss": 1.4022, "learning_rate": 2.8423713623182335e-05, "epoch": 0.368128, "percentage": 36.82, "elapsed_time": "5:17:02", "remaining_time": "9:04:06"}
1439
+ {"current_steps": 1439, "total_steps": 3906, "loss": 1.3992, "learning_rate": 2.840897031470128e-05, "epoch": 0.368384, "percentage": 36.84, "elapsed_time": "5:17:15", "remaining_time": "9:03:53"}
1440
+ {"current_steps": 1440, "total_steps": 3906, "loss": 1.4011, "learning_rate": 2.8394221453333156e-05, "epoch": 0.36864, "percentage": 36.87, "elapsed_time": "5:17:28", "remaining_time": "9:03:40"}
1441
+ {"current_steps": 1441, "total_steps": 3906, "loss": 1.39, "learning_rate": 2.8379467048817417e-05, "epoch": 0.368896, "percentage": 36.89, "elapsed_time": "5:17:41", "remaining_time": "9:03:27"}
1442
+ {"current_steps": 1442, "total_steps": 3906, "loss": 1.3279, "learning_rate": 2.8364707110897164e-05, "epoch": 0.369152, "percentage": 36.92, "elapsed_time": "5:17:54", "remaining_time": "9:03:13"}
1443
+ {"current_steps": 1443, "total_steps": 3906, "loss": 1.4148, "learning_rate": 2.8349941649319177e-05, "epoch": 0.369408, "percentage": 36.94, "elapsed_time": "5:18:07", "remaining_time": "9:03:00"}
1444
+ {"current_steps": 1444, "total_steps": 3906, "loss": 1.4042, "learning_rate": 2.8335170673833853e-05, "epoch": 0.369664, "percentage": 36.97, "elapsed_time": "5:18:21", "remaining_time": "9:02:47"}
1445
+ {"current_steps": 1445, "total_steps": 3906, "loss": 1.3894, "learning_rate": 2.832039419419526e-05, "epoch": 0.36992, "percentage": 36.99, "elapsed_time": "5:18:34", "remaining_time": "9:02:33"}
1446
+ {"current_steps": 1446, "total_steps": 3906, "loss": 1.4065, "learning_rate": 2.8305612220161083e-05, "epoch": 0.370176, "percentage": 37.02, "elapsed_time": "5:18:47", "remaining_time": "9:02:20"}
1447
+ {"current_steps": 1447, "total_steps": 3906, "loss": 1.4355, "learning_rate": 2.8290824761492638e-05, "epoch": 0.370432, "percentage": 37.05, "elapsed_time": "5:19:00", "remaining_time": "9:02:07"}
1448
+ {"current_steps": 1448, "total_steps": 3906, "loss": 1.3782, "learning_rate": 2.827603182795487e-05, "epoch": 0.370688, "percentage": 37.07, "elapsed_time": "5:19:13", "remaining_time": "9:01:54"}
1449
+ {"current_steps": 1449, "total_steps": 3906, "loss": 1.4379, "learning_rate": 2.8261233429316332e-05, "epoch": 0.370944, "percentage": 37.1, "elapsed_time": "5:19:27", "remaining_time": "9:01:40"}
1450
+ {"current_steps": 1450, "total_steps": 3906, "loss": 1.4362, "learning_rate": 2.824642957534918e-05, "epoch": 0.3712, "percentage": 37.12, "elapsed_time": "5:19:40", "remaining_time": "9:01:27"}
1451
+ {"current_steps": 1451, "total_steps": 3906, "loss": 1.407, "learning_rate": 2.8231620275829195e-05, "epoch": 0.371456, "percentage": 37.15, "elapsed_time": "5:19:53", "remaining_time": "9:01:14"}
1452
+ {"current_steps": 1452, "total_steps": 3906, "loss": 1.4066, "learning_rate": 2.8216805540535726e-05, "epoch": 0.371712, "percentage": 37.17, "elapsed_time": "5:20:06", "remaining_time": "9:01:01"}
1453
+ {"current_steps": 1453, "total_steps": 3906, "loss": 1.3865, "learning_rate": 2.820198537925174e-05, "epoch": 0.371968, "percentage": 37.2, "elapsed_time": "5:20:19", "remaining_time": "9:00:47"}
1454
+ {"current_steps": 1454, "total_steps": 3906, "loss": 1.3869, "learning_rate": 2.818715980176376e-05, "epoch": 0.372224, "percentage": 37.22, "elapsed_time": "5:20:33", "remaining_time": "9:00:34"}
1455
+ {"current_steps": 1455, "total_steps": 3906, "loss": 1.3704, "learning_rate": 2.8172328817861893e-05, "epoch": 0.37248, "percentage": 37.25, "elapsed_time": "5:20:46", "remaining_time": "9:00:21"}
1456
+ {"current_steps": 1456, "total_steps": 3906, "loss": 1.4013, "learning_rate": 2.815749243733983e-05, "epoch": 0.372736, "percentage": 37.28, "elapsed_time": "5:20:59", "remaining_time": "9:00:07"}
1457
+ {"current_steps": 1457, "total_steps": 3906, "loss": 1.3887, "learning_rate": 2.8142650669994815e-05, "epoch": 0.372992, "percentage": 37.3, "elapsed_time": "5:21:12", "remaining_time": "8:59:54"}
1458
+ {"current_steps": 1458, "total_steps": 3906, "loss": 1.4167, "learning_rate": 2.812780352562765e-05, "epoch": 0.373248, "percentage": 37.33, "elapsed_time": "5:21:25", "remaining_time": "8:59:41"}
1459
+ {"current_steps": 1459, "total_steps": 3906, "loss": 1.4529, "learning_rate": 2.811295101404269e-05, "epoch": 0.373504, "percentage": 37.35, "elapsed_time": "5:21:39", "remaining_time": "8:59:27"}
1460
+ {"current_steps": 1460, "total_steps": 3906, "loss": 1.3363, "learning_rate": 2.8098093145047835e-05, "epoch": 0.37376, "percentage": 37.38, "elapsed_time": "5:21:52", "remaining_time": "8:59:14"}
1461
+ {"current_steps": 1461, "total_steps": 3906, "loss": 1.4158, "learning_rate": 2.808322992845451e-05, "epoch": 0.374016, "percentage": 37.4, "elapsed_time": "5:22:05", "remaining_time": "8:59:01"}
1462
+ {"current_steps": 1462, "total_steps": 3906, "loss": 1.3325, "learning_rate": 2.8068361374077685e-05, "epoch": 0.374272, "percentage": 37.43, "elapsed_time": "5:22:18", "remaining_time": "8:58:47"}
1463
+ {"current_steps": 1463, "total_steps": 3906, "loss": 1.4214, "learning_rate": 2.805348749173586e-05, "epoch": 0.374528, "percentage": 37.46, "elapsed_time": "5:22:31", "remaining_time": "8:58:34"}
1464
+ {"current_steps": 1464, "total_steps": 3906, "loss": 1.4046, "learning_rate": 2.8038608291251034e-05, "epoch": 0.374784, "percentage": 37.48, "elapsed_time": "5:22:45", "remaining_time": "8:58:21"}
1465
+ {"current_steps": 1465, "total_steps": 3906, "loss": 1.3418, "learning_rate": 2.802372378244874e-05, "epoch": 0.37504, "percentage": 37.51, "elapsed_time": "5:22:58", "remaining_time": "8:58:08"}
1466
+ {"current_steps": 1466, "total_steps": 3906, "loss": 1.4432, "learning_rate": 2.8008833975158e-05, "epoch": 0.375296, "percentage": 37.53, "elapsed_time": "5:23:11", "remaining_time": "8:57:54"}
1467
+ {"current_steps": 1467, "total_steps": 3906, "loss": 1.3388, "learning_rate": 2.7993938879211326e-05, "epoch": 0.375552, "percentage": 37.56, "elapsed_time": "5:23:24", "remaining_time": "8:57:41"}
1468
+ {"current_steps": 1468, "total_steps": 3906, "loss": 1.3599, "learning_rate": 2.7979038504444758e-05, "epoch": 0.375808, "percentage": 37.58, "elapsed_time": "5:23:37", "remaining_time": "8:57:28"}
1469
+ {"current_steps": 1469, "total_steps": 3906, "loss": 1.361, "learning_rate": 2.796413286069779e-05, "epoch": 0.376064, "percentage": 37.61, "elapsed_time": "5:23:50", "remaining_time": "8:57:14"}
1470
+ {"current_steps": 1470, "total_steps": 3906, "loss": 1.3837, "learning_rate": 2.794922195781341e-05, "epoch": 0.37632, "percentage": 37.63, "elapsed_time": "5:24:04", "remaining_time": "8:57:01"}
1471
+ {"current_steps": 1471, "total_steps": 3906, "loss": 1.3832, "learning_rate": 2.793430580563807e-05, "epoch": 0.376576, "percentage": 37.66, "elapsed_time": "5:24:17", "remaining_time": "8:56:48"}
1472
+ {"current_steps": 1472, "total_steps": 3906, "loss": 1.3845, "learning_rate": 2.7919384414021694e-05, "epoch": 0.376832, "percentage": 37.69, "elapsed_time": "5:24:30", "remaining_time": "8:56:35"}
1473
+ {"current_steps": 1473, "total_steps": 3906, "loss": 1.4441, "learning_rate": 2.7904457792817657e-05, "epoch": 0.377088, "percentage": 37.71, "elapsed_time": "5:24:43", "remaining_time": "8:56:21"}
1474
+ {"current_steps": 1474, "total_steps": 3906, "loss": 1.3828, "learning_rate": 2.788952595188281e-05, "epoch": 0.377344, "percentage": 37.74, "elapsed_time": "5:24:56", "remaining_time": "8:56:08"}
1475
+ {"current_steps": 1475, "total_steps": 3906, "loss": 1.401, "learning_rate": 2.7874588901077423e-05, "epoch": 0.3776, "percentage": 37.76, "elapsed_time": "5:25:09", "remaining_time": "8:55:54"}
1476
+ {"current_steps": 1476, "total_steps": 3906, "loss": 1.4609, "learning_rate": 2.7859646650265234e-05, "epoch": 0.377856, "percentage": 37.79, "elapsed_time": "5:25:23", "remaining_time": "8:55:41"}
1477
+ {"current_steps": 1477, "total_steps": 3906, "loss": 1.3666, "learning_rate": 2.7844699209313386e-05, "epoch": 0.378112, "percentage": 37.81, "elapsed_time": "5:25:36", "remaining_time": "8:55:28"}
1478
+ {"current_steps": 1478, "total_steps": 3906, "loss": 1.3902, "learning_rate": 2.782974658809247e-05, "epoch": 0.378368, "percentage": 37.84, "elapsed_time": "5:25:49", "remaining_time": "8:55:15"}
1479
+ {"current_steps": 1479, "total_steps": 3906, "loss": 1.3568, "learning_rate": 2.7814788796476485e-05, "epoch": 0.378624, "percentage": 37.86, "elapsed_time": "5:26:02", "remaining_time": "8:55:01"}
1480
+ {"current_steps": 1480, "total_steps": 3906, "loss": 1.3763, "learning_rate": 2.7799825844342855e-05, "epoch": 0.37888, "percentage": 37.89, "elapsed_time": "5:26:15", "remaining_time": "8:54:48"}
1481
+ {"current_steps": 1481, "total_steps": 3906, "loss": 1.4173, "learning_rate": 2.7784857741572417e-05, "epoch": 0.379136, "percentage": 37.92, "elapsed_time": "5:26:29", "remaining_time": "8:54:35"}
1482
+ {"current_steps": 1482, "total_steps": 3906, "loss": 1.4141, "learning_rate": 2.7769884498049386e-05, "epoch": 0.379392, "percentage": 37.94, "elapsed_time": "5:26:42", "remaining_time": "8:54:21"}
1483
+ {"current_steps": 1483, "total_steps": 3906, "loss": 1.3913, "learning_rate": 2.7754906123661387e-05, "epoch": 0.379648, "percentage": 37.97, "elapsed_time": "5:26:55", "remaining_time": "8:54:08"}
1484
+ {"current_steps": 1484, "total_steps": 3906, "loss": 1.3699, "learning_rate": 2.7739922628299437e-05, "epoch": 0.379904, "percentage": 37.99, "elapsed_time": "5:27:08", "remaining_time": "8:53:55"}
1485
+ {"current_steps": 1485, "total_steps": 3906, "loss": 1.4148, "learning_rate": 2.7724934021857918e-05, "epoch": 0.38016, "percentage": 38.02, "elapsed_time": "5:27:21", "remaining_time": "8:53:42"}
1486
+ {"current_steps": 1486, "total_steps": 3906, "loss": 1.4123, "learning_rate": 2.770994031423461e-05, "epoch": 0.380416, "percentage": 38.04, "elapsed_time": "5:27:34", "remaining_time": "8:53:28"}
1487
+ {"current_steps": 1487, "total_steps": 3906, "loss": 1.3344, "learning_rate": 2.7694941515330647e-05, "epoch": 0.380672, "percentage": 38.07, "elapsed_time": "5:27:48", "remaining_time": "8:53:15"}
1488
+ {"current_steps": 1488, "total_steps": 3906, "loss": 1.3952, "learning_rate": 2.7679937635050528e-05, "epoch": 0.380928, "percentage": 38.1, "elapsed_time": "5:28:01", "remaining_time": "8:53:02"}
1489
+ {"current_steps": 1489, "total_steps": 3906, "loss": 1.4183, "learning_rate": 2.7664928683302105e-05, "epoch": 0.381184, "percentage": 38.12, "elapsed_time": "5:28:14", "remaining_time": "8:52:49"}
1490
+ {"current_steps": 1490, "total_steps": 3906, "loss": 1.3933, "learning_rate": 2.7649914669996586e-05, "epoch": 0.38144, "percentage": 38.15, "elapsed_time": "5:28:27", "remaining_time": "8:52:35"}
1491
+ {"current_steps": 1491, "total_steps": 3906, "loss": 1.3949, "learning_rate": 2.7634895605048507e-05, "epoch": 0.381696, "percentage": 38.17, "elapsed_time": "5:28:40", "remaining_time": "8:52:22"}
1492
+ {"current_steps": 1492, "total_steps": 3906, "loss": 1.3958, "learning_rate": 2.761987149837576e-05, "epoch": 0.381952, "percentage": 38.2, "elapsed_time": "5:28:54", "remaining_time": "8:52:09"}
1493
+ {"current_steps": 1493, "total_steps": 3906, "loss": 1.4421, "learning_rate": 2.7604842359899548e-05, "epoch": 0.382208, "percentage": 38.22, "elapsed_time": "5:29:07", "remaining_time": "8:51:55"}
1494
+ {"current_steps": 1494, "total_steps": 3906, "loss": 1.3611, "learning_rate": 2.758980819954441e-05, "epoch": 0.382464, "percentage": 38.25, "elapsed_time": "5:29:20", "remaining_time": "8:51:42"}
1495
+ {"current_steps": 1495, "total_steps": 3906, "loss": 1.4051, "learning_rate": 2.7574769027238192e-05, "epoch": 0.38272, "percentage": 38.27, "elapsed_time": "5:29:33", "remaining_time": "8:51:29"}
1496
+ {"current_steps": 1496, "total_steps": 3906, "loss": 1.3822, "learning_rate": 2.755972485291206e-05, "epoch": 0.382976, "percentage": 38.3, "elapsed_time": "5:29:46", "remaining_time": "8:51:15"}
1497
+ {"current_steps": 1497, "total_steps": 3906, "loss": 1.4076, "learning_rate": 2.7544675686500463e-05, "epoch": 0.383232, "percentage": 38.33, "elapsed_time": "5:30:00", "remaining_time": "8:51:02"}
1498
+ {"current_steps": 1498, "total_steps": 3906, "loss": 1.388, "learning_rate": 2.7529621537941178e-05, "epoch": 0.383488, "percentage": 38.35, "elapsed_time": "5:30:13", "remaining_time": "8:50:49"}
1499
+ {"current_steps": 1499, "total_steps": 3906, "loss": 1.3904, "learning_rate": 2.7514562417175245e-05, "epoch": 0.383744, "percentage": 38.38, "elapsed_time": "5:30:26", "remaining_time": "8:50:36"}
1500
+ {"current_steps": 1500, "total_steps": 3906, "loss": 1.3692, "learning_rate": 2.749949833414699e-05, "epoch": 0.384, "percentage": 38.4, "elapsed_time": "5:30:39", "remaining_time": "8:50:22"}
1501
+ {"current_steps": 1501, "total_steps": 3906, "loss": 1.3961, "learning_rate": 2.7484429298804035e-05, "epoch": 0.384256, "percentage": 38.43, "elapsed_time": "5:30:52", "remaining_time": "8:50:09"}
1502
+ {"current_steps": 1502, "total_steps": 3906, "loss": 1.3988, "learning_rate": 2.746935532109725e-05, "epoch": 0.384512, "percentage": 38.45, "elapsed_time": "5:31:06", "remaining_time": "8:49:56"}
1503
+ {"current_steps": 1503, "total_steps": 3906, "loss": 1.3943, "learning_rate": 2.7454276410980782e-05, "epoch": 0.384768, "percentage": 38.48, "elapsed_time": "5:31:19", "remaining_time": "8:49:42"}
1504
+ {"current_steps": 1504, "total_steps": 3906, "loss": 1.354, "learning_rate": 2.7439192578412038e-05, "epoch": 0.385024, "percentage": 38.5, "elapsed_time": "5:31:32", "remaining_time": "8:49:29"}
1505
+ {"current_steps": 1505, "total_steps": 3906, "loss": 1.3905, "learning_rate": 2.742410383335166e-05, "epoch": 0.38528, "percentage": 38.53, "elapsed_time": "5:31:45", "remaining_time": "8:49:16"}
1506
+ {"current_steps": 1506, "total_steps": 3906, "loss": 1.3959, "learning_rate": 2.740901018576354e-05, "epoch": 0.385536, "percentage": 38.56, "elapsed_time": "5:31:58", "remaining_time": "8:49:03"}
1507
+ {"current_steps": 1507, "total_steps": 3906, "loss": 1.3791, "learning_rate": 2.7393911645614823e-05, "epoch": 0.385792, "percentage": 38.58, "elapsed_time": "5:32:12", "remaining_time": "8:48:49"}
1508
+ {"current_steps": 1508, "total_steps": 3906, "loss": 1.4195, "learning_rate": 2.7378808222875857e-05, "epoch": 0.386048, "percentage": 38.61, "elapsed_time": "5:32:25", "remaining_time": "8:48:36"}
1509
+ {"current_steps": 1509, "total_steps": 3906, "loss": 1.3876, "learning_rate": 2.7363699927520245e-05, "epoch": 0.386304, "percentage": 38.63, "elapsed_time": "5:32:38", "remaining_time": "8:48:23"}
1510
+ {"current_steps": 1510, "total_steps": 3906, "loss": 1.4114, "learning_rate": 2.7348586769524787e-05, "epoch": 0.38656, "percentage": 38.66, "elapsed_time": "5:32:51", "remaining_time": "8:48:09"}
1511
+ {"current_steps": 1511, "total_steps": 3906, "loss": 1.4232, "learning_rate": 2.733346875886949e-05, "epoch": 0.386816, "percentage": 38.68, "elapsed_time": "5:33:04", "remaining_time": "8:47:56"}
1512
+ {"current_steps": 1512, "total_steps": 3906, "loss": 1.3488, "learning_rate": 2.7318345905537586e-05, "epoch": 0.387072, "percentage": 38.71, "elapsed_time": "5:33:17", "remaining_time": "8:47:43"}
1513
+ {"current_steps": 1513, "total_steps": 3906, "loss": 1.4452, "learning_rate": 2.730321821951549e-05, "epoch": 0.387328, "percentage": 38.74, "elapsed_time": "5:33:30", "remaining_time": "8:47:29"}
1514
+ {"current_steps": 1514, "total_steps": 3906, "loss": 1.3529, "learning_rate": 2.7288085710792803e-05, "epoch": 0.387584, "percentage": 38.76, "elapsed_time": "5:33:44", "remaining_time": "8:47:16"}
1515
+ {"current_steps": 1515, "total_steps": 3906, "loss": 1.3757, "learning_rate": 2.7272948389362336e-05, "epoch": 0.38784, "percentage": 38.79, "elapsed_time": "5:33:57", "remaining_time": "8:47:03"}
1516
+ {"current_steps": 1516, "total_steps": 3906, "loss": 1.3908, "learning_rate": 2.7257806265220054e-05, "epoch": 0.388096, "percentage": 38.81, "elapsed_time": "5:34:10", "remaining_time": "8:46:49"}
1517
+ {"current_steps": 1517, "total_steps": 3906, "loss": 1.3961, "learning_rate": 2.7242659348365095e-05, "epoch": 0.388352, "percentage": 38.84, "elapsed_time": "5:34:23", "remaining_time": "8:46:36"}
1518
+ {"current_steps": 1518, "total_steps": 3906, "loss": 1.3795, "learning_rate": 2.722750764879978e-05, "epoch": 0.388608, "percentage": 38.86, "elapsed_time": "5:34:36", "remaining_time": "8:46:23"}
1519
+ {"current_steps": 1519, "total_steps": 3906, "loss": 1.3808, "learning_rate": 2.721235117652956e-05, "epoch": 0.388864, "percentage": 38.89, "elapsed_time": "5:34:50", "remaining_time": "8:46:10"}
1520
+ {"current_steps": 1520, "total_steps": 3906, "loss": 1.3983, "learning_rate": 2.7197189941563062e-05, "epoch": 0.38912, "percentage": 38.91, "elapsed_time": "5:35:03", "remaining_time": "8:45:56"}
1521
+ {"current_steps": 1521, "total_steps": 3906, "loss": 1.3985, "learning_rate": 2.7182023953912064e-05, "epoch": 0.389376, "percentage": 38.94, "elapsed_time": "5:35:16", "remaining_time": "8:45:43"}
1522
+ {"current_steps": 1522, "total_steps": 3906, "loss": 1.3647, "learning_rate": 2.7166853223591443e-05, "epoch": 0.389632, "percentage": 38.97, "elapsed_time": "5:35:29", "remaining_time": "8:45:30"}
1523
+ {"current_steps": 1523, "total_steps": 3906, "loss": 1.3027, "learning_rate": 2.715167776061925e-05, "epoch": 0.389888, "percentage": 38.99, "elapsed_time": "5:35:42", "remaining_time": "8:45:16"}
1524
+ {"current_steps": 1524, "total_steps": 3906, "loss": 1.4065, "learning_rate": 2.713649757501664e-05, "epoch": 0.390144, "percentage": 39.02, "elapsed_time": "5:35:55", "remaining_time": "8:45:03"}
1525
+ {"current_steps": 1525, "total_steps": 3906, "loss": 1.4002, "learning_rate": 2.712131267680789e-05, "epoch": 0.3904, "percentage": 39.04, "elapsed_time": "5:36:09", "remaining_time": "8:44:50"}
1526
+ {"current_steps": 1526, "total_steps": 3906, "loss": 1.4001, "learning_rate": 2.7106123076020395e-05, "epoch": 0.390656, "percentage": 39.07, "elapsed_time": "5:36:22", "remaining_time": "8:44:36"}
1527
+ {"current_steps": 1527, "total_steps": 3906, "loss": 1.3776, "learning_rate": 2.7090928782684645e-05, "epoch": 0.390912, "percentage": 39.09, "elapsed_time": "5:36:35", "remaining_time": "8:44:23"}
1528
+ {"current_steps": 1528, "total_steps": 3906, "loss": 1.3806, "learning_rate": 2.707572980683423e-05, "epoch": 0.391168, "percentage": 39.12, "elapsed_time": "5:36:48", "remaining_time": "8:44:10"}
1529
+ {"current_steps": 1529, "total_steps": 3906, "loss": 1.3759, "learning_rate": 2.7060526158505842e-05, "epoch": 0.391424, "percentage": 39.14, "elapsed_time": "5:37:01", "remaining_time": "8:43:57"}
1530
+ {"current_steps": 1530, "total_steps": 3906, "loss": 1.388, "learning_rate": 2.7045317847739257e-05, "epoch": 0.39168, "percentage": 39.17, "elapsed_time": "5:37:14", "remaining_time": "8:43:43"}
1531
+ {"current_steps": 1531, "total_steps": 3906, "loss": 1.3558, "learning_rate": 2.7030104884577318e-05, "epoch": 0.391936, "percentage": 39.2, "elapsed_time": "5:37:28", "remaining_time": "8:43:30"}
1532
+ {"current_steps": 1532, "total_steps": 3906, "loss": 1.3405, "learning_rate": 2.7014887279065957e-05, "epoch": 0.392192, "percentage": 39.22, "elapsed_time": "5:37:41", "remaining_time": "8:43:17"}
1533
+ {"current_steps": 1533, "total_steps": 3906, "loss": 1.3942, "learning_rate": 2.6999665041254153e-05, "epoch": 0.392448, "percentage": 39.25, "elapsed_time": "5:37:54", "remaining_time": "8:43:03"}
1534
+ {"current_steps": 1534, "total_steps": 3906, "loss": 1.3786, "learning_rate": 2.6984438181193953e-05, "epoch": 0.392704, "percentage": 39.27, "elapsed_time": "5:38:07", "remaining_time": "8:42:50"}
1535
+ {"current_steps": 1535, "total_steps": 3906, "loss": 1.3364, "learning_rate": 2.696920670894046e-05, "epoch": 0.39296, "percentage": 39.3, "elapsed_time": "5:38:20", "remaining_time": "8:42:37"}
1536
+ {"current_steps": 1536, "total_steps": 3906, "loss": 1.405, "learning_rate": 2.6953970634551826e-05, "epoch": 0.393216, "percentage": 39.32, "elapsed_time": "5:38:34", "remaining_time": "8:42:23"}
1537
+ {"current_steps": 1537, "total_steps": 3906, "loss": 1.3948, "learning_rate": 2.693872996808922e-05, "epoch": 0.393472, "percentage": 39.35, "elapsed_time": "5:38:47", "remaining_time": "8:42:10"}
1538
+ {"current_steps": 1538, "total_steps": 3906, "loss": 1.4086, "learning_rate": 2.692348471961687e-05, "epoch": 0.393728, "percentage": 39.38, "elapsed_time": "5:39:00", "remaining_time": "8:41:57"}
1539
+ {"current_steps": 1539, "total_steps": 3906, "loss": 1.4199, "learning_rate": 2.6908234899202022e-05, "epoch": 0.393984, "percentage": 39.4, "elapsed_time": "5:39:13", "remaining_time": "8:41:44"}
1540
+ {"current_steps": 1540, "total_steps": 3906, "loss": 1.4126, "learning_rate": 2.6892980516914928e-05, "epoch": 0.39424, "percentage": 39.43, "elapsed_time": "5:39:26", "remaining_time": "8:41:30"}
1541
+ {"current_steps": 1541, "total_steps": 3906, "loss": 1.3923, "learning_rate": 2.6877721582828866e-05, "epoch": 0.394496, "percentage": 39.45, "elapsed_time": "5:39:40", "remaining_time": "8:41:17"}
1542
+ {"current_steps": 1542, "total_steps": 3906, "loss": 1.3315, "learning_rate": 2.686245810702011e-05, "epoch": 0.394752, "percentage": 39.48, "elapsed_time": "5:39:53", "remaining_time": "8:41:04"}
1543
+ {"current_steps": 1543, "total_steps": 3906, "loss": 1.4146, "learning_rate": 2.684719009956795e-05, "epoch": 0.395008, "percentage": 39.5, "elapsed_time": "5:40:06", "remaining_time": "8:40:51"}
1544
+ {"current_steps": 1544, "total_steps": 3906, "loss": 1.3387, "learning_rate": 2.683191757055465e-05, "epoch": 0.395264, "percentage": 39.53, "elapsed_time": "5:40:19", "remaining_time": "8:40:37"}
1545
+ {"current_steps": 1545, "total_steps": 3906, "loss": 1.3829, "learning_rate": 2.6816640530065473e-05, "epoch": 0.39552, "percentage": 39.55, "elapsed_time": "5:40:32", "remaining_time": "8:40:24"}
1546
+ {"current_steps": 1546, "total_steps": 3906, "loss": 1.3765, "learning_rate": 2.680135898818865e-05, "epoch": 0.395776, "percentage": 39.58, "elapsed_time": "5:40:46", "remaining_time": "8:40:11"}
1547
+ {"current_steps": 1547, "total_steps": 3906, "loss": 1.3892, "learning_rate": 2.6786072955015385e-05, "epoch": 0.396032, "percentage": 39.61, "elapsed_time": "5:40:59", "remaining_time": "8:39:57"}
1548
+ {"current_steps": 1548, "total_steps": 3906, "loss": 1.3874, "learning_rate": 2.6770782440639863e-05, "epoch": 0.396288, "percentage": 39.63, "elapsed_time": "5:41:12", "remaining_time": "8:39:44"}
1549
+ {"current_steps": 1549, "total_steps": 3906, "loss": 1.3757, "learning_rate": 2.675548745515922e-05, "epoch": 0.396544, "percentage": 39.66, "elapsed_time": "5:41:25", "remaining_time": "8:39:31"}
1550
+ {"current_steps": 1550, "total_steps": 3906, "loss": 1.3744, "learning_rate": 2.674018800867353e-05, "epoch": 0.3968, "percentage": 39.68, "elapsed_time": "5:41:38", "remaining_time": "8:39:17"}
1551
+ {"current_steps": 1551, "total_steps": 3906, "loss": 1.3824, "learning_rate": 2.6724884111285833e-05, "epoch": 0.397056, "percentage": 39.71, "elapsed_time": "5:41:51", "remaining_time": "8:39:04"}
1552
+ {"current_steps": 1552, "total_steps": 3906, "loss": 1.3769, "learning_rate": 2.67095757731021e-05, "epoch": 0.397312, "percentage": 39.73, "elapsed_time": "5:42:05", "remaining_time": "8:38:51"}
1553
+ {"current_steps": 1553, "total_steps": 3906, "loss": 1.3533, "learning_rate": 2.6694263004231233e-05, "epoch": 0.397568, "percentage": 39.76, "elapsed_time": "5:42:18", "remaining_time": "8:38:38"}
1554
+ {"current_steps": 1554, "total_steps": 3906, "loss": 1.4029, "learning_rate": 2.6678945814785064e-05, "epoch": 0.397824, "percentage": 39.78, "elapsed_time": "5:42:31", "remaining_time": "8:38:24"}
1555
+ {"current_steps": 1555, "total_steps": 3906, "loss": 1.3579, "learning_rate": 2.6663624214878346e-05, "epoch": 0.39808, "percentage": 39.81, "elapsed_time": "5:42:44", "remaining_time": "8:38:11"}
1556
+ {"current_steps": 1556, "total_steps": 3906, "loss": 1.3966, "learning_rate": 2.664829821462872e-05, "epoch": 0.398336, "percentage": 39.84, "elapsed_time": "5:42:57", "remaining_time": "8:37:58"}
1557
+ {"current_steps": 1557, "total_steps": 3906, "loss": 1.3776, "learning_rate": 2.6632967824156787e-05, "epoch": 0.398592, "percentage": 39.86, "elapsed_time": "5:43:10", "remaining_time": "8:37:44"}
1558
+ {"current_steps": 1558, "total_steps": 3906, "loss": 1.3969, "learning_rate": 2.6617633053585982e-05, "epoch": 0.398848, "percentage": 39.89, "elapsed_time": "5:43:24", "remaining_time": "8:37:31"}
1559
+ {"current_steps": 1559, "total_steps": 3906, "loss": 1.3499, "learning_rate": 2.660229391304268e-05, "epoch": 0.399104, "percentage": 39.91, "elapsed_time": "5:43:37", "remaining_time": "8:37:18"}
1560
+ {"current_steps": 1560, "total_steps": 3906, "loss": 1.3468, "learning_rate": 2.6586950412656123e-05, "epoch": 0.39936, "percentage": 39.94, "elapsed_time": "5:43:50", "remaining_time": "8:37:05"}
1561
+ {"current_steps": 1561, "total_steps": 3906, "loss": 1.371, "learning_rate": 2.6571602562558437e-05, "epoch": 0.399616, "percentage": 39.96, "elapsed_time": "5:44:03", "remaining_time": "8:36:51"}
1562
+ {"current_steps": 1562, "total_steps": 3906, "loss": 1.3778, "learning_rate": 2.6556250372884607e-05, "epoch": 0.399872, "percentage": 39.99, "elapsed_time": "5:44:16", "remaining_time": "8:36:38"}
1563
+ {"current_steps": 1563, "total_steps": 3906, "loss": 1.3992, "learning_rate": 2.6540893853772503e-05, "epoch": 0.400128, "percentage": 40.02, "elapsed_time": "5:44:30", "remaining_time": "8:36:25"}
1564
+ {"current_steps": 1564, "total_steps": 3906, "loss": 1.4196, "learning_rate": 2.6525533015362842e-05, "epoch": 0.400384, "percentage": 40.04, "elapsed_time": "5:44:43", "remaining_time": "8:36:12"}
1565
+ {"current_steps": 1565, "total_steps": 3906, "loss": 1.4068, "learning_rate": 2.65101678677992e-05, "epoch": 0.40064, "percentage": 40.07, "elapsed_time": "5:44:56", "remaining_time": "8:35:58"}
1566
+ {"current_steps": 1566, "total_steps": 3906, "loss": 1.3798, "learning_rate": 2.6494798421227998e-05, "epoch": 0.400896, "percentage": 40.09, "elapsed_time": "5:45:09", "remaining_time": "8:35:45"}
1567
+ {"current_steps": 1567, "total_steps": 3906, "loss": 1.3898, "learning_rate": 2.6479424685798486e-05, "epoch": 0.401152, "percentage": 40.12, "elapsed_time": "5:45:22", "remaining_time": "8:35:32"}
1568
+ {"current_steps": 1568, "total_steps": 3906, "loss": 1.4504, "learning_rate": 2.646404667166275e-05, "epoch": 0.401408, "percentage": 40.14, "elapsed_time": "5:45:36", "remaining_time": "8:35:18"}
1569
+ {"current_steps": 1569, "total_steps": 3906, "loss": 1.363, "learning_rate": 2.6448664388975715e-05, "epoch": 0.401664, "percentage": 40.17, "elapsed_time": "5:45:49", "remaining_time": "8:35:05"}
1570
+ {"current_steps": 1570, "total_steps": 3906, "loss": 1.3656, "learning_rate": 2.6433277847895112e-05, "epoch": 0.40192, "percentage": 40.19, "elapsed_time": "5:46:02", "remaining_time": "8:34:52"}
1571
+ {"current_steps": 1571, "total_steps": 3906, "loss": 1.4309, "learning_rate": 2.6417887058581477e-05, "epoch": 0.402176, "percentage": 40.22, "elapsed_time": "5:46:15", "remaining_time": "8:34:39"}
1572
+ {"current_steps": 1572, "total_steps": 3906, "loss": 1.3955, "learning_rate": 2.640249203119817e-05, "epoch": 0.402432, "percentage": 40.25, "elapsed_time": "5:46:28", "remaining_time": "8:34:25"}
1573
+ {"current_steps": 1573, "total_steps": 3906, "loss": 1.39, "learning_rate": 2.6387092775911346e-05, "epoch": 0.402688, "percentage": 40.27, "elapsed_time": "5:46:42", "remaining_time": "8:34:12"}
1574
+ {"current_steps": 1574, "total_steps": 3906, "loss": 1.3903, "learning_rate": 2.6371689302889932e-05, "epoch": 0.402944, "percentage": 40.3, "elapsed_time": "5:46:55", "remaining_time": "8:33:59"}
1575
+ {"current_steps": 1575, "total_steps": 3906, "loss": 1.3853, "learning_rate": 2.635628162230566e-05, "epoch": 0.4032, "percentage": 40.32, "elapsed_time": "5:47:08", "remaining_time": "8:33:46"}
1576
+ {"current_steps": 1576, "total_steps": 3906, "loss": 1.3685, "learning_rate": 2.634086974433304e-05, "epoch": 0.403456, "percentage": 40.35, "elapsed_time": "5:47:21", "remaining_time": "8:33:32"}
1577
+ {"current_steps": 1577, "total_steps": 3906, "loss": 1.3827, "learning_rate": 2.6325453679149345e-05, "epoch": 0.403712, "percentage": 40.37, "elapsed_time": "5:47:34", "remaining_time": "8:33:19"}
1578
+ {"current_steps": 1578, "total_steps": 3906, "loss": 1.3764, "learning_rate": 2.631003343693461e-05, "epoch": 0.403968, "percentage": 40.4, "elapsed_time": "5:47:48", "remaining_time": "8:33:06"}
1579
+ {"current_steps": 1579, "total_steps": 3906, "loss": 1.3928, "learning_rate": 2.629460902787165e-05, "epoch": 0.404224, "percentage": 40.42, "elapsed_time": "5:48:01", "remaining_time": "8:32:53"}
1580
+ {"current_steps": 1580, "total_steps": 3906, "loss": 1.3821, "learning_rate": 2.6279180462146007e-05, "epoch": 0.40448, "percentage": 40.45, "elapsed_time": "5:48:14", "remaining_time": "8:32:39"}
1581
+ {"current_steps": 1581, "total_steps": 3906, "loss": 1.3775, "learning_rate": 2.626374774994597e-05, "epoch": 0.404736, "percentage": 40.48, "elapsed_time": "5:48:27", "remaining_time": "8:32:26"}
1582
+ {"current_steps": 1582, "total_steps": 3906, "loss": 1.3775, "learning_rate": 2.624831090146259e-05, "epoch": 0.404992, "percentage": 40.5, "elapsed_time": "5:48:40", "remaining_time": "8:32:13"}
1583
+ {"current_steps": 1583, "total_steps": 3906, "loss": 1.3865, "learning_rate": 2.623286992688963e-05, "epoch": 0.405248, "percentage": 40.53, "elapsed_time": "5:48:53", "remaining_time": "8:31:59"}
1584
+ {"current_steps": 1584, "total_steps": 3906, "loss": 1.3765, "learning_rate": 2.6217424836423568e-05, "epoch": 0.405504, "percentage": 40.55, "elapsed_time": "5:49:07", "remaining_time": "8:31:46"}
1585
+ {"current_steps": 1585, "total_steps": 3906, "loss": 1.3837, "learning_rate": 2.620197564026363e-05, "epoch": 0.40576, "percentage": 40.58, "elapsed_time": "5:49:20", "remaining_time": "8:31:33"}
1586
+ {"current_steps": 1586, "total_steps": 3906, "loss": 1.3902, "learning_rate": 2.618652234861172e-05, "epoch": 0.406016, "percentage": 40.6, "elapsed_time": "5:49:33", "remaining_time": "8:31:19"}
1587
+ {"current_steps": 1587, "total_steps": 3906, "loss": 1.3846, "learning_rate": 2.617106497167247e-05, "epoch": 0.406272, "percentage": 40.63, "elapsed_time": "5:49:46", "remaining_time": "8:31:06"}
1588
+ {"current_steps": 1588, "total_steps": 3906, "loss": 1.4024, "learning_rate": 2.6155603519653204e-05, "epoch": 0.406528, "percentage": 40.66, "elapsed_time": "5:49:59", "remaining_time": "8:30:53"}
1589
+ {"current_steps": 1589, "total_steps": 3906, "loss": 1.3798, "learning_rate": 2.6140138002763934e-05, "epoch": 0.406784, "percentage": 40.68, "elapsed_time": "5:50:12", "remaining_time": "8:30:39"}
1590
+ {"current_steps": 1590, "total_steps": 3906, "loss": 1.3504, "learning_rate": 2.6124668431217348e-05, "epoch": 0.40704, "percentage": 40.71, "elapsed_time": "5:50:26", "remaining_time": "8:30:26"}
1591
+ {"current_steps": 1591, "total_steps": 3906, "loss": 1.4077, "learning_rate": 2.610919481522884e-05, "epoch": 0.407296, "percentage": 40.73, "elapsed_time": "5:50:39", "remaining_time": "8:30:13"}
1592
+ {"current_steps": 1592, "total_steps": 3906, "loss": 1.3901, "learning_rate": 2.6093717165016435e-05, "epoch": 0.407552, "percentage": 40.76, "elapsed_time": "5:50:52", "remaining_time": "8:30:00"}
1593
+ {"current_steps": 1593, "total_steps": 3906, "loss": 1.3998, "learning_rate": 2.6078235490800854e-05, "epoch": 0.407808, "percentage": 40.78, "elapsed_time": "5:51:05", "remaining_time": "8:29:46"}
1594
+ {"current_steps": 1594, "total_steps": 3906, "loss": 1.3429, "learning_rate": 2.606274980280547e-05, "epoch": 0.408064, "percentage": 40.81, "elapsed_time": "5:51:18", "remaining_time": "8:29:33"}
1595
+ {"current_steps": 1595, "total_steps": 3906, "loss": 1.3918, "learning_rate": 2.6047260111256285e-05, "epoch": 0.40832, "percentage": 40.83, "elapsed_time": "5:51:31", "remaining_time": "8:29:20"}
1596
+ {"current_steps": 1596, "total_steps": 3906, "loss": 1.3521, "learning_rate": 2.6031766426381966e-05, "epoch": 0.408576, "percentage": 40.86, "elapsed_time": "5:51:45", "remaining_time": "8:29:06"}
1597
+ {"current_steps": 1597, "total_steps": 3906, "loss": 1.3826, "learning_rate": 2.601626875841382e-05, "epoch": 0.408832, "percentage": 40.89, "elapsed_time": "5:51:58", "remaining_time": "8:28:53"}
1598
+ {"current_steps": 1598, "total_steps": 3906, "loss": 1.3647, "learning_rate": 2.6000767117585757e-05, "epoch": 0.409088, "percentage": 40.91, "elapsed_time": "5:52:11", "remaining_time": "8:28:40"}
1599
+ {"current_steps": 1599, "total_steps": 3906, "loss": 1.3888, "learning_rate": 2.598526151413435e-05, "epoch": 0.409344, "percentage": 40.94, "elapsed_time": "5:52:24", "remaining_time": "8:28:27"}
1600
+ {"current_steps": 1600, "total_steps": 3906, "loss": 1.3756, "learning_rate": 2.5969751958298757e-05, "epoch": 0.4096, "percentage": 40.96, "elapsed_time": "5:52:37", "remaining_time": "8:28:13"}
1601
+ {"current_steps": 1601, "total_steps": 3906, "loss": 1.3564, "learning_rate": 2.595423846032075e-05, "epoch": 0.409856, "percentage": 40.99, "elapsed_time": "5:53:08", "remaining_time": "8:28:26"}
1602
+ {"current_steps": 1602, "total_steps": 3906, "loss": 1.3446, "learning_rate": 2.593872103044472e-05, "epoch": 0.410112, "percentage": 41.01, "elapsed_time": "5:53:22", "remaining_time": "8:28:12"}
1603
+ {"current_steps": 1603, "total_steps": 3906, "loss": 1.4168, "learning_rate": 2.592319967891765e-05, "epoch": 0.410368, "percentage": 41.04, "elapsed_time": "5:53:35", "remaining_time": "8:27:59"}
1604
+ {"current_steps": 1604, "total_steps": 3906, "loss": 1.4139, "learning_rate": 2.5907674415989093e-05, "epoch": 0.410624, "percentage": 41.07, "elapsed_time": "5:53:48", "remaining_time": "8:27:46"}
1605
+ {"current_steps": 1605, "total_steps": 3906, "loss": 1.3831, "learning_rate": 2.5892145251911212e-05, "epoch": 0.41088, "percentage": 41.09, "elapsed_time": "5:54:01", "remaining_time": "8:27:33"}
1606
+ {"current_steps": 1606, "total_steps": 3906, "loss": 1.3645, "learning_rate": 2.5876612196938733e-05, "epoch": 0.411136, "percentage": 41.12, "elapsed_time": "5:54:14", "remaining_time": "8:27:19"}
1607
+ {"current_steps": 1607, "total_steps": 3906, "loss": 1.3982, "learning_rate": 2.586107526132894e-05, "epoch": 0.411392, "percentage": 41.14, "elapsed_time": "5:54:28", "remaining_time": "8:27:06"}
1608
+ {"current_steps": 1608, "total_steps": 3906, "loss": 1.3901, "learning_rate": 2.584553445534171e-05, "epoch": 0.411648, "percentage": 41.17, "elapsed_time": "5:54:41", "remaining_time": "8:26:53"}
1609
+ {"current_steps": 1609, "total_steps": 3906, "loss": 1.4044, "learning_rate": 2.5829989789239444e-05, "epoch": 0.411904, "percentage": 41.19, "elapsed_time": "5:54:54", "remaining_time": "8:26:39"}
1610
+ {"current_steps": 1610, "total_steps": 3906, "loss": 1.3526, "learning_rate": 2.5814441273287107e-05, "epoch": 0.41216, "percentage": 41.22, "elapsed_time": "5:55:07", "remaining_time": "8:26:26"}
1611
+ {"current_steps": 1611, "total_steps": 3906, "loss": 1.3944, "learning_rate": 2.5798888917752214e-05, "epoch": 0.412416, "percentage": 41.24, "elapsed_time": "5:55:20", "remaining_time": "8:26:13"}
1612
+ {"current_steps": 1612, "total_steps": 3906, "loss": 1.374, "learning_rate": 2.5783332732904804e-05, "epoch": 0.412672, "percentage": 41.27, "elapsed_time": "5:55:34", "remaining_time": "8:26:00"}