SKNahin commited on
Commit
6404de3
1 Parent(s): 44c4bce

Training in progress, step 2400

Browse files
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd537c093919489f9a1e66f9c98b5be0ca4df2f0212dcf0cf24cb248eedeb35a
3
  size 4988025760
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8c77cf17dea767cc4f7b498feab491b3b874d62d162959417c8fbe05f28a498
3
  size 4988025760
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b0a6e4517c3c68803e809227a19afe812d00f20c5215c95f45853dba6989b698
3
  size 240691728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4977dad605682261de9a7688a772be6b3079114c51773ba52d2180f8ddc74279
3
  size 240691728
trainer_log.jsonl CHANGED
@@ -2010,3 +2010,404 @@
2010
  {"current_steps": 2010, "total_steps": 3906, "loss": 1.3442, "learning_rate": 1.9398751085377947e-05, "epoch": 0.51456, "percentage": 51.46, "elapsed_time": "7:23:19", "remaining_time": "6:58:11"}
2011
  {"current_steps": 2011, "total_steps": 3906, "loss": 1.3587, "learning_rate": 1.9382506212096314e-05, "epoch": 0.514816, "percentage": 51.48, "elapsed_time": "7:23:33", "remaining_time": "6:57:58"}
2012
  {"current_steps": 2012, "total_steps": 3906, "loss": 1.3568, "learning_rate": 1.9366261746578436e-05, "epoch": 0.515072, "percentage": 51.51, "elapsed_time": "7:23:46", "remaining_time": "6:57:44"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2010
  {"current_steps": 2010, "total_steps": 3906, "loss": 1.3442, "learning_rate": 1.9398751085377947e-05, "epoch": 0.51456, "percentage": 51.46, "elapsed_time": "7:23:19", "remaining_time": "6:58:11"}
2011
  {"current_steps": 2011, "total_steps": 3906, "loss": 1.3587, "learning_rate": 1.9382506212096314e-05, "epoch": 0.514816, "percentage": 51.48, "elapsed_time": "7:23:33", "remaining_time": "6:57:58"}
2012
  {"current_steps": 2012, "total_steps": 3906, "loss": 1.3568, "learning_rate": 1.9366261746578436e-05, "epoch": 0.515072, "percentage": 51.51, "elapsed_time": "7:23:46", "remaining_time": "6:57:44"}
2013
+ {"current_steps": 2013, "total_steps": 3906, "loss": 1.3751, "learning_rate": 1.9350017699551388e-05, "epoch": 0.515328, "percentage": 51.54, "elapsed_time": "7:23:59", "remaining_time": "6:57:31"}
2014
+ {"current_steps": 2014, "total_steps": 3906, "loss": 1.3767, "learning_rate": 1.9333774081741966e-05, "epoch": 0.515584, "percentage": 51.56, "elapsed_time": "7:24:12", "remaining_time": "6:57:18"}
2015
+ {"current_steps": 2015, "total_steps": 3906, "loss": 1.3392, "learning_rate": 1.9317530903876693e-05, "epoch": 0.51584, "percentage": 51.59, "elapsed_time": "7:24:25", "remaining_time": "6:57:04"}
2016
+ {"current_steps": 2016, "total_steps": 3906, "loss": 1.3351, "learning_rate": 1.9301288176681804e-05, "epoch": 0.516096, "percentage": 51.61, "elapsed_time": "7:24:39", "remaining_time": "6:56:51"}
2017
+ {"current_steps": 2017, "total_steps": 3906, "loss": 1.36, "learning_rate": 1.9285045910883215e-05, "epoch": 0.516352, "percentage": 51.64, "elapsed_time": "7:24:52", "remaining_time": "6:56:38"}
2018
+ {"current_steps": 2018, "total_steps": 3906, "loss": 1.3456, "learning_rate": 1.926880411720656e-05, "epoch": 0.516608, "percentage": 51.66, "elapsed_time": "7:25:05", "remaining_time": "6:56:25"}
2019
+ {"current_steps": 2019, "total_steps": 3906, "loss": 1.3694, "learning_rate": 1.9252562806377157e-05, "epoch": 0.516864, "percentage": 51.69, "elapsed_time": "7:25:18", "remaining_time": "6:56:11"}
2020
+ {"current_steps": 2020, "total_steps": 3906, "loss": 1.3526, "learning_rate": 1.923632198911999e-05, "epoch": 0.51712, "percentage": 51.72, "elapsed_time": "7:25:32", "remaining_time": "6:55:58"}
2021
+ {"current_steps": 2021, "total_steps": 3906, "loss": 1.3277, "learning_rate": 1.9220081676159734e-05, "epoch": 0.517376, "percentage": 51.74, "elapsed_time": "7:25:45", "remaining_time": "6:55:45"}
2022
+ {"current_steps": 2022, "total_steps": 3906, "loss": 1.3522, "learning_rate": 1.920384187822073e-05, "epoch": 0.517632, "percentage": 51.77, "elapsed_time": "7:25:58", "remaining_time": "6:55:32"}
2023
+ {"current_steps": 2023, "total_steps": 3906, "loss": 1.35, "learning_rate": 1.9187602606026962e-05, "epoch": 0.517888, "percentage": 51.79, "elapsed_time": "7:26:11", "remaining_time": "6:55:18"}
2024
+ {"current_steps": 2024, "total_steps": 3906, "loss": 1.305, "learning_rate": 1.917136387030209e-05, "epoch": 0.518144, "percentage": 51.82, "elapsed_time": "7:26:24", "remaining_time": "6:55:05"}
2025
+ {"current_steps": 2025, "total_steps": 3906, "loss": 1.3668, "learning_rate": 1.915512568176941e-05, "epoch": 0.5184, "percentage": 51.84, "elapsed_time": "7:26:37", "remaining_time": "6:54:52"}
2026
+ {"current_steps": 2026, "total_steps": 3906, "loss": 1.3753, "learning_rate": 1.9138888051151843e-05, "epoch": 0.518656, "percentage": 51.87, "elapsed_time": "7:26:51", "remaining_time": "6:54:39"}
2027
+ {"current_steps": 2027, "total_steps": 3906, "loss": 1.3586, "learning_rate": 1.9122650989171963e-05, "epoch": 0.518912, "percentage": 51.89, "elapsed_time": "7:27:04", "remaining_time": "6:54:25"}
2028
+ {"current_steps": 2028, "total_steps": 3906, "loss": 1.3504, "learning_rate": 1.9106414506551953e-05, "epoch": 0.519168, "percentage": 51.92, "elapsed_time": "7:27:17", "remaining_time": "6:54:12"}
2029
+ {"current_steps": 2029, "total_steps": 3906, "loss": 1.3402, "learning_rate": 1.9090178614013623e-05, "epoch": 0.519424, "percentage": 51.95, "elapsed_time": "7:27:30", "remaining_time": "6:53:59"}
2030
+ {"current_steps": 2030, "total_steps": 3906, "loss": 1.3564, "learning_rate": 1.9073943322278392e-05, "epoch": 0.51968, "percentage": 51.97, "elapsed_time": "7:27:43", "remaining_time": "6:53:46"}
2031
+ {"current_steps": 2031, "total_steps": 3906, "loss": 1.3531, "learning_rate": 1.905770864206729e-05, "epoch": 0.519936, "percentage": 52.0, "elapsed_time": "7:27:57", "remaining_time": "6:53:32"}
2032
+ {"current_steps": 2032, "total_steps": 3906, "loss": 1.3843, "learning_rate": 1.9041474584100906e-05, "epoch": 0.520192, "percentage": 52.02, "elapsed_time": "7:28:10", "remaining_time": "6:53:19"}
2033
+ {"current_steps": 2033, "total_steps": 3906, "loss": 1.3479, "learning_rate": 1.9025241159099473e-05, "epoch": 0.520448, "percentage": 52.05, "elapsed_time": "7:28:23", "remaining_time": "6:53:06"}
2034
+ {"current_steps": 2034, "total_steps": 3906, "loss": 1.3615, "learning_rate": 1.900900837778276e-05, "epoch": 0.520704, "percentage": 52.07, "elapsed_time": "7:28:36", "remaining_time": "6:52:52"}
2035
+ {"current_steps": 2035, "total_steps": 3906, "loss": 1.3461, "learning_rate": 1.899277625087014e-05, "epoch": 0.52096, "percentage": 52.1, "elapsed_time": "7:28:49", "remaining_time": "6:52:39"}
2036
+ {"current_steps": 2036, "total_steps": 3906, "loss": 1.3601, "learning_rate": 1.897654478908054e-05, "epoch": 0.521216, "percentage": 52.12, "elapsed_time": "7:29:03", "remaining_time": "6:52:26"}
2037
+ {"current_steps": 2037, "total_steps": 3906, "loss": 1.3343, "learning_rate": 1.8960314003132454e-05, "epoch": 0.521472, "percentage": 52.15, "elapsed_time": "7:29:16", "remaining_time": "6:52:13"}
2038
+ {"current_steps": 2038, "total_steps": 3906, "loss": 1.4035, "learning_rate": 1.8944083903743925e-05, "epoch": 0.521728, "percentage": 52.18, "elapsed_time": "7:29:29", "remaining_time": "6:51:59"}
2039
+ {"current_steps": 2039, "total_steps": 3906, "loss": 1.3427, "learning_rate": 1.8927854501632545e-05, "epoch": 0.521984, "percentage": 52.2, "elapsed_time": "7:29:42", "remaining_time": "6:51:46"}
2040
+ {"current_steps": 2040, "total_steps": 3906, "loss": 1.3646, "learning_rate": 1.891162580751544e-05, "epoch": 0.52224, "percentage": 52.23, "elapsed_time": "7:29:55", "remaining_time": "6:51:33"}
2041
+ {"current_steps": 2041, "total_steps": 3906, "loss": 1.3281, "learning_rate": 1.8895397832109278e-05, "epoch": 0.522496, "percentage": 52.25, "elapsed_time": "7:30:09", "remaining_time": "6:51:19"}
2042
+ {"current_steps": 2042, "total_steps": 3906, "loss": 1.3353, "learning_rate": 1.887917058613025e-05, "epoch": 0.522752, "percentage": 52.28, "elapsed_time": "7:30:22", "remaining_time": "6:51:06"}
2043
+ {"current_steps": 2043, "total_steps": 3906, "loss": 1.3523, "learning_rate": 1.8862944080294064e-05, "epoch": 0.523008, "percentage": 52.3, "elapsed_time": "7:30:35", "remaining_time": "6:50:53"}
2044
+ {"current_steps": 2044, "total_steps": 3906, "loss": 1.3524, "learning_rate": 1.8846718325315932e-05, "epoch": 0.523264, "percentage": 52.33, "elapsed_time": "7:30:48", "remaining_time": "6:50:40"}
2045
+ {"current_steps": 2045, "total_steps": 3906, "loss": 1.3624, "learning_rate": 1.8830493331910585e-05, "epoch": 0.52352, "percentage": 52.36, "elapsed_time": "7:31:01", "remaining_time": "6:50:26"}
2046
+ {"current_steps": 2046, "total_steps": 3906, "loss": 1.3303, "learning_rate": 1.881426911079223e-05, "epoch": 0.523776, "percentage": 52.38, "elapsed_time": "7:31:15", "remaining_time": "6:50:13"}
2047
+ {"current_steps": 2047, "total_steps": 3906, "loss": 1.3459, "learning_rate": 1.879804567267459e-05, "epoch": 0.524032, "percentage": 52.41, "elapsed_time": "7:31:28", "remaining_time": "6:50:00"}
2048
+ {"current_steps": 2048, "total_steps": 3906, "loss": 1.4168, "learning_rate": 1.878182302827085e-05, "epoch": 0.524288, "percentage": 52.43, "elapsed_time": "7:31:41", "remaining_time": "6:49:47"}
2049
+ {"current_steps": 2049, "total_steps": 3906, "loss": 1.3732, "learning_rate": 1.8765601188293684e-05, "epoch": 0.524544, "percentage": 52.46, "elapsed_time": "7:31:54", "remaining_time": "6:49:33"}
2050
+ {"current_steps": 2050, "total_steps": 3906, "loss": 1.3402, "learning_rate": 1.8749380163455233e-05, "epoch": 0.5248, "percentage": 52.48, "elapsed_time": "7:32:07", "remaining_time": "6:49:20"}
2051
+ {"current_steps": 2051, "total_steps": 3906, "loss": 1.331, "learning_rate": 1.873315996446708e-05, "epoch": 0.525056, "percentage": 52.51, "elapsed_time": "7:32:20", "remaining_time": "6:49:07"}
2052
+ {"current_steps": 2052, "total_steps": 3906, "loss": 1.3486, "learning_rate": 1.8716940602040288e-05, "epoch": 0.525312, "percentage": 52.53, "elapsed_time": "7:32:34", "remaining_time": "6:48:54"}
2053
+ {"current_steps": 2053, "total_steps": 3906, "loss": 1.3656, "learning_rate": 1.8700722086885362e-05, "epoch": 0.525568, "percentage": 52.56, "elapsed_time": "7:32:47", "remaining_time": "6:48:40"}
2054
+ {"current_steps": 2054, "total_steps": 3906, "loss": 1.3516, "learning_rate": 1.8684504429712243e-05, "epoch": 0.525824, "percentage": 52.59, "elapsed_time": "7:33:00", "remaining_time": "6:48:27"}
2055
+ {"current_steps": 2055, "total_steps": 3906, "loss": 1.3475, "learning_rate": 1.8668287641230297e-05, "epoch": 0.52608, "percentage": 52.61, "elapsed_time": "7:33:13", "remaining_time": "6:48:14"}
2056
+ {"current_steps": 2056, "total_steps": 3906, "loss": 1.3993, "learning_rate": 1.865207173214835e-05, "epoch": 0.526336, "percentage": 52.64, "elapsed_time": "7:33:26", "remaining_time": "6:48:00"}
2057
+ {"current_steps": 2057, "total_steps": 3906, "loss": 1.3511, "learning_rate": 1.863585671317459e-05, "epoch": 0.526592, "percentage": 52.66, "elapsed_time": "7:33:40", "remaining_time": "6:47:47"}
2058
+ {"current_steps": 2058, "total_steps": 3906, "loss": 1.4097, "learning_rate": 1.8619642595016666e-05, "epoch": 0.526848, "percentage": 52.69, "elapsed_time": "7:33:53", "remaining_time": "6:47:34"}
2059
+ {"current_steps": 2059, "total_steps": 3906, "loss": 1.3908, "learning_rate": 1.8603429388381616e-05, "epoch": 0.527104, "percentage": 52.71, "elapsed_time": "7:34:06", "remaining_time": "6:47:21"}
2060
+ {"current_steps": 2060, "total_steps": 3906, "loss": 1.3498, "learning_rate": 1.8587217103975883e-05, "epoch": 0.52736, "percentage": 52.74, "elapsed_time": "7:34:19", "remaining_time": "6:47:07"}
2061
+ {"current_steps": 2061, "total_steps": 3906, "loss": 1.3535, "learning_rate": 1.8571005752505283e-05, "epoch": 0.527616, "percentage": 52.76, "elapsed_time": "7:34:32", "remaining_time": "6:46:54"}
2062
+ {"current_steps": 2062, "total_steps": 3906, "loss": 1.3504, "learning_rate": 1.855479534467504e-05, "epoch": 0.527872, "percentage": 52.79, "elapsed_time": "7:34:46", "remaining_time": "6:46:41"}
2063
+ {"current_steps": 2063, "total_steps": 3906, "loss": 1.3613, "learning_rate": 1.8538585891189728e-05, "epoch": 0.528128, "percentage": 52.82, "elapsed_time": "7:34:59", "remaining_time": "6:46:28"}
2064
+ {"current_steps": 2064, "total_steps": 3906, "loss": 1.3569, "learning_rate": 1.852237740275331e-05, "epoch": 0.528384, "percentage": 52.84, "elapsed_time": "7:35:12", "remaining_time": "6:46:14"}
2065
+ {"current_steps": 2065, "total_steps": 3906, "loss": 1.3432, "learning_rate": 1.8506169890069107e-05, "epoch": 0.52864, "percentage": 52.87, "elapsed_time": "7:35:25", "remaining_time": "6:46:01"}
2066
+ {"current_steps": 2066, "total_steps": 3906, "loss": 1.3722, "learning_rate": 1.84899633638398e-05, "epoch": 0.528896, "percentage": 52.89, "elapsed_time": "7:35:38", "remaining_time": "6:45:48"}
2067
+ {"current_steps": 2067, "total_steps": 3906, "loss": 1.3679, "learning_rate": 1.8473757834767407e-05, "epoch": 0.529152, "percentage": 52.92, "elapsed_time": "7:35:52", "remaining_time": "6:45:35"}
2068
+ {"current_steps": 2068, "total_steps": 3906, "loss": 1.3502, "learning_rate": 1.8457553313553307e-05, "epoch": 0.529408, "percentage": 52.94, "elapsed_time": "7:36:05", "remaining_time": "6:45:21"}
2069
+ {"current_steps": 2069, "total_steps": 3906, "loss": 1.343, "learning_rate": 1.8441349810898183e-05, "epoch": 0.529664, "percentage": 52.97, "elapsed_time": "7:36:18", "remaining_time": "6:45:08"}
2070
+ {"current_steps": 2070, "total_steps": 3906, "loss": 1.3621, "learning_rate": 1.842514733750207e-05, "epoch": 0.52992, "percentage": 53.0, "elapsed_time": "7:36:31", "remaining_time": "6:44:55"}
2071
+ {"current_steps": 2071, "total_steps": 3906, "loss": 1.3442, "learning_rate": 1.8408945904064318e-05, "epoch": 0.530176, "percentage": 53.02, "elapsed_time": "7:36:44", "remaining_time": "6:44:41"}
2072
+ {"current_steps": 2072, "total_steps": 3906, "loss": 1.3835, "learning_rate": 1.8392745521283595e-05, "epoch": 0.530432, "percentage": 53.05, "elapsed_time": "7:36:58", "remaining_time": "6:44:28"}
2073
+ {"current_steps": 2073, "total_steps": 3906, "loss": 1.3116, "learning_rate": 1.8376546199857863e-05, "epoch": 0.530688, "percentage": 53.07, "elapsed_time": "7:37:11", "remaining_time": "6:44:15"}
2074
+ {"current_steps": 2074, "total_steps": 3906, "loss": 1.371, "learning_rate": 1.8360347950484394e-05, "epoch": 0.530944, "percentage": 53.1, "elapsed_time": "7:37:24", "remaining_time": "6:44:02"}
2075
+ {"current_steps": 2075, "total_steps": 3906, "loss": 1.4056, "learning_rate": 1.8344150783859735e-05, "epoch": 0.5312, "percentage": 53.12, "elapsed_time": "7:37:37", "remaining_time": "6:43:48"}
2076
+ {"current_steps": 2076, "total_steps": 3906, "loss": 1.3839, "learning_rate": 1.832795471067974e-05, "epoch": 0.531456, "percentage": 53.15, "elapsed_time": "7:37:50", "remaining_time": "6:43:35"}
2077
+ {"current_steps": 2077, "total_steps": 3906, "loss": 1.3924, "learning_rate": 1.8311759741639532e-05, "epoch": 0.531712, "percentage": 53.17, "elapsed_time": "7:38:03", "remaining_time": "6:43:22"}
2078
+ {"current_steps": 2078, "total_steps": 3906, "loss": 1.3829, "learning_rate": 1.82955658874335e-05, "epoch": 0.531968, "percentage": 53.2, "elapsed_time": "7:38:17", "remaining_time": "6:43:09"}
2079
+ {"current_steps": 2079, "total_steps": 3906, "loss": 1.3909, "learning_rate": 1.8279373158755302e-05, "epoch": 0.532224, "percentage": 53.23, "elapsed_time": "7:38:30", "remaining_time": "6:42:55"}
2080
+ {"current_steps": 2080, "total_steps": 3906, "loss": 1.3399, "learning_rate": 1.826318156629786e-05, "epoch": 0.53248, "percentage": 53.25, "elapsed_time": "7:38:43", "remaining_time": "6:42:42"}
2081
+ {"current_steps": 2081, "total_steps": 3906, "loss": 1.3282, "learning_rate": 1.824699112075332e-05, "epoch": 0.532736, "percentage": 53.28, "elapsed_time": "7:38:56", "remaining_time": "6:42:29"}
2082
+ {"current_steps": 2082, "total_steps": 3906, "loss": 1.3958, "learning_rate": 1.8230801832813098e-05, "epoch": 0.532992, "percentage": 53.3, "elapsed_time": "7:39:09", "remaining_time": "6:42:15"}
2083
+ {"current_steps": 2083, "total_steps": 3906, "loss": 1.3397, "learning_rate": 1.821461371316784e-05, "epoch": 0.533248, "percentage": 53.33, "elapsed_time": "7:39:23", "remaining_time": "6:42:02"}
2084
+ {"current_steps": 2084, "total_steps": 3906, "loss": 1.3969, "learning_rate": 1.8198426772507403e-05, "epoch": 0.533504, "percentage": 53.35, "elapsed_time": "7:39:36", "remaining_time": "6:41:49"}
2085
+ {"current_steps": 2085, "total_steps": 3906, "loss": 1.3497, "learning_rate": 1.8182241021520894e-05, "epoch": 0.53376, "percentage": 53.38, "elapsed_time": "7:39:49", "remaining_time": "6:41:36"}
2086
+ {"current_steps": 2086, "total_steps": 3906, "loss": 1.3405, "learning_rate": 1.816605647089662e-05, "epoch": 0.534016, "percentage": 53.41, "elapsed_time": "7:40:02", "remaining_time": "6:41:22"}
2087
+ {"current_steps": 2087, "total_steps": 3906, "loss": 1.3528, "learning_rate": 1.8149873131322074e-05, "epoch": 0.534272, "percentage": 53.43, "elapsed_time": "7:40:15", "remaining_time": "6:41:09"}
2088
+ {"current_steps": 2088, "total_steps": 3906, "loss": 1.3704, "learning_rate": 1.813369101348398e-05, "epoch": 0.534528, "percentage": 53.46, "elapsed_time": "7:40:28", "remaining_time": "6:40:56"}
2089
+ {"current_steps": 2089, "total_steps": 3906, "loss": 1.3744, "learning_rate": 1.8117510128068256e-05, "epoch": 0.534784, "percentage": 53.48, "elapsed_time": "7:40:42", "remaining_time": "6:40:42"}
2090
+ {"current_steps": 2090, "total_steps": 3906, "loss": 1.3815, "learning_rate": 1.810133048575998e-05, "epoch": 0.53504, "percentage": 53.51, "elapsed_time": "7:40:55", "remaining_time": "6:40:29"}
2091
+ {"current_steps": 2091, "total_steps": 3906, "loss": 1.3317, "learning_rate": 1.8085152097243427e-05, "epoch": 0.535296, "percentage": 53.53, "elapsed_time": "7:41:08", "remaining_time": "6:40:16"}
2092
+ {"current_steps": 2092, "total_steps": 3906, "loss": 1.3553, "learning_rate": 1.8068974973202054e-05, "epoch": 0.535552, "percentage": 53.56, "elapsed_time": "7:41:21", "remaining_time": "6:40:03"}
2093
+ {"current_steps": 2093, "total_steps": 3906, "loss": 1.3624, "learning_rate": 1.805279912431845e-05, "epoch": 0.535808, "percentage": 53.58, "elapsed_time": "7:41:34", "remaining_time": "6:39:49"}
2094
+ {"current_steps": 2094, "total_steps": 3906, "loss": 1.3477, "learning_rate": 1.803662456127439e-05, "epoch": 0.536064, "percentage": 53.61, "elapsed_time": "7:41:48", "remaining_time": "6:39:36"}
2095
+ {"current_steps": 2095, "total_steps": 3906, "loss": 1.3367, "learning_rate": 1.8020451294750803e-05, "epoch": 0.53632, "percentage": 53.64, "elapsed_time": "7:42:01", "remaining_time": "6:39:23"}
2096
+ {"current_steps": 2096, "total_steps": 3906, "loss": 1.3699, "learning_rate": 1.8004279335427736e-05, "epoch": 0.536576, "percentage": 53.66, "elapsed_time": "7:42:14", "remaining_time": "6:39:10"}
2097
+ {"current_steps": 2097, "total_steps": 3906, "loss": 1.3528, "learning_rate": 1.798810869398439e-05, "epoch": 0.536832, "percentage": 53.69, "elapsed_time": "7:42:27", "remaining_time": "6:38:56"}
2098
+ {"current_steps": 2098, "total_steps": 3906, "loss": 1.3731, "learning_rate": 1.7971939381099096e-05, "epoch": 0.537088, "percentage": 53.71, "elapsed_time": "7:42:40", "remaining_time": "6:38:43"}
2099
+ {"current_steps": 2099, "total_steps": 3906, "loss": 1.3312, "learning_rate": 1.7955771407449318e-05, "epoch": 0.537344, "percentage": 53.74, "elapsed_time": "7:42:54", "remaining_time": "6:38:30"}
2100
+ {"current_steps": 2100, "total_steps": 3906, "loss": 1.3421, "learning_rate": 1.7939604783711604e-05, "epoch": 0.5376, "percentage": 53.76, "elapsed_time": "7:43:07", "remaining_time": "6:38:17"}
2101
+ {"current_steps": 2101, "total_steps": 3906, "loss": 1.4153, "learning_rate": 1.7923439520561633e-05, "epoch": 0.537856, "percentage": 53.79, "elapsed_time": "7:43:20", "remaining_time": "6:38:03"}
2102
+ {"current_steps": 2102, "total_steps": 3906, "loss": 1.376, "learning_rate": 1.790727562867418e-05, "epoch": 0.538112, "percentage": 53.81, "elapsed_time": "7:43:33", "remaining_time": "6:37:50"}
2103
+ {"current_steps": 2103, "total_steps": 3906, "loss": 1.3764, "learning_rate": 1.7891113118723124e-05, "epoch": 0.538368, "percentage": 53.84, "elapsed_time": "7:43:46", "remaining_time": "6:37:37"}
2104
+ {"current_steps": 2104, "total_steps": 3906, "loss": 1.3311, "learning_rate": 1.7874952001381422e-05, "epoch": 0.538624, "percentage": 53.87, "elapsed_time": "7:44:00", "remaining_time": "6:37:24"}
2105
+ {"current_steps": 2105, "total_steps": 3906, "loss": 1.3523, "learning_rate": 1.7858792287321115e-05, "epoch": 0.53888, "percentage": 53.89, "elapsed_time": "7:44:13", "remaining_time": "6:37:10"}
2106
+ {"current_steps": 2106, "total_steps": 3906, "loss": 1.3881, "learning_rate": 1.7842633987213306e-05, "epoch": 0.539136, "percentage": 53.92, "elapsed_time": "7:44:26", "remaining_time": "6:36:57"}
2107
+ {"current_steps": 2107, "total_steps": 3906, "loss": 1.3757, "learning_rate": 1.782647711172818e-05, "epoch": 0.539392, "percentage": 53.94, "elapsed_time": "7:44:39", "remaining_time": "6:36:44"}
2108
+ {"current_steps": 2108, "total_steps": 3906, "loss": 1.3342, "learning_rate": 1.781032167153497e-05, "epoch": 0.539648, "percentage": 53.97, "elapsed_time": "7:44:52", "remaining_time": "6:36:30"}
2109
+ {"current_steps": 2109, "total_steps": 3906, "loss": 1.3521, "learning_rate": 1.779416767730197e-05, "epoch": 0.539904, "percentage": 53.99, "elapsed_time": "7:45:06", "remaining_time": "6:36:17"}
2110
+ {"current_steps": 2110, "total_steps": 3906, "loss": 1.3714, "learning_rate": 1.7778015139696522e-05, "epoch": 0.54016, "percentage": 54.02, "elapsed_time": "7:45:19", "remaining_time": "6:36:04"}
2111
+ {"current_steps": 2111, "total_steps": 3906, "loss": 1.3271, "learning_rate": 1.776186406938499e-05, "epoch": 0.540416, "percentage": 54.05, "elapsed_time": "7:45:32", "remaining_time": "6:35:51"}
2112
+ {"current_steps": 2112, "total_steps": 3906, "loss": 1.3768, "learning_rate": 1.7745714477032785e-05, "epoch": 0.540672, "percentage": 54.07, "elapsed_time": "7:45:45", "remaining_time": "6:35:37"}
2113
+ {"current_steps": 2113, "total_steps": 3906, "loss": 1.3495, "learning_rate": 1.7729566373304324e-05, "epoch": 0.540928, "percentage": 54.1, "elapsed_time": "7:45:58", "remaining_time": "6:35:24"}
2114
+ {"current_steps": 2114, "total_steps": 3906, "loss": 1.3245, "learning_rate": 1.7713419768863062e-05, "epoch": 0.541184, "percentage": 54.12, "elapsed_time": "7:46:12", "remaining_time": "6:35:11"}
2115
+ {"current_steps": 2115, "total_steps": 3906, "loss": 1.3773, "learning_rate": 1.769727467437145e-05, "epoch": 0.54144, "percentage": 54.15, "elapsed_time": "7:46:25", "remaining_time": "6:34:58"}
2116
+ {"current_steps": 2116, "total_steps": 3906, "loss": 1.3765, "learning_rate": 1.768113110049096e-05, "epoch": 0.541696, "percentage": 54.17, "elapsed_time": "7:46:38", "remaining_time": "6:34:44"}
2117
+ {"current_steps": 2117, "total_steps": 3906, "loss": 1.3747, "learning_rate": 1.7664989057882028e-05, "epoch": 0.541952, "percentage": 54.2, "elapsed_time": "7:46:51", "remaining_time": "6:34:31"}
2118
+ {"current_steps": 2118, "total_steps": 3906, "loss": 1.36, "learning_rate": 1.7648848557204108e-05, "epoch": 0.542208, "percentage": 54.22, "elapsed_time": "7:47:04", "remaining_time": "6:34:18"}
2119
+ {"current_steps": 2119, "total_steps": 3906, "loss": 1.3599, "learning_rate": 1.7632709609115615e-05, "epoch": 0.542464, "percentage": 54.25, "elapsed_time": "7:47:17", "remaining_time": "6:34:05"}
2120
+ {"current_steps": 2120, "total_steps": 3906, "loss": 1.3774, "learning_rate": 1.7616572224273955e-05, "epoch": 0.54272, "percentage": 54.28, "elapsed_time": "7:47:31", "remaining_time": "6:33:51"}
2121
+ {"current_steps": 2121, "total_steps": 3906, "loss": 1.3385, "learning_rate": 1.7600436413335497e-05, "epoch": 0.542976, "percentage": 54.3, "elapsed_time": "7:47:44", "remaining_time": "6:33:38"}
2122
+ {"current_steps": 2122, "total_steps": 3906, "loss": 1.3637, "learning_rate": 1.7584302186955566e-05, "epoch": 0.543232, "percentage": 54.33, "elapsed_time": "7:47:57", "remaining_time": "6:33:25"}
2123
+ {"current_steps": 2123, "total_steps": 3906, "loss": 1.3277, "learning_rate": 1.7568169555788452e-05, "epoch": 0.543488, "percentage": 54.35, "elapsed_time": "7:48:10", "remaining_time": "6:33:11"}
2124
+ {"current_steps": 2124, "total_steps": 3906, "loss": 1.3606, "learning_rate": 1.7552038530487365e-05, "epoch": 0.543744, "percentage": 54.38, "elapsed_time": "7:48:23", "remaining_time": "6:32:58"}
2125
+ {"current_steps": 2125, "total_steps": 3906, "loss": 1.3797, "learning_rate": 1.7535909121704483e-05, "epoch": 0.544, "percentage": 54.4, "elapsed_time": "7:48:37", "remaining_time": "6:32:45"}
2126
+ {"current_steps": 2126, "total_steps": 3906, "loss": 1.3541, "learning_rate": 1.7519781340090907e-05, "epoch": 0.544256, "percentage": 54.43, "elapsed_time": "7:48:50", "remaining_time": "6:32:32"}
2127
+ {"current_steps": 2127, "total_steps": 3906, "loss": 1.3499, "learning_rate": 1.7503655196296663e-05, "epoch": 0.544512, "percentage": 54.45, "elapsed_time": "7:49:03", "remaining_time": "6:32:18"}
2128
+ {"current_steps": 2128, "total_steps": 3906, "loss": 1.3275, "learning_rate": 1.7487530700970695e-05, "epoch": 0.544768, "percentage": 54.48, "elapsed_time": "7:49:16", "remaining_time": "6:32:05"}
2129
+ {"current_steps": 2129, "total_steps": 3906, "loss": 1.3549, "learning_rate": 1.7471407864760865e-05, "epoch": 0.545024, "percentage": 54.51, "elapsed_time": "7:49:29", "remaining_time": "6:31:52"}
2130
+ {"current_steps": 2130, "total_steps": 3906, "loss": 1.336, "learning_rate": 1.7455286698313915e-05, "epoch": 0.54528, "percentage": 54.53, "elapsed_time": "7:49:43", "remaining_time": "6:31:39"}
2131
+ {"current_steps": 2131, "total_steps": 3906, "loss": 1.3661, "learning_rate": 1.7439167212275513e-05, "epoch": 0.545536, "percentage": 54.56, "elapsed_time": "7:49:56", "remaining_time": "6:31:25"}
2132
+ {"current_steps": 2132, "total_steps": 3906, "loss": 1.369, "learning_rate": 1.742304941729021e-05, "epoch": 0.545792, "percentage": 54.58, "elapsed_time": "7:50:09", "remaining_time": "6:31:12"}
2133
+ {"current_steps": 2133, "total_steps": 3906, "loss": 1.3936, "learning_rate": 1.7406933324001434e-05, "epoch": 0.546048, "percentage": 54.61, "elapsed_time": "7:50:22", "remaining_time": "6:30:59"}
2134
+ {"current_steps": 2134, "total_steps": 3906, "loss": 1.3731, "learning_rate": 1.739081894305149e-05, "epoch": 0.546304, "percentage": 54.63, "elapsed_time": "7:50:35", "remaining_time": "6:30:46"}
2135
+ {"current_steps": 2135, "total_steps": 3906, "loss": 1.3835, "learning_rate": 1.737470628508156e-05, "epoch": 0.54656, "percentage": 54.66, "elapsed_time": "7:50:49", "remaining_time": "6:30:32"}
2136
+ {"current_steps": 2136, "total_steps": 3906, "loss": 1.3355, "learning_rate": 1.7358595360731677e-05, "epoch": 0.546816, "percentage": 54.69, "elapsed_time": "7:51:02", "remaining_time": "6:30:19"}
2137
+ {"current_steps": 2137, "total_steps": 3906, "loss": 1.3516, "learning_rate": 1.7342486180640734e-05, "epoch": 0.547072, "percentage": 54.71, "elapsed_time": "7:51:15", "remaining_time": "6:30:06"}
2138
+ {"current_steps": 2138, "total_steps": 3906, "loss": 1.3693, "learning_rate": 1.7326378755446477e-05, "epoch": 0.547328, "percentage": 54.74, "elapsed_time": "7:51:28", "remaining_time": "6:29:53"}
2139
+ {"current_steps": 2139, "total_steps": 3906, "loss": 1.3627, "learning_rate": 1.7310273095785493e-05, "epoch": 0.547584, "percentage": 54.76, "elapsed_time": "7:51:41", "remaining_time": "6:29:39"}
2140
+ {"current_steps": 2140, "total_steps": 3906, "loss": 1.3267, "learning_rate": 1.729416921229319e-05, "epoch": 0.54784, "percentage": 54.79, "elapsed_time": "7:51:55", "remaining_time": "6:29:26"}
2141
+ {"current_steps": 2141, "total_steps": 3906, "loss": 1.3315, "learning_rate": 1.727806711560383e-05, "epoch": 0.548096, "percentage": 54.81, "elapsed_time": "7:52:08", "remaining_time": "6:29:13"}
2142
+ {"current_steps": 2142, "total_steps": 3906, "loss": 1.356, "learning_rate": 1.726196681635045e-05, "epoch": 0.548352, "percentage": 54.84, "elapsed_time": "7:52:21", "remaining_time": "6:29:00"}
2143
+ {"current_steps": 2143, "total_steps": 3906, "loss": 1.3255, "learning_rate": 1.724586832516495e-05, "epoch": 0.548608, "percentage": 54.86, "elapsed_time": "7:52:34", "remaining_time": "6:28:46"}
2144
+ {"current_steps": 2144, "total_steps": 3906, "loss": 1.3442, "learning_rate": 1.7229771652678e-05, "epoch": 0.548864, "percentage": 54.89, "elapsed_time": "7:52:47", "remaining_time": "6:28:33"}
2145
+ {"current_steps": 2145, "total_steps": 3906, "loss": 1.391, "learning_rate": 1.7213676809519097e-05, "epoch": 0.54912, "percentage": 54.92, "elapsed_time": "7:53:01", "remaining_time": "6:28:20"}
2146
+ {"current_steps": 2146, "total_steps": 3906, "loss": 1.4232, "learning_rate": 1.7197583806316503e-05, "epoch": 0.549376, "percentage": 54.94, "elapsed_time": "7:53:14", "remaining_time": "6:28:06"}
2147
+ {"current_steps": 2147, "total_steps": 3906, "loss": 1.3693, "learning_rate": 1.7181492653697294e-05, "epoch": 0.549632, "percentage": 54.97, "elapsed_time": "7:53:27", "remaining_time": "6:27:53"}
2148
+ {"current_steps": 2148, "total_steps": 3906, "loss": 1.3803, "learning_rate": 1.7165403362287282e-05, "epoch": 0.549888, "percentage": 54.99, "elapsed_time": "7:53:40", "remaining_time": "6:27:40"}
2149
+ {"current_steps": 2149, "total_steps": 3906, "loss": 1.3494, "learning_rate": 1.7149315942711095e-05, "epoch": 0.550144, "percentage": 55.02, "elapsed_time": "7:53:53", "remaining_time": "6:27:27"}
2150
+ {"current_steps": 2150, "total_steps": 3906, "loss": 1.3613, "learning_rate": 1.7133230405592104e-05, "epoch": 0.5504, "percentage": 55.04, "elapsed_time": "7:54:07", "remaining_time": "6:27:13"}
2151
+ {"current_steps": 2151, "total_steps": 3906, "loss": 1.3612, "learning_rate": 1.7117146761552427e-05, "epoch": 0.550656, "percentage": 55.07, "elapsed_time": "7:54:20", "remaining_time": "6:27:00"}
2152
+ {"current_steps": 2152, "total_steps": 3906, "loss": 1.3333, "learning_rate": 1.7101065021212953e-05, "epoch": 0.550912, "percentage": 55.09, "elapsed_time": "7:54:33", "remaining_time": "6:26:47"}
2153
+ {"current_steps": 2153, "total_steps": 3906, "loss": 1.3175, "learning_rate": 1.7084985195193314e-05, "epoch": 0.551168, "percentage": 55.12, "elapsed_time": "7:54:46", "remaining_time": "6:26:34"}
2154
+ {"current_steps": 2154, "total_steps": 3906, "loss": 1.3723, "learning_rate": 1.7068907294111846e-05, "epoch": 0.551424, "percentage": 55.15, "elapsed_time": "7:54:59", "remaining_time": "6:26:20"}
2155
+ {"current_steps": 2155, "total_steps": 3906, "loss": 1.3116, "learning_rate": 1.7052831328585644e-05, "epoch": 0.55168, "percentage": 55.17, "elapsed_time": "7:55:12", "remaining_time": "6:26:07"}
2156
+ {"current_steps": 2156, "total_steps": 3906, "loss": 1.3333, "learning_rate": 1.7036757309230528e-05, "epoch": 0.551936, "percentage": 55.2, "elapsed_time": "7:55:26", "remaining_time": "6:25:54"}
2157
+ {"current_steps": 2157, "total_steps": 3906, "loss": 1.3806, "learning_rate": 1.7020685246661005e-05, "epoch": 0.552192, "percentage": 55.22, "elapsed_time": "7:55:39", "remaining_time": "6:25:41"}
2158
+ {"current_steps": 2158, "total_steps": 3906, "loss": 1.3389, "learning_rate": 1.7004615151490315e-05, "epoch": 0.552448, "percentage": 55.25, "elapsed_time": "7:55:52", "remaining_time": "6:25:27"}
2159
+ {"current_steps": 2159, "total_steps": 3906, "loss": 1.3684, "learning_rate": 1.6988547034330398e-05, "epoch": 0.552704, "percentage": 55.27, "elapsed_time": "7:56:05", "remaining_time": "6:25:14"}
2160
+ {"current_steps": 2160, "total_steps": 3906, "loss": 1.4162, "learning_rate": 1.6972480905791866e-05, "epoch": 0.55296, "percentage": 55.3, "elapsed_time": "7:56:18", "remaining_time": "6:25:01"}
2161
+ {"current_steps": 2161, "total_steps": 3906, "loss": 1.3494, "learning_rate": 1.6956416776484033e-05, "epoch": 0.553216, "percentage": 55.33, "elapsed_time": "7:56:32", "remaining_time": "6:24:48"}
2162
+ {"current_steps": 2162, "total_steps": 3906, "loss": 1.3229, "learning_rate": 1.6940354657014904e-05, "epoch": 0.553472, "percentage": 55.35, "elapsed_time": "7:56:45", "remaining_time": "6:24:34"}
2163
+ {"current_steps": 2163, "total_steps": 3906, "loss": 1.365, "learning_rate": 1.6924294557991133e-05, "epoch": 0.553728, "percentage": 55.38, "elapsed_time": "7:56:58", "remaining_time": "6:24:21"}
2164
+ {"current_steps": 2164, "total_steps": 3906, "loss": 1.3528, "learning_rate": 1.6908236490018057e-05, "epoch": 0.553984, "percentage": 55.4, "elapsed_time": "7:57:11", "remaining_time": "6:24:08"}
2165
+ {"current_steps": 2165, "total_steps": 3906, "loss": 1.3367, "learning_rate": 1.6892180463699662e-05, "epoch": 0.55424, "percentage": 55.43, "elapsed_time": "7:57:24", "remaining_time": "6:23:54"}
2166
+ {"current_steps": 2166, "total_steps": 3906, "loss": 1.3526, "learning_rate": 1.68761264896386e-05, "epoch": 0.554496, "percentage": 55.45, "elapsed_time": "7:57:37", "remaining_time": "6:23:41"}
2167
+ {"current_steps": 2167, "total_steps": 3906, "loss": 1.3682, "learning_rate": 1.6860074578436144e-05, "epoch": 0.554752, "percentage": 55.48, "elapsed_time": "7:57:51", "remaining_time": "6:23:28"}
2168
+ {"current_steps": 2168, "total_steps": 3906, "loss": 1.3064, "learning_rate": 1.6844024740692225e-05, "epoch": 0.555008, "percentage": 55.5, "elapsed_time": "7:58:04", "remaining_time": "6:23:15"}
2169
+ {"current_steps": 2169, "total_steps": 3906, "loss": 1.3327, "learning_rate": 1.6827976987005396e-05, "epoch": 0.555264, "percentage": 55.53, "elapsed_time": "7:58:17", "remaining_time": "6:23:01"}
2170
+ {"current_steps": 2170, "total_steps": 3906, "loss": 1.3625, "learning_rate": 1.681193132797284e-05, "epoch": 0.55552, "percentage": 55.56, "elapsed_time": "7:58:30", "remaining_time": "6:22:48"}
2171
+ {"current_steps": 2171, "total_steps": 3906, "loss": 1.3689, "learning_rate": 1.6795887774190347e-05, "epoch": 0.555776, "percentage": 55.58, "elapsed_time": "7:58:43", "remaining_time": "6:22:35"}
2172
+ {"current_steps": 2172, "total_steps": 3906, "loss": 1.401, "learning_rate": 1.6779846336252338e-05, "epoch": 0.556032, "percentage": 55.61, "elapsed_time": "7:58:57", "remaining_time": "6:22:22"}
2173
+ {"current_steps": 2173, "total_steps": 3906, "loss": 1.3743, "learning_rate": 1.6763807024751803e-05, "epoch": 0.556288, "percentage": 55.63, "elapsed_time": "7:59:10", "remaining_time": "6:22:08"}
2174
+ {"current_steps": 2174, "total_steps": 3906, "loss": 1.363, "learning_rate": 1.6747769850280347e-05, "epoch": 0.556544, "percentage": 55.66, "elapsed_time": "7:59:23", "remaining_time": "6:21:55"}
2175
+ {"current_steps": 2175, "total_steps": 3906, "loss": 1.3428, "learning_rate": 1.6731734823428173e-05, "epoch": 0.5568, "percentage": 55.68, "elapsed_time": "7:59:36", "remaining_time": "6:21:42"}
2176
+ {"current_steps": 2176, "total_steps": 3906, "loss": 1.3512, "learning_rate": 1.671570195478405e-05, "epoch": 0.557056, "percentage": 55.71, "elapsed_time": "7:59:49", "remaining_time": "6:21:29"}
2177
+ {"current_steps": 2177, "total_steps": 3906, "loss": 1.3465, "learning_rate": 1.6699671254935327e-05, "epoch": 0.557312, "percentage": 55.73, "elapsed_time": "8:00:03", "remaining_time": "6:21:15"}
2178
+ {"current_steps": 2178, "total_steps": 3906, "loss": 1.3848, "learning_rate": 1.668364273446794e-05, "epoch": 0.557568, "percentage": 55.76, "elapsed_time": "8:00:16", "remaining_time": "6:21:02"}
2179
+ {"current_steps": 2179, "total_steps": 3906, "loss": 1.3168, "learning_rate": 1.6667616403966336e-05, "epoch": 0.557824, "percentage": 55.79, "elapsed_time": "8:00:29", "remaining_time": "6:20:49"}
2180
+ {"current_steps": 2180, "total_steps": 3906, "loss": 1.3396, "learning_rate": 1.6651592274013566e-05, "epoch": 0.55808, "percentage": 55.81, "elapsed_time": "8:00:42", "remaining_time": "6:20:35"}
2181
+ {"current_steps": 2181, "total_steps": 3906, "loss": 1.3504, "learning_rate": 1.6635570355191203e-05, "epoch": 0.558336, "percentage": 55.84, "elapsed_time": "8:00:55", "remaining_time": "6:20:22"}
2182
+ {"current_steps": 2182, "total_steps": 3906, "loss": 1.3529, "learning_rate": 1.6619550658079367e-05, "epoch": 0.558592, "percentage": 55.86, "elapsed_time": "8:01:08", "remaining_time": "6:20:09"}
2183
+ {"current_steps": 2183, "total_steps": 3906, "loss": 1.382, "learning_rate": 1.660353319325672e-05, "epoch": 0.558848, "percentage": 55.89, "elapsed_time": "8:01:22", "remaining_time": "6:19:56"}
2184
+ {"current_steps": 2184, "total_steps": 3906, "loss": 1.3172, "learning_rate": 1.6587517971300426e-05, "epoch": 0.559104, "percentage": 55.91, "elapsed_time": "8:01:35", "remaining_time": "6:19:42"}
2185
+ {"current_steps": 2185, "total_steps": 3906, "loss": 1.3763, "learning_rate": 1.657150500278619e-05, "epoch": 0.55936, "percentage": 55.94, "elapsed_time": "8:01:48", "remaining_time": "6:19:29"}
2186
+ {"current_steps": 2186, "total_steps": 3906, "loss": 1.3703, "learning_rate": 1.6555494298288214e-05, "epoch": 0.559616, "percentage": 55.97, "elapsed_time": "8:02:01", "remaining_time": "6:19:16"}
2187
+ {"current_steps": 2187, "total_steps": 3906, "loss": 1.331, "learning_rate": 1.653948586837921e-05, "epoch": 0.559872, "percentage": 55.99, "elapsed_time": "8:02:14", "remaining_time": "6:19:03"}
2188
+ {"current_steps": 2188, "total_steps": 3906, "loss": 1.3676, "learning_rate": 1.6523479723630395e-05, "epoch": 0.560128, "percentage": 56.02, "elapsed_time": "8:02:28", "remaining_time": "6:18:49"}
2189
+ {"current_steps": 2189, "total_steps": 3906, "loss": 1.3251, "learning_rate": 1.650747587461148e-05, "epoch": 0.560384, "percentage": 56.04, "elapsed_time": "8:02:41", "remaining_time": "6:18:36"}
2190
+ {"current_steps": 2190, "total_steps": 3906, "loss": 1.3768, "learning_rate": 1.6491474331890635e-05, "epoch": 0.56064, "percentage": 56.07, "elapsed_time": "8:02:54", "remaining_time": "6:18:23"}
2191
+ {"current_steps": 2191, "total_steps": 3906, "loss": 1.3708, "learning_rate": 1.6475475106034532e-05, "epoch": 0.560896, "percentage": 56.09, "elapsed_time": "8:03:07", "remaining_time": "6:18:10"}
2192
+ {"current_steps": 2192, "total_steps": 3906, "loss": 1.3586, "learning_rate": 1.64594782076083e-05, "epoch": 0.561152, "percentage": 56.12, "elapsed_time": "8:03:20", "remaining_time": "6:17:56"}
2193
+ {"current_steps": 2193, "total_steps": 3906, "loss": 1.367, "learning_rate": 1.6443483647175543e-05, "epoch": 0.561408, "percentage": 56.14, "elapsed_time": "8:03:34", "remaining_time": "6:17:43"}
2194
+ {"current_steps": 2194, "total_steps": 3906, "loss": 1.3716, "learning_rate": 1.6427491435298302e-05, "epoch": 0.561664, "percentage": 56.17, "elapsed_time": "8:03:47", "remaining_time": "6:17:30"}
2195
+ {"current_steps": 2195, "total_steps": 3906, "loss": 1.328, "learning_rate": 1.6411501582537094e-05, "epoch": 0.56192, "percentage": 56.2, "elapsed_time": "8:04:00", "remaining_time": "6:17:16"}
2196
+ {"current_steps": 2196, "total_steps": 3906, "loss": 1.379, "learning_rate": 1.639551409945086e-05, "epoch": 0.562176, "percentage": 56.22, "elapsed_time": "8:04:13", "remaining_time": "6:17:03"}
2197
+ {"current_steps": 2197, "total_steps": 3906, "loss": 1.3494, "learning_rate": 1.6379528996596968e-05, "epoch": 0.562432, "percentage": 56.25, "elapsed_time": "8:04:26", "remaining_time": "6:16:50"}
2198
+ {"current_steps": 2198, "total_steps": 3906, "loss": 1.3327, "learning_rate": 1.6363546284531228e-05, "epoch": 0.562688, "percentage": 56.27, "elapsed_time": "8:04:40", "remaining_time": "6:16:37"}
2199
+ {"current_steps": 2199, "total_steps": 3906, "loss": 1.3932, "learning_rate": 1.6347565973807874e-05, "epoch": 0.562944, "percentage": 56.3, "elapsed_time": "8:04:53", "remaining_time": "6:16:23"}
2200
+ {"current_steps": 2200, "total_steps": 3906, "loss": 1.3683, "learning_rate": 1.6331588074979548e-05, "epoch": 0.5632, "percentage": 56.32, "elapsed_time": "8:05:06", "remaining_time": "6:16:10"}
2201
+ {"current_steps": 2201, "total_steps": 3906, "loss": 1.321, "learning_rate": 1.6315612598597303e-05, "epoch": 0.563456, "percentage": 56.35, "elapsed_time": "8:05:19", "remaining_time": "6:15:57"}
2202
+ {"current_steps": 2202, "total_steps": 3906, "loss": 1.4058, "learning_rate": 1.629963955521059e-05, "epoch": 0.563712, "percentage": 56.37, "elapsed_time": "8:05:32", "remaining_time": "6:15:44"}
2203
+ {"current_steps": 2203, "total_steps": 3906, "loss": 1.3838, "learning_rate": 1.6283668955367242e-05, "epoch": 0.563968, "percentage": 56.4, "elapsed_time": "8:05:46", "remaining_time": "6:15:31"}
2204
+ {"current_steps": 2204, "total_steps": 3906, "loss": 1.3624, "learning_rate": 1.6267700809613495e-05, "epoch": 0.564224, "percentage": 56.43, "elapsed_time": "8:05:59", "remaining_time": "6:15:17"}
2205
+ {"current_steps": 2205, "total_steps": 3906, "loss": 1.381, "learning_rate": 1.625173512849396e-05, "epoch": 0.56448, "percentage": 56.45, "elapsed_time": "8:06:12", "remaining_time": "6:15:04"}
2206
+ {"current_steps": 2206, "total_steps": 3906, "loss": 1.3357, "learning_rate": 1.6235771922551625e-05, "epoch": 0.564736, "percentage": 56.48, "elapsed_time": "8:06:25", "remaining_time": "6:14:51"}
2207
+ {"current_steps": 2207, "total_steps": 3906, "loss": 1.3705, "learning_rate": 1.6219811202327823e-05, "epoch": 0.564992, "percentage": 56.5, "elapsed_time": "8:06:38", "remaining_time": "6:14:38"}
2208
+ {"current_steps": 2208, "total_steps": 3906, "loss": 1.3923, "learning_rate": 1.6203852978362283e-05, "epoch": 0.565248, "percentage": 56.53, "elapsed_time": "8:06:52", "remaining_time": "6:14:24"}
2209
+ {"current_steps": 2209, "total_steps": 3906, "loss": 1.3149, "learning_rate": 1.618789726119304e-05, "epoch": 0.565504, "percentage": 56.55, "elapsed_time": "8:07:05", "remaining_time": "6:14:11"}
2210
+ {"current_steps": 2210, "total_steps": 3906, "loss": 1.3817, "learning_rate": 1.6171944061356502e-05, "epoch": 0.56576, "percentage": 56.58, "elapsed_time": "8:07:18", "remaining_time": "6:13:58"}
2211
+ {"current_steps": 2211, "total_steps": 3906, "loss": 1.3732, "learning_rate": 1.6155993389387416e-05, "epoch": 0.566016, "percentage": 56.61, "elapsed_time": "8:07:31", "remaining_time": "6:13:44"}
2212
+ {"current_steps": 2212, "total_steps": 3906, "loss": 1.33, "learning_rate": 1.6140045255818852e-05, "epoch": 0.566272, "percentage": 56.63, "elapsed_time": "8:07:44", "remaining_time": "6:13:31"}
2213
+ {"current_steps": 2213, "total_steps": 3906, "loss": 1.3505, "learning_rate": 1.61240996711822e-05, "epoch": 0.566528, "percentage": 56.66, "elapsed_time": "8:07:58", "remaining_time": "6:13:18"}
2214
+ {"current_steps": 2214, "total_steps": 3906, "loss": 1.3703, "learning_rate": 1.610815664600718e-05, "epoch": 0.566784, "percentage": 56.68, "elapsed_time": "8:08:11", "remaining_time": "6:13:05"}
2215
+ {"current_steps": 2215, "total_steps": 3906, "loss": 1.3803, "learning_rate": 1.6092216190821797e-05, "epoch": 0.56704, "percentage": 56.71, "elapsed_time": "8:08:24", "remaining_time": "6:12:51"}
2216
+ {"current_steps": 2216, "total_steps": 3906, "loss": 1.3786, "learning_rate": 1.6076278316152385e-05, "epoch": 0.567296, "percentage": 56.73, "elapsed_time": "8:08:37", "remaining_time": "6:12:38"}
2217
+ {"current_steps": 2217, "total_steps": 3906, "loss": 1.3512, "learning_rate": 1.6060343032523565e-05, "epoch": 0.567552, "percentage": 56.76, "elapsed_time": "8:08:50", "remaining_time": "6:12:25"}
2218
+ {"current_steps": 2218, "total_steps": 3906, "loss": 1.3677, "learning_rate": 1.604441035045825e-05, "epoch": 0.567808, "percentage": 56.78, "elapsed_time": "8:09:04", "remaining_time": "6:12:12"}
2219
+ {"current_steps": 2219, "total_steps": 3906, "loss": 1.3184, "learning_rate": 1.6028480280477623e-05, "epoch": 0.568064, "percentage": 56.81, "elapsed_time": "8:09:17", "remaining_time": "6:11:58"}
2220
+ {"current_steps": 2220, "total_steps": 3906, "loss": 1.3418, "learning_rate": 1.601255283310116e-05, "epoch": 0.56832, "percentage": 56.84, "elapsed_time": "8:09:30", "remaining_time": "6:11:45"}
2221
+ {"current_steps": 2221, "total_steps": 3906, "loss": 1.3196, "learning_rate": 1.5996628018846583e-05, "epoch": 0.568576, "percentage": 56.86, "elapsed_time": "8:09:43", "remaining_time": "6:11:32"}
2222
+ {"current_steps": 2222, "total_steps": 3906, "loss": 1.3615, "learning_rate": 1.598070584822989e-05, "epoch": 0.568832, "percentage": 56.89, "elapsed_time": "8:09:56", "remaining_time": "6:11:19"}
2223
+ {"current_steps": 2223, "total_steps": 3906, "loss": 1.3322, "learning_rate": 1.5964786331765338e-05, "epoch": 0.569088, "percentage": 56.91, "elapsed_time": "8:10:09", "remaining_time": "6:11:05"}
2224
+ {"current_steps": 2224, "total_steps": 3906, "loss": 1.3349, "learning_rate": 1.5948869479965427e-05, "epoch": 0.569344, "percentage": 56.94, "elapsed_time": "8:10:23", "remaining_time": "6:10:52"}
2225
+ {"current_steps": 2225, "total_steps": 3906, "loss": 1.3141, "learning_rate": 1.593295530334088e-05, "epoch": 0.5696, "percentage": 56.96, "elapsed_time": "8:10:36", "remaining_time": "6:10:39"}
2226
+ {"current_steps": 2226, "total_steps": 3906, "loss": 1.4244, "learning_rate": 1.5917043812400675e-05, "epoch": 0.569856, "percentage": 56.99, "elapsed_time": "8:10:49", "remaining_time": "6:10:26"}
2227
+ {"current_steps": 2227, "total_steps": 3906, "loss": 1.3505, "learning_rate": 1.5901135017652026e-05, "epoch": 0.570112, "percentage": 57.01, "elapsed_time": "8:11:02", "remaining_time": "6:10:12"}
2228
+ {"current_steps": 2228, "total_steps": 3906, "loss": 1.3875, "learning_rate": 1.588522892960032e-05, "epoch": 0.570368, "percentage": 57.04, "elapsed_time": "8:11:16", "remaining_time": "6:09:59"}
2229
+ {"current_steps": 2229, "total_steps": 3906, "loss": 1.3402, "learning_rate": 1.5869325558749213e-05, "epoch": 0.570624, "percentage": 57.07, "elapsed_time": "8:11:29", "remaining_time": "6:09:46"}
2230
+ {"current_steps": 2230, "total_steps": 3906, "loss": 1.3343, "learning_rate": 1.585342491560052e-05, "epoch": 0.57088, "percentage": 57.09, "elapsed_time": "8:11:42", "remaining_time": "6:09:33"}
2231
+ {"current_steps": 2231, "total_steps": 3906, "loss": 1.3379, "learning_rate": 1.5837527010654288e-05, "epoch": 0.571136, "percentage": 57.12, "elapsed_time": "8:11:55", "remaining_time": "6:09:19"}
2232
+ {"current_steps": 2232, "total_steps": 3906, "loss": 1.3892, "learning_rate": 1.5821631854408737e-05, "epoch": 0.571392, "percentage": 57.14, "elapsed_time": "8:12:08", "remaining_time": "6:09:06"}
2233
+ {"current_steps": 2233, "total_steps": 3906, "loss": 1.3419, "learning_rate": 1.580573945736029e-05, "epoch": 0.571648, "percentage": 57.17, "elapsed_time": "8:12:22", "remaining_time": "6:08:53"}
2234
+ {"current_steps": 2234, "total_steps": 3906, "loss": 1.3713, "learning_rate": 1.578984983000352e-05, "epoch": 0.571904, "percentage": 57.19, "elapsed_time": "8:12:35", "remaining_time": "6:08:40"}
2235
+ {"current_steps": 2235, "total_steps": 3906, "loss": 1.3715, "learning_rate": 1.5773962982831195e-05, "epoch": 0.57216, "percentage": 57.22, "elapsed_time": "8:12:48", "remaining_time": "6:08:26"}
2236
+ {"current_steps": 2236, "total_steps": 3906, "loss": 1.3236, "learning_rate": 1.575807892633423e-05, "epoch": 0.572416, "percentage": 57.25, "elapsed_time": "8:13:01", "remaining_time": "6:08:13"}
2237
+ {"current_steps": 2237, "total_steps": 3906, "loss": 1.3278, "learning_rate": 1.5742197671001718e-05, "epoch": 0.572672, "percentage": 57.27, "elapsed_time": "8:13:14", "remaining_time": "6:08:00"}
2238
+ {"current_steps": 2238, "total_steps": 3906, "loss": 1.2887, "learning_rate": 1.5726319227320886e-05, "epoch": 0.572928, "percentage": 57.3, "elapsed_time": "8:13:28", "remaining_time": "6:07:47"}
2239
+ {"current_steps": 2239, "total_steps": 3906, "loss": 1.3717, "learning_rate": 1.5710443605777116e-05, "epoch": 0.573184, "percentage": 57.32, "elapsed_time": "8:13:41", "remaining_time": "6:07:33"}
2240
+ {"current_steps": 2240, "total_steps": 3906, "loss": 1.3713, "learning_rate": 1.56945708168539e-05, "epoch": 0.57344, "percentage": 57.35, "elapsed_time": "8:13:54", "remaining_time": "6:07:20"}
2241
+ {"current_steps": 2241, "total_steps": 3906, "loss": 1.3657, "learning_rate": 1.5678700871032897e-05, "epoch": 0.573696, "percentage": 57.37, "elapsed_time": "8:14:07", "remaining_time": "6:07:07"}
2242
+ {"current_steps": 2242, "total_steps": 3906, "loss": 1.3797, "learning_rate": 1.566283377879386e-05, "epoch": 0.573952, "percentage": 57.4, "elapsed_time": "8:14:20", "remaining_time": "6:06:54"}
2243
+ {"current_steps": 2243, "total_steps": 3906, "loss": 1.3173, "learning_rate": 1.5646969550614668e-05, "epoch": 0.574208, "percentage": 57.42, "elapsed_time": "8:14:33", "remaining_time": "6:06:40"}
2244
+ {"current_steps": 2244, "total_steps": 3906, "loss": 1.367, "learning_rate": 1.5631108196971314e-05, "epoch": 0.574464, "percentage": 57.45, "elapsed_time": "8:14:47", "remaining_time": "6:06:27"}
2245
+ {"current_steps": 2245, "total_steps": 3906, "loss": 1.3432, "learning_rate": 1.561524972833789e-05, "epoch": 0.57472, "percentage": 57.48, "elapsed_time": "8:15:00", "remaining_time": "6:06:14"}
2246
+ {"current_steps": 2246, "total_steps": 3906, "loss": 1.3482, "learning_rate": 1.5599394155186572e-05, "epoch": 0.574976, "percentage": 57.5, "elapsed_time": "8:15:13", "remaining_time": "6:06:01"}
2247
+ {"current_steps": 2247, "total_steps": 3906, "loss": 1.3893, "learning_rate": 1.5583541487987634e-05, "epoch": 0.575232, "percentage": 57.53, "elapsed_time": "8:15:26", "remaining_time": "6:05:47"}
2248
+ {"current_steps": 2248, "total_steps": 3906, "loss": 1.355, "learning_rate": 1.5567691737209426e-05, "epoch": 0.575488, "percentage": 57.55, "elapsed_time": "8:15:39", "remaining_time": "6:05:34"}
2249
+ {"current_steps": 2249, "total_steps": 3906, "loss": 1.3098, "learning_rate": 1.5551844913318384e-05, "epoch": 0.575744, "percentage": 57.58, "elapsed_time": "8:15:53", "remaining_time": "6:05:21"}
2250
+ {"current_steps": 2250, "total_steps": 3906, "loss": 1.3581, "learning_rate": 1.5536001026778995e-05, "epoch": 0.576, "percentage": 57.6, "elapsed_time": "8:16:06", "remaining_time": "6:05:07"}
2251
+ {"current_steps": 2251, "total_steps": 3906, "loss": 1.3517, "learning_rate": 1.5520160088053823e-05, "epoch": 0.576256, "percentage": 57.63, "elapsed_time": "8:16:19", "remaining_time": "6:04:54"}
2252
+ {"current_steps": 2252, "total_steps": 3906, "loss": 1.355, "learning_rate": 1.5504322107603468e-05, "epoch": 0.576512, "percentage": 57.65, "elapsed_time": "8:16:32", "remaining_time": "6:04:41"}
2253
+ {"current_steps": 2253, "total_steps": 3906, "loss": 1.3108, "learning_rate": 1.5488487095886583e-05, "epoch": 0.576768, "percentage": 57.68, "elapsed_time": "8:16:45", "remaining_time": "6:04:28"}
2254
+ {"current_steps": 2254, "total_steps": 3906, "loss": 1.3729, "learning_rate": 1.5472655063359866e-05, "epoch": 0.577024, "percentage": 57.71, "elapsed_time": "8:16:58", "remaining_time": "6:04:14"}
2255
+ {"current_steps": 2255, "total_steps": 3906, "loss": 1.3094, "learning_rate": 1.545682602047804e-05, "epoch": 0.57728, "percentage": 57.73, "elapsed_time": "8:17:12", "remaining_time": "6:04:01"}
2256
+ {"current_steps": 2256, "total_steps": 3906, "loss": 1.3735, "learning_rate": 1.544099997769387e-05, "epoch": 0.577536, "percentage": 57.76, "elapsed_time": "8:17:25", "remaining_time": "6:03:48"}
2257
+ {"current_steps": 2257, "total_steps": 3906, "loss": 1.3552, "learning_rate": 1.5425176945458115e-05, "epoch": 0.577792, "percentage": 57.78, "elapsed_time": "8:17:38", "remaining_time": "6:03:35"}
2258
+ {"current_steps": 2258, "total_steps": 3906, "loss": 1.3407, "learning_rate": 1.5409356934219565e-05, "epoch": 0.578048, "percentage": 57.81, "elapsed_time": "8:17:51", "remaining_time": "6:03:21"}
2259
+ {"current_steps": 2259, "total_steps": 3906, "loss": 1.3326, "learning_rate": 1.5393539954425003e-05, "epoch": 0.578304, "percentage": 57.83, "elapsed_time": "8:18:04", "remaining_time": "6:03:08"}
2260
+ {"current_steps": 2260, "total_steps": 3906, "loss": 1.3641, "learning_rate": 1.5377726016519217e-05, "epoch": 0.57856, "percentage": 57.86, "elapsed_time": "8:18:18", "remaining_time": "6:02:55"}
2261
+ {"current_steps": 2261, "total_steps": 3906, "loss": 1.3214, "learning_rate": 1.5361915130944992e-05, "epoch": 0.578816, "percentage": 57.89, "elapsed_time": "8:18:31", "remaining_time": "6:02:42"}
2262
+ {"current_steps": 2262, "total_steps": 3906, "loss": 1.3015, "learning_rate": 1.5346107308143086e-05, "epoch": 0.579072, "percentage": 57.91, "elapsed_time": "8:18:44", "remaining_time": "6:02:28"}
2263
+ {"current_steps": 2263, "total_steps": 3906, "loss": 1.3588, "learning_rate": 1.533030255855224e-05, "epoch": 0.579328, "percentage": 57.94, "elapsed_time": "8:18:57", "remaining_time": "6:02:15"}
2264
+ {"current_steps": 2264, "total_steps": 3906, "loss": 1.3524, "learning_rate": 1.5314500892609165e-05, "epoch": 0.579584, "percentage": 57.96, "elapsed_time": "8:19:10", "remaining_time": "6:02:02"}
2265
+ {"current_steps": 2265, "total_steps": 3906, "loss": 1.359, "learning_rate": 1.529870232074853e-05, "epoch": 0.57984, "percentage": 57.99, "elapsed_time": "8:19:24", "remaining_time": "6:01:49"}
2266
+ {"current_steps": 2266, "total_steps": 3906, "loss": 1.3428, "learning_rate": 1.528290685340297e-05, "epoch": 0.580096, "percentage": 58.01, "elapsed_time": "8:19:37", "remaining_time": "6:01:35"}
2267
+ {"current_steps": 2267, "total_steps": 3906, "loss": 1.3668, "learning_rate": 1.526711450100306e-05, "epoch": 0.580352, "percentage": 58.04, "elapsed_time": "8:19:50", "remaining_time": "6:01:22"}
2268
+ {"current_steps": 2268, "total_steps": 3906, "loss": 1.3572, "learning_rate": 1.525132527397734e-05, "epoch": 0.580608, "percentage": 58.06, "elapsed_time": "8:20:03", "remaining_time": "6:01:09"}
2269
+ {"current_steps": 2269, "total_steps": 3906, "loss": 1.3532, "learning_rate": 1.523553918275226e-05, "epoch": 0.580864, "percentage": 58.09, "elapsed_time": "8:20:16", "remaining_time": "6:00:56"}
2270
+ {"current_steps": 2270, "total_steps": 3906, "loss": 1.3868, "learning_rate": 1.5219756237752208e-05, "epoch": 0.58112, "percentage": 58.12, "elapsed_time": "8:20:29", "remaining_time": "6:00:42"}
2271
+ {"current_steps": 2271, "total_steps": 3906, "loss": 1.3344, "learning_rate": 1.5203976449399496e-05, "epoch": 0.581376, "percentage": 58.14, "elapsed_time": "8:20:43", "remaining_time": "6:00:29"}
2272
+ {"current_steps": 2272, "total_steps": 3906, "loss": 1.3113, "learning_rate": 1.5188199828114351e-05, "epoch": 0.581632, "percentage": 58.17, "elapsed_time": "8:20:56", "remaining_time": "6:00:16"}
2273
+ {"current_steps": 2273, "total_steps": 3906, "loss": 1.3474, "learning_rate": 1.5172426384314913e-05, "epoch": 0.581888, "percentage": 58.19, "elapsed_time": "8:21:09", "remaining_time": "6:00:02"}
2274
+ {"current_steps": 2274, "total_steps": 3906, "loss": 1.2984, "learning_rate": 1.5156656128417222e-05, "epoch": 0.582144, "percentage": 58.22, "elapsed_time": "8:21:22", "remaining_time": "5:59:49"}
2275
+ {"current_steps": 2275, "total_steps": 3906, "loss": 1.3228, "learning_rate": 1.514088907083521e-05, "epoch": 0.5824, "percentage": 58.24, "elapsed_time": "8:21:35", "remaining_time": "5:59:36"}
2276
+ {"current_steps": 2276, "total_steps": 3906, "loss": 1.3492, "learning_rate": 1.5125125221980685e-05, "epoch": 0.582656, "percentage": 58.27, "elapsed_time": "8:21:49", "remaining_time": "5:59:23"}
2277
+ {"current_steps": 2277, "total_steps": 3906, "loss": 1.3123, "learning_rate": 1.5109364592263358e-05, "epoch": 0.582912, "percentage": 58.29, "elapsed_time": "8:22:02", "remaining_time": "5:59:09"}
2278
+ {"current_steps": 2278, "total_steps": 3906, "loss": 1.3163, "learning_rate": 1.5093607192090804e-05, "epoch": 0.583168, "percentage": 58.32, "elapsed_time": "8:22:15", "remaining_time": "5:58:56"}
2279
+ {"current_steps": 2279, "total_steps": 3906, "loss": 1.3353, "learning_rate": 1.5077853031868474e-05, "epoch": 0.583424, "percentage": 58.35, "elapsed_time": "8:22:28", "remaining_time": "5:58:43"}
2280
+ {"current_steps": 2280, "total_steps": 3906, "loss": 1.3698, "learning_rate": 1.506210212199966e-05, "epoch": 0.58368, "percentage": 58.37, "elapsed_time": "8:22:41", "remaining_time": "5:58:30"}
2281
+ {"current_steps": 2281, "total_steps": 3906, "loss": 1.3625, "learning_rate": 1.5046354472885531e-05, "epoch": 0.583936, "percentage": 58.4, "elapsed_time": "8:22:55", "remaining_time": "5:58:16"}
2282
+ {"current_steps": 2282, "total_steps": 3906, "loss": 1.3391, "learning_rate": 1.5030610094925075e-05, "epoch": 0.584192, "percentage": 58.42, "elapsed_time": "8:23:08", "remaining_time": "5:58:03"}
2283
+ {"current_steps": 2283, "total_steps": 3906, "loss": 1.3507, "learning_rate": 1.5014868998515149e-05, "epoch": 0.584448, "percentage": 58.45, "elapsed_time": "8:23:21", "remaining_time": "5:57:50"}
2284
+ {"current_steps": 2284, "total_steps": 3906, "loss": 1.369, "learning_rate": 1.4999131194050422e-05, "epoch": 0.584704, "percentage": 58.47, "elapsed_time": "8:23:34", "remaining_time": "5:57:37"}
2285
+ {"current_steps": 2285, "total_steps": 3906, "loss": 1.4044, "learning_rate": 1.4983396691923409e-05, "epoch": 0.58496, "percentage": 58.5, "elapsed_time": "8:23:47", "remaining_time": "5:57:23"}
2286
+ {"current_steps": 2286, "total_steps": 3906, "loss": 1.3208, "learning_rate": 1.496766550252442e-05, "epoch": 0.585216, "percentage": 58.53, "elapsed_time": "8:24:01", "remaining_time": "5:57:10"}
2287
+ {"current_steps": 2287, "total_steps": 3906, "loss": 1.3933, "learning_rate": 1.4951937636241596e-05, "epoch": 0.585472, "percentage": 58.55, "elapsed_time": "8:24:14", "remaining_time": "5:56:57"}
2288
+ {"current_steps": 2288, "total_steps": 3906, "loss": 1.3382, "learning_rate": 1.4936213103460887e-05, "epoch": 0.585728, "percentage": 58.58, "elapsed_time": "8:24:27", "remaining_time": "5:56:44"}
2289
+ {"current_steps": 2289, "total_steps": 3906, "loss": 1.3235, "learning_rate": 1.4920491914566006e-05, "epoch": 0.585984, "percentage": 58.6, "elapsed_time": "8:24:40", "remaining_time": "5:56:30"}
2290
+ {"current_steps": 2290, "total_steps": 3906, "loss": 1.2912, "learning_rate": 1.4904774079938506e-05, "epoch": 0.58624, "percentage": 58.63, "elapsed_time": "8:24:53", "remaining_time": "5:56:17"}
2291
+ {"current_steps": 2291, "total_steps": 3906, "loss": 1.3203, "learning_rate": 1.4889059609957701e-05, "epoch": 0.586496, "percentage": 58.65, "elapsed_time": "8:25:07", "remaining_time": "5:56:04"}
2292
+ {"current_steps": 2292, "total_steps": 3906, "loss": 1.3967, "learning_rate": 1.4873348515000674e-05, "epoch": 0.586752, "percentage": 58.68, "elapsed_time": "8:25:20", "remaining_time": "5:55:51"}
2293
+ {"current_steps": 2293, "total_steps": 3906, "loss": 1.3399, "learning_rate": 1.4857640805442299e-05, "epoch": 0.587008, "percentage": 58.7, "elapsed_time": "8:25:33", "remaining_time": "5:55:37"}
2294
+ {"current_steps": 2294, "total_steps": 3906, "loss": 1.3304, "learning_rate": 1.4841936491655214e-05, "epoch": 0.587264, "percentage": 58.73, "elapsed_time": "8:25:46", "remaining_time": "5:55:24"}
2295
+ {"current_steps": 2295, "total_steps": 3906, "loss": 1.3443, "learning_rate": 1.4826235584009787e-05, "epoch": 0.58752, "percentage": 58.76, "elapsed_time": "8:25:59", "remaining_time": "5:55:11"}
2296
+ {"current_steps": 2296, "total_steps": 3906, "loss": 1.3429, "learning_rate": 1.4810538092874166e-05, "epoch": 0.587776, "percentage": 58.78, "elapsed_time": "8:26:12", "remaining_time": "5:54:58"}
2297
+ {"current_steps": 2297, "total_steps": 3906, "loss": 1.3952, "learning_rate": 1.4794844028614241e-05, "epoch": 0.588032, "percentage": 58.81, "elapsed_time": "8:26:26", "remaining_time": "5:54:44"}
2298
+ {"current_steps": 2298, "total_steps": 3906, "loss": 1.4048, "learning_rate": 1.4779153401593615e-05, "epoch": 0.588288, "percentage": 58.83, "elapsed_time": "8:26:39", "remaining_time": "5:54:31"}
2299
+ {"current_steps": 2299, "total_steps": 3906, "loss": 1.3477, "learning_rate": 1.4763466222173651e-05, "epoch": 0.588544, "percentage": 58.86, "elapsed_time": "8:26:52", "remaining_time": "5:54:18"}
2300
+ {"current_steps": 2300, "total_steps": 3906, "loss": 1.3468, "learning_rate": 1.4747782500713424e-05, "epoch": 0.5888, "percentage": 58.88, "elapsed_time": "8:27:05", "remaining_time": "5:54:05"}
2301
+ {"current_steps": 2301, "total_steps": 3906, "loss": 1.3561, "learning_rate": 1.4732102247569707e-05, "epoch": 0.589056, "percentage": 58.91, "elapsed_time": "8:27:18", "remaining_time": "5:53:51"}
2302
+ {"current_steps": 2302, "total_steps": 3906, "loss": 1.3202, "learning_rate": 1.4716425473097014e-05, "epoch": 0.589312, "percentage": 58.93, "elapsed_time": "8:27:32", "remaining_time": "5:53:38"}
2303
+ {"current_steps": 2303, "total_steps": 3906, "loss": 1.3332, "learning_rate": 1.4700752187647536e-05, "epoch": 0.589568, "percentage": 58.96, "elapsed_time": "8:27:45", "remaining_time": "5:53:25"}
2304
+ {"current_steps": 2304, "total_steps": 3906, "loss": 1.3379, "learning_rate": 1.4685082401571175e-05, "epoch": 0.589824, "percentage": 58.99, "elapsed_time": "8:27:58", "remaining_time": "5:53:12"}
2305
+ {"current_steps": 2305, "total_steps": 3906, "loss": 1.3686, "learning_rate": 1.4669416125215521e-05, "epoch": 0.59008, "percentage": 59.01, "elapsed_time": "8:28:11", "remaining_time": "5:52:58"}
2306
+ {"current_steps": 2306, "total_steps": 3906, "loss": 1.3453, "learning_rate": 1.4653753368925849e-05, "epoch": 0.590336, "percentage": 59.04, "elapsed_time": "8:28:24", "remaining_time": "5:52:45"}
2307
+ {"current_steps": 2307, "total_steps": 3906, "loss": 1.333, "learning_rate": 1.463809414304509e-05, "epoch": 0.590592, "percentage": 59.06, "elapsed_time": "8:28:37", "remaining_time": "5:52:32"}
2308
+ {"current_steps": 2308, "total_steps": 3906, "loss": 1.347, "learning_rate": 1.4622438457913868e-05, "epoch": 0.590848, "percentage": 59.09, "elapsed_time": "8:28:51", "remaining_time": "5:52:18"}
2309
+ {"current_steps": 2309, "total_steps": 3906, "loss": 1.3266, "learning_rate": 1.4606786323870453e-05, "epoch": 0.591104, "percentage": 59.11, "elapsed_time": "8:29:04", "remaining_time": "5:52:05"}
2310
+ {"current_steps": 2310, "total_steps": 3906, "loss": 1.3701, "learning_rate": 1.4591137751250773e-05, "epoch": 0.59136, "percentage": 59.14, "elapsed_time": "8:29:17", "remaining_time": "5:51:52"}
2311
+ {"current_steps": 2311, "total_steps": 3906, "loss": 1.355, "learning_rate": 1.4575492750388414e-05, "epoch": 0.591616, "percentage": 59.17, "elapsed_time": "8:29:30", "remaining_time": "5:51:39"}
2312
+ {"current_steps": 2312, "total_steps": 3906, "loss": 1.3478, "learning_rate": 1.4559851331614599e-05, "epoch": 0.591872, "percentage": 59.19, "elapsed_time": "8:29:43", "remaining_time": "5:51:25"}
2313
+ {"current_steps": 2313, "total_steps": 3906, "loss": 1.3624, "learning_rate": 1.454421350525817e-05, "epoch": 0.592128, "percentage": 59.22, "elapsed_time": "8:29:57", "remaining_time": "5:51:12"}
2314
+ {"current_steps": 2314, "total_steps": 3906, "loss": 1.324, "learning_rate": 1.452857928164562e-05, "epoch": 0.592384, "percentage": 59.24, "elapsed_time": "8:30:10", "remaining_time": "5:50:59"}
2315
+ {"current_steps": 2315, "total_steps": 3906, "loss": 1.3658, "learning_rate": 1.4512948671101044e-05, "epoch": 0.59264, "percentage": 59.27, "elapsed_time": "8:30:23", "remaining_time": "5:50:46"}
2316
+ {"current_steps": 2316, "total_steps": 3906, "loss": 1.3169, "learning_rate": 1.4497321683946164e-05, "epoch": 0.592896, "percentage": 59.29, "elapsed_time": "8:30:36", "remaining_time": "5:50:32"}
2317
+ {"current_steps": 2317, "total_steps": 3906, "loss": 1.3617, "learning_rate": 1.4481698330500305e-05, "epoch": 0.593152, "percentage": 59.32, "elapsed_time": "8:30:49", "remaining_time": "5:50:19"}
2318
+ {"current_steps": 2318, "total_steps": 3906, "loss": 1.3367, "learning_rate": 1.44660786210804e-05, "epoch": 0.593408, "percentage": 59.34, "elapsed_time": "8:31:03", "remaining_time": "5:50:06"}
2319
+ {"current_steps": 2319, "total_steps": 3906, "loss": 1.3634, "learning_rate": 1.4450462566000949e-05, "epoch": 0.593664, "percentage": 59.37, "elapsed_time": "8:31:16", "remaining_time": "5:49:53"}
2320
+ {"current_steps": 2320, "total_steps": 3906, "loss": 1.344, "learning_rate": 1.4434850175574075e-05, "epoch": 0.59392, "percentage": 59.4, "elapsed_time": "8:31:29", "remaining_time": "5:49:39"}
2321
+ {"current_steps": 2321, "total_steps": 3906, "loss": 1.3282, "learning_rate": 1.441924146010945e-05, "epoch": 0.594176, "percentage": 59.42, "elapsed_time": "8:31:42", "remaining_time": "5:49:26"}
2322
+ {"current_steps": 2322, "total_steps": 3906, "loss": 1.3412, "learning_rate": 1.4403636429914341e-05, "epoch": 0.594432, "percentage": 59.45, "elapsed_time": "8:31:55", "remaining_time": "5:49:13"}
2323
+ {"current_steps": 2323, "total_steps": 3906, "loss": 1.3116, "learning_rate": 1.4388035095293574e-05, "epoch": 0.594688, "percentage": 59.47, "elapsed_time": "8:32:09", "remaining_time": "5:49:00"}
2324
+ {"current_steps": 2324, "total_steps": 3906, "loss": 1.3449, "learning_rate": 1.4372437466549538e-05, "epoch": 0.594944, "percentage": 59.5, "elapsed_time": "8:32:22", "remaining_time": "5:48:46"}
2325
+ {"current_steps": 2325, "total_steps": 3906, "loss": 1.3284, "learning_rate": 1.435684355398216e-05, "epoch": 0.5952, "percentage": 59.52, "elapsed_time": "8:32:35", "remaining_time": "5:48:33"}
2326
+ {"current_steps": 2326, "total_steps": 3906, "loss": 1.3818, "learning_rate": 1.4341253367888927e-05, "epoch": 0.595456, "percentage": 59.55, "elapsed_time": "8:32:48", "remaining_time": "5:48:20"}
2327
+ {"current_steps": 2327, "total_steps": 3906, "loss": 1.3511, "learning_rate": 1.4325666918564864e-05, "epoch": 0.595712, "percentage": 59.58, "elapsed_time": "8:33:01", "remaining_time": "5:48:07"}
2328
+ {"current_steps": 2328, "total_steps": 3906, "loss": 1.3277, "learning_rate": 1.4310084216302525e-05, "epoch": 0.595968, "percentage": 59.6, "elapsed_time": "8:33:15", "remaining_time": "5:47:53"}
2329
+ {"current_steps": 2329, "total_steps": 3906, "loss": 1.3383, "learning_rate": 1.4294505271391996e-05, "epoch": 0.596224, "percentage": 59.63, "elapsed_time": "8:33:28", "remaining_time": "5:47:40"}
2330
+ {"current_steps": 2330, "total_steps": 3906, "loss": 1.3407, "learning_rate": 1.4278930094120873e-05, "epoch": 0.59648, "percentage": 59.65, "elapsed_time": "8:33:41", "remaining_time": "5:47:27"}
2331
+ {"current_steps": 2331, "total_steps": 3906, "loss": 1.3526, "learning_rate": 1.4263358694774265e-05, "epoch": 0.596736, "percentage": 59.68, "elapsed_time": "8:33:54", "remaining_time": "5:47:14"}
2332
+ {"current_steps": 2332, "total_steps": 3906, "loss": 1.333, "learning_rate": 1.4247791083634793e-05, "epoch": 0.596992, "percentage": 59.7, "elapsed_time": "8:34:07", "remaining_time": "5:47:00"}
2333
+ {"current_steps": 2333, "total_steps": 3906, "loss": 1.3408, "learning_rate": 1.4232227270982568e-05, "epoch": 0.597248, "percentage": 59.73, "elapsed_time": "8:34:20", "remaining_time": "5:46:47"}
2334
+ {"current_steps": 2334, "total_steps": 3906, "loss": 1.4125, "learning_rate": 1.4216667267095201e-05, "epoch": 0.597504, "percentage": 59.75, "elapsed_time": "8:34:33", "remaining_time": "5:46:34"}
2335
+ {"current_steps": 2335, "total_steps": 3906, "loss": 1.2867, "learning_rate": 1.4201111082247789e-05, "epoch": 0.59776, "percentage": 59.78, "elapsed_time": "8:34:47", "remaining_time": "5:46:21"}
2336
+ {"current_steps": 2336, "total_steps": 3906, "loss": 1.326, "learning_rate": 1.4185558726712897e-05, "epoch": 0.598016, "percentage": 59.81, "elapsed_time": "8:35:00", "remaining_time": "5:46:07"}
2337
+ {"current_steps": 2337, "total_steps": 3906, "loss": 1.3442, "learning_rate": 1.4170010210760565e-05, "epoch": 0.598272, "percentage": 59.83, "elapsed_time": "8:35:13", "remaining_time": "5:45:54"}
2338
+ {"current_steps": 2338, "total_steps": 3906, "loss": 1.3752, "learning_rate": 1.41544655446583e-05, "epoch": 0.598528, "percentage": 59.86, "elapsed_time": "8:35:26", "remaining_time": "5:45:41"}
2339
+ {"current_steps": 2339, "total_steps": 3906, "loss": 1.3174, "learning_rate": 1.4138924738671062e-05, "epoch": 0.598784, "percentage": 59.88, "elapsed_time": "8:35:39", "remaining_time": "5:45:28"}
2340
+ {"current_steps": 2340, "total_steps": 3906, "loss": 1.344, "learning_rate": 1.4123387803061272e-05, "epoch": 0.59904, "percentage": 59.91, "elapsed_time": "8:35:53", "remaining_time": "5:45:14"}
2341
+ {"current_steps": 2341, "total_steps": 3906, "loss": 1.3694, "learning_rate": 1.4107854748088793e-05, "epoch": 0.599296, "percentage": 59.93, "elapsed_time": "8:36:06", "remaining_time": "5:45:01"}
2342
+ {"current_steps": 2342, "total_steps": 3906, "loss": 1.3005, "learning_rate": 1.409232558401091e-05, "epoch": 0.599552, "percentage": 59.96, "elapsed_time": "8:36:19", "remaining_time": "5:44:48"}
2343
+ {"current_steps": 2343, "total_steps": 3906, "loss": 1.3493, "learning_rate": 1.407680032108236e-05, "epoch": 0.599808, "percentage": 59.98, "elapsed_time": "8:36:32", "remaining_time": "5:44:34"}
2344
+ {"current_steps": 2344, "total_steps": 3906, "loss": 1.3569, "learning_rate": 1.4061278969555282e-05, "epoch": 0.600064, "percentage": 60.01, "elapsed_time": "8:36:45", "remaining_time": "5:44:21"}
2345
+ {"current_steps": 2345, "total_steps": 3906, "loss": 1.3337, "learning_rate": 1.4045761539679252e-05, "epoch": 0.60032, "percentage": 60.04, "elapsed_time": "8:36:59", "remaining_time": "5:44:08"}
2346
+ {"current_steps": 2346, "total_steps": 3906, "loss": 1.3501, "learning_rate": 1.403024804170125e-05, "epoch": 0.600576, "percentage": 60.06, "elapsed_time": "8:37:12", "remaining_time": "5:43:55"}
2347
+ {"current_steps": 2347, "total_steps": 3906, "loss": 1.338, "learning_rate": 1.4014738485865653e-05, "epoch": 0.600832, "percentage": 60.09, "elapsed_time": "8:37:25", "remaining_time": "5:43:42"}
2348
+ {"current_steps": 2348, "total_steps": 3906, "loss": 1.3361, "learning_rate": 1.3999232882414243e-05, "epoch": 0.601088, "percentage": 60.11, "elapsed_time": "8:37:38", "remaining_time": "5:43:28"}
2349
+ {"current_steps": 2349, "total_steps": 3906, "loss": 1.3227, "learning_rate": 1.3983731241586191e-05, "epoch": 0.601344, "percentage": 60.14, "elapsed_time": "8:37:51", "remaining_time": "5:43:15"}
2350
+ {"current_steps": 2350, "total_steps": 3906, "loss": 1.3499, "learning_rate": 1.3968233573618037e-05, "epoch": 0.6016, "percentage": 60.16, "elapsed_time": "8:38:05", "remaining_time": "5:43:02"}
2351
+ {"current_steps": 2351, "total_steps": 3906, "loss": 1.3698, "learning_rate": 1.395273988874372e-05, "epoch": 0.601856, "percentage": 60.19, "elapsed_time": "8:38:18", "remaining_time": "5:42:49"}
2352
+ {"current_steps": 2352, "total_steps": 3906, "loss": 1.32, "learning_rate": 1.3937250197194538e-05, "epoch": 0.602112, "percentage": 60.22, "elapsed_time": "8:38:31", "remaining_time": "5:42:35"}
2353
+ {"current_steps": 2353, "total_steps": 3906, "loss": 1.3726, "learning_rate": 1.3921764509199144e-05, "epoch": 0.602368, "percentage": 60.24, "elapsed_time": "8:38:44", "remaining_time": "5:42:22"}
2354
+ {"current_steps": 2354, "total_steps": 3906, "loss": 1.3179, "learning_rate": 1.3906282834983565e-05, "epoch": 0.602624, "percentage": 60.27, "elapsed_time": "8:38:57", "remaining_time": "5:42:09"}
2355
+ {"current_steps": 2355, "total_steps": 3906, "loss": 1.3654, "learning_rate": 1.3890805184771172e-05, "epoch": 0.60288, "percentage": 60.29, "elapsed_time": "8:39:10", "remaining_time": "5:41:55"}
2356
+ {"current_steps": 2356, "total_steps": 3906, "loss": 1.3314, "learning_rate": 1.3875331568782655e-05, "epoch": 0.603136, "percentage": 60.32, "elapsed_time": "8:39:24", "remaining_time": "5:41:42"}
2357
+ {"current_steps": 2357, "total_steps": 3906, "loss": 1.3368, "learning_rate": 1.3859861997236072e-05, "epoch": 0.603392, "percentage": 60.34, "elapsed_time": "8:39:37", "remaining_time": "5:41:29"}
2358
+ {"current_steps": 2358, "total_steps": 3906, "loss": 1.3414, "learning_rate": 1.3844396480346802e-05, "epoch": 0.603648, "percentage": 60.37, "elapsed_time": "8:39:50", "remaining_time": "5:41:16"}
2359
+ {"current_steps": 2359, "total_steps": 3906, "loss": 1.3797, "learning_rate": 1.3828935028327534e-05, "epoch": 0.603904, "percentage": 60.39, "elapsed_time": "8:40:03", "remaining_time": "5:41:02"}
2360
+ {"current_steps": 2360, "total_steps": 3906, "loss": 1.3844, "learning_rate": 1.3813477651388284e-05, "epoch": 0.60416, "percentage": 60.42, "elapsed_time": "8:40:16", "remaining_time": "5:40:49"}
2361
+ {"current_steps": 2361, "total_steps": 3906, "loss": 1.3276, "learning_rate": 1.379802435973638e-05, "epoch": 0.604416, "percentage": 60.45, "elapsed_time": "8:40:30", "remaining_time": "5:40:36"}
2362
+ {"current_steps": 2362, "total_steps": 3906, "loss": 1.35, "learning_rate": 1.3782575163576435e-05, "epoch": 0.604672, "percentage": 60.47, "elapsed_time": "8:40:43", "remaining_time": "5:40:23"}
2363
+ {"current_steps": 2363, "total_steps": 3906, "loss": 1.3307, "learning_rate": 1.3767130073110376e-05, "epoch": 0.604928, "percentage": 60.5, "elapsed_time": "8:40:56", "remaining_time": "5:40:09"}
2364
+ {"current_steps": 2364, "total_steps": 3906, "loss": 1.3843, "learning_rate": 1.3751689098537414e-05, "epoch": 0.605184, "percentage": 60.52, "elapsed_time": "8:41:09", "remaining_time": "5:39:56"}
2365
+ {"current_steps": 2365, "total_steps": 3906, "loss": 1.348, "learning_rate": 1.373625225005403e-05, "epoch": 0.60544, "percentage": 60.55, "elapsed_time": "8:41:22", "remaining_time": "5:39:43"}
2366
+ {"current_steps": 2366, "total_steps": 3906, "loss": 1.3397, "learning_rate": 1.3720819537853998e-05, "epoch": 0.605696, "percentage": 60.57, "elapsed_time": "8:41:35", "remaining_time": "5:39:30"}
2367
+ {"current_steps": 2367, "total_steps": 3906, "loss": 1.3603, "learning_rate": 1.370539097212836e-05, "epoch": 0.605952, "percentage": 60.6, "elapsed_time": "8:41:49", "remaining_time": "5:39:16"}
2368
+ {"current_steps": 2368, "total_steps": 3906, "loss": 1.3604, "learning_rate": 1.3689966563065394e-05, "epoch": 0.606208, "percentage": 60.62, "elapsed_time": "8:42:02", "remaining_time": "5:39:03"}
2369
+ {"current_steps": 2369, "total_steps": 3906, "loss": 1.3065, "learning_rate": 1.3674546320850661e-05, "epoch": 0.606464, "percentage": 60.65, "elapsed_time": "8:42:15", "remaining_time": "5:38:50"}
2370
+ {"current_steps": 2370, "total_steps": 3906, "loss": 1.3772, "learning_rate": 1.3659130255666968e-05, "epoch": 0.60672, "percentage": 60.68, "elapsed_time": "8:42:28", "remaining_time": "5:38:37"}
2371
+ {"current_steps": 2371, "total_steps": 3906, "loss": 1.322, "learning_rate": 1.3643718377694341e-05, "epoch": 0.606976, "percentage": 60.7, "elapsed_time": "8:42:41", "remaining_time": "5:38:23"}
2372
+ {"current_steps": 2372, "total_steps": 3906, "loss": 1.3018, "learning_rate": 1.3628310697110073e-05, "epoch": 0.607232, "percentage": 60.73, "elapsed_time": "8:42:55", "remaining_time": "5:38:10"}
2373
+ {"current_steps": 2373, "total_steps": 3906, "loss": 1.3251, "learning_rate": 1.3612907224088665e-05, "epoch": 0.607488, "percentage": 60.75, "elapsed_time": "8:43:08", "remaining_time": "5:37:57"}
2374
+ {"current_steps": 2374, "total_steps": 3906, "loss": 1.3011, "learning_rate": 1.3597507968801834e-05, "epoch": 0.607744, "percentage": 60.78, "elapsed_time": "8:43:21", "remaining_time": "5:37:44"}
2375
+ {"current_steps": 2375, "total_steps": 3906, "loss": 1.3177, "learning_rate": 1.3582112941418531e-05, "epoch": 0.608, "percentage": 60.8, "elapsed_time": "8:43:34", "remaining_time": "5:37:30"}
2376
+ {"current_steps": 2376, "total_steps": 3906, "loss": 1.3316, "learning_rate": 1.3566722152104897e-05, "epoch": 0.608256, "percentage": 60.83, "elapsed_time": "8:43:47", "remaining_time": "5:37:17"}
2377
+ {"current_steps": 2377, "total_steps": 3906, "loss": 1.3337, "learning_rate": 1.355133561102429e-05, "epoch": 0.608512, "percentage": 60.86, "elapsed_time": "8:44:01", "remaining_time": "5:37:04"}
2378
+ {"current_steps": 2378, "total_steps": 3906, "loss": 1.3536, "learning_rate": 1.353595332833725e-05, "epoch": 0.608768, "percentage": 60.88, "elapsed_time": "8:44:14", "remaining_time": "5:36:51"}
2379
+ {"current_steps": 2379, "total_steps": 3906, "loss": 1.3612, "learning_rate": 1.3520575314201524e-05, "epoch": 0.609024, "percentage": 60.91, "elapsed_time": "8:44:27", "remaining_time": "5:36:37"}
2380
+ {"current_steps": 2380, "total_steps": 3906, "loss": 1.3037, "learning_rate": 1.3505201578772009e-05, "epoch": 0.60928, "percentage": 60.93, "elapsed_time": "8:44:40", "remaining_time": "5:36:24"}
2381
+ {"current_steps": 2381, "total_steps": 3906, "loss": 1.3915, "learning_rate": 1.3489832132200804e-05, "epoch": 0.609536, "percentage": 60.96, "elapsed_time": "8:44:53", "remaining_time": "5:36:11"}
2382
+ {"current_steps": 2382, "total_steps": 3906, "loss": 1.3088, "learning_rate": 1.347446698463716e-05, "epoch": 0.609792, "percentage": 60.98, "elapsed_time": "8:45:07", "remaining_time": "5:35:58"}
2383
+ {"current_steps": 2383, "total_steps": 3906, "loss": 1.3407, "learning_rate": 1.34591061462275e-05, "epoch": 0.610048, "percentage": 61.01, "elapsed_time": "8:45:20", "remaining_time": "5:35:45"}
2384
+ {"current_steps": 2384, "total_steps": 3906, "loss": 1.3676, "learning_rate": 1.3443749627115397e-05, "epoch": 0.610304, "percentage": 61.03, "elapsed_time": "8:45:33", "remaining_time": "5:35:31"}
2385
+ {"current_steps": 2385, "total_steps": 3906, "loss": 1.3701, "learning_rate": 1.3428397437441573e-05, "epoch": 0.61056, "percentage": 61.06, "elapsed_time": "8:45:46", "remaining_time": "5:35:18"}
2386
+ {"current_steps": 2386, "total_steps": 3906, "loss": 1.3546, "learning_rate": 1.341304958734388e-05, "epoch": 0.610816, "percentage": 61.09, "elapsed_time": "8:45:59", "remaining_time": "5:35:05"}
2387
+ {"current_steps": 2387, "total_steps": 3906, "loss": 1.3407, "learning_rate": 1.3397706086957328e-05, "epoch": 0.611072, "percentage": 61.11, "elapsed_time": "8:46:12", "remaining_time": "5:34:51"}
2388
+ {"current_steps": 2388, "total_steps": 3906, "loss": 1.3157, "learning_rate": 1.3382366946414023e-05, "epoch": 0.611328, "percentage": 61.14, "elapsed_time": "8:46:26", "remaining_time": "5:34:38"}
2389
+ {"current_steps": 2389, "total_steps": 3906, "loss": 1.3468, "learning_rate": 1.336703217584322e-05, "epoch": 0.611584, "percentage": 61.16, "elapsed_time": "8:46:39", "remaining_time": "5:34:25"}
2390
+ {"current_steps": 2390, "total_steps": 3906, "loss": 1.3113, "learning_rate": 1.3351701785371275e-05, "epoch": 0.61184, "percentage": 61.19, "elapsed_time": "8:46:52", "remaining_time": "5:34:12"}
2391
+ {"current_steps": 2391, "total_steps": 3906, "loss": 1.3478, "learning_rate": 1.3336375785121667e-05, "epoch": 0.612096, "percentage": 61.21, "elapsed_time": "8:47:05", "remaining_time": "5:33:58"}
2392
+ {"current_steps": 2392, "total_steps": 3906, "loss": 1.4023, "learning_rate": 1.3321054185214941e-05, "epoch": 0.612352, "percentage": 61.24, "elapsed_time": "8:47:18", "remaining_time": "5:33:45"}
2393
+ {"current_steps": 2393, "total_steps": 3906, "loss": 1.3113, "learning_rate": 1.3305736995768774e-05, "epoch": 0.612608, "percentage": 61.26, "elapsed_time": "8:47:31", "remaining_time": "5:33:32"}
2394
+ {"current_steps": 2394, "total_steps": 3906, "loss": 1.3419, "learning_rate": 1.3290424226897907e-05, "epoch": 0.612864, "percentage": 61.29, "elapsed_time": "8:47:45", "remaining_time": "5:33:19"}
2395
+ {"current_steps": 2395, "total_steps": 3906, "loss": 1.3816, "learning_rate": 1.327511588871417e-05, "epoch": 0.61312, "percentage": 61.32, "elapsed_time": "8:47:58", "remaining_time": "5:33:05"}
2396
+ {"current_steps": 2396, "total_steps": 3906, "loss": 1.3036, "learning_rate": 1.3259811991326472e-05, "epoch": 0.613376, "percentage": 61.34, "elapsed_time": "8:48:11", "remaining_time": "5:32:52"}
2397
+ {"current_steps": 2397, "total_steps": 3906, "loss": 1.3585, "learning_rate": 1.324451254484079e-05, "epoch": 0.613632, "percentage": 61.37, "elapsed_time": "8:48:24", "remaining_time": "5:32:39"}
2398
+ {"current_steps": 2398, "total_steps": 3906, "loss": 1.3528, "learning_rate": 1.3229217559360143e-05, "epoch": 0.613888, "percentage": 61.39, "elapsed_time": "8:48:37", "remaining_time": "5:32:25"}
2399
+ {"current_steps": 2399, "total_steps": 3906, "loss": 1.3494, "learning_rate": 1.3213927044984622e-05, "epoch": 0.614144, "percentage": 61.42, "elapsed_time": "8:48:50", "remaining_time": "5:32:12"}
2400
+ {"current_steps": 2400, "total_steps": 3906, "loss": 1.364, "learning_rate": 1.319864101181136e-05, "epoch": 0.6144, "percentage": 61.44, "elapsed_time": "8:49:04", "remaining_time": "5:31:59"}
2401
+ {"current_steps": 2401, "total_steps": 3906, "loss": 1.3237, "learning_rate": 1.318335946993453e-05, "epoch": 0.614656, "percentage": 61.47, "elapsed_time": "8:49:37", "remaining_time": "5:31:58"}
2402
+ {"current_steps": 2402, "total_steps": 3906, "loss": 1.356, "learning_rate": 1.3168082429445348e-05, "epoch": 0.614912, "percentage": 61.5, "elapsed_time": "8:49:50", "remaining_time": "5:31:45"}
2403
+ {"current_steps": 2403, "total_steps": 3906, "loss": 1.3067, "learning_rate": 1.3152809900432058e-05, "epoch": 0.615168, "percentage": 61.52, "elapsed_time": "8:50:03", "remaining_time": "5:31:32"}
2404
+ {"current_steps": 2404, "total_steps": 3906, "loss": 1.3554, "learning_rate": 1.3137541892979897e-05, "epoch": 0.615424, "percentage": 61.55, "elapsed_time": "8:50:16", "remaining_time": "5:31:18"}
2405
+ {"current_steps": 2405, "total_steps": 3906, "loss": 1.3321, "learning_rate": 1.3122278417171144e-05, "epoch": 0.61568, "percentage": 61.57, "elapsed_time": "8:50:29", "remaining_time": "5:31:05"}
2406
+ {"current_steps": 2406, "total_steps": 3906, "loss": 1.3395, "learning_rate": 1.3107019483085077e-05, "epoch": 0.615936, "percentage": 61.6, "elapsed_time": "8:50:43", "remaining_time": "5:30:52"}
2407
+ {"current_steps": 2407, "total_steps": 3906, "loss": 1.383, "learning_rate": 1.3091765100797981e-05, "epoch": 0.616192, "percentage": 61.62, "elapsed_time": "8:50:56", "remaining_time": "5:30:39"}
2408
+ {"current_steps": 2408, "total_steps": 3906, "loss": 1.322, "learning_rate": 1.307651528038313e-05, "epoch": 0.616448, "percentage": 61.65, "elapsed_time": "8:51:09", "remaining_time": "5:30:25"}
2409
+ {"current_steps": 2409, "total_steps": 3906, "loss": 1.3924, "learning_rate": 1.3061270031910787e-05, "epoch": 0.616704, "percentage": 61.67, "elapsed_time": "8:51:22", "remaining_time": "5:30:12"}
2410
+ {"current_steps": 2410, "total_steps": 3906, "loss": 1.321, "learning_rate": 1.3046029365448187e-05, "epoch": 0.61696, "percentage": 61.7, "elapsed_time": "8:51:35", "remaining_time": "5:29:59"}
2411
+ {"current_steps": 2411, "total_steps": 3906, "loss": 1.3785, "learning_rate": 1.3030793291059545e-05, "epoch": 0.617216, "percentage": 61.73, "elapsed_time": "8:51:49", "remaining_time": "5:29:46"}
2412
+ {"current_steps": 2412, "total_steps": 3906, "loss": 1.3771, "learning_rate": 1.3015561818806055e-05, "epoch": 0.617472, "percentage": 61.75, "elapsed_time": "8:52:02", "remaining_time": "5:29:32"}
2413
+ {"current_steps": 2413, "total_steps": 3906, "loss": 1.3389, "learning_rate": 1.3000334958745856e-05, "epoch": 0.617728, "percentage": 61.78, "elapsed_time": "8:52:15", "remaining_time": "5:29:19"}